From c7ba58f07c6583614f74d906bbce796e24042522 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 1 Nov 2021 16:12:39 -0400
Subject: [PATCH 01/46] Initial draft of a DFT interface and FFTW
 implementation

---
 aux/inc/WireCellAux/FftwDFT.h    |  42 ++++++++++++
 aux/src/FftwDFT.cxx              | 113 +++++++++++++++++++++++++++++++
 iface/README.org                 |  59 ++++++++++++++++
 iface/inc/WireCellIface/IDFT.h   |  56 +++++++++++++++
 iface/src/IDFT.cxx               |  25 +++++++
 util/inc/WireCellUtil/Waveform.h |   4 ++
 util/src/Waveform.cxx            |  16 +++++
 7 files changed, 315 insertions(+)
 create mode 100644 aux/inc/WireCellAux/FftwDFT.h
 create mode 100644 aux/src/FftwDFT.cxx
 create mode 100644 iface/inc/WireCellIface/IDFT.h
 create mode 100644 iface/src/IDFT.cxx
diff --git a/aux/inc/WireCellAux/FftwDFT.h b/aux/inc/WireCellAux/FftwDFT.h
new file mode 100644
index 000000000..ad265eef7
--- /dev/null
+++ b/aux/inc/WireCellAux/FftwDFT.h
@@ -0,0 +1,42 @@
+#ifndef WIRECELLAUX_FFTWDFT
+#define WIRECELLAUX_FFTWDFT
+
+#include "WireCellIface/IDFT.h"
+
+namespace WireCell::Aux {
+
+    /** 
+        FftwDFT provides IDFT based on FFTW3.        
+    */
+    class FftwDFT : public IDFT {
+      public:
+        
+        FftwDFT();
+        virtual ~FftwDFT();
+
+        // 1d 
+
+        virtual 
+        void fwd1d(const complex_t* in, complex_t* out,
+                   int stride) const = 0;
+
+        virtual 
+        void inv1d(const complex_t* in, complex_t* out,
+                   int stride) const = 0;
+
+        // batched 1D ("1b") - rely on base implementation
+
+        // 2d
+
+        virtual 
+        void fwd2d(const complex_t* in, complex_t* out,
+                   int stride, int nstrides) const = 0;
+        virtual 
+        void inv2d(const complex_t* in, complex_t* out,
+                   int stride, int nstrides) const = 0;
+
+
+    };
+}
+
+#endif
diff --git a/aux/src/FftwDFT.cxx b/aux/src/FftwDFT.cxx
new file mode 100644
index 000000000..85f6b0820
--- /dev/null
+++ b/aux/src/FftwDFT.cxx
@@ -0,0 +1,113 @@
+#include "WireCellAux/FftwDFT.h"
+#include <fftw3.h>
+#include <mutex>
+#include <shared_mutex>
+#include <unordered_map>
+
+
+using namespace WireCell;
+
+using plan_key_t = int64_t;
+using plan_type = fftwf_plan;
+using plan_map_t = std::unordered_map<plan_key_t, plan_type>;
+using plan_val_t = fftwf_complex;
+
+static
+plan_key_t make_key(bool inverse, const void * src, void * dst, int n0, int n1)
+{
+    bool inplace = (dst==src);
+    bool aligned = ( (reinterpret_cast<size_t>(src)&15) | (reinterpret_cast<size_t>(dst)&15) ) == 0;
+    int64_t key = ( ( (((int64_t)n0) << 30)|(n1<<3 ) | (inverse<<2) | (inplace<<1) | aligned ) << 1 ) + 1;
+    return key;
+}
+
+static
+plan_type get_plan(std::shared_mutex& mutex, plan_map_t& plans, plan_key_t key)
+{
+    std::shared_lock lock(mutex);
+    auto it = plans.find(key);
+    if (it == plans.end()) {
+        return NULL;
+    }
+    return it->second;
+}
+
+
+template<typename planner_function>
+void doit(std::shared_mutex& mutex, plan_map_t& plans, 
+                int fwdrev, plan_val_t* src, plan_val_t* dst, int stride, int nstrides,
+                planner_function make_plan)
+{
+    auto key = make_key(fwdrev == FFTW_BACKWARD, src, dst, stride, nstrides);
+    auto plan = get_plan(mutex, plans, key);
+    if (!plan) {
+        std::unique_lock lock(mutex);
+        // Check again in case another thread snakes us.
+        auto it = plans.find(key);
+        if (it == plans.end()) {
+            plan = make_plan();
+            plans[key] = plan;
+        }
+        else {
+            plan = it->second;
+        }
+    }
+    fftwf_execute_dft(plan, src, dst);
+}
+
+
+static
+plan_val_t* pval_cast( const IDFT::complex_t * p)
+{ 
+    return const_cast<plan_val_t*>( reinterpret_cast<const plan_val_t*>(p) ); 
+}
+
+
+void Aux::FftwDFT::fwd1d(const complex_t* in, complex_t* out, int stride) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = FFTW_FORWARD;
+    auto src = pval_cast(in);
+    auto dst = pval_cast(out);
+    doit(mutex, plans, dir, src, dst, stride, 0, [&]( ) {
+        return fftwf_plan_dft_1d(stride, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    });
+}
+void Aux::FftwDFT::inv1d(const complex_t* in, complex_t* out, int stride) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = FFTW_BACKWARD;
+    auto src = pval_cast(in);
+    auto dst = pval_cast(out);
+    doit(mutex, plans, dir, src, dst, stride, 0, [&]( ) {
+        return fftwf_plan_dft_1d(stride, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    });
+}
+
+
+void Aux::FftwDFT::fwd2d(const complex_t* in, complex_t* out, int stride, int nstrides) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = FFTW_FORWARD;
+    auto src = pval_cast(in);
+    auto dst = pval_cast(out);
+    doit(mutex, plans, dir, src, dst, stride, nstrides, [&]( ) {
+        return fftwf_plan_dft_2d(stride, nstrides, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    });
+}
+
+
+void Aux::FftwDFT::inv2d(const complex_t* in, complex_t* out, int stride, int nstrides) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = FFTW_BACKWARD;
+    auto src = pval_cast(in);
+    auto dst = pval_cast(out);
+    doit(mutex, plans, dir, src, dst, stride, nstrides, [&]( ) {
+        return fftwf_plan_dft_2d(stride, nstrides, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    });
+}
diff --git a/iface/README.org b/iface/README.org
index 37e27b412..cf76f4926 100644
--- a/iface/README.org
+++ b/iface/README.org
@@ -25,3 +25,62 @@ the overall WCT dependency tree.  Discussion is warranted in these cases.
 
 See the user manual for more info.  https://wirecell.bnl.gov/
 
+* Interfaces
+
+** IDFT
+
+The ~IDFT~ class provides interface to methods to perform discrete
+Fourier transforms on arrays of complex single precision floating
+point values.
+
+The interface defines a number of methods which take a general naming
+convention like:
+#+begin_example
+void <direction><domain>(...);
+#+end_example
+
+The "direction" of the transform is one of
+
+- fwd :: the DFT is from interval to frequency, no normalization.
+- inv :: the DFT is from frequency to interval, 1/n normalization.
+ 
+The "domain" determines the dimension of array and how it is transformed
+
+- 1d :: a 1D array is transformed
+- 1b :: a batch of equal-length 1D arrays are transformed
+- 2d :: a 2D array is transformed (along both dimensions)
+
+The shape of 2D arrays (~1b~ or ~2d~ methods) are given in terms of two
+numbers: ~stride~ and ~nstrides~.  The number ~stride~ counts the number of
+contiguous array elements along one dimension and ~nstrides~ counts the
+number non-contiguous elements logically along the opposite dimension.
+In the case of "row-major" aka "C" memory ordering of 2D arrays, the
+number ~stride~ counts the number of elements in one "row" and ~nstrides~
+counts the number of rows, aka, the number of elements in one column.
+
+The ~1b~ transforms operate along a contiguous array of length ~stride~.
+By default, these transforms are implemented in terms of ~nstrides~
+calls to the ~1d~ DFT interface method.  The implementation may override
+the ~1b~ default methods for example to exploit some kind of "batch
+optimization". 
+
+*** Limitations
+
+- The potential speed up when the input to a forward or output from
+  reverse is real valued is not possible to implement with ~IDFT~.  It
+  requires the caller to take particular care in array sizes and would
+  double the number of methods.
+
+- To satisfy the low-level pointer to memory interface from higher
+  level objects see the ~Waveform.h~ and ~Array.h~ headers in
+  ~WireCellUtil~.  In particular, see functions there to lift real to
+  complex or perform memory transforms.
+
+- Interface to higher order transforms, such as convolutions, are not
+  provided.  See ~Aux::DFT~ for implementations in terms of an ~IDFT~.
+
+** ...
+
+Any interfaces not listed above, please see their header file in
+[[file:inc/WireCellIface/][inc/WireCellIface/]] for more information.
+
diff --git a/iface/inc/WireCellIface/IDFT.h b/iface/inc/WireCellIface/IDFT.h
new file mode 100644
index 000000000..dd1d39e8c
--- /dev/null
+++ b/iface/inc/WireCellIface/IDFT.h
@@ -0,0 +1,56 @@
+/** 
+    Interface to perform discrete single-precision Fourier transforms.
+*/
+
+#ifndef WIRECELL_IDFT
+#define WIRECELL_IDFT
+
+#include "WireCellUtil/IComponent.h"
+#include <complex>
+
+namespace WireCell {
+
+    class IDFT  : public IComponent<IDFT> {
+      public:
+        virtual ~IDFT();
+
+        /// The type for the signal in each bin.
+        using scalar_t = float;
+
+        /// The type for the spectrum in each bin.
+        using complex_t = std::complex<scalar_t>;
+
+        // 1D 
+
+        virtual 
+        void fwd1d(const complex_t* in, complex_t* out,
+                   int stride) const = 0;
+
+        virtual 
+        void inv1d(const complex_t* in, complex_t* out,
+                   int stride) const = 0;
+
+        // batched 1D ("1b")
+
+        virtual 
+        void fwd1b(const complex_t* in, complex_t* out,
+                   int stride, int nstrides) const;
+        virtual 
+        void inv1b(const complex_t* in, complex_t* out,
+                   int stride, int nstrides) const;
+
+
+        // 2D, transform both dimensions
+
+        virtual 
+        void fwd2d(const complex_t* in, complex_t* out,
+                   int stride, int nstrides) const = 0;
+        virtual 
+        void inv2d(const complex_t* in, complex_t* out,
+                   int stride, int nstrides) const = 0;
+
+     };
+}
+
+
+#endif
diff --git a/iface/src/IDFT.cxx b/iface/src/IDFT.cxx
new file mode 100644
index 000000000..2f9ee3543
--- /dev/null
+++ b/iface/src/IDFT.cxx
@@ -0,0 +1,25 @@
+#include "WireCellIface/IDFT.h"
+
+using namespace WireCell;
+
+IDFT::~IDFT() {}
+
+// Trivial default "batched" implementations.  If your concrete
+// implementation provides some kind of "batch optimization", such as
+// with some GPU FFTs, override these methods!
+
+void IDFT::fwd1b(const complex_t* in, complex_t* out,
+                 int stride, int nstrides) const
+{
+    for (int istride=0; istride<nstrides; ++istride) {
+        fwd1d(in+istride*stride, out+istride*stride, stride);
+    }
+}
+
+void IDFT::inv1b(const complex_t* in, complex_t* out,
+                 int stride, int nstrides) const
+{
+    for (int istride=0; istride<nstrides; ++istride) {
+        inv1d(in+istride*stride, out+istride*stride, stride);
+    }
+}
diff --git a/util/inc/WireCellUtil/Waveform.h b/util/inc/WireCellUtil/Waveform.h
index af7de262e..7240ba7b6 100644
--- a/util/inc/WireCellUtil/Waveform.h
+++ b/util/inc/WireCellUtil/Waveform.h
@@ -114,6 +114,10 @@ namespace WireCell {
         realseq_t magnitude(const compseq_t& seq);
         /// Return the phase or arg part of the sequence
         realseq_t phase(const compseq_t& seq);
+        /// Uplift a real sequence to a complex one (with zero imaginary parts)
+        compseq_t complex(const realseq_t& real);
+        /// Pack individual real/imag parts into complex sequence
+        compseq_t complex(const realseq_t& real, const realseq_t& imag);
 
         /// Increase (shift) sequence values by scalar
         template <typename Val>
diff --git a/util/src/Waveform.cxx b/util/src/Waveform.cxx
index 6cb356f91..21ce70fa3 100644
--- a/util/src/Waveform.cxx
+++ b/util/src/Waveform.cxx
@@ -69,6 +69,22 @@ Waveform::realseq_t WireCell::Waveform::phase(const Waveform::compseq_t& seq)
     return c2r(seq, [](Waveform::complex_t c) { return std::arg(c); });
 }
 
+
+Waveform::compseq_t Waveform::complex(const Waveform::realseq_t& real)
+{
+    Waveform::realseq_t imag(real.size(), 0);
+    return Waveform::complex(real, imag);
+}
+
+Waveform::compseq_t Waveform::complex(const Waveform::realseq_t& real, const Waveform::realseq_t& imag)
+{
+    Waveform::compseq_t ret(real.size());
+    std::transform(real.begin(), real.end(), imag.begin(), ret.begin(),
+                   [](real_t re, real_t im) { return Waveform::complex_t(re,im); } );
+    return ret;
+}
+
+
 Waveform::real_t WireCell::Waveform::median(Waveform::realseq_t& wave) { return percentile(wave, 0.5); }
 
 Waveform::real_t WireCell::Waveform::median_binned(Waveform::realseq_t& wave) { return percentile_binned(wave, 0.5); }

From 59be25c7eda82233a7672748fefc3c4d059be833 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 2 Nov 2021 12:10:17 -0400
Subject: [PATCH 02/46] Tell Boost to shut up with the internal deprecation
 warnings

---
 util/inc/WireCellUtil/IndexedGraph.h | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/util/inc/WireCellUtil/IndexedGraph.h b/util/inc/WireCellUtil/IndexedGraph.h
index 6c6eb54d3..35c8513ed 100644
--- a/util/inc/WireCellUtil/IndexedGraph.h
+++ b/util/inc/WireCellUtil/IndexedGraph.h
@@ -13,6 +13,18 @@
 #ifndef WIRECELL_INDEXEDGRAPH
 #define WIRECELL_INDEXEDGRAPH
 
+// fixme: watchme: Boost started to deprecate some internal header
+// inclusion which is not, as best as I can tell, any of our problem.
+// The message is:
+//
+// ../../../../../opt/boost-1-76-0/include/boost/config/pragma_message.hpp:24:34: note: ‘#pragma message: This header is deprecated. Use <iterator> instead.’
+//
+//  This arises from a deeply nested #include well beyond anything
+//  which is obvious here.
+//
+//  If/when this is cleaned up in Boost, remove this comment and the
+//  next line.
+#define BOOST_ALLOW_DEPRECATED_HEADERS 1
 #include <boost/graph/connected_components.hpp>
 #include <boost/graph/graph_traits.hpp>
 #include <boost/graph/adjacency_list.hpp>

From a9787bb9d858c2665429b2ae095576097cbade8f Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 2 Nov 2021 12:50:57 -0400
Subject: [PATCH 03/46] Tell Boost to shut up with the internal deprecation
 warnings

---
 util/inc/WireCellUtil/String.h | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/util/inc/WireCellUtil/String.h b/util/inc/WireCellUtil/String.h
index ac06e6eb1..d065a5964 100644
--- a/util/inc/WireCellUtil/String.h
+++ b/util/inc/WireCellUtil/String.h
@@ -1,6 +1,18 @@
 #ifndef WIRECELLUTIL_STRING
 #define WIRECELLUTIL_STRING
 
+// fixme: watchme: Boost started to deprecate some internal header
+// inclusion which is not, as best as I can tell, any of our problem.
+// The message is:
+//
+// ../../../../../opt/boost-1-76-0/include/boost/config/pragma_message.hpp:24:34: note: ‘#pragma message: This header is deprecated. Use <iterator> instead.’
+//
+//  This arises from a deeply nested #include well beyond anything
+//  which is obvious here.
+//
+//  If/when this is cleaned up in Boost, remove this comment and the
+//  next line.
+#define BOOST_ALLOW_DEPRECATED_HEADERS 1
 #include <boost/algorithm/string.hpp>
 #include <boost/format.hpp>
 

From 08815ba37658625f40c46c2b2f2a605466a12d95 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 2 Nov 2021 12:51:22 -0400
Subject: [PATCH 04/46] Add stack trace to exception what()

---
 util/inc/WireCellUtil/Exceptions.h | 23 +++++++++++++++++++++--
 util/test/test_exceptions.cxx      |  3 ++-
 2 files changed, 23 insertions(+), 3 deletions(-)

diff --git a/util/inc/WireCellUtil/Exceptions.h b/util/inc/WireCellUtil/Exceptions.h
index 955ab62c9..54feb39cb 100644
--- a/util/inc/WireCellUtil/Exceptions.h
+++ b/util/inc/WireCellUtil/Exceptions.h
@@ -19,17 +19,36 @@
 #define WIRECELL_EXCEPTIONS
 
 #include <boost/exception/all.hpp>
+#include <boost/stacktrace.hpp>
 #include <exception>
 #include <string>
 
-#define THROW(e) BOOST_THROW_EXCEPTION(e)
+using stack_traced_t = boost::error_info<struct tag_stacktrace, boost::stacktrace::stacktrace>;
+// template <class E>
+// void throw_with_trace(const E& e) {
+//     BOOST_THROW_EXCEPTION(boost::enable_error_info(e) << stack_traced_t(boost::stacktrace::stacktrace()));
+// }
+// #define THROW(e) throw_with_trace(e)
+#define THROW(e) BOOST_THROW_EXCEPTION(boost::enable_error_info(e) << stack_traced_t(boost::stacktrace::stacktrace()))
+//#define THROW(e) BOOST_THROW_EXCEPTION(e)
 #define errstr(e) boost::diagnostic_information(e)
 
+
 namespace WireCell {
 
+    // Get the stacktrace as an object.  You must test for non-nullptr.
+    // Or, just rely on e.what().
+    inline
+    const boost::stacktrace::stacktrace* stacktrace(const std::exception& e) {
+        return boost::get_error_info<stack_traced_t>(e);
+    }
+
+
     /// The base wire cell exception.
     struct Exception : virtual public std::exception, virtual boost::exception {
-        char const *what() const throw() { return diagnostic_information_what(*this); }
+        char const *what() const throw() {
+            return diagnostic_information_what(*this);
+        }
     };
 
     /// Thrown when a wrong value has been encountered.
diff --git a/util/test/test_exceptions.cxx b/util/test/test_exceptions.cxx
index 11d4553fb..a79b44321 100644
--- a/util/test/test_exceptions.cxx
+++ b/util/test/test_exceptions.cxx
@@ -22,6 +22,7 @@ int main()
         THROW(ValueError() << errmsg{format("some error with value=%d msg=\"%s\"", value, omg)});
     }
     catch (ValueError& e) {
-        cerr << "caught ValueError: " << errstr(e) << endl;
+        cerr << "Caught:\n";
+        cerr << e.what() << "\n";
     }
 }

From a7b6f97bb91066d9a2fd42e3d48859e1776a3bde Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 2 Nov 2021 12:52:11 -0400
Subject: [PATCH 05/46] Throw instead of returning garbage on garbage input.

This can only be an improvement as the garbage return value was being ignored by all callers.
---
 util/src/Waveform.cxx      |  5 ++--
 util/test/test_issue24.cxx | 55 +++++++++++++++++++++++++++++++++++---
 2 files changed, 54 insertions(+), 6 deletions(-)

diff --git a/util/src/Waveform.cxx b/util/src/Waveform.cxx
index 21ce70fa3..7817740e5 100644
--- a/util/src/Waveform.cxx
+++ b/util/src/Waveform.cxx
@@ -1,4 +1,5 @@
 #include "WireCellUtil/Waveform.h"
+#include "WireCellUtil/Exceptions.h"
 
 #include <algorithm>
 
@@ -92,11 +93,11 @@ Waveform::real_t WireCell::Waveform::median_binned(Waveform::realseq_t& wave) {
 Waveform::real_t WireCell::Waveform::percentile(Waveform::realseq_t& wave, real_t percentage)
 {
     if (percentage < 0.0 or percentage > 1.0) {
-        return -9999;
+        THROW(ValueError() << errmsg{"percentage out of range"});
     }
     const size_t siz = wave.size();
     if (siz == 0) {
-        return -9999;
+        THROW(ValueError() << errmsg{"empty waveform"});
     }
     if (siz == 1) {
         return wave[0];
diff --git a/util/test/test_issue24.cxx b/util/test/test_issue24.cxx
index 7f67778be..d7ce8c9f5 100644
--- a/util/test/test_issue24.cxx
+++ b/util/test/test_issue24.cxx
@@ -1,25 +1,72 @@
 #include "WireCellUtil/Waveform.h"
+#include "WireCellUtil/Exceptions.h"
+
 #include <iostream>
 
 using namespace std;
 
 using namespace WireCell::Waveform;
+using namespace WireCell;
 
 int main()
 {
     int nsamples = 10;
-    while (nsamples >= 0) {
+    while (nsamples > 0) {
         realseq_t wave(nsamples, 0);
         median(wave);
         --nsamples;
     }
 
+    cerr << "Testing error handling\n";
     realseq_t wave;
-    assert(-9999 == median(wave));
+    bool okay = false;
+    try {
+        median(wave);
+    }
+    catch (ValueError& err) {
+        okay = true;
+        cerr << "Caught:\n" << err.what() << "\nOKAY\n";
+    }
+    catch (std::exception& err) {
+        cerr << "Why am I here?\n";
+        cerr << err.what() << "\n";
+    }
+    if (!okay) {
+        cerr << "median of empty wave should throw\n";
+    }
+    assert(okay);
+    cerr << "thrown and caught empty waveform\n";
+
     wave.push_back(6.9);
     wave.push_back(9.6);
-    assert(-9999 == percentile(wave, -0.1));
-    assert(-9999 == percentile(wave, 1.1));
+    okay = false;
+    try {
+        percentile(wave, -0.1);
+    }
+    catch (ValueError& err) {
+        okay = true;
+        cerr << "Caught:\n" << err.what() << "\nOKAY\n";
+    }
+    if (!okay) {
+        cerr << "median under percentage should throw\n";
+    }
+    assert(okay);
+    cerr << "thrown and caught median under percentage\n";
+    
+    okay = false;
+    try {
+        percentile(wave, 1.1);
+    }
+    catch (ValueError& err) {
+        okay = true;
+        cerr << "Caught:\n" << err.what() << "\nOKAY\n";
+    }
+    if (!okay) {
+        cerr << "median over percentage should throw\n";
+    }
+    assert(okay);
+    cerr << "thrown and caught median over percentage\n";
+
     cerr << median(wave) << endl;
     assert(std::abs(9.6 - median(wave)) < 0.001);
     wave.push_back(0.0);

From dd4dffb55c7f922d1cdc0e26292135affe312cfb Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 2 Nov 2021 16:04:08 -0400
Subject: [PATCH 06/46] Start on higher-level dft functions

---
 aux/inc/WireCellAux/DftTools.h   |  79 ++++++++++++++++++++
 aux/inc/WireCellAux/FftwDFT.h    |   8 +-
 aux/src/DftTools.cxx             |  82 +++++++++++++++++++++
 aux/src/FftwDFT.cxx              |  14 ++++
 aux/test/test_dfttools.cxx       |  28 +++++++
 aux/test/test_idft.cxx           | 122 +++++++++++++++++++++++++++++++
 util/inc/WireCellUtil/Waveform.h |   3 +-
 util/test/test_complex.cxx       |  36 +++++++++
 8 files changed, 367 insertions(+), 5 deletions(-)
 create mode 100644 aux/inc/WireCellAux/DftTools.h
 create mode 100644 aux/src/DftTools.cxx
 create mode 100644 aux/test/test_dfttools.cxx
 create mode 100644 aux/test/test_idft.cxx
 create mode 100644 util/test/test_complex.cxx

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
new file mode 100644
index 000000000..24e097a43
--- /dev/null
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -0,0 +1,79 @@
+/**
+   High level functions related to DFTs.
+
+   Most take an IDFT::pointer to a DFT implementation and return an
+   allocated result.  Use IDFT directly to control allocation.
+
+   There are std::vector and Eigen array functions.
+
+   Abbreviations:
+
+   - IS is interval space aka time / distance
+   - FS is frequency space aka frequency / periodicity 
+
+   Price to pay for simple API is a lack of optimizations:
+
+   - When a real valued array is invovled, all arrays are full size.
+     That is, no half-size optimization will be exposed to the caller.
+
+   - These functions tend to make more copies than may be needed if
+     IDFT is called directly.  In addition to real/complex conversion,
+     using std::vector or Eigen array instead of raw memory leads to
+     more copies.
+ */
+
+#ifndef WIRECELL_AUX_DFTTOOLS
+#define WIRECELL_AUX_DFTTOOLS
+
+#include "WireCellIface/IDFT.h"
+#include <vector>
+#include <Eigen/Core>
+
+namespace WireCell::Aux {
+
+    using real_t = IDFT::scalar_t;
+    using complex_t = IDFT::complex_t;
+
+    // std::vector based functions
+
+    using realvec_t = std::vector<real_t>;
+    using compvec_t = std::vector<complex_t>;
+
+    // 1D with vectors
+
+    // Transform a real IS, return same size FS.
+    compvec_t dft(IDFT::pointer dft, const realvec_t& seq);
+        
+    // Transform complex FS to IS and return real part
+    realvec_t idft(IDFT::pointer dft, const compvec_t& spec);
+
+    compvec_t r2c(const realvec_t& r);
+    realvec_t c2r(const compvec_t& c);
+
+
+    // Eigen array based functions
+
+    /// Real 1D array
+    using array_xf = Eigen::ArrayXf;
+
+    /// Complex 1D array
+    using array_xc = Eigen::ArrayXcf;
+
+    /// A real, 2D array
+    using array_xxf = Eigen::ArrayXXf;
+
+    /// A complex, 2D array
+    using array_xxc = Eigen::ArrayXXcf;
+    
+    // 2D with Eigen arrays
+
+    // Transform a real IS, return same size FS.
+    array_xxc dft(IDFT::pointer dft, const array_xxf& arr);
+
+    // Transform complex FS to IS and return real part
+    array_xxf idft(IDFT::pointer dft, const array_xxc& arr);
+
+
+}
+
+#endif
diff --git a/aux/inc/WireCellAux/FftwDFT.h b/aux/inc/WireCellAux/FftwDFT.h
index ad265eef7..62cea9a84 100644
--- a/aux/inc/WireCellAux/FftwDFT.h
+++ b/aux/inc/WireCellAux/FftwDFT.h
@@ -18,11 +18,11 @@ namespace WireCell::Aux {
 
         virtual 
         void fwd1d(const complex_t* in, complex_t* out,
-                   int stride) const = 0;
+                   int stride) const;
 
         virtual 
         void inv1d(const complex_t* in, complex_t* out,
-                   int stride) const = 0;
+                   int stride) const;
 
         // batched 1D ("1b") - rely on base implementation
 
@@ -30,10 +30,10 @@ namespace WireCell::Aux {
 
         virtual 
         void fwd2d(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const = 0;
+                   int stride, int nstrides) const;
         virtual 
         void inv2d(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const = 0;
+                   int stride, int nstrides) const;
 
 
     };
diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
new file mode 100644
index 000000000..b7ec12cb5
--- /dev/null
+++ b/aux/src/DftTools.cxx
@@ -0,0 +1,82 @@
+#include "WireCellAux/DftTools.h"
+
+using namespace WireCell;
+using namespace WireCell::Aux;
+
+compvec_t Aux::r2c(const realvec_t& r)
+{
+    compvec_t cret(r.size());
+    std::transform(r.begin(), r.end(), cret.begin(),
+                   [](const real_t& r) { return complex_t(r, 0); });
+    return cret;
+}
+realvec_t Aux::c2r(const compvec_t& c)
+{
+    realvec_t rret(c.size());
+    std::transform(c.begin(), c.end(), rret.begin(),
+                   [](const complex_t& c) { return std::real(c); });
+    return rret;
+}
+
+// Transform a real IS, return same size FS.
+compvec_t Aux::dft(IDFT::pointer dft, const realvec_t& seq)
+{
+    compvec_t cseq = Aux::r2c(seq);
+    compvec_t cret(cseq.size());
+    dft->fwd1d(cseq.data(), cret.data(), cret.size());
+    return cret;
+}
+        
+// Transform complex FS to IS and return real part
+realvec_t Aux::idft(IDFT::pointer dft, const compvec_t& spec)
+{
+    compvec_t cret(spec.size());
+    dft->inv1d(spec.data(), cret.data(), cret.size());
+    return Aux::c2r(cret);
+}
+
+using array_xxf_rm = Eigen::Array<real_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+using array_xxc_rm = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+
+
+// Transform a real IS, return same size FS.
+array_xxc Aux::dft(IDFT::pointer trans, const array_xxf& arr)
+{
+    int stride = arr.rows();
+    int nstrides = arr.cols();
+    array_xxc ret(stride, nstrides);
+
+    if (!arr.IsRowMajor) {
+        stride = arr.cols();
+        nstrides = arr.rows();
+    }
+
+    size_t size = stride*nstrides;
+    compvec_t carr(size);
+    std::transform(arr.data(), arr.data()+size, carr.begin(),
+                   [](const real_t& r) { return complex_t(r,0); });
+    
+    trans->fwd2d(carr.data(), ret.data(), stride, nstrides);
+    return ret;
+}
+
+// Transform complex FS to IS and return real part
+array_xxf Aux::idft(IDFT::pointer trans, const array_xxc& arr)
+{
+    int stride = arr.rows();
+    int nstrides = arr.cols();
+    array_xxf ret(stride, nstrides);
+
+    if (!arr.IsRowMajor) {
+        stride = arr.cols();
+        nstrides = arr.rows();
+    }
+
+    size_t size = stride*nstrides;
+    compvec_t cret(size);
+    trans->inv2d(arr.data(), cret.data(), stride, nstrides);
+
+    std::transform(cret.begin(), cret.end(), ret.data(),
+                   [](const complex_t& c) { return std::real(c); });
+    return ret;
+}
diff --git a/aux/src/FftwDFT.cxx b/aux/src/FftwDFT.cxx
index 85f6b0820..2a655f5d6 100644
--- a/aux/src/FftwDFT.cxx
+++ b/aux/src/FftwDFT.cxx
@@ -1,9 +1,13 @@
 #include "WireCellAux/FftwDFT.h"
+#include "WireCellUtil/NamedFactory.h"
+
 #include <fftw3.h>
 #include <mutex>
 #include <shared_mutex>
 #include <unordered_map>
 
+WIRECELL_FACTORY(FftwDFT, WireCell::Aux::FftwDFT, WireCell::IDFT)
+
 
 using namespace WireCell;
 
@@ -33,6 +37,8 @@ plan_type get_plan(std::shared_mutex& mutex, plan_map_t& plans, plan_key_t key)
 }
 
 
+// #include <iostream>             // debugging
+
 template<typename planner_function>
 void doit(std::shared_mutex& mutex, plan_map_t& plans, 
                 int fwdrev, plan_val_t* src, plan_val_t* dst, int stride, int nstrides,
@@ -45,6 +51,7 @@ void doit(std::shared_mutex& mutex, plan_map_t& plans,
         // Check again in case another thread snakes us.
         auto it = plans.find(key);
         if (it == plans.end()) {
+            //std::cerr << "make plan for " << key << std::endl;
             plan = make_plan();
             plans[key] = plan;
         }
@@ -111,3 +118,10 @@ void Aux::FftwDFT::inv2d(const complex_t* in, complex_t* out, int stride, int ns
         return fftwf_plan_dft_2d(stride, nstrides, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
     });
 }
+Aux::FftwDFT::FftwDFT()
+{
+}
+Aux::FftwDFT::~FftwDFT()
+{
+}
+
diff --git a/aux/test/test_dfttools.cxx b/aux/test/test_dfttools.cxx
new file mode 100644
index 000000000..0ef2eaf22
--- /dev/null
+++ b/aux/test/test_dfttools.cxx
@@ -0,0 +1,28 @@
+#include "WireCellAux/DftTools.h"
+#include "WireCellAux/FftwDFT.h"
+
+#include <iostream>
+#include <memory>
+
+using namespace WireCell;
+using namespace WireCell::Aux;
+
+void test_1d_imp(IDFT::pointer trans)
+{
+    realvec_t rimp(64, 0);
+    rimp[1] = 1.0;
+    auto cimp = dft(trans, rimp);
+    for (auto c : cimp) {
+        std::cerr << c << " ";
+    }
+    std::cerr << "\n";
+}
+
+int main()
+{
+    auto trans = std::make_shared<FftwDFT>();
+
+    test_1d_imp(trans);
+
+    return 0;
+}
diff --git a/aux/test/test_idft.cxx b/aux/test/test_idft.cxx
new file mode 100644
index 000000000..97f85b14d
--- /dev/null
+++ b/aux/test/test_idft.cxx
@@ -0,0 +1,122 @@
+// Test IDFT implementations.
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/Waveform.h"
+#include "WireCellUtil/PluginManager.h"
+#include "WireCellIface/IConfigurable.h"
+#include "WireCellIface/IDFT.h"
+
+#include <chrono>
+#include <vector>
+#include <thread>
+#include <iostream>
+
+using namespace WireCell;
+
+
+static
+void test_1d_zero(IDFT::pointer dft, int size = 1024)
+{
+    std::vector<IDFT::complex_t> inter(size,0), freq(size,0);
+
+    dft->fwd1d(inter.data(), freq.data(), inter.size());
+    dft->inv1d(freq.data(), inter.data(), freq.size());
+
+    auto tot = Waveform::sum(inter);
+    assert(std::real(tot) == 0);
+}
+static
+void test_2d_zero(IDFT::pointer dft, int size = 1024)
+{
+    int stride=size, nstrides=size;
+    std::vector<IDFT::complex_t> inter(stride*nstrides,0);
+    std::vector<IDFT::complex_t> freq(stride*nstrides,0);
+
+    dft->fwd2d(inter.data(), freq.data(), stride, nstrides);
+    dft->inv2d(freq.data(), inter.data(), stride, nstrides);
+
+    auto tot = Waveform::sum(inter);
+    assert(std::real(tot) == 0);
+}
+
+void fwdrev(IDFT::pointer dft, int id, int ntimes, int size)
+{
+    int stride=size, nstrides=size;
+    std::vector<IDFT::complex_t> inter(stride*nstrides,0);
+    std::vector<IDFT::complex_t> freq(stride*nstrides,0);
+
+    // std::cerr << "running " << id << std::endl;
+
+    while (ntimes) {
+        //std::cerr << ntimes << "\n";
+        dft->fwd2d(inter.data(), freq.data(), stride, nstrides);
+        dft->inv2d(freq.data(), inter.data(), stride, nstrides);
+
+        --ntimes;        
+        auto tot = Waveform::sum(inter);
+        assert(std::real(tot) == 0);
+    }
+    //std::cerr << "finished " << id << std::endl;
+}
+
+static
+void test_2d_threads(IDFT::pointer dft, int nthreads, int nloops, int size = 1024)
+{
+    using namespace std::chrono;
+
+    steady_clock::time_point t1 = steady_clock::now();
+
+    std::vector<std::thread> workers;
+
+    //std::cerr << "Starting workers\n";
+    for (int ind=0; ind<nthreads; ++ind) {
+        workers.emplace_back(fwdrev, dft, ind, nloops, size);
+    }
+    //std::cerr << "Waiting for workers\n";
+    for (auto& worker : workers) {
+        if (worker.joinable()) {
+            worker.join();
+        }
+    }
+    steady_clock::time_point t2 = steady_clock::now();
+    duration<double> dt1 = duration_cast<duration<double>>(t2 - t1);
+    std::cerr << "ndfts: " << nthreads*nloops
+              << " " << nthreads << " " << nloops
+              << " " << dt1.count() << std::endl;
+}
+
+int main(int argc, char* argv[])
+{
+    // fixme, add CLI parsing to add plugins, config and name another
+    // dft.  For now, just use the one in aux.
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    std::string dft_tn = "FftwDFT";
+
+    // creates
+    auto idft = Factory::lookup_tn<IDFT>(dft_tn);
+    assert(idft);
+    {                          // configure before use if configurable
+        auto icfg = Factory::find_maybe_tn<IConfigurable>(dft_tn);
+        if (icfg) {
+            auto cfg = icfg->default_configuration();
+            icfg->configure(cfg);
+        }
+    }
+
+    test_1d_zero(idft);
+    test_2d_zero(idft);
+
+    std::vector<int> sizes = {128,256,512,1024};
+    for (auto size : sizes) {
+        int ndouble=3, ntot=2*16384/size;
+        while (ndouble) {
+            int nthread = 1<<ndouble;
+            int nloop = ntot/nthread;
+            --ndouble;
+            std::cerr << "size=" << size << " nthread=" << nthread << " nloop=" << nloop << "\n";
+            test_2d_threads(idft, nthread, nloop, size);
+        }
+    }
+
+    return 0;
+}
diff --git a/util/inc/WireCellUtil/Waveform.h b/util/inc/WireCellUtil/Waveform.h
index 7240ba7b6..f2ed89cc0 100644
--- a/util/inc/WireCellUtil/Waveform.h
+++ b/util/inc/WireCellUtil/Waveform.h
@@ -9,7 +9,8 @@
 #include <algorithm>
 #include <string>
 
-// for FFT
+// FIXME: remove the hard-wired Eigen::FFT related in favor of dynamic
+// DFT with Aux/DftTools.h.
 #include <Eigen/Core>
 #include <unsupported/Eigen/FFT>
 
diff --git a/util/test/test_complex.cxx b/util/test/test_complex.cxx
new file mode 100644
index 000000000..877138020
--- /dev/null
+++ b/util/test/test_complex.cxx
@@ -0,0 +1,36 @@
+#include <complex>
+#include <vector>
+#include <iostream>
+
+int main()
+{
+    // note: this compiles but doesn't do what you may expect.
+    // complex<double> numbers are a 2-array of doubles: [r,i] so the
+    // reinterpret_cast from complex to double gives an "interleaved"
+    // array of [r0,i0,r1,i1].  Likewise from double to complex gives
+    // a "complex" number of [r0 ,r1].
+
+    using complex_t = std::complex<double>;
+    using cvec = std::vector<complex_t>;
+    using dvec = std::vector<double>;
+
+    cvec c1{{0,0}, {1,1}};
+    dvec d1={0,1};
+
+    complex_t* c2 = reinterpret_cast<complex_t*>(d1.data());
+    cvec c3(c2, c2+2);
+
+    double* d2 = reinterpret_cast<double*>(c1.data());
+    dvec d3(d2, d2+2);
+
+    for (auto c : c3) {
+        std::cerr << c << " ";
+    }
+    std::cerr << "\n";
+    for (auto d : d3) {
+        std::cerr << d << " ";
+    }
+    std::cerr << "\n";
+    
+    return 0;
+}

From dbcbe9bf681adf836c3adec033162e36b0d95822 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Fri, 5 Nov 2021 18:33:06 -0400
Subject: [PATCH 07/46] Allow to optionally provide data and metadata in
 constructor

---
 aux/inc/WireCellAux/SimpleTensor.h | 22 ++++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/aux/inc/WireCellAux/SimpleTensor.h b/aux/inc/WireCellAux/SimpleTensor.h
index 56c3ab905..7b267bdbe 100644
--- a/aux/inc/WireCellAux/SimpleTensor.h
+++ b/aux/inc/WireCellAux/SimpleTensor.h
@@ -2,7 +2,9 @@
 #define WIRECELL_AUX_SIMPLETENSOR
 
 #include "WireCellIface/ITensor.h"
+
 #include <boost/multi_array.hpp>
+#include <cstring>
 
 namespace WireCell {
 
@@ -13,14 +15,26 @@ namespace WireCell {
            public:
             typedef ElementType element_t;
 
-            SimpleTensor(const shape_t& shape)
+            // Create simple tensor, allocating space for data.  If
+            // data given it must have at least as many elements as
+            // implied by shape and that span will be copied into
+            // allocated memory.
+            SimpleTensor(const shape_t& shape,
+                         const element_t* data=nullptr,
+                         const Configuration& md = Configuration())
             {
                 size_t nbytes = element_size();
-                for (const auto& s : shape) {
+                m_shape = shape;
+                for (const auto& s : m_shape) {
                     nbytes *= s;
                 }
-                m_store.resize(nbytes);
-                m_shape = shape;
+                if (data) {
+                    const std::byte* bytes = reinterpret_cast<const std::byte*>(data);
+                    m_store.assign(bytes, bytes+nbytes);
+                }
+                else {
+                    m_store.resize(nbytes);
+                }
             }
             virtual ~SimpleTensor() {}
 

From 2ffbb84e97aeaaeebf3c0a9d2c037864136cded7 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Fri, 5 Nov 2021 18:33:23 -0400
Subject: [PATCH 08/46] More work toward DFT as a service

---
 aux/inc/WireCellAux/DftTools.h    |  80 ++++++----------
 aux/inc/WireCellAux/FftwDFT.h     |   4 +-
 aux/inc/WireCellAux/TensorTools.h |  77 +++++++++++++++
 aux/src/DftTools.cxx              | 103 ++++++++------------
 aux/src/FftwDFT.cxx               |  25 +++--
 aux/test/test_dfttools.cxx        | 103 ++++++++++++++++++--
 aux/test/test_idft.cxx            |   8 +-
 aux/test/test_tensor_tools.cxx    | 102 ++++++++++++++++++++
 iface/inc/WireCellIface/IDFT.h    |  22 ++++-
 iface/inc/WireCellIface/ITensor.h |   7 +-
 iface/src/IDFT.cxx                |   4 +-
 util/test/test_eigen_cast.cxx     |  45 +++++++++
 util/test/test_eigen_rowcol.cxx   | 150 ++++++++++++++++++++++++++++++
 13 files changed, 590 insertions(+), 140 deletions(-)
 create mode 100644 aux/inc/WireCellAux/TensorTools.h
 create mode 100644 aux/test/test_tensor_tools.cxx
 create mode 100644 util/test/test_eigen_cast.cxx
 create mode 100644 util/test/test_eigen_rowcol.cxx

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
index 24e097a43..10f2d8cbf 100644
--- a/aux/inc/WireCellAux/DftTools.h
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -1,25 +1,6 @@
 /**
-   High level functions related to DFTs.
-
-   Most take an IDFT::pointer to a DFT implementation and return an
-   allocated result.  Use IDFT directly to control allocation.
-
-   There are std::vector and Eigen array functions.
-
-   Abbreviations:
-
-   - IS is interval space aka time / distance
-   - FS is frequency space aka frequency / periodicity 
-
-   Price to pay for simple API is a lack of optimizations:
-
-   - When a real valued array is invovled, all arrays are full size.
-     That is, no half-size optimization will be exposed to the caller.
-
-   - These functions tend to make more copies than may be needed if
-     IDFT is called directly.  In addition to real/complex conversion,
-     using std::vector or Eigen array instead of raw memory leads to
-     more copies.
+   This provides std::vector and Eigen::Array typed interface to an
+   IDFT.
  */
 
 #ifndef WIRECELL_AUX_DFTTOOLS
@@ -31,47 +12,46 @@
 
 namespace WireCell::Aux {
 
-    using real_t = IDFT::scalar_t;
     using complex_t = IDFT::complex_t;
 
     // std::vector based functions
 
-    using realvec_t = std::vector<real_t>;
-    using compvec_t = std::vector<complex_t>;
+    using dft_vector_t = std::vector<complex_t>;
 
     // 1D with vectors
 
-    // Transform a real IS, return same size FS.
-    compvec_t dft(IDFT::pointer dft, const realvec_t& seq);
-        
-    // Transform complex FS to IS and return real part
-    realvec_t idft(IDFT::pointer dft, const compvec_t& spec);
-
-    compvec_t r2c(const realvec_t& r);
-    realvec_t c2r(const compvec_t& c);
+    inline dft_vector_t fwd(IDFT::pointer dft, const dft_vector_t& seq)
+    {
+        dft_vector_t ret(seq.size());
+        dft->fwd1d(seq.data(), ret.data(), ret.size());
+        return ret;
+    }
 
+    inline dft_vector_t inv(IDFT::pointer dft, const dft_vector_t& spec)
+    {
+        dft_vector_t ret(spec.size());
+        dft->inv1d(spec.data(), ret.data(), ret.size());
+        return ret;
+    }
 
     // Eigen array based functions
 
-    /// Real 1D array
-    using array_xf = Eigen::ArrayXf;
-
-    /// Complex 1D array
-    using array_xc = Eigen::ArrayXcf;
-
-    /// A real, 2D array
-    using array_xxf = Eigen::ArrayXXf;
-
-    /// A complex, 2D array
-    using array_xxc = Eigen::ArrayXXcf;
+    /// A complex, 2D array.  Use Array::cast<type>() if you need to
+    /// convert to/from real.
+    using dft_array_t = Eigen::ArrayXXcf;
     
-    // 2D with Eigen arrays
-
-    // Transform a real IS, return same size FS.
-    array_xxc dft(IDFT::pointer dft, const array_xxf& arr);
-
-    // Transform complex FS to IS and return real part
-    array_xxf idft(IDFT::pointer dft, const array_xxc& arr);
+    // 2D with Eigen arrays.  Use eg arr.cast<complex_>() to provde
+    // from real or arr.cast<float>() to convert result to real.
+
+    // Transform both dimesions.
+    dft_array_t fwd(IDFT::pointer dft, const dft_array_t& arr);
+    dft_array_t inv(IDFT::pointer dft, const dft_array_t& arr);
+
+    // Transform one dimesions.  For example axis=0 transforms each
+    // logical row of the Eigen array so that column=0 of each row
+    // would hold the frequency=0 component of each row's spectrum.  
+    // array_xxc fwd(IDFT::pointer dft, const array_xxc& arr, int axis);
+    // array_xxc inv(IDFT::pointer dft, const array_xxc& arr, int axis);
 
 
 }
diff --git a/aux/inc/WireCellAux/FftwDFT.h b/aux/inc/WireCellAux/FftwDFT.h
index 62cea9a84..365190f0c 100644
--- a/aux/inc/WireCellAux/FftwDFT.h
+++ b/aux/inc/WireCellAux/FftwDFT.h
@@ -30,10 +30,10 @@ namespace WireCell::Aux {
 
         virtual 
         void fwd2d(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const;
+                   int nstrides, int stride) const;
         virtual 
         void inv2d(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const;
+                   int nstrides, int stride) const;
 
 
     };
diff --git a/aux/inc/WireCellAux/TensorTools.h b/aux/inc/WireCellAux/TensorTools.h
new file mode 100644
index 000000000..6765b457e
--- /dev/null
+++ b/aux/inc/WireCellAux/TensorTools.h
@@ -0,0 +1,77 @@
+#ifndef WIRECELL_AUX_TENSORTOOLS
+#define WIRECELL_AUX_TENSORTOOLS
+
+#include "WireCellIface/ITensor.h"
+#include "WireCellIface/IDFT.h"
+#include "WireCellUtil/Exceptions.h"
+
+#include <Eigen/Core>
+#include <complex>
+
+namespace WireCell::Aux {
+
+    bool is_row_major(const ITensor::pointer& ten) {
+        if (ten->order().empty() or ten->order()[0] == 1) {
+            return true;
+        }
+        return false;
+    }
+
+    template<typename scalar_t>
+    bool is_type(const ITensor::pointer& ten) {
+        return (ten->element_type() == typeid(scalar_t));
+    }
+
+
+    // Extract the underlying data array from the tensor as a vector.
+    // Caution: this ignores storage order hints and 1D or 2D will be
+    // flattened assuming C-ordering, aka row-major (if 2D).  It
+    // throws ValueError on type mismatch.
+    template<typename element_type>
+    std::vector<element_type> asvec(const ITensor::pointer& ten)
+    {
+        if (ten->element_type() != typeid(element_type)) {
+            THROW(ValueError() << errmsg{"element type mismatch"});
+        }
+        const element_type* data = (const element_type*)ten->data();
+        const size_t nelems = ten->size()/sizeof(element_type);
+        return std::vector<element_type>(data, data+nelems);
+    }
+    
+    // Extract the tensor data as an Eigen array.
+    template<typename element_type>
+    Eigen::Array<element_type, Eigen::Dynamic, Eigen::Dynamic> // this default is column-wise
+    asarray(const ITensor::pointer& tens)
+    {
+        if (tens->element_type() != typeid(element_type)) {
+            THROW(ValueError() << errmsg{"element type mismatch"});
+        }
+        using ROWM = Eigen::Array<element_type, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+        using COLM = Eigen::Array<element_type, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor>;
+
+        auto shape = tens->shape();
+        int nrows, ncols;
+        if (shape.size() == 1) {
+            nrows = 1;
+            ncols = shape[0];
+        }
+        else {
+            nrows = shape[0];
+            ncols = shape[1];
+        }
+
+        // Eigen::Map is a non-const view of data but a copy happens
+        // on return.  We need to temporarily break const correctness.
+        const element_type* cdata = reinterpret_cast<const element_type*>(tens->data());
+        element_type* mdata = const_cast<element_type*>(cdata);
+
+        if (is_row_major(tens)) {
+            return Eigen::Map<ROWM>(mdata, nrows, ncols);
+        }
+        // column-major
+        return Eigen::Map<COLM>(mdata, nrows, ncols);
+    }
+
+}
+
+#endif
diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index b7ec12cb5..5ef53e166 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -3,80 +3,55 @@
 using namespace WireCell;
 using namespace WireCell::Aux;
 
-compvec_t Aux::r2c(const realvec_t& r)
-{
-    compvec_t cret(r.size());
-    std::transform(r.begin(), r.end(), cret.begin(),
-                   [](const real_t& r) { return complex_t(r, 0); });
-    return cret;
-}
-realvec_t Aux::c2r(const compvec_t& c)
-{
-    realvec_t rret(c.size());
-    std::transform(c.begin(), c.end(), rret.begin(),
-                   [](const complex_t& c) { return std::real(c); });
-    return rret;
-}
-
-// Transform a real IS, return same size FS.
-compvec_t Aux::dft(IDFT::pointer dft, const realvec_t& seq)
-{
-    compvec_t cseq = Aux::r2c(seq);
-    compvec_t cret(cseq.size());
-    dft->fwd1d(cseq.data(), cret.data(), cret.size());
-    return cret;
-}
-        
-// Transform complex FS to IS and return real part
-realvec_t Aux::idft(IDFT::pointer dft, const compvec_t& spec)
-{
-    compvec_t cret(spec.size());
-    dft->inv1d(spec.data(), cret.data(), cret.size());
-    return Aux::c2r(cret);
-}
-
-using array_xxf_rm = Eigen::Array<real_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
-using array_xxc_rm = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
-
-
-// Transform a real IS, return same size FS.
-array_xxc Aux::dft(IDFT::pointer trans, const array_xxf& arr)
+/*
+  Big fat warning to future me: Passing by reference means the input
+  array may carry the .IsRowMajor optimization for implementing
+  transpose().  An extra copy would remove that complication but this
+  interface tries to keep it.
+ */
+
+using ROWM = Eigen::Array<Aux::complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+using COLM = Eigen::Array<Aux::complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor>;
+
+template<typename trans>
+Aux::dft_array_t doit(const Aux::dft_array_t& arr, trans func)
 {
+    // Nominally, memory is in column-major order
+    const Aux::complex_t* in_data = arr.data();
     int stride = arr.rows();
     int nstrides = arr.cols();
-    array_xxc ret(stride, nstrides);
 
-    if (!arr.IsRowMajor) {
+    // except when it isn't
+    bool flipped = arr.IsRowMajor;
+    if (flipped) {
         stride = arr.cols();
         nstrides = arr.rows();
     }
 
-    size_t size = stride*nstrides;
-    compvec_t carr(size);
-    std::transform(arr.data(), arr.data()+size, carr.begin(),
-                   [](const real_t& r) { return complex_t(r,0); });
-    
-    trans->fwd2d(carr.data(), ret.data(), stride, nstrides);
-    return ret;
-}
-
-// Transform complex FS to IS and return real part
-array_xxf Aux::idft(IDFT::pointer trans, const array_xxc& arr)
-{
-    int stride = arr.rows();
-    int nstrides = arr.cols();
-    array_xxf ret(stride, nstrides);
+    Aux::dft_vector_t out_vec(nstrides*stride);
+    func(in_data, out_vec.data(), nstrides, stride);
 
-    if (!arr.IsRowMajor) {
-        stride = arr.cols();
-        nstrides = arr.rows();
+    if (flipped) {
+        return Eigen::Map<ROWM>(out_vec.data(), arr.rows(), arr.cols());
     }
+    return Eigen::Map<COLM>(out_vec.data(), arr.rows(), arr.cols());
+
+}
 
-    size_t size = stride*nstrides;
-    compvec_t cret(size);
-    trans->inv2d(arr.data(), cret.data(), stride, nstrides);
+Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr)
+{
+    return doit(arr, [&](const complex_t* in_data,
+                         complex_t* out_data,
+                         int nstrides, int stride) {
+        dft->fwd2d(in_data, out_data, nstrides, stride);
+    });
+}
 
-    std::transform(cret.begin(), cret.end(), ret.data(),
-                   [](const complex_t& c) { return std::real(c); });
-    return ret;
+Aux::dft_array_t Aux::inv(IDFT::pointer dft, const Aux::dft_array_t& arr)
+{
+    return doit(arr, [&](const complex_t* in_data,
+                         complex_t* out_data,
+                         int nstrides, int stride) {
+        dft->inv2d(in_data, out_data, nstrides, stride);
+    });
 }
diff --git a/aux/src/FftwDFT.cxx b/aux/src/FftwDFT.cxx
index 2a655f5d6..f4a214760 100644
--- a/aux/src/FftwDFT.cxx
+++ b/aux/src/FftwDFT.cxx
@@ -41,7 +41,7 @@ plan_type get_plan(std::shared_mutex& mutex, plan_map_t& plans, plan_key_t key)
 
 template<typename planner_function>
 void doit(std::shared_mutex& mutex, plan_map_t& plans, 
-                int fwdrev, plan_val_t* src, plan_val_t* dst, int stride, int nstrides,
+                int fwdrev, plan_val_t* src, plan_val_t* dst, int nstrides, int stride,
                 planner_function make_plan)
 {
     auto key = make_key(fwdrev == FFTW_BACKWARD, src, dst, stride, nstrides);
@@ -77,7 +77,7 @@ void Aux::FftwDFT::fwd1d(const complex_t* in, complex_t* out, int stride) const
     static const int dir = FFTW_FORWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, stride, 0, [&]( ) {
+    doit(mutex, plans, dir, src, dst, 0, stride, [&]( ) {
         return fftwf_plan_dft_1d(stride, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
     });
 }
@@ -88,35 +88,46 @@ void Aux::FftwDFT::inv1d(const complex_t* in, complex_t* out, int stride) const
     static const int dir = FFTW_BACKWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, stride, 0, [&]( ) {
+    doit(mutex, plans, dir, src, dst, 0, stride, [&]( ) {
         return fftwf_plan_dft_1d(stride, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
     });
+
+    // reverse normalization
+    for (int ind=0; ind<stride; ++ind) {
+        out[ind] /= stride;
+    }
 }
 
 
-void Aux::FftwDFT::fwd2d(const complex_t* in, complex_t* out, int stride, int nstrides) const
+void Aux::FftwDFT::fwd2d(const complex_t* in, complex_t* out, int nstrides, int stride) const
 {
     static std::shared_mutex mutex;
     static plan_map_t plans;
     static const int dir = FFTW_FORWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, stride, nstrides, [&]( ) {
+    doit(mutex, plans, dir, src, dst, nstrides, stride, [&]( ) {
         return fftwf_plan_dft_2d(stride, nstrides, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
     });
 }
 
 
-void Aux::FftwDFT::inv2d(const complex_t* in, complex_t* out, int stride, int nstrides) const
+void Aux::FftwDFT::inv2d(const complex_t* in, complex_t* out, int nstrides, int stride) const
 {
     static std::shared_mutex mutex;
     static plan_map_t plans;
     static const int dir = FFTW_BACKWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, stride, nstrides, [&]( ) {
+    doit(mutex, plans, dir, src, dst, nstrides, stride, [&]( ) {
         return fftwf_plan_dft_2d(stride, nstrides, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
     });
+
+    // reverse normalization
+    const int ntot = stride*nstrides;
+    for (int ind=0; ind<ntot; ++ind) {
+        out[ind] /= ntot;
+    }
 }
 Aux::FftwDFT::FftwDFT()
 {
diff --git a/aux/test/test_dfttools.cxx b/aux/test/test_dfttools.cxx
index 0ef2eaf22..c5bf85930 100644
--- a/aux/test/test_dfttools.cxx
+++ b/aux/test/test_dfttools.cxx
@@ -1,28 +1,119 @@
 #include "WireCellAux/DftTools.h"
 #include "WireCellAux/FftwDFT.h"
+#include "WireCellUtil/Waveform.h"
 
 #include <iostream>
 #include <memory>
 
 using namespace WireCell;
-using namespace WireCell::Aux;
 
-void test_1d_imp(IDFT::pointer trans)
+using real_t = float;
+using RV = std::vector<real_t>;
+using complex_t = std::complex<real_t>;
+using CV = std::vector<complex_t>;
+
+void test_1d(IDFT::pointer dft)
 {
-    realvec_t rimp(64, 0);
+    RV rimp(64, 0);
     rimp[1] = 1.0;
-    auto cimp = dft(trans, rimp);
+
+    auto cimp = Aux::fwd(dft, Waveform::complex(rimp));
     for (auto c : cimp) {
         std::cerr << c << " ";
     }
     std::cerr << "\n";
+
+    RV rimp2 = Waveform::real(Aux::inv(dft, cimp));
+    for (auto r : rimp2) {
+        std::cerr << r << " ";
+    }
+    std::cerr << "\n";
+    for (int ind=0; ind<64; ++ind) {
+        if (ind == 1) {
+            assert(std::abs(rimp2[ind]-1.0) < 1e-6);
+            continue;
+        }
+        assert(std::abs(rimp2[ind]) < 1e-6);
+    }
+}
+
+using FA = Eigen::Array<float, Eigen::Dynamic, Eigen::Dynamic>;
+
+void test_2d(IDFT::pointer dft)
+{
+    const int nrows=16;
+    const int ncols=8;
+    FA r = FA::Zero(nrows, ncols);
+    r(10,1) = 1.0;
+    std::cerr << r << std::endl;
+    auto c = Aux::fwd(dft, r.cast<complex_t>());
+    std::cerr << c << std::endl;
+    FA r2 = Aux::inv(dft, c).real();
+    std::cerr << r2 << std::endl;
+    for (int irow=0; irow<nrows; ++irow) {
+        for (int icol=0; icol<ncols; ++icol) {
+            if (irow==10 and icol==1) {
+                assert(std::abs(r2(irow, icol)-1.0) < 1e-6);
+                continue;
+            }
+            assert(std::abs(r2(irow, icol)) < 1e-6);    
+        }
+    }
+}
+
+template<typename array_type>
+void dump(std::string name, const array_type& arr)
+{
+    std::cerr << name << ":(" << arr.rows() << "," << arr.cols() << ") row-major:" << arr.IsRowMajor << "\n";
+}
+
+void test_2d_transpose(IDFT::pointer dft)
+{
+    const int nrows=16;
+    const int ncols=8;
+
+    FA r = FA::Zero(nrows, ncols); // shape:(16,8)
+    dump("r", r);
+
+    // do not remove the auto in this next line
+    auto rt = r.transpose();    // shape:(8,16)
+    dump("rt", rt);
+    rt(1,10) = 1.0;
+
+    auto c = Aux::fwd(dft, rt.cast<complex_t>());
+    dump("c", c);
+
+    auto r2 = Aux::inv(dft, c).real();
+    dump("r2",r2);
+
+    // transpose access
+    const int nrowst = r2.rows();
+    const int ncolst = r2.cols();
+
+    for (int irow=0; irow<nrowst; ++irow) {
+        for (int icol=0; icol<ncolst; ++icol) {
+            float val = rt(irow, icol);
+            float val2 = r2(irow, icol); // access with transposed indices
+            std::cerr << "(" << irow << ","<< icol << "):" << val << " ? " << val2 << "\n";
+            if (irow==1 and icol==10) {
+                assert(std::abs(val-1.0) < 1e-6);
+                continue;
+            }
+            assert(std::abs(val) < 1e-6);    
+        }
+        std::cerr << "\n";
+    }
+
+    
 }
 
 int main()
 {
-    auto trans = std::make_shared<FftwDFT>();
+    auto dft = std::make_shared<Aux::FftwDFT>();
 
-    test_1d_imp(trans);
+    test_1d(dft);
+    test_2d(dft);
+    test_2d_transpose(dft);
 
     return 0;
 }
diff --git a/aux/test/test_idft.cxx b/aux/test/test_idft.cxx
index 97f85b14d..73bc95df2 100644
--- a/aux/test/test_idft.cxx
+++ b/aux/test/test_idft.cxx
@@ -31,8 +31,8 @@ void test_2d_zero(IDFT::pointer dft, int size = 1024)
     std::vector<IDFT::complex_t> inter(stride*nstrides,0);
     std::vector<IDFT::complex_t> freq(stride*nstrides,0);
 
-    dft->fwd2d(inter.data(), freq.data(), stride, nstrides);
-    dft->inv2d(freq.data(), inter.data(), stride, nstrides);
+    dft->fwd2d(inter.data(), freq.data(), nstrides, stride);
+    dft->inv2d(freq.data(), inter.data(), nstrides, stride);
 
     auto tot = Waveform::sum(inter);
     assert(std::real(tot) == 0);
@@ -48,8 +48,8 @@ void fwdrev(IDFT::pointer dft, int id, int ntimes, int size)
 
     while (ntimes) {
         //std::cerr << ntimes << "\n";
-        dft->fwd2d(inter.data(), freq.data(), stride, nstrides);
-        dft->inv2d(freq.data(), inter.data(), stride, nstrides);
+        dft->fwd2d(inter.data(), freq.data(), nstrides, stride);
+        dft->inv2d(freq.data(), inter.data(), nstrides, stride);
 
         --ntimes;        
         auto tot = Waveform::sum(inter);
diff --git a/aux/test/test_tensor_tools.cxx b/aux/test/test_tensor_tools.cxx
new file mode 100644
index 000000000..933a777e7
--- /dev/null
+++ b/aux/test/test_tensor_tools.cxx
@@ -0,0 +1,102 @@
+#include "WireCellAux/TensorTools.h"
+#include "WireCellAux/SimpleTensor.h"
+
+
+#include <complex>
+#include <vector>
+
+using real_t = float;
+using RV = std::vector<real_t>;
+using complex_t = std::complex<real_t>;
+using CV = std::vector<complex_t>;
+using RT = WireCell::Aux::SimpleTensor<real_t>;
+using CT = WireCell::Aux::SimpleTensor<complex_t>;
+
+// test fodder
+const RV real_vector{0,1,2,3,4,5};
+const RV real_vector_cw{0,3,1,4,2,5};
+const CV complex_vector{{0,0},{1,1},{2,2},{3,3},{4,4},{5,5}};
+const WireCell::ITensor::shape_t shape{2,3};
+
+using namespace WireCell;
+
+void test_is_type()
+{
+    auto rt = std::make_shared<RT>(shape, real_vector.data());
+    assert (Aux::is_type<real_t>(rt));
+    assert (!Aux::is_type<complex_t>(rt));
+}
+
+void test_is_row_major()
+{
+    // ST actually does not let us do anything but C-order/row-major
+    auto rm = std::make_shared<RT>(shape, real_vector.data());
+    assert(Aux::is_row_major(rm));
+}
+
+template<typename VectorType>
+void assert_equal(const VectorType& v1, const VectorType& v2)
+{
+    assert(v1.size() == v2.size());
+    for (size_t ind=0; ind<v1.size(); ++ind) {
+        assert(v1[ind] == v2[ind]);
+    }
+}
+
+// asvec 1) match type, 2) type mismatch
+void test_asvec()
+{
+    auto rt = std::make_shared<RT>(shape, real_vector.data());
+    auto ct = std::make_shared<CT>(shape, complex_vector.data());
+    auto got_rt = Aux::asvec<real_t>(rt);
+    auto got_ct = Aux::asvec<complex_t>(ct);
+    assert_equal(real_vector, got_rt);
+    assert_equal(complex_vector, got_ct);
+
+    try {
+        auto oops = Aux::asvec<complex_t>(rt);
+    }
+    catch (ValueError& err) {
+    }
+}
+
+void test_asarray()
+{
+    // as array 2x2: (1d,2d) x (rw,cw)
+
+    // make mutable copy to test that TT returns a copy
+    RV my_vec(real_vector.begin(), real_vector.end());
+
+    // test 2d
+    auto rt = std::make_shared<RT>(shape, my_vec.data());
+    auto ra = Aux::asarray<real_t>(rt);
+    auto shape = rt->shape();
+    for (size_t irow = 0; irow < shape[0]; ++irow) {
+        for (size_t icol = 0; icol < shape[1]; ++icol) {        
+            assert(ra(irow, icol) == my_vec[irow*shape[1] + icol]);
+        }
+    }
+
+    // test 1d
+    const WireCell::ITensor::shape_t shape1d{6,};
+    auto rt1d = std::make_shared<RT>(shape1d, my_vec.data());
+    auto ra1d = Aux::asarray<real_t>(rt1d);
+    for (size_t ind = 0; ind < shape[0]; ++ind) {        
+        assert(ra1d(ind) == my_vec[ind]);
+    }
+
+    // Assure the internal use of Eigen::Map leads to a copy on return
+    my_vec[0] = 42;
+    assert(ra(0,0) == 0);
+    assert(ra1d(0) == 0);
+}
+
+int main()
+{
+    test_is_type();
+    test_is_row_major();
+    test_asvec();
+    test_asarray();
+
+    return 0;
+}
diff --git a/iface/inc/WireCellIface/IDFT.h b/iface/inc/WireCellIface/IDFT.h
index dd1d39e8c..448c04858 100644
--- a/iface/inc/WireCellIface/IDFT.h
+++ b/iface/inc/WireCellIface/IDFT.h
@@ -1,5 +1,19 @@
 /** 
     Interface to perform discrete single-precision Fourier transforms.
+
+    Note, implementations MUST NOT normalize forward transforms and
+    MUST normalize reverse/inverse transforms by 1/n where n is the
+    number of elements in the 1D array being reverse transformed.
+
+    The number "stride" describes how many elements of the array are
+    contiguous.  For "C-order" aka row-major ordering of 2D arrays,
+    stride is the size of a row, aka number of columns.
+
+    The number "nstrides" describe how many arrays of length "stride"
+    are placed end-to-end in the memory.  For "C-order" aka row-major
+    ordering of 2D arrays, the "nstrides" counts the size of the
+    columns, aka the number of rows.  With this ordering, the
+    (nstrides, stride) pair maps to the usual (nrows, ncols).
 */
 
 #ifndef WIRECELL_IDFT
@@ -34,20 +48,20 @@ namespace WireCell {
 
         virtual 
         void fwd1b(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const;
+                   int nstrides, int stride) const;
         virtual 
         void inv1b(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const;
+                   int nstrides, int stride) const;
 
 
         // 2D, transform both dimensions
 
         virtual 
         void fwd2d(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const = 0;
+                   int nstrides, int stride) const = 0;
         virtual 
         void inv2d(const complex_t* in, complex_t* out,
-                   int stride, int nstrides) const = 0;
+                   int nstrides, int stride) const = 0;
 
      };
 }
diff --git a/iface/inc/WireCellIface/ITensor.h b/iface/inc/WireCellIface/ITensor.h
index 5154b68fd..23bf52964 100644
--- a/iface/inc/WireCellIface/ITensor.h
+++ b/iface/inc/WireCellIface/ITensor.h
@@ -19,7 +19,12 @@ namespace WireCell {
        public:
         /// Shape gives size of each dimension.  Size of shape give Ndim.
         typedef std::vector<size_t> shape_t;
-        /// Storage order.  Empty implies C order.
+        /// Storage order.  Empty implies C order.  If non-empty the
+        /// vector holds the "majority" of the dimension.  C-order
+        /// implies a vector of {1,0} which means if the array is
+        /// accessed as array[a][b] then "b" is most major and "a" is
+        /// next most major.  Ie, row-major.  A fortran order would be
+        /// given as {0,1}.
         typedef std::vector<size_t> order_t;
 
         /// The type of the element.
diff --git a/iface/src/IDFT.cxx b/iface/src/IDFT.cxx
index 2f9ee3543..c0a62655c 100644
--- a/iface/src/IDFT.cxx
+++ b/iface/src/IDFT.cxx
@@ -9,7 +9,7 @@ IDFT::~IDFT() {}
 // with some GPU FFTs, override these methods!
 
 void IDFT::fwd1b(const complex_t* in, complex_t* out,
-                 int stride, int nstrides) const
+                 int nstrides, int stride) const
 {
     for (int istride=0; istride<nstrides; ++istride) {
         fwd1d(in+istride*stride, out+istride*stride, stride);
@@ -17,7 +17,7 @@ void IDFT::fwd1b(const complex_t* in, complex_t* out,
 }
 
 void IDFT::inv1b(const complex_t* in, complex_t* out,
-                 int stride, int nstrides) const
+                 int nstrides, int stride) const
 {
     for (int istride=0; istride<nstrides; ++istride) {
         inv1d(in+istride*stride, out+istride*stride, stride);
diff --git a/util/test/test_eigen_cast.cxx b/util/test/test_eigen_cast.cxx
new file mode 100644
index 000000000..8f9657ef7
--- /dev/null
+++ b/util/test/test_eigen_cast.cxx
@@ -0,0 +1,45 @@
+#include "Eigen/Core"
+
+#include <vector>
+#include <iostream>
+#include <complex>
+
+using real_t = float;
+using RV = std::vector<real_t>;
+using complex_t = std::complex<real_t>;
+using CV = std::vector<complex_t>;
+const RV real_vector{0,1,2,3,4,5};
+const RV real_vector_cw{0,3,1,4,2,5};
+const CV complex_vector{{0,0},{1,10},{2,20},{3,30},{4,40},{5,50}};
+
+using RA = Eigen::Array<real_t, Eigen::Dynamic, Eigen::Dynamic>;
+using RARM = Eigen::Array<real_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+using CA = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic>;
+using CARM = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+
+int main()
+{
+    RA ra = Eigen::Map<RARM>((real_t*)real_vector.data(), 2, 3);
+    CA ca = Eigen::Map<CARM>((complex_t*)complex_vector.data(), 2, 3);
+
+    CA ra2c = ra.cast<complex_t>();
+    RA ca2r = ca.real();
+
+    for (int irow = 0; irow<2; ++irow) {
+        for (int icol = 0; icol<3; ++icol) {
+            int ind = irow*3 + icol;
+            complex_t c = ra2c(irow, icol);
+            real_t r = c.real();
+            real_t r2 = ca2r(irow, icol);
+            real_t rwant = real_vector[ind];
+            complex_t cwant = complex_vector[ind];
+
+            std::cerr << ind << ": c=" << c  << " r=" << r << " r2=" << r2 << " rwant=" << rwant << " cwant=" << cwant << "\n";
+            assert(c.imag() == 0.0);
+            assert(r==rwant);
+            assert(r2==rwant);
+
+        }
+    }
+    return 0;
+}
diff --git a/util/test/test_eigen_rowcol.cxx b/util/test/test_eigen_rowcol.cxx
new file mode 100644
index 000000000..aec1fd763
--- /dev/null
+++ b/util/test/test_eigen_rowcol.cxx
@@ -0,0 +1,150 @@
+#include <Eigen/Core>
+#include <iostream>
+
+using DEFM = Eigen::Array<float, Eigen::Dynamic, Eigen::Dynamic>; // should be ColMajor
+using COLM = Eigen::Array<float, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor>;
+using ROWM = Eigen::Array<float, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+
+COLM get_mapped_cw()
+{
+    std::vector<float> col_major{11,21,12,22,13,23};
+    Eigen::Map<COLM> ret(col_major.data(), 2,3);
+    return ret;
+}
+ROWM get_mapped_rw()
+{
+    std::vector<float> row_major{11, 12, 13, 21, 22, 23};
+    Eigen::Map<ROWM> ret(row_major.data(), 2,3);
+    return ret;
+}
+    
+
+COLM get_colwise()
+{
+    COLM ret(2,3);
+    for (int major=0; major<2; ++major) {
+        for (int minor=0; minor<3; ++minor) {
+            ret(major,minor) = (major+1)*10 + minor+1;
+        }
+    }
+    return ret;
+}
+ROWM get_rowwise()
+{
+    ROWM ret(2,3);
+    for (int major=0; major<2; ++major) {
+        for (int minor=0; minor<3; ++minor) {
+            ret(major,minor) = (major+1)*10 + minor+1;
+        }
+    }
+    return ret;
+}
+
+void dump_def(DEFM arr)
+{
+    std::cout << "DEFM" << "("<<arr.rows()<<","<<arr.cols()<<")\n" << arr << "\n";
+    for (int major=0; major<2; ++major) {
+        for (int minor=0; minor<3; ++minor) {
+            std::cout << arr(major,minor)
+                      << "=" << arr.data()[minor*2+major] << " ";
+        }
+    }
+    std::cout << "\n";
+}
+void dump_cw(COLM arr)
+{
+    std::cout << "COLM" << "("<<arr.rows()<<","<<arr.cols()<<")\n" << arr << "\n";
+    for (int major=0; major<2; ++major) {
+        for (int minor=0; minor<3; ++minor) {
+            std::cout << arr(major,minor)
+                      << "=" << arr.data()[minor*2+major] << " ";
+        }
+    }
+    std::cout << "\n";
+}
+void dump_rw(ROWM arr)
+{
+    std::cout << "ROWM" << "("<<arr.rows()<<","<<arr.cols()<<")\n" << arr << "\n";
+    for (int major=0; major<2; ++major) {
+        for (int minor=0; minor<3; ++minor) {
+            std::cout << arr(major,minor)
+                      << "=" << arr.data()[major*3+minor] << " ";
+        }
+    }
+    std::cout << "\n";
+}
+
+void dump_data(const COLM& arr)
+{
+    std::cout << "COLM:";
+    const int size = arr.rows() * arr.cols();
+    for (int ind=0; ind<size; ++ind) {
+        std::cout << arr(ind) << " ";
+    }
+    std::cout << std::endl;
+}
+void dump_data(float* data, int size=6)
+{
+    std::cout << "data:";
+    for (int ind=0; ind<size; ++ind) {
+        std::cout << data[ind] << " ";
+    }
+    std::cout << std::endl;
+}
+
+int main()
+{
+    std::cout << "mapped-cw:\n";
+    dump_def(get_mapped_cw());
+    dump_cw(get_mapped_cw());
+    dump_rw(get_mapped_cw());
+    std::cout << "mapped-rw:\n";
+    dump_def(get_mapped_rw());
+    dump_cw(get_mapped_rw());
+    dump_rw(get_mapped_rw());
+
+    std::cout << "column-wise:\n";
+    dump_def(get_colwise());
+    dump_cw(get_colwise());
+    dump_rw(get_colwise());
+    std::cout << "row-wise:\n";
+    dump_def(get_rowwise());
+    dump_cw(get_rowwise());
+    dump_rw(get_rowwise());
+
+    auto cw = get_colwise();
+    std::cout << "cw is row-major:" << cw.IsRowMajor << "\n";
+    dump_data(cw);
+    dump_data(cw.data());
+
+    auto cat = cw.transpose();
+    std::cout << "cat is row-major:" << cat.IsRowMajor << "\n";
+    dump_data(cat);
+    dump_data(cat.data());
+
+    COLM cct = cw.transpose();
+    std::cout << "cct is row-major:" << cct.IsRowMajor << "\n";
+    dump_data(cct);
+    dump_data(cct.data());
+
+
+}
+/*
+  conclusions: 
+
+  - default is indeed column-wise storage order
+
+  - a copy between ROWM and COLM transforms the underlying data.
+
+  - indices given via the callable operator are invariant.
+
+  - transpose:
+
+    - a transpose() returns same array with IsRowMajor toggled.
+
+    - a IsRowMajor COLM copied to a COLM applies the transpose to the
+      data.
+
+    - access via indicies is always as expected but .data() order
+      interpretation must check C++ type against IsRowMajor!
+ */

From c248bab3e9d5913cf0463f2be637211ce01ad2aa Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 8 Nov 2021 16:31:54 -0500
Subject: [PATCH 09/46] Elaborate on comments

---
 iface/inc/WireCellIface/ITensor.h | 16 +++++++++++++---
 1 file changed, 13 insertions(+), 3 deletions(-)

diff --git a/iface/inc/WireCellIface/ITensor.h b/iface/inc/WireCellIface/ITensor.h
index 23bf52964..d1cbf6adb 100644
--- a/iface/inc/WireCellIface/ITensor.h
+++ b/iface/inc/WireCellIface/ITensor.h
@@ -19,12 +19,22 @@ namespace WireCell {
        public:
         /// Shape gives size of each dimension.  Size of shape give Ndim.
         typedef std::vector<size_t> shape_t;
+
         /// Storage order.  Empty implies C order.  If non-empty the
         /// vector holds the "majority" of the dimension.  C-order
         /// implies a vector of {1,0} which means if the array is
-        /// accessed as array[a][b] then "b" is most major and "a" is
-        /// next most major.  Ie, row-major.  A fortran order would be
-        /// given as {0,1}.
+        /// accessed as array[a][b] "axis" 0 (indexed by "a") is the
+        /// "major index" and "axis" 1 (indexed by "b") is the "minor
+        /// index".  It is thus "row-major" ordering as the major
+        /// index counts rows.  An array in fortran-order
+        /// (column-major order) would be given as {0,1}.
+        ///
+        /// A note as this can be confusing: The "logical" rows and
+        /// columns, eg when used in an Eigen array are independent
+        /// from memory order.  An Eigen array is always indexed as
+        /// arr(r,c).  Storage order only matters when, well, you
+        /// access the array storage such as from Eigen array's
+        /// .data() method - and indeed ITensor::data().
         typedef std::vector<size_t> order_t;
 
         /// The type of the element.

From cd3369d3385300e58f88de3e6388348fd5ac697e Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 8 Nov 2021 16:31:58 -0500
Subject: [PATCH 10/46] Flesh out and test DftTools interface

---
 aux/inc/WireCellAux/DftTools.h | 20 +++++++++---
 aux/src/DftTools.cxx           | 58 ++++++++++++++++++++++++++++++++++
 aux/test/test_dfttools.cxx     | 35 +++++++++++++++++++-
 3 files changed, 107 insertions(+), 6 deletions(-)

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
index 10f2d8cbf..bf4894291 100644
--- a/aux/inc/WireCellAux/DftTools.h
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -47,11 +47,21 @@ namespace WireCell::Aux {
     dft_array_t fwd(IDFT::pointer dft, const dft_array_t& arr);
     dft_array_t inv(IDFT::pointer dft, const dft_array_t& arr);
 
-    // Transform one dimesions.  For example axis=0 transforms each
-    // logical row of the Eigen array so that column=0 of each row
-    // would hold the frequency=0 component of each row's spectrum.  
-    // array_xxc fwd(IDFT::pointer dft, const array_xxc& arr, int axis);
-    // array_xxc inv(IDFT::pointer dft, const array_xxc& arr, int axis);
+    // Transform a 2D array along one axis.
+    //
+    // The axis identifies the logical array "dimension" over which
+    // the transform is applied.  For example, axis=1 means the
+    // transforms are applied along columns (ie, on a per-row basis).
+    // Note: this is the same convention as held by numpy.fft.
+    //
+    // The axis is interpreted in the "logical" sense Eigen arrays
+    // indexed as array(irow, icol).  Ie, the dimension traversing
+    // rows is axis 0 and the dimension traversing columns is axis 1.
+    // Note: internal storage order of an Eigen array may differ from
+    // the logical order and indeed that of the array template type
+    // order.  Neither is pertinent in setting the axis.
+    dft_array_t fwd(IDFT::pointer dft, const dft_array_t& arr, int axis);
+    dft_array_t inv(IDFT::pointer dft, const dft_array_t& arr, int axis);
 
 
 }
diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index 5ef53e166..7297d8806 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -55,3 +55,61 @@ Aux::dft_array_t Aux::inv(IDFT::pointer dft, const Aux::dft_array_t& arr)
         dft->inv2d(in_data, out_data, nstrides, stride);
     });
 }
+
+#include <iostream> // debug
+
+template<typename trans>
+Aux::dft_array_t doit1b(const Aux::dft_array_t& arr, int axis, trans func)
+{
+    // We must provide a flat array with storage order such with
+    // logical axis-major ordering.
+    const Aux::complex_t* in_data = arr.data();
+    const int nrows = arr.rows(); // "logical"
+    const int ncols = arr.cols(); // shape
+
+    std::cerr << "nrows="<<nrows<<", ncols="<<ncols
+              << ", axis="<<axis<<", IsRowMajor:"<<arr.IsRowMajor<<"\n";
+
+    // If storage order matches "axis-major"
+    if ( (axis == 1 and arr.IsRowMajor)
+         or
+         (axis == 0 and not arr.IsRowMajor) ) {
+        Aux::dft_vector_t out_vec(nrows*ncols);
+        func(in_data, out_vec.data(), ncols, nrows);
+        if (arr.IsRowMajor) {
+            // note, returning makes a copy and will perform an actual
+            // storage order transpose.
+            return Eigen::Map<ROWM>(out_vec.data(), nrows, ncols);
+        }
+        return Eigen::Map<COLM>(out_vec.data(), nrows, ncols);
+    }
+    
+    // Either we have row-major and want column-major storage order or
+    // vice versa.
+
+    // Here, we must copy and not use "auto" to get actual storage
+    // order transpose and avoid the IsRowMajor flip optimization.
+    COLM flipped = arr.transpose();
+    COLM got = doit1b(flipped, (axis+1)%2, func);
+    return got.transpose();
+}
+
+Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr, int axis)
+{
+    return doit1b(arr, axis,
+                  [&](const complex_t* in_data,
+                      complex_t* out_data,
+                      int nstrides, int stride) {
+        dft->fwd1b(in_data, out_data, nstrides, stride);
+    });
+}
+
+Aux::dft_array_t Aux::inv(IDFT::pointer dft, const Aux::dft_array_t& arr, int axis)
+{
+    return doit1b(arr, axis,
+                  [&](const complex_t* in_data,
+                      complex_t* out_data,
+                      int nstrides, int stride) {
+        dft->inv1b(in_data, out_data, nstrides, stride);
+    });
+}
diff --git a/aux/test/test_dfttools.cxx b/aux/test/test_dfttools.cxx
index c5bf85930..e506da80f 100644
--- a/aux/test/test_dfttools.cxx
+++ b/aux/test/test_dfttools.cxx
@@ -107,6 +107,36 @@ void test_2d_transpose(IDFT::pointer dft)
     
 }
 
+void test_1b(IDFT::pointer dft, int axis)
+{
+    const int nrows=8; 
+    const int ncols=4;
+    FA r = FA::Zero(nrows, ncols);
+    r(6,1) = 1.0;
+    dump("impulse", r);
+    std::cerr << r << std::endl;
+    auto c = Aux::fwd(dft, r.cast<complex_t>(), axis);
+    dump("spectra", c);
+    if (axis==0) {
+        
+    }
+    std::cerr << c << std::endl;
+}
+void test_1bt(IDFT::pointer dft, int axis)
+{
+    const int nrows=8; 
+    const int ncols=4;
+    FA r = FA::Zero(nrows, ncols);
+    r(6,1) = 1.0;
+    auto rc = r.cast<complex_t>();
+    auto rct = rc.transpose();
+    dump("impulse.T", rct);
+    std::cerr << rct << std::endl;
+    auto c = Aux::fwd(dft, rct, axis);
+    dump("spectra", c);
+    std::cerr << c << std::endl;
+}
+
 int main()
 {
     auto dft = std::make_shared<Aux::FftwDFT>();
@@ -114,6 +144,9 @@ int main()
     test_1d(dft);
     test_2d(dft);
     test_2d_transpose(dft);
-
+    test_1b(dft, 0);
+    test_1b(dft, 1);
+    test_1bt(dft, 0);
+    test_1bt(dft, 1);
     return 0;
 }

From a83cba82e38e6e8bcfc579e35c64ffbcfc0afa6e Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 15 Nov 2021 16:00:39 -0500
Subject: [PATCH 11/46] Add axis, transpose, tests

---
 aux/inc/WireCellAux/DftTools.h |   2 +-
 aux/inc/WireCellAux/FftwDFT.h  |  31 +++--
 aux/src/DftTools.cxx           |  62 ++++++----
 aux/src/FftwDFT.cxx            | 209 ++++++++++++++++++++++++++++-----
 aux/test/test_idft.cxx         | 155 +++++++++++++++++++++++-
 iface/inc/WireCellIface/IDFT.h | 123 ++++++++++++++-----
 iface/src/IDFT.cxx             |  84 +++++++++++--
 7 files changed, 564 insertions(+), 102 deletions(-)

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
index bf4894291..20272bc3f 100644
--- a/aux/inc/WireCellAux/DftTools.h
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -41,7 +41,7 @@ namespace WireCell::Aux {
     using dft_array_t = Eigen::ArrayXXcf;
     
     // 2D with Eigen arrays.  Use eg arr.cast<complex_>() to provde
-    // from real or arr.cast<float>() to convert result to real.
+    // from real or arr.real()() to convert result to real.
 
     // Transform both dimesions.
     dft_array_t fwd(IDFT::pointer dft, const dft_array_t& arr);
diff --git a/aux/inc/WireCellAux/FftwDFT.h b/aux/inc/WireCellAux/FftwDFT.h
index 365190f0c..f26b5bcf9 100644
--- a/aux/inc/WireCellAux/FftwDFT.h
+++ b/aux/inc/WireCellAux/FftwDFT.h
@@ -6,7 +6,12 @@
 namespace WireCell::Aux {
 
     /** 
-        FftwDFT provides IDFT based on FFTW3.        
+        The FftwDFT component provides IDFT based on FFTW3.
+
+        All instances share a common thread-safe plan cache.  There is
+        no benefit to using more than one instance in a process.
+
+        See IDFT.h for important comments.
     */
     class FftwDFT : public IDFT {
       public:
@@ -18,23 +23,33 @@ namespace WireCell::Aux {
 
         virtual 
         void fwd1d(const complex_t* in, complex_t* out,
-                   int stride) const;
+                   int size) const;
 
         virtual 
         void inv1d(const complex_t* in, complex_t* out,
-                   int stride) const;
+                   int size) const;
 
-        // batched 1D ("1b") - rely on base implementation
+        virtual 
+        void fwd1b(const complex_t* in, complex_t* out,
+                   int nrows, int ncols, int axis) const;
 
-        // 2d
+        virtual 
+        void inv1b(const complex_t* in, complex_t* out,
+                   int nrows, int ncols, int axis) const;
 
         virtual 
         void fwd2d(const complex_t* in, complex_t* out,
-                   int nstrides, int stride) const;
+                   int nrows, int ncols) const;
         virtual 
         void inv2d(const complex_t* in, complex_t* out,
-                   int nstrides, int stride) const;
-
+                   int nrows, int ncols) const;
+
+        virtual
+        void transpose(const scalar_t* in, scalar_t* out,
+                       int nrows, int ncols) const;
+        virtual
+        void transpose(const complex_t* in, complex_t* out,
+                       int nrows, int ncols) const;
 
     };
 }
diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index 7297d8806..905cbcfa2 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -16,20 +16,20 @@ using COLM = Eigen::Array<Aux::complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen:
 template<typename trans>
 Aux::dft_array_t doit(const Aux::dft_array_t& arr, trans func)
 {
-    // Nominally, memory is in column-major order
+    // Nominally, eigen storage memory is in column-major order
     const Aux::complex_t* in_data = arr.data();
-    int stride = arr.rows();
-    int nstrides = arr.cols();
+    int ncols = arr.rows();
+    int nrows = arr.cols();
 
     // except when it isn't
     bool flipped = arr.IsRowMajor;
     if (flipped) {
-        stride = arr.cols();
-        nstrides = arr.rows();
+        ncols = arr.cols();
+        nrows = arr.rows();
     }
 
-    Aux::dft_vector_t out_vec(nstrides*stride);
-    func(in_data, out_vec.data(), nstrides, stride);
+    Aux::dft_vector_t out_vec(nrows*ncols);
+    func(in_data, out_vec.data(), nrows, ncols);
 
     if (flipped) {
         return Eigen::Map<ROWM>(out_vec.data(), arr.rows(), arr.cols());
@@ -42,8 +42,8 @@ Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr)
 {
     return doit(arr, [&](const complex_t* in_data,
                          complex_t* out_data,
-                         int nstrides, int stride) {
-        dft->fwd2d(in_data, out_data, nstrides, stride);
+                         int nrows, int ncols) {
+        dft->fwd2d(in_data, out_data, nrows, ncols);
     });
 }
 
@@ -51,8 +51,8 @@ Aux::dft_array_t Aux::inv(IDFT::pointer dft, const Aux::dft_array_t& arr)
 {
     return doit(arr, [&](const complex_t* in_data,
                          complex_t* out_data,
-                         int nstrides, int stride) {
-        dft->inv2d(in_data, out_data, nstrides, stride);
+                         int nrows, int ncols) {
+        dft->inv2d(in_data, out_data, nrows, ncols);
     });
 }
 
@@ -94,22 +94,38 @@ Aux::dft_array_t doit1b(const Aux::dft_array_t& arr, int axis, trans func)
     return got.transpose();
 }
 
+// Implementation notes for fwd()/inv():
+//
+// - We make an initial copy to get rid of any potential IsRowMajor
+//   optimization/confusion over storage order.  This suffers a copy
+//   but we need to allocate return anyways.
+//
+// - We then have column-wise storage order but IDFT assumes row-wise
+// - so we reverse (nrows, ncols) and meaning of axis.
+
 Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr, int axis)
 {
-    return doit1b(arr, axis,
-                  [&](const complex_t* in_data,
-                      complex_t* out_data,
-                      int nstrides, int stride) {
-        dft->fwd1b(in_data, out_data, nstrides, stride);
-    });
+    Aux::dft_array_t ret = arr; 
+    dft->fwd1b(ret.data(), ret.data(), ret.cols(), ret.rows(), !axis);
+    return ret;
+
+    // return doit1b(arr, axis,
+    //               [&](const complex_t* in_data,
+    //                   complex_t* out_data,
+    //                   int nrows, int ncols) {
+    //     dft->fwd1b(in_data, out_data, nrows, ncols);
+    // });
 }
 
 Aux::dft_array_t Aux::inv(IDFT::pointer dft, const Aux::dft_array_t& arr, int axis)
 {
-    return doit1b(arr, axis,
-                  [&](const complex_t* in_data,
-                      complex_t* out_data,
-                      int nstrides, int stride) {
-        dft->inv1b(in_data, out_data, nstrides, stride);
-    });
+    Aux::dft_array_t ret = arr; 
+    dft->inv1b(ret.data(), ret.data(), ret.cols(), ret.rows(), !axis);
+    return ret;
+    // return doit1b(arr, axis,
+    //               [&](const complex_t* in_data,
+    //                   complex_t* out_data,
+    //                   int nrows, int ncols) {
+    //     dft->inv1b(in_data, out_data, nrows, ncols);
+    // });
 }
diff --git a/aux/src/FftwDFT.cxx b/aux/src/FftwDFT.cxx
index f4a214760..1289b8f99 100644
--- a/aux/src/FftwDFT.cxx
+++ b/aux/src/FftwDFT.cxx
@@ -16,15 +16,25 @@ using plan_type = fftwf_plan;
 using plan_map_t = std::unordered_map<plan_key_t, plan_type>;
 using plan_val_t = fftwf_complex;
 
+// Make a key by which a plan is known.  dir should be FFTW_FORWARD or
+// FFTW_BACKWARD and "axis" is -1 for all or in {0,1} for one of 2D.
+// For 1D, use the default axis=-1.
+//
+// Imp note: The key is slightly over-specified as we keep one
+// independent cache for each of the six methods.  The "dir" is
+// thus redundant.
 static
-plan_key_t make_key(bool inverse, const void * src, void * dst, int n0, int n1)
+plan_key_t make_key(const void * src, void * dst, int nrows, int ncols, int dir, int axis=-1)
 {
+    ++axis;                     // need three positive values, default is both axis 
+    bool inverse = dir == FFTW_BACKWARD;
     bool inplace = (dst==src);
     bool aligned = ( (reinterpret_cast<size_t>(src)&15) | (reinterpret_cast<size_t>(dst)&15) ) == 0;
-    int64_t key = ( ( (((int64_t)n0) << 30)|(n1<<3 ) | (inverse<<2) | (inplace<<1) | aligned ) << 1 ) + 1;
+    int64_t key = ( ( (((int64_t)nrows) << 32)| (ncols<<5 ) | (axis<<3) | (inverse<<2) | (inplace<<1) | aligned ) << 1 ) + 1;
     return key;
 }
 
+// Look up a plan by key or return NULL
 static
 plan_type get_plan(std::shared_mutex& mutex, plan_map_t& plans, plan_key_t key)
 {
@@ -39,12 +49,16 @@ plan_type get_plan(std::shared_mutex& mutex, plan_map_t& plans, plan_key_t key)
 
 // #include <iostream>             // debugging
 
-template<typename planner_function>
-void doit(std::shared_mutex& mutex, plan_map_t& plans, 
-                int fwdrev, plan_val_t* src, plan_val_t* dst, int nstrides, int stride,
-                planner_function make_plan)
+using planner_function = std::function<plan_type()>;
+
+// This wraps plan lookup, possible plan creation and subsequent plan
+// execution so that we get thread-safe plan caching.
+template<typename ValueType>
+void doit(std::shared_mutex& mutex, plan_map_t& plans, plan_key_t key,
+          ValueType* src, ValueType* dst,
+          planner_function make_plan,
+          std::function<void(const plan_type, ValueType*, ValueType*)> exec_plan)
 {
-    auto key = make_key(fwdrev == FFTW_BACKWARD, src, dst, stride, nstrides);
     auto plan = get_plan(mutex, plans, key);
     if (!plan) {
         std::unique_lock lock(mutex);
@@ -59,7 +73,8 @@ void doit(std::shared_mutex& mutex, plan_map_t& plans,
             plan = it->second;
         }
     }
-    fftwf_execute_dft(plan, src, dst);
+    //fftwf_execute_dft(plan, src, dst);
+    exec_plan(plan, src, dst);
 }
 
 
@@ -70,65 +85,203 @@ plan_val_t* pval_cast( const IDFT::complex_t * p)
 }
 
 
-void Aux::FftwDFT::fwd1d(const complex_t* in, complex_t* out, int stride) const
+void Aux::FftwDFT::fwd1d(const complex_t* in, complex_t* out, int ncols) const
 {
     static std::shared_mutex mutex;
     static plan_map_t plans;
     static const int dir = FFTW_FORWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, 0, stride, [&]( ) {
-        return fftwf_plan_dft_1d(stride, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
-    });
+    auto key = make_key(src, dst, 1, ncols, dir);
+    doit<plan_val_t>(mutex, plans, key, src, dst, [&]( ) {
+        return fftwf_plan_dft_1d(ncols, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    }, fftwf_execute_dft);
 }
-void Aux::FftwDFT::inv1d(const complex_t* in, complex_t* out, int stride) const
+void Aux::FftwDFT::inv1d(const complex_t* in, complex_t* out, int ncols) const
 {
     static std::shared_mutex mutex;
     static plan_map_t plans;
     static const int dir = FFTW_BACKWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, 0, stride, [&]( ) {
-        return fftwf_plan_dft_1d(stride, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
-    });
+    auto key = make_key(src, dst, 1, ncols, dir);
 
-    // reverse normalization
-    for (int ind=0; ind<stride; ++ind) {
-        out[ind] /= stride;
+    doit<plan_val_t>(mutex, plans, key, src, dst, [&]( ) {
+        return fftwf_plan_dft_1d(ncols, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    }, fftwf_execute_dft);
+
+    // Apply 1/n normalization
+    for (int ind=0; ind<ncols; ++ind) {
+        out[ind] /= ncols;
+    }
+}
+
+
+fftwf_plan plan_1b(fftwf_complex *in, fftwf_complex *out,
+                   int nrows, int ncols, int sign, int axis)
+{
+    // (r,c) element at in + r*stride + c*dist
+
+    const int rank = 1;         // dimension of transform
+    int n = ncols;              // along rows
+    int howmany = nrows;
+    int stride = 1;
+    int dist = ncols;
+    if (axis == 0) {            // along columns
+        n = nrows;
+        howmany = ncols;
+        stride = ncols;
+        dist = 1;
+    }
+    int *inembed=&n, *onembed=&n;
+
+    unsigned int flags =  FFTW_ESTIMATE|FFTW_PRESERVE_INPUT;
+
+    return fftwf_plan_many_dft(rank, &n, howmany,
+                               in, inembed,
+                               stride, dist,
+                               out, onembed,
+                               stride, dist,
+                               sign, flags);
+}
+
+
+void Aux::FftwDFT::fwd1b(const complex_t* in, complex_t* out, int nrows, int ncols, int axis) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = FFTW_FORWARD;
+    auto src = pval_cast(in);
+    auto dst = pval_cast(out);
+    auto key = make_key(src, dst, nrows, ncols, dir, axis);
+
+    doit<plan_val_t>(mutex, plans, key, src, dst, [&]( ) {
+        return plan_1b(src, dst, nrows, ncols, dir, axis);
+    }, fftwf_execute_dft);
+}
+
+
+void Aux::FftwDFT::inv1b(const complex_t* in, complex_t* out, int nrows, int ncols, int axis) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = FFTW_BACKWARD;
+    auto src = pval_cast(in);
+    auto dst = pval_cast(out);
+    auto key = make_key(src, dst, nrows, ncols, dir, axis);
+
+    doit<plan_val_t>(mutex, plans, key, src, dst, [&]( ) {
+        return plan_1b(src, dst, nrows, ncols, dir, axis);
+    }, fftwf_execute_dft);
+
+    // 1/n normalization
+    const int norm = axis ? ncols : nrows;
+    const int ntot = ncols*nrows;
+    for (int ind=0; ind<ntot; ++ind) {
+        out[ind] /= norm;
     }
 }
 
 
-void Aux::FftwDFT::fwd2d(const complex_t* in, complex_t* out, int nstrides, int stride) const
+void Aux::FftwDFT::fwd2d(const complex_t* in, complex_t* out, int nrows, int ncols) const
 {
     static std::shared_mutex mutex;
     static plan_map_t plans;
     static const int dir = FFTW_FORWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, nstrides, stride, [&]( ) {
-        return fftwf_plan_dft_2d(stride, nstrides, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
-    });
+    auto key = make_key(src, dst, nrows, ncols, dir);
+    doit<plan_val_t>(mutex, plans, key, src, dst, [&]( ) {
+        return fftwf_plan_dft_2d(ncols, nrows, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    }, fftwf_execute_dft);
 }
 
 
-void Aux::FftwDFT::inv2d(const complex_t* in, complex_t* out, int nstrides, int stride) const
+void Aux::FftwDFT::inv2d(const complex_t* in, complex_t* out, int nrows, int ncols) const
 {
     static std::shared_mutex mutex;
     static plan_map_t plans;
     static const int dir = FFTW_BACKWARD;
     auto src = pval_cast(in);
     auto dst = pval_cast(out);
-    doit(mutex, plans, dir, src, dst, nstrides, stride, [&]( ) {
-        return fftwf_plan_dft_2d(stride, nstrides, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
-    });
+    auto key = make_key(src, dst, nrows, ncols, dir);
+    doit<plan_val_t>(mutex, plans, key, src, dst, [&]( ) {
+        return fftwf_plan_dft_2d(ncols, nrows, src, dst, dir, FFTW_ESTIMATE|FFTW_PRESERVE_INPUT);
+    }, fftwf_execute_dft);
 
     // reverse normalization
-    const int ntot = stride*nstrides;
+    const int ntot = ncols*nrows;
     for (int ind=0; ind<ntot; ++ind) {
         out[ind] /= ntot;
     }
 }
+
+
+// based on example from fftw3 faq
+static
+plan_type transpose_plan_complex(plan_val_t *in, plan_val_t *out, int rows, int cols)
+{
+    const unsigned flags = FFTW_ESTIMATE; /* other flags are possible */
+    fftw_iodim howmany_dims[2];
+
+    howmany_dims[0].n  = rows;
+    howmany_dims[0].is = cols;
+    howmany_dims[0].os = 1;
+
+    howmany_dims[1].n  = cols;
+    howmany_dims[1].is = 1;
+    howmany_dims[1].os = rows;
+
+    return fftwf_plan_guru_dft(/*rank=*/ 0, /*dims=*/ NULL,
+                               /*howmany_rank=*/ 2, howmany_dims,
+                               in, out, /*sign=*/ 0, flags);
+}
+void Aux::FftwDFT::transpose(const complex_t* in, complex_t* out,
+                             int nrows, int ncols) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = 0;
+    auto src = pval_cast(in);
+    auto dst = pval_cast(out);
+    auto key = make_key(src, dst, nrows, ncols, dir);
+    doit<plan_val_t>(mutex, plans, key, src, dst, [&]( ) {
+        return transpose_plan_complex(src, dst, nrows, ncols);
+    }, fftwf_execute_dft);
+}
+
+static
+plan_type transpose_plan_real(float *in, float *out, int rows, int cols)
+{
+    const unsigned flags = FFTW_ESTIMATE; /* other flags are possible */
+    fftw_iodim howmany_dims[2];
+
+    howmany_dims[0].n  = rows;
+    howmany_dims[0].is = cols;
+    howmany_dims[0].os = 1;
+
+    howmany_dims[1].n  = cols;
+    howmany_dims[1].is = 1;
+    howmany_dims[1].os = rows;
+
+    return fftwf_plan_guru_r2r(/*rank=*/ 0, /*dims=*/ NULL,
+                               /*howmany_rank=*/ 2, howmany_dims,
+                               in, out, /*kind=*/ NULL, flags);
+}
+void Aux::FftwDFT::transpose(const scalar_t* in, scalar_t* out,
+                             int nrows, int ncols) const
+{
+    static std::shared_mutex mutex;
+    static plan_map_t plans;
+    static const int dir = 0;
+    auto src = const_cast<scalar_t*>(in);
+    auto dst = out;
+    auto key = make_key(src, dst, nrows, ncols, dir);
+    doit<float>(mutex, plans, key, src, dst, [&]( ) {
+        return transpose_plan_real(src, dst, nrows, ncols);
+    }, fftwf_execute_r2r);
+}
+
 Aux::FftwDFT::FftwDFT()
 {
 }
diff --git a/aux/test/test_idft.cxx b/aux/test/test_idft.cxx
index 73bc95df2..cfd109a8b 100644
--- a/aux/test/test_idft.cxx
+++ b/aux/test/test_idft.cxx
@@ -8,10 +8,36 @@
 #include <chrono>
 #include <vector>
 #include <thread>
+#include <numeric>
 #include <iostream>
 
 using namespace WireCell;
 
+const float eps = 1e-8;
+
+static void assert_impulse_at_index(const std::vector<IDFT::complex_t>& vec, size_t index=0)
+{
+    const size_t size = vec.size();
+    auto tot = Waveform::sum(vec);
+    assert(std::abs(std::real(tot) - 1.0) < eps);
+    assert(std::abs(std::real(vec[index]) - 1.0) < eps);
+    assert(std::abs(std::imag(tot))  < eps);
+    assert(std::abs(std::imag(vec[index])) < eps);
+    for (size_t ind=0; ind<size; ++ind) {
+        if (ind == index) continue;
+        assert(std::abs(std::real(vec[ind])) < eps);
+        assert(std::abs(std::imag(vec[ind])) < eps);
+    }
+}
+static void assert_flat_value(const std::vector<IDFT::complex_t>& vec, IDFT::scalar_t val = 1.0)
+{
+    const auto size = vec.size();
+    auto tot = Waveform::sum(vec);
+    assert(std::abs(std::abs(tot) - val*size) < eps);
+    for (const auto& v : vec) {
+        assert(std::abs(std::abs(v) - val) < eps);
+    }
+}
 
 static
 void test_1d_zero(IDFT::pointer dft, int size = 1024)
@@ -19,11 +45,25 @@ void test_1d_zero(IDFT::pointer dft, int size = 1024)
     std::vector<IDFT::complex_t> inter(size,0), freq(size,0);
 
     dft->fwd1d(inter.data(), freq.data(), inter.size());
+    assert_flat_value(freq, 0);
     dft->inv1d(freq.data(), inter.data(), freq.size());
+    assert_flat_value(inter, 0);
+}
+static
+void test_1d_impulse(IDFT::pointer dft, int size=1024)
+{
+    std::vector<IDFT::complex_t> inter(size,0), freq(size,0), back(size,0);
+    inter[0] = 1.0;
+
+    dft->fwd1d(inter.data(), freq.data(), freq.size());
+    assert_flat_value(freq);
 
-    auto tot = Waveform::sum(inter);
-    assert(std::real(tot) == 0);
+    dft->inv1d(freq.data(), back.data(), back.size());
+    assert_impulse_at_index(back);
 }
+
+
+
 static
 void test_2d_zero(IDFT::pointer dft, int size = 1024)
 {
@@ -32,10 +72,71 @@ void test_2d_zero(IDFT::pointer dft, int size = 1024)
     std::vector<IDFT::complex_t> freq(stride*nstrides,0);
 
     dft->fwd2d(inter.data(), freq.data(), nstrides, stride);
+    assert_flat_value(inter, 0);
     dft->inv2d(freq.data(), inter.data(), nstrides, stride);
+    assert_flat_value(freq, 0);
+}
+static
+void test_2d_impulse(IDFT::pointer dft, int nrows=128, int ncols=128)
+{
+    const int size = nrows*ncols;
+    std::vector<IDFT::complex_t> inter(size,0), freq(size,0), back(size,0);
+    inter[0] = 1.0;
+    dft->fwd2d(inter.data(), freq.data(), nrows, ncols);
+    assert_flat_value(freq);
+
+    dft->inv2d(freq.data(), back.data(), nrows, ncols);
+    assert_impulse_at_index(back);
+
+}
+
+
+static void assert_on_axis(const std::vector<IDFT::complex_t>& freq,
+                           int axis, int nrows=128, int ncols=128)
+{
+    for (int irow=0; irow<nrows; ++irow) {
+        for (int icol=0; icol<ncols; ++icol) {
+            int ind = irow*ncols + icol;
+            auto val = std::abs(freq[ind]);
+            if (axis) {
+                if (irow==0) {
+                    assert(std::abs(val - 1.0) < eps);
+                }
+                else {
+                    assert(val < eps);
+                }
+            }
+            else {
+                if (icol==0) {
+                    assert(std::abs(val - 1.0) < eps);
+                }
+                else {
+                    assert(val < eps);
+                }
+            }
+        }
+    }
+}
+
+void test_1b_impulse(IDFT::pointer dft, int axis, int nrows=128, int ncols=128)
+{
+    const int size = nrows*ncols;
+
+    std::vector<IDFT::complex_t> inter(size,0), freq(size,0), back(size,0);
+    inter[0] = 1.0;
+    dft->fwd1b(inter.data(), freq.data(), nrows, ncols, axis);
+    assert_on_axis(freq, axis, nrows, ncols);
+    dft->inv1b(freq.data(), back.data(), nrows, ncols, axis);
+    assert_impulse_at_index(back, 0);
 
-    auto tot = Waveform::sum(inter);
-    assert(std::real(tot) == 0);
+    std::vector<IDFT::complex_t> inplace(size,0);
+    inplace[0] = 1.0;
+    dft->fwd1b(inplace.data(), inplace.data(), nrows, ncols, axis);
+    assert_on_axis(inplace, axis, nrows, ncols);
+
+    std::vector<IDFT::complex_t> inback(inplace.begin(), inplace.end());
+    dft->inv1b(inback.data(), inback.data(), nrows, ncols, axis);
+    assert_impulse_at_index(inback, 0);
 }
 
 void fwdrev(IDFT::pointer dft, int id, int ntimes, int size)
@@ -84,6 +185,42 @@ void test_2d_threads(IDFT::pointer dft, int nthreads, int nloops, int size = 102
               << " " << dt1.count() << std::endl;
 }
 
+template<typename ValueType>
+void dump(ValueType* data, int nrows, int ncols, std::string msg="")
+{
+    std::cerr << msg << "("<<nrows<<","<<ncols<<")\n";
+    for (int irow=0; irow<nrows; ++irow) {
+        for (int icol=0; icol<ncols; ++icol) {
+            std::cerr << data[irow*ncols + icol] << " ";
+        }
+        std::cerr << "\n";
+    }
+}
+
+template<typename ValueType>
+void test_2d_transpose(IDFT::pointer dft, int nrows, int ncols)
+{
+    std::vector<ValueType> arr(nrows*ncols);
+    std::iota(arr.begin(), arr.end(), 0);
+
+    std::vector<ValueType> arr2(nrows*ncols, 0);
+    std::vector<ValueType> arr3(arr.begin(), arr.end());
+
+    dft->transpose(arr.data(), arr2.data(), nrows, ncols);
+    dft->transpose(arr3.data(), arr3.data(), nrows, ncols);
+
+    for (int irow=0; irow<nrows; ++irow) {
+        for (int icol=0; icol<ncols; ++icol) {
+            assert( arr[irow*ncols + icol] == arr2[icol*nrows + irow]);
+            assert( arr[irow*ncols + icol] == arr3[icol*nrows + irow]);
+        }
+    }
+    dump(arr.data(), nrows, ncols, "original");
+    dump(arr2.data(), ncols, nrows, "copy");
+    dump(arr3.data(), ncols, nrows, "inplace");
+
+}
+
 int main(int argc, char* argv[])
 {
     // fixme, add CLI parsing to add plugins, config and name another
@@ -104,7 +241,17 @@ int main(int argc, char* argv[])
     }
 
     test_1d_zero(idft);
+    test_1d_impulse(idft);
     test_2d_zero(idft);
+    test_2d_impulse(idft);
+
+    test_1b_impulse(idft, 0);
+    test_1b_impulse(idft, 1);
+
+    test_2d_transpose<IDFT::scalar_t>(idft, 2, 8);
+    test_2d_transpose<IDFT::scalar_t>(idft, 8, 2);
+    test_2d_transpose<IDFT::complex_t>(idft, 2, 8);
+    test_2d_transpose<IDFT::complex_t>(idft, 8, 2);
 
     std::vector<int> sizes = {128,256,512,1024};
     for (auto size : sizes) {
diff --git a/iface/inc/WireCellIface/IDFT.h b/iface/inc/WireCellIface/IDFT.h
index 448c04858..e94afb391 100644
--- a/iface/inc/WireCellIface/IDFT.h
+++ b/iface/inc/WireCellIface/IDFT.h
@@ -1,21 +1,3 @@
-/** 
-    Interface to perform discrete single-precision Fourier transforms.
-
-    Note, implementations MUST NOT normalize forward transforms and
-    MUST normalize reverse/inverse transforms by 1/n where n is the
-    number of elements in the 1D array being reverse transformed.
-
-    The number "stride" describes how many elements of the array are
-    contiguous.  For "C-order" aka row-major ordering of 2D arrays,
-    stride is the size of a row, aka number of columns.
-
-    The number "nstrides" describe how many arrays of length "stride"
-    are placed end-to-end in the memory.  For "C-order" aka row-major
-    ordering of 2D arrays, the "nstrides" counts the size of the
-    columns, aka the number of rows.  With this ordering, the
-    (nstrides, stride) pair maps to the usual (nrows, ncols).
-*/
-
 #ifndef WIRECELL_IDFT
 #define WIRECELL_IDFT
 
@@ -24,6 +6,77 @@
 
 namespace WireCell {
 
+    /** 
+        Interface to perform discrete Fourier transforms on arrays of
+        signal precision, complex floating point values.
+
+        There are 6 DFT methods which are formed as the outer product
+        of two lists:
+
+        - fwd, inv
+        - 1d, 1b, 2d
+
+        The "fwd" methods provide forward transform, no normalization.
+        The "inv" methods provide reverse/inverse transform normalized
+        by 1/size.
+
+        The 1d transforms take rank=1 / 1D arrays and perform a single
+        transform.
+
+        The 2d transforms take rank=2 / 2D arrays and perform nrows of
+        transforms along rows and ncols of transforms along columns.
+        The order over which each dimension is transformed is
+        implementation-defined (and imaterial).
+
+        The 1b transforms take rank=1 / 2D arrays and perform
+        transforms along a single dimension as determined by the value
+        of the "axis" parameter.  An axis=1 means to perform nrows
+        transforms along rows.  Note, this is the same convention
+        followed by numpy.fft functions.
+
+        There is also a special rank=0 DFT on rank=2 arrays which is
+        more commonly known as a "matrix transpose".
+
+        Requirements on implementations:
+
+        - Forward transforms SHALL NOT apply normalization.
+
+        - Reverse transforms SHALL apply 1/n normalization.
+
+        - The arrays SHALL be assumed to follow C-ordering aka
+          row-major storage order.
+      
+        - Transform methods SHALL allow the input and output array
+          pointers to be identical.
+
+        - The IDFT interface provides 1b methods implemented in terms
+          of 1d calls and a implementation MAY override these (for
+          example, if implementation can exploit batch optimization).
+
+        - Implementation SHALL allow safe concurrent calls to methods
+          by different threads of execution.
+
+        Requirement on callers.
+
+        - Input and output arrays SHALL be pre-allocated and be sized
+          at least as large as indicated by accompanying size arguments.
+
+        - Input and output arrays MUST either be non-overlapping in
+          memory or MUST be identical.
+
+        Notes: 
+
+        - All arrays are of type single precision complex floating
+          point.  Functions and methods to easily convert between the
+          two exist.
+
+        - Eigen arrays are column-wise by default and so their
+          arr.data() method can not directly supply input to this
+          interface.  Likewise, use of arr.transpose().data() may run
+          afowl of Eigen's IsRowMajor optimization flag.  Copy your
+          default array in a Eigen::RowMajor array first or use IDFT
+          via Aux::DftTools functions.
+    */
     class IDFT  : public IComponent<IDFT> {
       public:
         virtual ~IDFT();
@@ -34,35 +87,43 @@ namespace WireCell {
         /// The type for the spectrum in each bin.
         using complex_t = std::complex<scalar_t>;
 
-        // 1D 
+        // 1d 
 
         virtual 
-        void fwd1d(const complex_t* in, complex_t* out,
-                   int stride) const = 0;
+        void fwd1d(const complex_t* in, complex_t* out, int size) const = 0;
 
         virtual 
-        void inv1d(const complex_t* in, complex_t* out,
-                   int stride) const = 0;
+        void inv1d(const complex_t* in, complex_t* out, int size) const = 0;
 
-        // batched 1D ("1b")
+        // 1b
 
         virtual 
         void fwd1b(const complex_t* in, complex_t* out,
-                   int nstrides, int stride) const;
+                   int nrows, int ncols, int axis) const;
+
         virtual 
         void inv1b(const complex_t* in, complex_t* out,
-                   int nstrides, int stride) const;
-
+                   int nrows, int ncols, int axis) const;
 
-        // 2D, transform both dimensions
+        // 2d
 
         virtual 
         void fwd2d(const complex_t* in, complex_t* out,
-                   int nstrides, int stride) const = 0;
+                   int nrows, int ncols) const = 0;
         virtual 
         void inv2d(const complex_t* in, complex_t* out,
-                   int nstrides, int stride) const = 0;
-
+                   int nrows, int ncols) const = 0;
+
+
+        // Fill "out" with the transpose of "in", may be in-place.
+        // The nrows/ncols refers to the shape of the input.
+        virtual
+        void transpose(const scalar_t* in, scalar_t* out,
+                       int nrows, int ncols) const;
+        virtual
+        void transpose(const complex_t* in, complex_t* out,
+                       int nrows, int ncols) const;
+        
      };
 }
 
diff --git a/iface/src/IDFT.cxx b/iface/src/IDFT.cxx
index c0a62655c..58b1d335b 100644
--- a/iface/src/IDFT.cxx
+++ b/iface/src/IDFT.cxx
@@ -1,25 +1,95 @@
 #include "WireCellIface/IDFT.h"
 
+#include <vector>
+#include <utility>              // std::swap since c++11
+
 using namespace WireCell;
 
 IDFT::~IDFT() {}
 
 // Trivial default "batched" implementations.  If your concrete
 // implementation provides some kind of "batch optimization", such as
-// with some GPU FFTs, override these methods!
+// with FFTW3's advanced interface or with some GPU FFT library,
+// override these dumb methods for the win.
 
 void IDFT::fwd1b(const complex_t* in, complex_t* out,
-                 int nstrides, int stride) const
+                 int nrows, int ncols, int axis) const
 {
-    for (int istride=0; istride<nstrides; ++istride) {
-        fwd1d(in+istride*stride, out+istride*stride, stride);
+    if (axis) { 
+        for (int irow=0; irow<nrows; ++irow) {
+            fwd1d(in+irow*ncols, out+irow*ncols, ncols);
+        }
+    }
+    else {
+        this->transpose(in, out, nrows, ncols);
+        this->fwd1b(out, out, ncols, nrows, 1);
+        this->transpose(out, out, ncols, nrows);
     }
 }
 
 void IDFT::inv1b(const complex_t* in, complex_t* out,
-                 int nstrides, int stride) const
+                 int nrows, int ncols, int axis) const
 {
-    for (int istride=0; istride<nstrides; ++istride) {
-        inv1d(in+istride*stride, out+istride*stride, stride);
+    if (axis) { 
+        for (int irow=0; irow<nrows; ++irow) {
+            inv1d(in+irow*ncols, out+irow*ncols, ncols);
+        }
+    }
+    else {
+        this->transpose(in, out, nrows, ncols);
+        this->inv1b(out, out, ncols, nrows, 1);
+        this->transpose(out, out, ncols, nrows);
     }
 }
+
+// Trivial default transpose.  Implementations, please override if you
+// can offer something faster.
+
+template<typename ValueType>
+void transpose_type(const ValueType* in, ValueType* out,
+                    int nrows, int ncols) 
+{
+    if (in != out) {
+        for (int irow=0; irow<nrows; ++irow) {
+            for (int icol=0; icol<ncols; ++icol) {
+                out[icol*nrows + irow] = in[irow*ncols + icol];
+            }
+        }
+        return;
+    }
+    
+    // inplace adapated from https://stackoverflow.com/a/9320349 which
+    // comes from
+    // https://en.wikipedia.org/wiki/In-place_matrix_transposition#Non-square_matrices:_Following_the_cycles
+
+    const int n = nrows;
+    const int size = nrows*ncols;
+    const int mn1 = (size - 1);
+    std::vector<bool> visited(size);
+    ValueType* first = out + size;
+    const ValueType* last = first + size;
+    ValueType* cycle = out;
+    while (++cycle != last) {
+        if (visited[cycle - first])
+            continue;
+        int a = cycle - first;
+        do  {
+            a = a == mn1 ? mn1 : (n * a) % mn1;
+            std::swap(*(first + a), *cycle);
+            visited[a] = true;
+        } while ((first + a) != cycle);
+    }
+
+}
+
+
+void IDFT::transpose(const IDFT::scalar_t* in, IDFT::scalar_t* out,
+                     int nrows, int ncols) const
+{
+    transpose_type(in, out, nrows, ncols);
+}
+void IDFT::transpose(const IDFT::complex_t* in, IDFT::complex_t* out,
+                     int nrows, int ncols) const
+{
+    transpose_type(in, out, nrows, ncols);
+}

From e8e0625bff7284fcfe93d7cdbfca00c852f410a6 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 16 Nov 2021 11:47:00 -0500
Subject: [PATCH 12/46] Improve tests

---
 aux/test/test_dfttools.cxx | 131 ++++++++++++++++---------------------
 aux/test/test_idft.cxx     |  28 +-------
 2 files changed, 58 insertions(+), 101 deletions(-)

diff --git a/aux/test/test_dfttools.cxx b/aux/test/test_dfttools.cxx
index e506da80f..3ee006a92 100644
--- a/aux/test/test_dfttools.cxx
+++ b/aux/test/test_dfttools.cxx
@@ -1,3 +1,5 @@
+#include "aux_test_dft_helpers.h"
+
 #include "WireCellAux/DftTools.h"
 #include "WireCellAux/FftwDFT.h"
 #include "WireCellUtil/Waveform.h"
@@ -6,79 +8,67 @@
 #include <memory>
 
 using namespace WireCell;
+using namespace WireCell::Aux::Test;
 
 using real_t = float;
 using RV = std::vector<real_t>;
 using complex_t = std::complex<real_t>;
 using CV = std::vector<complex_t>;
 
-void test_1d(IDFT::pointer dft)
+void test_1d_impulse(IDFT::pointer dft, int size = 64)
 {
-    RV rimp(64, 0);
-    rimp[1] = 1.0;
+    RV rimp(size, 0);
+    rimp[0] = 1.0;
 
     auto cimp = Aux::fwd(dft, Waveform::complex(rimp));
-    for (auto c : cimp) {
-        std::cerr << c << " ";
-    }
-    std::cerr << "\n";
+    assert_flat_value(cimp.data(), cimp.size());
 
     RV rimp2 = Waveform::real(Aux::inv(dft, cimp));
-    for (auto r : rimp2) {
-        std::cerr << r << " ";
-    }
-    std::cerr << "\n";
-    for (int ind=0; ind<64; ++ind) {
-        if (ind == 1) {
-            assert(std::abs(rimp2[ind]-1.0) < 1e-6);
-            continue;
-        }
-        assert(std::abs(rimp2[ind]) < 1e-6);
-    }
+    assert_impulse_at_index(rimp2.data(), rimp2.size());
 }
 
-using FA = Eigen::Array<float, Eigen::Dynamic, Eigen::Dynamic>;
+using FA = Eigen::Array<real_t, Eigen::Dynamic, Eigen::Dynamic>;
+using CA = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic>;
+using FARM = Eigen::Array<real_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+using CARM = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
 
-void test_2d(IDFT::pointer dft)
+void test_2d_impulse(IDFT::pointer dft, int nrows=16, int ncols=8)
 {
-    const int nrows=16;
-    const int ncols=8;
+    const size_t size = nrows*ncols;
     FA r = FA::Zero(nrows, ncols);
-    r(10,1) = 1.0;
-    std::cerr << r << std::endl;
-    auto c = Aux::fwd(dft, r.cast<complex_t>());
-    std::cerr << c << std::endl;
-    FA r2 = Aux::inv(dft, c).real();
-    std::cerr << r2 << std::endl;
-    for (int irow=0; irow<nrows; ++irow) {
-        for (int icol=0; icol<ncols; ++icol) {
-            if (irow==10 and icol==1) {
-                assert(std::abs(r2(irow, icol)-1.0) < 1e-6);
-                continue;
-            }
-            assert(std::abs(r2(irow, icol)) < 1e-6);    
-        }
-    }
-}
+    r(0,0) = 1.0;
+    dump("r", r);
+    assert_impulse_at_index(r.data(), size);
 
-template<typename array_type>
-void dump(std::string name, const array_type& arr)
-{
-    std::cerr << name << ":(" << arr.rows() << "," << arr.cols() << ") row-major:" << arr.IsRowMajor << "\n";
+    CA rc = r.cast<complex_t>();
+    dump("rc", rc);
+    assert_impulse_at_index(rc.data(), size);
+
+    CA c = Aux::fwd(dft, rc);
+    dump("c", c);
+    assert_flat_value(c.data(), size);
+
+    FA r2 = Aux::inv(dft, c).real();
+    dump("r2", r2);
+    assert_impulse_at_index(r2.data(), size);
 }
 
-void test_2d_transpose(IDFT::pointer dft)
+void test_2d_eigen_transpose(IDFT::pointer dft)
 {
     const int nrows=16;
     const int ncols=8;
 
+    // where the impulse lives (off axis)
+    const int imp_row = 1;
+    const int imp_col = 10;
+
     FA r = FA::Zero(nrows, ncols); // shape:(16,8)
     dump("r", r);
 
     // do not remove the auto in this next line
     auto rt = r.transpose();    // shape:(8,16)
     dump("rt", rt);
-    rt(1,10) = 1.0;
+    rt(imp_row, imp_col) = 1.0;
 
     auto c = Aux::fwd(dft, rt.cast<complex_t>());
     dump("c", c);
@@ -95,7 +85,7 @@ void test_2d_transpose(IDFT::pointer dft)
             float val = rt(irow, icol);
             float val2 = r2(irow, icol); // access with transposed indices
             std::cerr << "(" << irow << ","<< icol << "):" << val << " ? " << val2 << "\n";
-            if (irow==1 and icol==10) {
+            if (irow==imp_row and icol==imp_col) {
                 assert(std::abs(val-1.0) < 1e-6);
                 continue;
             }
@@ -103,50 +93,41 @@ void test_2d_transpose(IDFT::pointer dft)
         }
         std::cerr << "\n";
     }
-
-    
 }
 
-void test_1b(IDFT::pointer dft, int axis)
+void test_1b(IDFT::pointer dft, int axis, int nrows=8, int ncols=4)
 {
-    const int nrows=8; 
-    const int ncols=4;
     FA r = FA::Zero(nrows, ncols);
-    r(6,1) = 1.0;
+    r(0,0) = 1.0;
     dump("impulse", r);
-    std::cerr << r << std::endl;
-    auto c = Aux::fwd(dft, r.cast<complex_t>(), axis);
-    dump("spectra", c);
-    if (axis==0) {
-        
-    }
-    std::cerr << c << std::endl;
-}
-void test_1bt(IDFT::pointer dft, int axis)
-{
-    const int nrows=8; 
-    const int ncols=4;
-    FA r = FA::Zero(nrows, ncols);
-    r(6,1) = 1.0;
-    auto rc = r.cast<complex_t>();
-    auto rct = rc.transpose();
-    dump("impulse.T", rct);
-    std::cerr << rct << std::endl;
-    auto c = Aux::fwd(dft, rct, axis);
+    CA c = Aux::fwd(dft, r.cast<complex_t>(), axis);
+
     dump("spectra", c);
     std::cerr << c << std::endl;
+
+    if (axis) {                 // transform along rows
+        CA ct = c.transpose();      // convert to along columns (native Eigen storage order)
+        c = ct;
+        std::swap(nrows, ncols);
+        dump("transpose", c);
+        std::cerr << c << std::endl;
+    }
+
+    // first column has flat abs value of 1.0.
+    assert_flat_value(c.data(), nrows, complex_t(1,0)); 
+    // rest should be flat, zero value
+    assert_flat_value(c.data()+nrows, nrows*ncols - nrows, complex_t(0,0)); 
+
 }
 
 int main()
 {
     auto dft = std::make_shared<Aux::FftwDFT>();
 
-    test_1d(dft);
-    test_2d(dft);
-    test_2d_transpose(dft);
+    test_1d_impulse(dft);
+    test_2d_impulse(dft);
+    test_2d_eigen_transpose(dft);
     test_1b(dft, 0);
     test_1b(dft, 1);
-    test_1bt(dft, 0);
-    test_1bt(dft, 1);
     return 0;
 }
diff --git a/aux/test/test_idft.cxx b/aux/test/test_idft.cxx
index cfd109a8b..babc5ed9d 100644
--- a/aux/test/test_idft.cxx
+++ b/aux/test/test_idft.cxx
@@ -3,7 +3,8 @@
 #include "WireCellUtil/Waveform.h"
 #include "WireCellUtil/PluginManager.h"
 #include "WireCellIface/IConfigurable.h"
-#include "WireCellIface/IDFT.h"
+
+#include "aux_test_dft_helpers.h"
 
 #include <chrono>
 #include <vector>
@@ -13,31 +14,6 @@
 
 using namespace WireCell;
 
-const float eps = 1e-8;
-
-static void assert_impulse_at_index(const std::vector<IDFT::complex_t>& vec, size_t index=0)
-{
-    const size_t size = vec.size();
-    auto tot = Waveform::sum(vec);
-    assert(std::abs(std::real(tot) - 1.0) < eps);
-    assert(std::abs(std::real(vec[index]) - 1.0) < eps);
-    assert(std::abs(std::imag(tot))  < eps);
-    assert(std::abs(std::imag(vec[index])) < eps);
-    for (size_t ind=0; ind<size; ++ind) {
-        if (ind == index) continue;
-        assert(std::abs(std::real(vec[ind])) < eps);
-        assert(std::abs(std::imag(vec[ind])) < eps);
-    }
-}
-static void assert_flat_value(const std::vector<IDFT::complex_t>& vec, IDFT::scalar_t val = 1.0)
-{
-    const auto size = vec.size();
-    auto tot = Waveform::sum(vec);
-    assert(std::abs(std::abs(tot) - val*size) < eps);
-    for (const auto& v : vec) {
-        assert(std::abs(std::abs(v) - val) < eps);
-    }
-}
 
 static
 void test_1d_zero(IDFT::pointer dft, int size = 1024)

From 28d9ec9129fb7f816e2c87cf55d769b25b995281 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 16 Nov 2021 12:11:59 -0500
Subject: [PATCH 13/46] More testing

---
 aux/test/aux_test_dft_helpers.h | 119 ++++++++++++++++++++++++++++++++
 aux/test/test_dfttools.cxx      |  15 ++--
 aux/test/test_idft.cxx          |  34 +++------
 3 files changed, 136 insertions(+), 32 deletions(-)
 create mode 100644 aux/test/aux_test_dft_helpers.h

diff --git a/aux/test/aux_test_dft_helpers.h b/aux/test/aux_test_dft_helpers.h
new file mode 100644
index 000000000..c4b12e012
--- /dev/null
+++ b/aux/test/aux_test_dft_helpers.h
@@ -0,0 +1,119 @@
+// This is only for sharing some common code betweeen different
+// aux/test/*.cxx tests.  Not for "real" use.
+
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
+#include "WireCellUtil/Exceptions.h"
+
+#include "WireCellIface/IConfigurable.h"
+#include "WireCellIface/IDFT.h"
+
+#include <cassert>
+#include <iostream>
+
+namespace WireCell::Aux::Test {
+
+
+    // fixme: add support for config
+    IDFT::pointer make_dft(const std::string& tn="FftwDFT",
+                           const std::string& pi="WireCellAux")
+    {
+        PluginManager& pm = PluginManager::instance();
+        pm.add(pi);
+        
+        // create first
+        auto idft = Factory::lookup_tn<IDFT>(tn);
+        assert(idft);
+        // configure before use if configurable
+        auto icfg = Factory::find_maybe_tn<IConfigurable>(tn);
+        if (icfg) {
+            auto cfg = icfg->default_configuration();
+            icfg->configure(cfg);
+        }
+        return idft;
+    }
+    IDFT::pointer make_dft_args(int argc, char* argv[]) 
+    {
+        std::string dft_tn="FftwDFT";
+        std::string dft_pi="WireCellAux";
+        if (argc > 1) dft_tn = argv[1];
+        if (argc > 2) dft_pi = argv[2];
+        return make_dft(dft_tn, dft_pi);
+    }
+
+    const double default_eps = 1e-8;
+    const std::complex<float> czero = 0.0;
+    const std::complex<float> cone = 1.0;
+
+    void assert_small(double val, double eps = default_eps) {
+        if (val < eps) {
+            return;
+        }
+        std::stringstream ss;
+        ss << "value " << val << " >= " << eps;
+        std::cerr << ss.str() << std::endl;
+        THROW(WireCell::ValueError() << errmsg{ss.str()});
+    }
+
+    // Assert the array has only value val at index and near zero elsewhere
+    template <typename ValueType>
+    void assert_impulse_at_index(const ValueType* vec, size_t size,
+                                 size_t index=0, ValueType val = 1.0)
+    {
+        ValueType tot = 0;
+        for (size_t ind=0; ind<size; ++ind) {
+            auto v = vec[ind];
+            if (ind == index) {
+                v -= val;
+            }
+            tot += v;
+            assert_small(std::abs(v));
+        }
+        assert_small(std::abs(tot));
+    }
+
+    // Same as above but with pass by vector 
+    template <typename VectorType>
+    void assert_impulse_at_index(const VectorType& vec, 
+                                 size_t index=0, const typename VectorType::value_type& val = 1.0)
+    {
+        assert_impulse_at_index(vec.data(), vec.size(), index, val);
+    }
+
+    // Assert all values in array are near given val
+    template <typename ValueType>
+    void assert_flat_value(const ValueType* vec, size_t size, ValueType val = 1.0)
+    {
+        ValueType tot = 0;
+        for (size_t ind=0; ind<size; ++ind) {
+            auto v = vec[ind];
+            tot += v;
+            assert_small(std::abs(v - val));
+        }
+        assert_small(std::abs(std::abs(tot) - std::abs(val)*size));
+    }
+
+    // As above but pass by vector
+    template <typename VectorType>
+    void assert_flat_value(const VectorType& vec, const typename VectorType::value_type& val = 1.0)
+    {
+        assert_flat_value(vec.data(), vec.size(), val);
+    }
+
+    // Print eigen array
+    template<typename array_type>
+    void dump(std::string name, const array_type& arr)
+    {
+        std::cerr << name << ":(" << arr.rows() << "," << arr.cols() << ") row-major:" << arr.IsRowMajor << "\n";
+    }
+
+
+    // Like std::iota, but dummer
+    template<typename ValueType>
+    void iota(ValueType* vec, size_t size, ValueType start = 0)
+    {
+        for (size_t ind=0; ind<size; ++ind) {
+            vec[ind] = start++;
+        }
+    }
+}
diff --git a/aux/test/test_dfttools.cxx b/aux/test/test_dfttools.cxx
index 3ee006a92..cc4b43157 100644
--- a/aux/test/test_dfttools.cxx
+++ b/aux/test/test_dfttools.cxx
@@ -120,14 +120,15 @@ void test_1b(IDFT::pointer dft, int axis, int nrows=8, int ncols=4)
 
 }
 
-int main()
+int main(int argc, char* argv[])
 {
-    auto dft = std::make_shared<Aux::FftwDFT>();
+    auto idft = make_dft_args(argc, argv);
+
+    test_1d_impulse(idft);
+    test_2d_impulse(idft);
+    test_2d_eigen_transpose(idft);
+    test_1b(idft, 0);
+    test_1b(idft, 1);
 
-    test_1d_impulse(dft);
-    test_2d_impulse(dft);
-    test_2d_eigen_transpose(dft);
-    test_1b(dft, 0);
-    test_1b(dft, 1);
     return 0;
 }
diff --git a/aux/test/test_idft.cxx b/aux/test/test_idft.cxx
index babc5ed9d..1b47646b8 100644
--- a/aux/test/test_idft.cxx
+++ b/aux/test/test_idft.cxx
@@ -1,8 +1,5 @@
 // Test IDFT implementations.
-#include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/Waveform.h"
-#include "WireCellUtil/PluginManager.h"
-#include "WireCellIface/IConfigurable.h"
 
 #include "aux_test_dft_helpers.h"
 
@@ -13,6 +10,7 @@
 #include <iostream>
 
 using namespace WireCell;
+using namespace WireCell::Aux::Test;
 
 
 static
@@ -21,9 +19,9 @@ void test_1d_zero(IDFT::pointer dft, int size = 1024)
     std::vector<IDFT::complex_t> inter(size,0), freq(size,0);
 
     dft->fwd1d(inter.data(), freq.data(), inter.size());
-    assert_flat_value(freq, 0);
+    assert_flat_value(freq, czero);
     dft->inv1d(freq.data(), inter.data(), freq.size());
-    assert_flat_value(inter, 0);
+    assert_flat_value(inter, czero); 
 }
 static
 void test_1d_impulse(IDFT::pointer dft, int size=1024)
@@ -76,18 +74,18 @@ static void assert_on_axis(const std::vector<IDFT::complex_t>& freq,
             auto val = std::abs(freq[ind]);
             if (axis) {
                 if (irow==0) {
-                    assert(std::abs(val - 1.0) < eps);
+                    assert_small(std::abs(val - 1.0));
                 }
                 else {
-                    assert(val < eps);
+                    assert_small(val);
                 }
             }
             else {
                 if (icol==0) {
-                    assert(std::abs(val - 1.0) < eps);
+                    assert_small(std::abs(val - 1.0));
                 }
                 else {
-                    assert(val < eps);
+                    assert_small(val);
                 }
             }
         }
@@ -197,24 +195,10 @@ void test_2d_transpose(IDFT::pointer dft, int nrows, int ncols)
 
 }
 
+
 int main(int argc, char* argv[])
 {
-    // fixme, add CLI parsing to add plugins, config and name another
-    // dft.  For now, just use the one in aux.
-    PluginManager& pm = PluginManager::instance();
-    pm.add("WireCellAux");
-    std::string dft_tn = "FftwDFT";
-
-    // creates
-    auto idft = Factory::lookup_tn<IDFT>(dft_tn);
-    assert(idft);
-    {                          // configure before use if configurable
-        auto icfg = Factory::find_maybe_tn<IConfigurable>(dft_tn);
-        if (icfg) {
-            auto cfg = icfg->default_configuration();
-            icfg->configure(cfg);
-        }
-    }
+    auto idft = make_dft_args(argc, argv);
 
     test_1d_zero(idft);
     test_1d_impulse(idft);

From c798cd4ba874353f64efb0a061e87f8ea7116e45 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 16 Nov 2021 15:03:45 -0500
Subject: [PATCH 14/46] Make a semaphore interface and implement with what is
 in util

---
 aux/inc/WireCellAux/Semaphore.h      | 34 +++++++++++++++++++
 aux/src/Semaphore.cxx                | 51 ++++++++++++++++++++++++++++
 iface/inc/WireCellIface/ISemaphore.h | 31 +++++++++++++++++
 iface/src/IfaceDesctructors.cxx      |  2 ++
 4 files changed, 118 insertions(+)
 create mode 100644 aux/inc/WireCellAux/Semaphore.h
 create mode 100644 aux/src/Semaphore.cxx
 create mode 100644 iface/inc/WireCellIface/ISemaphore.h

diff --git a/aux/inc/WireCellAux/Semaphore.h b/aux/inc/WireCellAux/Semaphore.h
new file mode 100644
index 000000000..1385bf51d
--- /dev/null
+++ b/aux/inc/WireCellAux/Semaphore.h
@@ -0,0 +1,34 @@
+/** Implement a semaphore component interace. */
+
+#ifndef WIRECELLAUX_SEMAPHORE
+#define WIRECELLAUX_SEMAPHORE
+
+#include "WireCellIface/IConfigurable.h"
+#include "WireCellIface/ISemaphore.h"
+#include "WireCellUtil/Semaphore.h"
+
+
+namespace WireCell::Aux {
+    class Semaphore : public ISemaphore,
+                      public IConfigurable
+    {
+      public:
+        Semaphore();
+        virtual ~Semaphore();
+
+        // IConfigurable interface
+        virtual void configure(const WireCell::Configuration& config);
+        virtual WireCell::Configuration default_configuration() const;
+
+        // ISemaphore
+        virtual void acquire() const;
+        virtual void release() const;
+
+      private:
+
+        mutable FastSemaphore m_sem;
+
+    };
+}  // namespace WireCell::Pytorch
+
+#endif  // WIRECELLPYTORCH_TORCHSERVICE
diff --git a/aux/src/Semaphore.cxx b/aux/src/Semaphore.cxx
new file mode 100644
index 000000000..d76999837
--- /dev/null
+++ b/aux/src/Semaphore.cxx
@@ -0,0 +1,51 @@
+#include "WireCellAux/Semaphore.h"
+
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/Semaphore.h"
+
+WIRECELL_FACTORY(Semaphore, 
+                 WireCell::Aux::Semaphore,
+                 WireCell::ISemaphore,
+                 WireCell::IConfigurable)
+
+using namespace WireCell;
+
+Aux::Semaphore::Semaphore()
+    : m_sem(0)
+{
+}
+Aux::Semaphore::~Semaphore()
+{
+}
+
+WireCell::Configuration Aux::Semaphore::default_configuration() const
+{
+    Configuration cfg;
+
+    // The maximum allowed number concurrent calls to forward().  A
+    // value of unity means all calls will be serialized.  When made
+    // smaller than the number of threads, the difference gives the
+    // number of threads that may block on the semaphore.
+    cfg["concurrency"] = 1;
+
+    return cfg;
+}
+
+void Aux::Semaphore::configure(const WireCell::Configuration& cfg)
+{
+    auto count = get<int>(cfg, "concurrency", 1);
+    if (count < 1 ) {
+        count = 1;
+    }
+    m_sem.set_count(count);
+}
+
+void Aux::Semaphore::acquire() const
+{
+    m_sem.acquire();
+}
+
+void Aux::Semaphore::release() const
+{
+    m_sem.release();
+}
diff --git a/iface/inc/WireCellIface/ISemaphore.h b/iface/inc/WireCellIface/ISemaphore.h
new file mode 100644
index 000000000..99a55396d
--- /dev/null
+++ b/iface/inc/WireCellIface/ISemaphore.h
@@ -0,0 +1,31 @@
+/** An interface to the semaphore pattern */
+
+#ifndef WIRECELL_ISEMAPHORE
+#define WIRECELL_ISEMAPHORE
+
+#include "WireCellUtil/IComponent.h"
+
+namespace WireCell {
+    class ISemaphore : public IComponent<ISemaphore> {
+      public:
+        virtual ~ISemaphore();
+
+        /// Block until available spot to hold the semaphore is
+        /// available.
+        virtual void acquire() const = 0;
+
+        /// Release hold on the semaphore
+        virtual void release() const = 0;
+
+        /// Use Construct a Context on a semaphore in a local scope to
+        /// automate release
+        struct Context {
+            ISemaphore::pointer sem;
+            Context(ISemaphore::pointer sem) : sem(sem) { sem->acquire(); }
+            ~Context() { sem->release(); }
+        };
+
+    };
+}  // namespace WireCell
+
+#endif  // WIRECELL_ITENSORFORWARD
diff --git a/iface/src/IfaceDesctructors.cxx b/iface/src/IfaceDesctructors.cxx
index 76efb5ecd..59b1597d1 100644
--- a/iface/src/IfaceDesctructors.cxx
+++ b/iface/src/IfaceDesctructors.cxx
@@ -74,6 +74,7 @@
 #include "WireCellIface/IRandom.h"
 #include "WireCellIface/IRecombinationModel.h"
 #include "WireCellIface/IScalarFieldSink.h"
+#include "WireCellIface/ISemaphore.h"
 #include "WireCellIface/ISequence.h"
 #include "WireCellIface/ISinkNode.h"
 #include "WireCellIface/ISlice.h"
@@ -172,6 +173,7 @@ IQueuedoutNodeBase::~IQueuedoutNodeBase() {}
 IRandom::~IRandom() {}
 IRecombinationModel::~IRecombinationModel() {}
 IScalarFieldSink::~IScalarFieldSink() {}
+ISemaphore::~ISemaphore() {}
 ISinkNodeBase::~ISinkNodeBase() {}
 ISlice::~ISlice() {}
 ISliceFanout::~ISliceFanout() {}

From fc8dc584d0355aba82f460d7ac98dea11947cfa2 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 16 Nov 2021 15:04:16 -0500
Subject: [PATCH 15/46] Move common code to a 'context' mix-in, add initial
 torch imp of IDFT

---
 pytorch/inc/WireCellPytorch/DFT.h          |  62 +++++++++++
 pytorch/inc/WireCellPytorch/TorchContext.h |  62 +++++++++++
 pytorch/inc/WireCellPytorch/TorchService.h |   9 +-
 pytorch/src/DFT.cxx                        | 118 +++++++++++++++++++++
 pytorch/src/TorchContext.cxx               |  38 +++++++
 pytorch/src/TorchService.cxx               |  68 ++----------
 6 files changed, 294 insertions(+), 63 deletions(-)
 create mode 100644 pytorch/inc/WireCellPytorch/DFT.h
 create mode 100644 pytorch/inc/WireCellPytorch/TorchContext.h
 create mode 100644 pytorch/src/DFT.cxx
 create mode 100644 pytorch/src/TorchContext.cxx

diff --git a/pytorch/inc/WireCellPytorch/DFT.h b/pytorch/inc/WireCellPytorch/DFT.h
new file mode 100644
index 000000000..41e154152
--- /dev/null
+++ b/pytorch/inc/WireCellPytorch/DFT.h
@@ -0,0 +1,62 @@
+/**
+   TorchDFT provides a libtorch based implementation of IDFT.
+
+   The libtorch API is documented at:
+
+   https://pytorch.org/cppdocs/api/namespace_torch__fft.html
+ */
+
+#ifndef WIRECELL_PYTORCH_DFT
+#define WIRECELL_PYTORCH_DFT
+
+#include "WireCellIface/IDFT.h"
+#include "WireCellIface/IConfigurable.h"
+#include "WireCellPytorch/TorchContext.h"
+
+namespace WireCell::Pytorch {
+    class DFT : public IDFT,
+                public IConfigurable
+    {
+      public:
+        DFT();
+        virtual ~DFT();
+
+        // IConfigurable interface
+        virtual void configure(const WireCell::Configuration& config);
+        virtual WireCell::Configuration default_configuration() const;
+
+        // 1d 
+
+        virtual 
+        void fwd1d(const complex_t* in, complex_t* out,
+                   int size) const;
+
+        virtual 
+        void inv1d(const complex_t* in, complex_t* out,
+                   int size) const;
+
+        // batched 1D ("1b") - rely on base implementation
+        virtual 
+        void fwd1b(const complex_t* in, complex_t* out,
+                   int nrows, int ncols, int axis) const;
+        virtual 
+        void inv1b(const complex_t* in, complex_t* out,
+                   int nrows, int ncols, int axis) const;
+        
+        // 2d
+
+        virtual 
+        void fwd2d(const complex_t* in, complex_t* out,
+                   int nrows, int ncols) const;
+        virtual 
+        void inv2d(const complex_t* in, complex_t* out,
+                   int nrows, int ncols) const;
+          
+      private:
+        TorchContext m_ctx;
+
+    };
+
+}
+
+#endif
diff --git a/pytorch/inc/WireCellPytorch/TorchContext.h b/pytorch/inc/WireCellPytorch/TorchContext.h
new file mode 100644
index 000000000..66979a1c5
--- /dev/null
+++ b/pytorch/inc/WireCellPytorch/TorchContext.h
@@ -0,0 +1,62 @@
+/** A mixin class to provide a torch context
+    
+ */
+
+#include "WireCellIface/ISemaphore.h"
+#include <torch/script.h>
+
+namespace WireCell::Pytorch {
+
+    class TorchContext {
+      public:
+
+        // The "devname" is "cpu" or "gpu" or "gpuN" where N is a GPU
+        // number.  If "semname" is given, use it for semaphore,
+        // otherwise use canonically tn=Semaphore:torch-<devname>.
+        TorchContext(const std::string& devname,
+                     const std::string& semname="");
+        TorchContext();
+        ~TorchContext();
+
+        // Default constructor makes context with no device nor
+        // semaphore.  This will make the "connection" to them.
+        void connect(const std::string& devname,
+                     const std::string& semname="");
+
+        torch::Device device() const { return m_dev; }
+        std::string devname() const { return m_devname; }
+
+        bool is_gpu() const { return m_devname != "cpu"; }
+
+        // Context manager methods.  Caller should prefer using a
+        // TorchSemaphore class but if called directly, caller MUST
+        // balance an enter() with an exit().  These can and should be
+        // used in multi-thread run stage.
+        void enter() const { if (m_sem) m_sem->acquire(); }
+        void exit() const { if (m_sem) m_sem->release(); }
+
+      private:
+
+        torch::Device m_dev{torch::kCPU};
+        std::string m_devname;
+        ISemaphore::pointer m_sem;
+     };
+
+    /// Use like:
+    ///
+    /// void mymeth() {
+    ///   TorchSemaphore sem(m_ctx);
+    ///   ... more code may return/throw
+    /// } // end of scope
+    class TorchSemaphore {
+        const TorchContext& m_th;
+      public:
+        TorchSemaphore(const TorchContext& th) : m_th(th) {
+            m_th.enter();
+        }
+        ~TorchSemaphore() {
+            m_th.exit();
+        }
+    };            
+
+}
diff --git a/pytorch/inc/WireCellPytorch/TorchService.h b/pytorch/inc/WireCellPytorch/TorchService.h
index 01504724e..ca8fe4eb1 100644
--- a/pytorch/inc/WireCellPytorch/TorchService.h
+++ b/pytorch/inc/WireCellPytorch/TorchService.h
@@ -7,7 +7,7 @@
 #include "WireCellIface/ITensorForward.h"
 #include "WireCellUtil/Logging.h"
 #include "WireCellAux/Logger.h"
-#include "WireCellUtil/Semaphore.h"
+#include "WireCellPytorch/TorchContext.h"
 
 #include <torch/script.h>  // One-stop header.
 
@@ -29,15 +29,14 @@ namespace WireCell::Pytorch {
 
       private:
 
-        // Mark which device is used
-        torch::Device m_dev;
-
         // for read-only access, claim is that .forward() is thread
         // safe.  However .forward() is not const so we must make this
         // mutable.
         mutable torch::jit::script::Module m_module;
 
-        mutable FastSemaphore m_sem;
+        // Even though thread safe, we want to honor a per device
+        // semaphore to give user chance ot limit us.
+        TorchContext m_ctx;
 
     };
 }  // namespace WireCell::Pytorch
diff --git a/pytorch/src/DFT.cxx b/pytorch/src/DFT.cxx
new file mode 100644
index 000000000..cba68164e
--- /dev/null
+++ b/pytorch/src/DFT.cxx
@@ -0,0 +1,118 @@
+#include "WireCellPytorch/DFT.h"
+#include "WireCellUtil/NamedFactory.h"
+
+#include <torch/script.h>
+#include <torch/csrc/api/include/torch/fft.h>
+
+
+WIRECELL_FACTORY(FftwDFT, WireCell::Pytorch::DFT,
+                 WireCell::IDFT,
+                 WireCell::IConfigurable)
+
+using namespace WireCell;
+using namespace WireCell::Pytorch;
+
+DFT::DFT()
+{
+}
+
+DFT::~DFT()
+{
+}
+
+Configuration DFT::default_configuration() const
+{
+    Configuration cfg;
+
+    // one of: {cpu, gpu, gpuN} where "N" is a GPU number.  "gpu"
+    // alone will use GPU 0.
+    cfg["device"] = "cpu";
+    return cfg;
+}
+
+void DFT::configure(const WireCell::Configuration& cfg)
+{
+    auto dev = get<std::string>(cfg, "device", "cpu");
+    m_ctx.connect(dev);
+}
+
+
+using torch_transform = std::function<torch::Tensor(const torch::Tensor&)>;
+
+static
+void doit(const TorchContext& ctx,
+          const IDFT::complex_t* in, IDFT::complex_t* out,
+          int64_t nrows, int64_t ncols, // 1d vec should have nrows=1
+          torch_transform func)
+{
+    TorchSemaphore sem(ctx);
+    torch::NoGradGuard no_grad;
+
+    int64_t size = nrows*ncols;
+
+    auto options = torch::TensorOptions().device(ctx.device()).dtype(torch::kComplexFloat);
+
+    // 1) in->src
+    if (in != out) {            // from_blob() doesn't like const data
+        memcpy(out, in, sizeof(IDFT::complex_t)*size);
+    }
+
+    torch::Tensor src = torch::from_blob(out, {nrows, ncols}, options);
+
+    // 2) dst = func(src)
+    auto dst = func(src);
+    dst = dst.cpu();
+
+    // 3) dst->out
+    if (out != dst.data_ptr()) {
+        memcpy(out, dst.data_ptr(), sizeof(IDFT::complex_t)*size);
+    }
+        
+}
+
+
+void DFT::fwd1d(const IDFT::complex_t* in, IDFT::complex_t* out, int size) const
+{
+    doit(m_ctx, in, out, 1, size,
+         [](const torch::Tensor& src) { return torch::fft::fft(src); });
+}
+
+
+void DFT::inv1d(const IDFT::complex_t* in, IDFT::complex_t* out, int size) const
+{
+    doit(m_ctx, in, out, 1, size, // fixme: check norm
+         [](const torch::Tensor& src) { return torch::fft::ifft(src); });
+}
+
+
+void DFT::fwd1b(const IDFT::complex_t* in, IDFT::complex_t* out,
+                int nrows, int ncols, int axis) const
+{
+    doit(m_ctx, in, out, nrows, ncols, [&](const torch::Tensor& src) {
+        return torch::fft::fft2(src, torch::nullopt, {axis}); });
+}
+
+
+void DFT::inv1b(const IDFT::complex_t* in, IDFT::complex_t* out,
+                int nrows, int ncols, int axis) const
+{
+    doit(m_ctx, in, out, nrows, ncols, [&](const torch::Tensor& src) {
+        return torch::fft::ifft2(src, torch::nullopt, {axis}); });
+}       
+
+        
+void DFT::fwd2d(const IDFT::complex_t* in, IDFT::complex_t* out,
+                int nrows, int ncols) const
+{
+    doit(m_ctx, in, out, nrows, ncols,
+         [](const torch::Tensor& src) { return torch::fft::fft2(src); });
+}
+
+
+void DFT::inv2d(const IDFT::complex_t* in, IDFT::complex_t* out,
+                int nrows, int ncols) const
+{
+    doit(m_ctx, in, out, nrows, ncols,
+         [](const torch::Tensor& src) { return torch::fft::ifft2(src); });
+}
+
diff --git a/pytorch/src/TorchContext.cxx b/pytorch/src/TorchContext.cxx
new file mode 100644
index 000000000..e5de936b8
--- /dev/null
+++ b/pytorch/src/TorchContext.cxx
@@ -0,0 +1,38 @@
+#include "WireCellPytorch/TorchContext.h"
+#include "WireCellUtil/NamedFactory.h"
+
+using namespace WireCell;
+using namespace WireCell::Pytorch;
+
+TorchContext::TorchContext() {}
+TorchContext::~TorchContext() { }
+TorchContext::TorchContext(const std::string& devname,
+                           const std::string& semname)
+{
+    connect(devname, semname);
+}
+void TorchContext::connect(const std::string& devname,
+                           const std::string& semname)
+{
+    // Use almost 1/2 the memory and 3/4 the time.
+    torch::NoGradGuard no_grad;
+
+    if (devname == "cpu") {
+        m_dev = torch::Device(torch::kCPU);
+    }
+    else {
+        int devnum = 0;
+        if (devname.size() > 3) {
+            devnum = atoi(devname.substr(3).c_str());
+        }
+        m_dev = torch::Device(torch::kCUDA, devnum);
+    }
+
+    std::string s_tn = "Semaphore:torch-" + devname;
+    if (not semname.empty()) {
+        s_tn = semname;
+    }
+
+    m_sem = Factory::find_tn<ISemaphore>(s_tn);
+}
+
diff --git a/pytorch/src/TorchService.cxx b/pytorch/src/TorchService.cxx
index 76bbfe436..b78a3a8d0 100644
--- a/pytorch/src/TorchService.cxx
+++ b/pytorch/src/TorchService.cxx
@@ -14,8 +14,6 @@ using namespace WireCell;
 
 Pytorch::TorchService::TorchService()
     : Aux::Logger("TorchService", "torch")
-    , m_dev(torch::kCPU, 0)
-    , m_sem(0)
 {
 }
 
@@ -26,30 +24,17 @@ Configuration Pytorch::TorchService::default_configuration() const
     // TorchScript model
     cfg["model"] = "model.ts";
 
-    // one of: {cpu, gpu, gpucpu}.  Latter allows fail-over to cpu
-    // when there is a failure to load the model.
-    // fixme: we may want to allow user to give a GPU index number
-    // here so like eg gpu:1, gpucpu:2.  An index is not meaningful
-    // for cpu.
-    cfg["device"] = "gpucpu";      
+    // one of: {cpu, gpu, gpuN} where "N" is a GPU number.  "gpu"
+    // alone will use GPU 0.
+    cfg["device"] = "cpu";
     
-    // The maximum allowed number concurrent calls to forward().  A
-    // value of unity means all calls will be serialized.  When made
-    // smaller than the number of threads, the difference gives the
-    // number of threads that may block on the semaphore.
-    cfg["concurrency"] = 1;
-
     return cfg;
 }
 
 void Pytorch::TorchService::configure(const WireCell::Configuration& cfg)
 {
-    auto dev = get<std::string>(cfg, "device", "gpucpu");
-    auto count = get<int>(cfg, "concurrency", 1);
-    if (count < 1 ) {
-        count = 1;
-    }
-    m_sem.set_count(count);
+    auto dev = get<std::string>(cfg, "device", "cpu");
+    m_ctx.connect(dev);
 
     auto model_path = cfg["model"].asString();
     if (model_path.empty()) {
@@ -58,34 +43,10 @@ void Pytorch::TorchService::configure(const WireCell::Configuration& cfg)
     }
 
     // Use almost 1/2 the memory and 3/4 the time.
-    // but, fixme: check with Haiwng that this is okay.
     torch::NoGradGuard no_grad;
 
-    // Maybe first try to load torch script model on GPU.
-    if (dev == "gpucpu") {
-        try {
-            m_dev = torch::Device(torch::kCUDA, 0);
-            m_module = torch::jit::load(model_path, m_dev);
-            log->debug("loaded model {} to {}", model_path, dev);
-            return;
-        }
-        catch (const c10::Error& e) {
-            log->warn("failed to load model: {} to GPU will try CPU: {}",
-                      model_path, e.what());
-        }
-    }
-
-    if (dev == "cpu") {
-        m_dev = torch::Device(torch::kCPU);
-    }
-    else {
-        m_dev = torch::Device(torch::kCUDA, 0);
-    }
-
-    // from now, we either succeed or we throw
-    
     try {
-        m_module = torch::jit::load(model_path, m_dev);
+        m_module = torch::jit::load(model_path, m_ctx.device());
     }
     catch (const c10::Error& e) {
         log->critical("error loading model: {} to {}: {}",
@@ -96,19 +57,15 @@ void Pytorch::TorchService::configure(const WireCell::Configuration& cfg)
     log->debug("loaded model {} to {}", model_path, dev);
 }
 
-#include <c10/cuda/CUDACachingAllocator.h>
-
 ITensorSet::pointer Pytorch::TorchService::forward(const ITensorSet::pointer& in) const
 {
+    TorchSemaphore sem(m_ctx);
 
-    m_sem.acquire();
-
-    const bool is_gpu = ! (m_dev == torch::kCPU);
-    log->debug("running model on {}", is_gpu ? "GPU" : "CPU");
+    log->debug("running model on {}", m_ctx.devname());
 
     torch::NoGradGuard no_grad;
 
-    std::vector<torch::IValue> iival = Pytorch::from_itensor(in, is_gpu);
+    std::vector<torch::IValue> iival = Pytorch::from_itensor(in, m_ctx.is_gpu());
 
     torch::IValue oival;
     try {
@@ -116,16 +73,11 @@ ITensorSet::pointer Pytorch::TorchService::forward(const ITensorSet::pointer& in
     }
     catch (const std::runtime_error& err) {
         log->error("error running model on {}: {}",
-                   is_gpu ? "GPU" : "CPU", err.what());
-        m_sem.release();
+                   m_ctx.devname(), err.what());
         return nullptr;
     }
 
     ITensorSet::pointer ret = Pytorch::to_itensor({oival});
 
-    // maybe needs a mutex?
-    c10::cuda::CUDACachingAllocator::emptyCache();
-
-    m_sem.release();
     return ret;
 }

From 22d5ea0bd66fb447d24f21b55dc3937c994ce4c6 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Wed, 17 Nov 2021 12:30:19 -0500
Subject: [PATCH 16/46] Work out brain bugs in understanding torch tensor
 storage

---
 aux/src/Semaphore.cxx              |  2 +-
 aux/test/aux_test_dft_helpers.h    | 31 +++++++++++--
 aux/test/test_idft.cxx             | 34 ++++++++------
 aux/test/test_idft_pytorch.jsonnet |  7 +++
 iface/src/IDFT.cxx                 |  2 +-
 pytorch/src/DFT.cxx                | 22 +++++----
 pytorch/src/TorchContext.cxx       |  2 +-
 pytorch/test/test_from_blob.cxx    | 73 ++++++++++++++++++++++++++++++
 8 files changed, 146 insertions(+), 27 deletions(-)
 create mode 100644 aux/test/test_idft_pytorch.jsonnet
 create mode 100644 pytorch/test/test_from_blob.cxx

diff --git a/aux/src/Semaphore.cxx b/aux/src/Semaphore.cxx
index d76999837..841debbb7 100644
--- a/aux/src/Semaphore.cxx
+++ b/aux/src/Semaphore.cxx
@@ -11,7 +11,7 @@ WIRECELL_FACTORY(Semaphore,
 using namespace WireCell;
 
 Aux::Semaphore::Semaphore()
-    : m_sem(0)
+    : m_sem(1)
 {
 }
 Aux::Semaphore::~Semaphore()
diff --git a/aux/test/aux_test_dft_helpers.h b/aux/test/aux_test_dft_helpers.h
index c4b12e012..d83754976 100644
--- a/aux/test/aux_test_dft_helpers.h
+++ b/aux/test/aux_test_dft_helpers.h
@@ -4,6 +4,7 @@
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/PluginManager.h"
 #include "WireCellUtil/Exceptions.h"
+#include "WireCellUtil/Persist.h"
 
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IDFT.h"
@@ -16,8 +17,11 @@ namespace WireCell::Aux::Test {
 
     // fixme: add support for config
     IDFT::pointer make_dft(const std::string& tn="FftwDFT",
-                           const std::string& pi="WireCellAux")
+                           const std::string& pi="WireCellAux",
+                           Configuration cfg = Configuration())
     {
+        std::cerr << "Making DFT " << tn << " from plugin " << pi << std::endl;
+
         PluginManager& pm = PluginManager::instance();
         pm.add(pi);
         
@@ -27,8 +31,9 @@ namespace WireCell::Aux::Test {
         // configure before use if configurable
         auto icfg = Factory::find_maybe_tn<IConfigurable>(tn);
         if (icfg) {
-            auto cfg = icfg->default_configuration();
-            icfg->configure(cfg);
+            auto def_cfg = icfg->default_configuration();
+            def_cfg = update(def_cfg, cfg);
+            icfg->configure(def_cfg);
         }
         return idft;
     }
@@ -38,6 +43,26 @@ namespace WireCell::Aux::Test {
         std::string dft_pi="WireCellAux";
         if (argc > 1) dft_tn = argv[1];
         if (argc > 2) dft_pi = argv[2];
+        Configuration cfg;
+        if (argc > 3) {
+            // Either we get directly a "data" object 
+            cfg = Persist::load(argv[3]);
+            // or we go searching a list for matching type/name.
+            if (cfg.isArray()) {
+                for (auto one : cfg) {
+                    std::string tn = get<std::string>(one, "type");
+                    std::string n = get<std::string>(one, "name", "");
+                    if (not n.empty()) {
+                        tn = tn + ":" + n;
+                    }
+                    if (tn == dft_tn) {
+                        cfg = one["data"];
+                        break;
+                    }
+                }
+            }
+
+        }
         return make_dft(dft_tn, dft_pi);
     }
 
diff --git a/aux/test/test_idft.cxx b/aux/test/test_idft.cxx
index 1b47646b8..a4f337a5e 100644
--- a/aux/test/test_idft.cxx
+++ b/aux/test/test_idft.cxx
@@ -12,6 +12,17 @@
 using namespace WireCell;
 using namespace WireCell::Aux::Test;
 
+template<typename ValueType>
+void dump(ValueType* data, int nrows, int ncols, std::string msg="")
+{
+    std::cerr << msg << "("<<nrows<<","<<ncols<<")\n";
+    for (int irow=0; irow<nrows; ++irow) {
+        for (int icol=0; icol<ncols; ++icol) {
+            std::cerr << data[irow*ncols + icol] << " ";
+        }
+        std::cerr << "\n";
+    }
+}
 
 static
 void test_1d_zero(IDFT::pointer dft, int size = 1024)
@@ -95,14 +106,20 @@ static void assert_on_axis(const std::vector<IDFT::complex_t>& freq,
 void test_1b_impulse(IDFT::pointer dft, int axis, int nrows=128, int ncols=128)
 {
     const int size = nrows*ncols;
+    std::cerr << "1b impulse freq axis="<<axis << " nrows="<<nrows<<" ncols="<<ncols<<"\n";
 
     std::vector<IDFT::complex_t> inter(size,0), freq(size,0), back(size,0);
     inter[0] = 1.0;
+
     dft->fwd1b(inter.data(), freq.data(), nrows, ncols, axis);
+    dump(freq.data(), nrows, ncols, "freq");
     assert_on_axis(freq, axis, nrows, ncols);
+
     dft->inv1b(freq.data(), back.data(), nrows, ncols, axis);
+    dump(back.data(), nrows, ncols, "back");
     assert_impulse_at_index(back, 0);
 
+
     std::vector<IDFT::complex_t> inplace(size,0);
     inplace[0] = 1.0;
     dft->fwd1b(inplace.data(), inplace.data(), nrows, ncols, axis);
@@ -159,17 +176,6 @@ void test_2d_threads(IDFT::pointer dft, int nthreads, int nloops, int size = 102
               << " " << dt1.count() << std::endl;
 }
 
-template<typename ValueType>
-void dump(ValueType* data, int nrows, int ncols, std::string msg="")
-{
-    std::cerr << msg << "("<<nrows<<","<<ncols<<")\n";
-    for (int irow=0; irow<nrows; ++irow) {
-        for (int icol=0; icol<ncols; ++icol) {
-            std::cerr << data[irow*ncols + icol] << " ";
-        }
-        std::cerr << "\n";
-    }
-}
 
 template<typename ValueType>
 void test_2d_transpose(IDFT::pointer dft, int nrows, int ncols)
@@ -205,8 +211,10 @@ int main(int argc, char* argv[])
     test_2d_zero(idft);
     test_2d_impulse(idft);
 
-    test_1b_impulse(idft, 0);
-    test_1b_impulse(idft, 1);
+    test_1b_impulse(idft, 0, 2, 8);
+    test_1b_impulse(idft, 1, 2, 8);
+    test_1b_impulse(idft, 0, 8, 2);
+    test_1b_impulse(idft, 1, 8, 2);
 
     test_2d_transpose<IDFT::scalar_t>(idft, 2, 8);
     test_2d_transpose<IDFT::scalar_t>(idft, 8, 2);
diff --git a/aux/test/test_idft_pytorch.jsonnet b/aux/test/test_idft_pytorch.jsonnet
new file mode 100644
index 000000000..10e1f788a
--- /dev/null
+++ b/aux/test/test_idft_pytorch.jsonnet
@@ -0,0 +1,7 @@
+// a configuration "data" portion for TorchDFT.
+// call like:
+// ❯ ./build/aux/test_idft TorchDFT WireCellPytorch aux/test/test_idft_pytorch.jsonnet
+{
+    device: "gpu",
+}
+    
diff --git a/iface/src/IDFT.cxx b/iface/src/IDFT.cxx
index 58b1d335b..abc3d6120 100644
--- a/iface/src/IDFT.cxx
+++ b/iface/src/IDFT.cxx
@@ -66,7 +66,7 @@ void transpose_type(const ValueType* in, ValueType* out,
     const int size = nrows*ncols;
     const int mn1 = (size - 1);
     std::vector<bool> visited(size);
-    ValueType* first = out + size;
+    ValueType* first = out;
     const ValueType* last = first + size;
     ValueType* cycle = out;
     while (++cycle != last) {
diff --git a/pytorch/src/DFT.cxx b/pytorch/src/DFT.cxx
index cba68164e..052013ded 100644
--- a/pytorch/src/DFT.cxx
+++ b/pytorch/src/DFT.cxx
@@ -5,7 +5,7 @@
 #include <torch/csrc/api/include/torch/fft.h>
 
 
-WIRECELL_FACTORY(FftwDFT, WireCell::Pytorch::DFT,
+WIRECELL_FACTORY(TorchDFT, WireCell::Pytorch::DFT,
                  WireCell::IDFT,
                  WireCell::IConfigurable)
 
@@ -50,24 +50,30 @@ void doit(const TorchContext& ctx,
 
     int64_t size = nrows*ncols;
 
-    auto options = torch::TensorOptions().device(ctx.device()).dtype(torch::kComplexFloat);
+    auto dtype = torch::TensorOptions().dtype(torch::kComplexFloat);
 
     // 1) in->src
     if (in != out) {            // from_blob() doesn't like const data
         memcpy(out, in, sizeof(IDFT::complex_t)*size);
     }
 
-    torch::Tensor src = torch::from_blob(out, {nrows, ncols}, options);
+    torch::Tensor src = torch::from_blob(out, {nrows, ncols}, dtype);
 
     // 2) dst = func(src)
+    src = src.to(ctx.device());
     auto dst = func(src);
-    dst = dst.cpu();
+
+    // Making contiguous costs a copy but gets the data in row-major
+    // so the (2nd) copy next actually gives correct results.  This
+    // corrects optimizations that libtorch makes for transpose (and
+    // others) eg when our func is 1b.  Alternatively, may avoid both
+    // copies by iterating over indices but presumably (?) that is
+    // slower.  Likewise we make contiguous on the device as that is
+    // presumably (?) faster when the device is GPU.
+    dst = dst.contiguous().cpu();
 
     // 3) dst->out
-    if (out != dst.data_ptr()) {
-        memcpy(out, dst.data_ptr(), sizeof(IDFT::complex_t)*size);
-    }
-        
+    memcpy(out, dst.data_ptr(), sizeof(IDFT::complex_t)*size);
 }
 
 
diff --git a/pytorch/src/TorchContext.cxx b/pytorch/src/TorchContext.cxx
index e5de936b8..ed219f93b 100644
--- a/pytorch/src/TorchContext.cxx
+++ b/pytorch/src/TorchContext.cxx
@@ -33,6 +33,6 @@ void TorchContext::connect(const std::string& devname,
         s_tn = semname;
     }
 
-    m_sem = Factory::find_tn<ISemaphore>(s_tn);
+    m_sem = Factory::lookup_tn<ISemaphore>(s_tn);
 }
 
diff --git a/pytorch/test/test_from_blob.cxx b/pytorch/test/test_from_blob.cxx
new file mode 100644
index 000000000..b6e45e23e
--- /dev/null
+++ b/pytorch/test/test_from_blob.cxx
@@ -0,0 +1,73 @@
+#include <torch/script.h>
+#include <torch/csrc/api/include/torch/fft.h>
+
+#include <vector>
+#include <complex>
+#include <iostream>
+
+using complex_t = std::complex<float>;
+
+void dump(const std::vector<complex_t>& v, int nrows, int ncols, const std::string& msg="")
+{
+    std::cerr << msg << ": ("<<nrows<<","<<ncols<<")\n";
+    for (int irow = 0; irow<nrows; ++irow) {
+        for (int icol = 0; icol<ncols; ++icol) {
+            auto c =  v[irow*ncols + icol];
+            std::cerr<< "(" << std::real(c) << "," << std::imag(c) << ")\t";
+        }
+        std::cerr << "\n";
+    }
+}
+
+void dump(const at::Tensor& ten, const std::string& msg="")
+{
+    int nrows = ten.size(0);
+    int ncols = ten.size(1);
+    std::cerr << msg << ": ("<<nrows<<","<<ncols<<")\n"
+              << ten << "\n";
+}
+
+int main()
+{
+    const int nrows=3, ncols=8;
+    int size = nrows*ncols;
+    std::vector<complex_t> v(size, 0);
+    //std::iota(v.begin(), v.end(), 0);
+    v[ncols+2] = 1.0;
+    dump(v, nrows, ncols, "v");
+
+    // Note: gpu is almost 10x SLOWER than CPU due to kernel load time!
+    // auto device = at::Device(at::kCPU);
+    auto device = at::Device(at::kCUDA);
+
+    auto typ_options = at::TensorOptions().dtype(at::kComplexFloat);
+    // auto dev_options = typ_options.device(device);
+    
+    for (int axis = 0; axis < 2; ++ axis) {
+        at::Tensor src = at::from_blob(v.data(), {nrows, ncols}, typ_options);
+        dump(src, "src");
+
+        src = src.to(device);
+        // In pytorch dim=(0,) transforms along columns, ie follows
+        // numpy.fft convention.  Both directions work on both CPU and
+        // CUDA.
+        at::Tensor dst = torch::fft::fft2(src, {}, {axis,});
+
+        // BUT, BEWARE that the underlying storage will NOT reflect
+        // logical row-major ordering.  Indexing is as expected but
+        // memory returned by data_ptr() will reflect transpose
+        // optimizations.  At the expense of a copy the contiguous()
+        // method provides expected row-major storage order.  
+        dst = dst.contiguous().cpu();
+
+        dump(dst, "dst");
+
+        std::vector<complex_t> v2(size, 0);
+        memcpy(v2.data(), dst.data_ptr(), sizeof(complex_t)*size);
+
+        std::cerr << "axis=" << axis << " dim=" << axis
+                  << " shape=(" << src.size(0) << "," << src.size(1) << ")\n";
+        dump(v2, nrows, ncols, "dft(v)");
+    }
+    return 0;
+}

From 47e67dd12f086ea02a3066deb48320791dd77cc3 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 18 Nov 2021 08:40:10 -0500
Subject: [PATCH 17/46] Typo in plugin name fixed

---
 cfg/pgrapher/common/helpers/utils.jsonnet | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cfg/pgrapher/common/helpers/utils.jsonnet b/cfg/pgrapher/common/helpers/utils.jsonnet
index 19e31618b..08ed7781f 100644
--- a/cfg/pgrapher/common/helpers/utils.jsonnet
+++ b/cfg/pgrapher/common/helpers/utils.jsonnet
@@ -18,7 +18,7 @@ local pg = import "pgraph.jsonnet";
     
     local app_plugins = {
         'TbbFlow': ["WireCellTbb"],
-        'PGrapher': ["WireCellPgraph"],
+        'PGrapher': ["WireCellPgrapher"],
     },
 
     main(graph, app='Pgrapher', extra_plugins = []) :: 

From d90bdcc8dfe32b073765cb882499be685f7b301e Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 18 Nov 2021 08:40:23 -0500
Subject: [PATCH 18/46] Initial draft of an IDFT benchmarker

---
 aux/test/test_idft_bench.cxx | 100 +++++++++++++++++++++++++++++++++++
 1 file changed, 100 insertions(+)
 create mode 100644 aux/test/test_idft_bench.cxx

diff --git a/aux/test/test_idft_bench.cxx b/aux/test/test_idft_bench.cxx
new file mode 100644
index 000000000..01b10d91d
--- /dev/null
+++ b/aux/test/test_idft_bench.cxx
@@ -0,0 +1,100 @@
+/**
+   A simple benchmark of IDFT for payloads relevant to WCT
+ */
+
+#include "WireCellUtil/TimeKeeper.h"
+
+#include "aux_test_dft_helpers.h"
+
+#include <string>
+#include <complex>
+#include <iostream>
+
+using namespace WireCell;
+using namespace WireCell::Aux::Test;
+
+using benchmark_function = std::function<void()>;
+using complex_t = std::complex<float>;
+
+void timeit(TimeKeeper& tk, const std::string& msg, benchmark_function func)
+{
+    tk("\tINIT\t" + msg);
+    func();
+    tk("\tFINI\t" + msg);
+}
+
+// benchmarks span outer product of:
+// - in-place / out-place
+// - 1d, 1b, 2d
+// - sizes: perfect powers of 2 and with larger prime factors
+// - use repitition numbers to keep each test roughly same runtime
+
+using transform_function = std::function<void(const complex_t* in, complex_t* out)>;
+
+const int onedfull = 100'000'000;
+void doit(TimeKeeper& tk, const std::string& name, int nrows, int ncols, bool inplace, transform_function func)
+{
+    const int size = nrows*ncols;
+    const int ntimes = onedfull / size;
+    std::stringstream ss;
+    ss << "\t(" << nrows << "," << ncols << ")\t" << ntimes << "\t";
+    std::string s = ss.str();
+    
+    if (inplace) {
+        timeit(tk, s + "in-place\t" + name, [&]() {
+            std::vector<complex_t> in(size);
+            for (int count=0; count<ntimes; ++count) {
+                func(in.data(), in.data());
+            }});
+    }
+    else {
+        timeit(tk, s + "separate\t" + name, [&]() {
+            std::vector<complex_t> in(size), out(size);
+            for (int count=0; count<ntimes; ++count) {
+                func(in.data(), out.data());
+            }});
+    }
+}
+
+int main(int argc, char* argv[])
+{
+    auto idft = make_dft_args(argc, argv);
+
+    TimeKeeper tk("IDFT benchmark\t\tsize\t\tcount\toverlap\t\ttran");
+
+    int size = 10'000;
+    doit(tk, "fwd1d", 1, size, false, [&](const complex_t* in, complex_t* out) {
+        idft->fwd1d(in, out, size);
+    });
+
+    doit(tk, "inv1d", 1, size, false, [&](const complex_t* in, complex_t* out) {
+        idft->inv1d(in, out, size);
+    });
+
+    int nrows = 1000;
+    int ncols = 1000;
+    doit(tk, "fwd2d", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
+        idft->fwd2d(in, out, nrows, ncols);
+    });
+    doit(tk, "inv2d", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
+        idft->inv2d(in, out, nrows, ncols);
+    });
+
+    doit(tk, "fwd1b0", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
+        idft->fwd1b(in, out, nrows, ncols, 0);
+    });
+    doit(tk, "inv1b0", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
+        idft->inv1b(in, out, nrows, ncols, 0);
+    });
+    doit(tk, "fwd1b1", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
+        idft->fwd1b(in, out, nrows, ncols, 1);
+    });
+    doit(tk, "inv1b1", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
+        idft->inv1b(in, out, nrows, ncols, 1);
+    });
+
+
+    std::cerr << tk.summary() << std::endl;
+
+    return 0;
+}

From a46fd9a3be5f39508660583a18c26404bc2819ce Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 18 Nov 2021 13:08:40 -0500
Subject: [PATCH 19/46] Improve timing measurements

---
 aux/test/aux_test_dft_helpers.h |  86 +++++++++++++++--
 aux/test/test_idft_bench.cxx    | 158 ++++++++++++++++++--------------
 2 files changed, 165 insertions(+), 79 deletions(-)

diff --git a/aux/test/aux_test_dft_helpers.h b/aux/test/aux_test_dft_helpers.h
index d83754976..db83d0fa8 100644
--- a/aux/test/aux_test_dft_helpers.h
+++ b/aux/test/aux_test_dft_helpers.h
@@ -9,11 +9,70 @@
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IDFT.h"
 
+#include <ctime>                // std::clock
+#include <chrono>
+
+#include <string>
 #include <cassert>
+#include <fstream>
 #include <iostream>
 
+// note: likely will move in the future.
+#include "custard/nlohmann/json.hpp"
+
 namespace WireCell::Aux::Test {
 
+    using object_t = nlohmann::json;
+
+    // probably move this to util
+    struct Stopwatch {
+        using clock = std::chrono::high_resolution_clock;
+        using time_point = clock::time_point;
+        using function_type = std::function<void()>;
+
+        std::clock_t c_ini = std::clock();
+        time_point t_ini = clock::now();
+
+        object_t results;
+
+        Stopwatch(const object_t& first = object_t{}) {
+            (*this)([](){}, first);
+        }
+
+        // Run the func, add timing info to a "stopwatch" attribute of
+        // data and save data to results.  A pair of clock objects are
+        // saved, "clock" (std::clock) and "time" (std::chrono).  Each
+        // have "start" and "elapsed" which are the number of
+        // nanoseconds from creation of stopwatch and for just this
+        // job, respectively.
+        void operator()(function_type func, object_t data = object_t{})
+        {
+            auto c_now =std::clock();
+            auto t_now = clock::now();
+            func();
+            auto c_fin =std::clock();
+            auto t_fin = clock::now();
+            
+            double dc_now = 1e9 * (c_now - c_ini) / ((double) CLOCKS_PER_SEC);
+            double dc_fin = 1e9 * (c_fin - c_now) / ((double) CLOCKS_PER_SEC);
+            double dt_now = std::chrono::duration_cast<std::chrono::nanoseconds>(t_now - t_ini).count();
+            double dt_fin = std::chrono::duration_cast<std::chrono::nanoseconds>(t_fin - t_now).count();
+
+            data["stopwatch"]["clock"]["start"] = dc_now;
+            data["stopwatch"]["clock"]["elapsed"] = dc_fin;
+            data["stopwatch"]["time"]["start"] = dt_now;
+            data["stopwatch"]["time"]["elapsed"] = dt_fin;
+
+            results.push_back(data);
+        }        
+
+        void save(const std::string& jsonfile) {
+            std::ofstream fp(jsonfile.c_str());
+            fp << results.dump(4) << std::endl;
+        }
+            
+
+    };
 
     // fixme: add support for config
     IDFT::pointer make_dft(const std::string& tn="FftwDFT",
@@ -37,16 +96,23 @@ namespace WireCell::Aux::Test {
         }
         return idft;
     }
-    IDFT::pointer make_dft_args(int argc, char* argv[]) 
-    {
-        std::string dft_tn="FftwDFT";
-        std::string dft_pi="WireCellAux";
-        if (argc > 1) dft_tn = argv[1];
-        if (argc > 2) dft_pi = argv[2];
+    struct DftArgs {
+        std::string tn{"FftwDFT"};
+        std::string pi{"WireCellAux"};
+        std::string cfg_name{""};
         Configuration cfg;
+    };        
+
+    DftArgs make_dft_args(int argc, char* argv[]) 
+    {
+        DftArgs ret;
+
+        if (argc > 1) ret.tn = argv[1];
+        if (argc > 2) ret.pi = argv[2];
         if (argc > 3) {
             // Either we get directly a "data" object 
-            cfg = Persist::load(argv[3]);
+            ret.cfg_name = argv[3];
+            auto cfg = Persist::load(argv[3]);
             // or we go searching a list for matching type/name.
             if (cfg.isArray()) {
                 for (auto one : cfg) {
@@ -55,15 +121,17 @@ namespace WireCell::Aux::Test {
                     if (not n.empty()) {
                         tn = tn + ":" + n;
                     }
-                    if (tn == dft_tn) {
+                    if (tn == ret.tn) {
                         cfg = one["data"];
                         break;
                     }
                 }
             }
+            ret.cfg = cfg;
 
         }
-        return make_dft(dft_tn, dft_pi);
+        return ret;
+        //return make_dft(dft_tn, dft_pi, cfg);
     }
 
     const double default_eps = 1e-8;
diff --git a/aux/test/test_idft_bench.cxx b/aux/test/test_idft_bench.cxx
index 01b10d91d..3d223a787 100644
--- a/aux/test/test_idft_bench.cxx
+++ b/aux/test/test_idft_bench.cxx
@@ -2,26 +2,14 @@
    A simple benchmark of IDFT for payloads relevant to WCT
  */
 
-#include "WireCellUtil/TimeKeeper.h"
-
 #include "aux_test_dft_helpers.h"
 
-#include <string>
-#include <complex>
-#include <iostream>
-
 using namespace WireCell;
 using namespace WireCell::Aux::Test;
 
 using benchmark_function = std::function<void()>;
 using complex_t = std::complex<float>;
 
-void timeit(TimeKeeper& tk, const std::string& msg, benchmark_function func)
-{
-    tk("\tINIT\t" + msg);
-    func();
-    tk("\tFINI\t" + msg);
-}
 
 // benchmarks span outer product of:
 // - in-place / out-place
@@ -31,70 +19,100 @@ void timeit(TimeKeeper& tk, const std::string& msg, benchmark_function func)
 
 using transform_function = std::function<void(const complex_t* in, complex_t* out)>;
 
-const int onedfull = 100'000'000;
-void doit(TimeKeeper& tk, const std::string& name, int nrows, int ncols, bool inplace, transform_function func)
+const int nominal = 100'000'000;
+void doit(Stopwatch& sw, const std::string& name, int nrows, int ncols, transform_function func)
 {
     const int size = nrows*ncols;
-    const int ntimes = onedfull / size;
-    std::stringstream ss;
-    ss << "\t(" << nrows << "," << ncols << ")\t" << ntimes << "\t";
-    std::string s = ss.str();
-    
-    if (inplace) {
-        timeit(tk, s + "in-place\t" + name, [&]() {
-            std::vector<complex_t> in(size);
-            for (int count=0; count<ntimes; ++count) {
-                func(in.data(), in.data());
-            }});
-    }
-    else {
-        timeit(tk, s + "separate\t" + name, [&]() {
-            std::vector<complex_t> in(size), out(size);
-            for (int count=0; count<ntimes; ++count) {
-                func(in.data(), out.data());
-            }});
-    }
+    const int ntimes = std::max(1, nominal / size);
+    std::vector<complex_t> in(size), out(size);
+
+    sw([&](){func(in.data(), in.data());}, {
+            {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",1}, {"first",true}, {"in-place",true},
+        });
+
+    sw([&](){
+        for (int count=0; count<ntimes+1; ++count) {
+            func(in.data(), in.data());
+        }}, {
+            {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",ntimes}, {"first",false}, {"in-place",true},
+        });
+
+    sw([&](){func(in.data(), out.data());}, {
+            {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",1}, {"first",true}, {"in-place",false},
+        });
+
+    sw([&](){
+        for (int count=0; count<ntimes+1; ++count) {
+            func(in.data(), out.data());
+        }}, {
+            {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",ntimes}, {"first",false}, {"in-place",false},
+        });
 }
 
 int main(int argc, char* argv[])
 {
-    auto idft = make_dft_args(argc, argv);
-
-    TimeKeeper tk("IDFT benchmark\t\tsize\t\tcount\toverlap\t\ttran");
-
-    int size = 10'000;
-    doit(tk, "fwd1d", 1, size, false, [&](const complex_t* in, complex_t* out) {
-        idft->fwd1d(in, out, size);
-    });
-
-    doit(tk, "inv1d", 1, size, false, [&](const complex_t* in, complex_t* out) {
-        idft->inv1d(in, out, size);
-    });
-
-    int nrows = 1000;
-    int ncols = 1000;
-    doit(tk, "fwd2d", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
-        idft->fwd2d(in, out, nrows, ncols);
-    });
-    doit(tk, "inv2d", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
-        idft->inv2d(in, out, nrows, ncols);
-    });
-
-    doit(tk, "fwd1b0", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
-        idft->fwd1b(in, out, nrows, ncols, 0);
-    });
-    doit(tk, "inv1b0", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
-        idft->inv1b(in, out, nrows, ncols, 0);
-    });
-    doit(tk, "fwd1b1", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
-        idft->fwd1b(in, out, nrows, ncols, 1);
-    });
-    doit(tk, "inv1b1", nrows, ncols, false, [&](const complex_t* in, complex_t* out) {
-        idft->inv1b(in, out, nrows, ncols, 1);
-    });
-
-
-    std::cerr << tk.summary() << std::endl;
+    auto args = make_dft_args(argc, argv);
+    auto idft = make_dft(args.tn, args.pi, args.cfg);
+
+    Stopwatch sw({
+            {"typename",args.tn},
+            {"plugin",args.pi},
+            {"config", object_t::parse(Persist::dumps(args.cfg))}, 
+            {"config_file",args.cfg_name}});
+
+    std::string cname = args.cfg_name;
+    auto slash = cname.rfind("/");
+    if (slash != std::string::npos) {
+        cname = cname.substr(slash+1);
+    }
+    cname = cname.substr(0, cname.rfind("."));
+    std::string fname = argv[0];
+    fname += "_" + args.pi + "_" + args.tn + "_" + cname + ".json";
+    std::cerr << "writing to: " << fname << std::endl;
+    
+
+    std::vector<int> oned_sizes{500, 512, 1000, 1024, 4096, 6000, 8192, 10000, 16384};
+    for (auto size : oned_sizes) {
+        std::cerr << "1d " << size << std::endl;
+        doit(sw, "fwd1d", 1, size, [&](const complex_t* in, complex_t* out) {
+            idft->fwd1d(in, out, size);
+        });
+
+        doit(sw, "inv1d", 1, size, [&](const complex_t* in, complex_t* out) {
+            idft->inv1d(in, out, size);
+        });
+    }
+
+    // channel count from some detectors plus powers of 2
+    std::vector<int> twod_nrows{800, 960, 1024, 2048, 2400, 3456, 4096};
+    // tick count from some detectors plus powers of 2
+    std::vector<int> twod_ncols{2000, 4096, 6000, 8192, 9375, 9595, 9600, 10000, 16384};
+    for (int nrows : twod_nrows) {
+        for (int ncols : twod_ncols) {
+            std::cerr << "2d (" << nrows << "," << ncols << ")\n";
+            doit(sw, "fwd2d", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+                idft->fwd2d(in, out, nrows, ncols);
+            });
+            doit(sw, "inv2d", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+                idft->inv2d(in, out, nrows, ncols);
+            });
+
+            doit(sw, "fwd1b0", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+                idft->fwd1b(in, out, nrows, ncols, 0);
+            });
+            doit(sw, "inv1b0", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+                idft->inv1b(in, out, nrows, ncols, 0);
+            });
+            doit(sw, "fwd1b1", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+                idft->fwd1b(in, out, nrows, ncols, 1);
+            });
+            doit(sw, "inv1b1", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+                idft->inv1b(in, out, nrows, ncols, 1);
+            });
+        }
+    }
+    
+    sw.save(fname);
 
     return 0;
 }

From 3c65ffb21a0b298ea56663a423ae2200e9d3c91e Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 18 Nov 2021 14:21:47 -0500
Subject: [PATCH 20/46] Rename, too slow to run each time

---
 ...st_idft_bench.cxx => check_idft_bench.cxx} | 55 ++++++++++---------
 1 file changed, 28 insertions(+), 27 deletions(-)
 rename aux/test/{test_idft_bench.cxx => check_idft_bench.cxx} (67%)

diff --git a/aux/test/test_idft_bench.cxx b/aux/test/check_idft_bench.cxx
similarity index 67%
rename from aux/test/test_idft_bench.cxx
rename to aux/test/check_idft_bench.cxx
index 3d223a787..b7bd29100 100644
--- a/aux/test/test_idft_bench.cxx
+++ b/aux/test/check_idft_bench.cxx
@@ -24,6 +24,8 @@ void doit(Stopwatch& sw, const std::string& name, int nrows, int ncols, transfor
 {
     const int size = nrows*ncols;
     const int ntimes = std::max(1, nominal / size);
+    std::cerr << name << ": (" << nrows << "," << ncols << ") x "<<ntimes<<"\n";
+
     std::vector<complex_t> in(size), out(size);
 
     sw([&](){func(in.data(), in.data());}, {
@@ -73,7 +75,6 @@ int main(int argc, char* argv[])
 
     std::vector<int> oned_sizes{500, 512, 1000, 1024, 4096, 6000, 8192, 10000, 16384};
     for (auto size : oned_sizes) {
-        std::cerr << "1d " << size << std::endl;
         doit(sw, "fwd1d", 1, size, [&](const complex_t* in, complex_t* out) {
             idft->fwd1d(in, out, size);
         });
@@ -84,32 +85,32 @@ int main(int argc, char* argv[])
     }
 
     // channel count from some detectors plus powers of 2
-    std::vector<int> twod_nrows{800, 960, 1024, 2048, 2400, 3456, 4096};
-    // tick count from some detectors plus powers of 2
-    std::vector<int> twod_ncols{2000, 4096, 6000, 8192, 9375, 9595, 9600, 10000, 16384};
-    for (int nrows : twod_nrows) {
-        for (int ncols : twod_ncols) {
-            std::cerr << "2d (" << nrows << "," << ncols << ")\n";
-            doit(sw, "fwd2d", nrows, ncols, [&](const complex_t* in, complex_t* out) {
-                idft->fwd2d(in, out, nrows, ncols);
-            });
-            doit(sw, "inv2d", nrows, ncols, [&](const complex_t* in, complex_t* out) {
-                idft->inv2d(in, out, nrows, ncols);
-            });
-
-            doit(sw, "fwd1b0", nrows, ncols, [&](const complex_t* in, complex_t* out) {
-                idft->fwd1b(in, out, nrows, ncols, 0);
-            });
-            doit(sw, "inv1b0", nrows, ncols, [&](const complex_t* in, complex_t* out) {
-                idft->inv1b(in, out, nrows, ncols, 0);
-            });
-            doit(sw, "fwd1b1", nrows, ncols, [&](const complex_t* in, complex_t* out) {
-                idft->fwd1b(in, out, nrows, ncols, 1);
-            });
-            doit(sw, "inv1b1", nrows, ncols, [&](const complex_t* in, complex_t* out) {
-                idft->inv1b(in, out, nrows, ncols, 1);
-            });
-        }
+    std::vector<std::pair<int,int>> twod_sizes{
+        {800,6000}, {960,6000}, // protodune u/v and w 3ms
+        {2400, 9595}, {3456, 9595}, // uboone u/v daq size
+        {1024, 1024}, {2048, 2048}, {4096, 4096}, // perfect powers of 2
+    };
+    for (auto& [nrows,ncols] : twod_sizes) {
+
+        doit(sw, "fwd2d", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+            idft->fwd2d(in, out, nrows, ncols);
+        });
+        doit(sw, "inv2d", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+            idft->inv2d(in, out, nrows, ncols);
+        });
+
+        doit(sw, "fwd1b0", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+            idft->fwd1b(in, out, nrows, ncols, 0);
+        });
+        doit(sw, "inv1b0", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+            idft->inv1b(in, out, nrows, ncols, 0);
+        });
+        doit(sw, "fwd1b1", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+            idft->fwd1b(in, out, nrows, ncols, 1);
+        });
+        doit(sw, "inv1b1", nrows, ncols, [&](const complex_t* in, complex_t* out) {
+            idft->inv1b(in, out, nrows, ncols, 1);
+        });
     }
     
     sw.save(fname);

From 365c21c7fb7f93740f9ab96de1fb6dab1a4ea3f8 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Fri, 19 Nov 2021 13:44:12 -0500
Subject: [PATCH 21/46] Make this more globally accessible so test/check
 programs can use it

---
 util/inc/WireCellUtil/CLI11.hpp | 9066 +++++++++++++++++++++++++++++++
 1 file changed, 9066 insertions(+)
 create mode 100644 util/inc/WireCellUtil/CLI11.hpp

diff --git a/util/inc/WireCellUtil/CLI11.hpp b/util/inc/WireCellUtil/CLI11.hpp
new file mode 100644
index 000000000..dcb57c6c6
--- /dev/null
+++ b/util/inc/WireCellUtil/CLI11.hpp
@@ -0,0 +1,9066 @@
+// CLI11: Version 2.1.2
+// Originally designed by Henry Schreiner
+// https://github.com/CLIUtils/CLI11
+//
+// This is a standalone header file generated by MakeSingleHeader.py in CLI11/scripts
+// from: v2.1.2
+//
+// CLI11 2.1.2 Copyright (c) 2017-2021 University of Cincinnati, developed by Henry
+// Schreiner under NSF AWARD 1414736. All rights reserved.
+//
+// Redistribution and use in source and binary forms of CLI11, with or without
+// modification, are permitted provided that the following conditions are met:
+//
+// 1. Redistributions of source code must retain the above copyright notice, this
+//    list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright notice,
+//    this list of conditions and the following disclaimer in the documentation
+//    and/or other materials provided with the distribution.
+// 3. Neither the name of the copyright holder nor the names of its contributors
+//    may be used to endorse or promote products derived from this software without
+//    specific prior written permission.
+//
+// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+// WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+// ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+// (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+// LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+// ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+// SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#pragma once
+
+// Standard combined includes:
+#include <memory>
+#include <string>
+#include <cmath>
+#include <functional>
+#include <numeric>
+#include <map>
+#include <fstream>
+#include <tuple>
+#include <utility>
+#include <iomanip>
+#include <locale>
+#include <sstream>
+#include <algorithm>
+#include <cstdint>
+#include <iostream>
+#include <set>
+#include <type_traits>
+#include <iterator>
+#include <stdexcept>
+#include <vector>
+#include <limits>
+#include <exception>
+
+
+#define CLI11_VERSION_MAJOR 2
+#define CLI11_VERSION_MINOR 1
+#define CLI11_VERSION_PATCH 2
+#define CLI11_VERSION "2.1.2"
+
+
+
+
+// The following version macro is very similar to the one in pybind11
+#if !(defined(_MSC_VER) && __cplusplus == 199711L) && !defined(__INTEL_COMPILER)
+#if __cplusplus >= 201402L
+#define CLI11_CPP14
+#if __cplusplus >= 201703L
+#define CLI11_CPP17
+#if __cplusplus > 201703L
+#define CLI11_CPP20
+#endif
+#endif
+#endif
+#elif defined(_MSC_VER) && __cplusplus == 199711L
+// MSVC sets _MSVC_LANG rather than __cplusplus (supposedly until the standard is fully implemented)
+// Unless you use the /Zc:__cplusplus flag on Visual Studio 2017 15.7 Preview 3 or newer
+#if _MSVC_LANG >= 201402L
+#define CLI11_CPP14
+#if _MSVC_LANG > 201402L && _MSC_VER >= 1910
+#define CLI11_CPP17
+#if __MSVC_LANG > 201703L && _MSC_VER >= 1910
+#define CLI11_CPP20
+#endif
+#endif
+#endif
+#endif
+
+#if defined(CLI11_CPP14)
+#define CLI11_DEPRECATED(reason) [[deprecated(reason)]]
+#elif defined(_MSC_VER)
+#define CLI11_DEPRECATED(reason) __declspec(deprecated(reason))
+#else
+#define CLI11_DEPRECATED(reason) __attribute__((deprecated(reason)))
+#endif
+
+
+
+
+// C standard library
+// Only needed for existence checking
+#if defined CLI11_CPP17 && defined __has_include && !defined CLI11_HAS_FILESYSTEM
+#if __has_include(<filesystem>)
+// Filesystem cannot be used if targeting macOS < 10.15
+#if defined __MAC_OS_X_VERSION_MIN_REQUIRED && __MAC_OS_X_VERSION_MIN_REQUIRED < 101500
+#define CLI11_HAS_FILESYSTEM 0
+#else
+#include <filesystem>
+#if defined __cpp_lib_filesystem && __cpp_lib_filesystem >= 201703
+#if defined _GLIBCXX_RELEASE && _GLIBCXX_RELEASE >= 9
+#define CLI11_HAS_FILESYSTEM 1
+#elif defined(__GLIBCXX__)
+// if we are using gcc and Version <9 default to no filesystem
+#define CLI11_HAS_FILESYSTEM 0
+#else
+#define CLI11_HAS_FILESYSTEM 1
+#endif
+#else
+#define CLI11_HAS_FILESYSTEM 0
+#endif
+#endif
+#endif
+#endif
+
+#if defined CLI11_HAS_FILESYSTEM && CLI11_HAS_FILESYSTEM > 0
+#include <filesystem>  // NOLINT(build/include)
+#else
+#include <sys/stat.h>
+#include <sys/types.h>
+#endif
+
+
+
+namespace CLI {
+
+
+/// Include the items in this namespace to get free conversion of enums to/from streams.
+/// (This is available inside CLI as well, so CLI11 will use this without a using statement).
+namespace enums {
+
+/// output streaming for enumerations
+template <typename T, typename = typename std::enable_if<std::is_enum<T>::value>::type>
+std::ostream &operator<<(std::ostream &in, const T &item) {
+    // make sure this is out of the detail namespace otherwise it won't be found when needed
+    return in << static_cast<typename std::underlying_type<T>::type>(item);
+}
+
+}  // namespace enums
+
+/// Export to CLI namespace
+using enums::operator<<;
+
+namespace detail {
+/// a constant defining an expected max vector size defined to be a big number that could be multiplied by 4 and not
+/// produce overflow for some expected uses
+constexpr int expected_max_vector_size{1 << 29};
+// Based on http://stackoverflow.com/questions/236129/split-a-string-in-c
+/// Split a string by a delim
+inline std::vector<std::string> split(const std::string &s, char delim) {
+    std::vector<std::string> elems;
+    // Check to see if empty string, give consistent result
+    if(s.empty()) {
+        elems.emplace_back();
+    } else {
+        std::stringstream ss;
+        ss.str(s);
+        std::string item;
+        while(std::getline(ss, item, delim)) {
+            elems.push_back(item);
+        }
+    }
+    return elems;
+}
+
+/// Simple function to join a string
+template <typename T> std::string join(const T &v, std::string delim = ",") {
+    std::ostringstream s;
+    auto beg = std::begin(v);
+    auto end = std::end(v);
+    if(beg != end)
+        s << *beg++;
+    while(beg != end) {
+        s << delim << *beg++;
+    }
+    return s.str();
+}
+
+/// Simple function to join a string from processed elements
+template <typename T,
+          typename Callable,
+          typename = typename std::enable_if<!std::is_constructible<std::string, Callable>::value>::type>
+std::string join(const T &v, Callable func, std::string delim = ",") {
+    std::ostringstream s;
+    auto beg = std::begin(v);
+    auto end = std::end(v);
+    auto loc = s.tellp();
+    while(beg != end) {
+        auto nloc = s.tellp();
+        if(nloc > loc) {
+            s << delim;
+            loc = nloc;
+        }
+        s << func(*beg++);
+    }
+    return s.str();
+}
+
+/// Join a string in reverse order
+template <typename T> std::string rjoin(const T &v, std::string delim = ",") {
+    std::ostringstream s;
+    for(std::size_t start = 0; start < v.size(); start++) {
+        if(start > 0)
+            s << delim;
+        s << v[v.size() - start - 1];
+    }
+    return s.str();
+}
+
+// Based roughly on http://stackoverflow.com/questions/25829143/c-trim-whitespace-from-a-string
+
+/// Trim whitespace from left of string
+inline std::string &ltrim(std::string &str) {
+    auto it = std::find_if(str.begin(), str.end(), [](char ch) { return !std::isspace<char>(ch, std::locale()); });
+    str.erase(str.begin(), it);
+    return str;
+}
+
+/// Trim anything from left of string
+inline std::string &ltrim(std::string &str, const std::string &filter) {
+    auto it = std::find_if(str.begin(), str.end(), [&filter](char ch) { return filter.find(ch) == std::string::npos; });
+    str.erase(str.begin(), it);
+    return str;
+}
+
+/// Trim whitespace from right of string
+inline std::string &rtrim(std::string &str) {
+    auto it = std::find_if(str.rbegin(), str.rend(), [](char ch) { return !std::isspace<char>(ch, std::locale()); });
+    str.erase(it.base(), str.end());
+    return str;
+}
+
+/// Trim anything from right of string
+inline std::string &rtrim(std::string &str, const std::string &filter) {
+    auto it =
+        std::find_if(str.rbegin(), str.rend(), [&filter](char ch) { return filter.find(ch) == std::string::npos; });
+    str.erase(it.base(), str.end());
+    return str;
+}
+
+/// Trim whitespace from string
+inline std::string &trim(std::string &str) { return ltrim(rtrim(str)); }
+
+/// Trim anything from string
+inline std::string &trim(std::string &str, const std::string filter) { return ltrim(rtrim(str, filter), filter); }
+
+/// Make a copy of the string and then trim it
+inline std::string trim_copy(const std::string &str) {
+    std::string s = str;
+    return trim(s);
+}
+
+/// remove quotes at the front and back of a string either '"' or '\''
+inline std::string &remove_quotes(std::string &str) {
+    if(str.length() > 1 && (str.front() == '"' || str.front() == '\'')) {
+        if(str.front() == str.back()) {
+            str.pop_back();
+            str.erase(str.begin(), str.begin() + 1);
+        }
+    }
+    return str;
+}
+
+/// Add a leader to the beginning of all new lines (nothing is added
+/// at the start of the first line). `"; "` would be for ini files
+///
+/// Can't use Regex, or this would be a subs.
+inline std::string fix_newlines(const std::string &leader, std::string input) {
+    std::string::size_type n = 0;
+    while(n != std::string::npos && n < input.size()) {
+        n = input.find('\n', n);
+        if(n != std::string::npos) {
+            input = input.substr(0, n + 1) + leader + input.substr(n + 1);
+            n += leader.size();
+        }
+    }
+    return input;
+}
+
+/// Make a copy of the string and then trim it, any filter string can be used (any char in string is filtered)
+inline std::string trim_copy(const std::string &str, const std::string &filter) {
+    std::string s = str;
+    return trim(s, filter);
+}
+/// Print a two part "help" string
+inline std::ostream &format_help(std::ostream &out, std::string name, const std::string &description, std::size_t wid) {
+    name = "  " + name;
+    out << std::setw(static_cast<int>(wid)) << std::left << name;
+    if(!description.empty()) {
+        if(name.length() >= wid)
+            out << "\n" << std::setw(static_cast<int>(wid)) << "";
+        for(const char c : description) {
+            out.put(c);
+            if(c == '\n') {
+                out << std::setw(static_cast<int>(wid)) << "";
+            }
+        }
+    }
+    out << "\n";
+    return out;
+}
+
+/// Print subcommand aliases
+inline std::ostream &format_aliases(std::ostream &out, const std::vector<std::string> &aliases, std::size_t wid) {
+    if(!aliases.empty()) {
+        out << std::setw(static_cast<int>(wid)) << "     aliases: ";
+        bool front = true;
+        for(const auto &alias : aliases) {
+            if(!front) {
+                out << ", ";
+            } else {
+                front = false;
+            }
+            out << detail::fix_newlines("              ", alias);
+        }
+        out << "\n";
+    }
+    return out;
+}
+
+/// Verify the first character of an option
+/// - is a trigger character, ! has special meaning and new lines would just be annoying to deal with
+template <typename T> bool valid_first_char(T c) { return ((c != '-') && (c != '!') && (c != ' ') && c != '\n'); }
+
+/// Verify following characters of an option
+template <typename T> bool valid_later_char(T c) {
+    // = and : are value separators, { has special meaning for option defaults,
+    // and \n would just be annoying to deal with in many places allowing space here has too much potential for
+    // inadvertent entry errors and bugs
+    return ((c != '=') && (c != ':') && (c != '{') && (c != ' ') && c != '\n');
+}
+
+/// Verify an option/subcommand name
+inline bool valid_name_string(const std::string &str) {
+    if(str.empty() || !valid_first_char(str[0])) {
+        return false;
+    }
+    auto e = str.end();
+    for(auto c = str.begin() + 1; c != e; ++c)
+        if(!valid_later_char(*c))
+            return false;
+    return true;
+}
+
+/// Verify an app name
+inline bool valid_alias_name_string(const std::string &str) {
+    static const std::string badChars(std::string("\n") + '\0');
+    return (str.find_first_of(badChars) == std::string::npos);
+}
+
+/// check if a string is a container segment separator (empty or "%%")
+inline bool is_separator(const std::string &str) {
+    static const std::string sep("%%");
+    return (str.empty() || str == sep);
+}
+
+/// Verify that str consists of letters only
+inline bool isalpha(const std::string &str) {
+    return std::all_of(str.begin(), str.end(), [](char c) { return std::isalpha(c, std::locale()); });
+}
+
+/// Return a lower case version of a string
+inline std::string to_lower(std::string str) {
+    std::transform(std::begin(str), std::end(str), std::begin(str), [](const std::string::value_type &x) {
+        return std::tolower(x, std::locale());
+    });
+    return str;
+}
+
+/// remove underscores from a string
+inline std::string remove_underscore(std::string str) {
+    str.erase(std::remove(std::begin(str), std::end(str), '_'), std::end(str));
+    return str;
+}
+
+/// Find and replace a substring with another substring
+inline std::string find_and_replace(std::string str, std::string from, std::string to) {
+
+    std::size_t start_pos = 0;
+
+    while((start_pos = str.find(from, start_pos)) != std::string::npos) {
+        str.replace(start_pos, from.length(), to);
+        start_pos += to.length();
+    }
+
+    return str;
+}
+
+/// check if the flag definitions has possible false flags
+inline bool has_default_flag_values(const std::string &flags) {
+    return (flags.find_first_of("{!") != std::string::npos);
+}
+
+inline void remove_default_flag_values(std::string &flags) {
+    auto loc = flags.find_first_of('{', 2);
+    while(loc != std::string::npos) {
+        auto finish = flags.find_first_of("},", loc + 1);
+        if((finish != std::string::npos) && (flags[finish] == '}')) {
+            flags.erase(flags.begin() + static_cast<std::ptrdiff_t>(loc),
+                        flags.begin() + static_cast<std::ptrdiff_t>(finish) + 1);
+        }
+        loc = flags.find_first_of('{', loc + 1);
+    }
+    flags.erase(std::remove(flags.begin(), flags.end(), '!'), flags.end());
+}
+
+/// Check if a string is a member of a list of strings and optionally ignore case or ignore underscores
+inline std::ptrdiff_t find_member(std::string name,
+                                  const std::vector<std::string> names,
+                                  bool ignore_case = false,
+                                  bool ignore_underscore = false) {
+    auto it = std::end(names);
+    if(ignore_case) {
+        if(ignore_underscore) {
+            name = detail::to_lower(detail::remove_underscore(name));
+            it = std::find_if(std::begin(names), std::end(names), [&name](std::string local_name) {
+                return detail::to_lower(detail::remove_underscore(local_name)) == name;
+            });
+        } else {
+            name = detail::to_lower(name);
+            it = std::find_if(std::begin(names), std::end(names), [&name](std::string local_name) {
+                return detail::to_lower(local_name) == name;
+            });
+        }
+
+    } else if(ignore_underscore) {
+        name = detail::remove_underscore(name);
+        it = std::find_if(std::begin(names), std::end(names), [&name](std::string local_name) {
+            return detail::remove_underscore(local_name) == name;
+        });
+    } else {
+        it = std::find(std::begin(names), std::end(names), name);
+    }
+
+    return (it != std::end(names)) ? (it - std::begin(names)) : (-1);
+}
+
+/// Find a trigger string and call a modify callable function that takes the current string and starting position of the
+/// trigger and returns the position in the string to search for the next trigger string
+template <typename Callable> inline std::string find_and_modify(std::string str, std::string trigger, Callable modify) {
+    std::size_t start_pos = 0;
+    while((start_pos = str.find(trigger, start_pos)) != std::string::npos) {
+        start_pos = modify(str, start_pos);
+    }
+    return str;
+}
+
+/// Split a string '"one two" "three"' into 'one two', 'three'
+/// Quote characters can be ` ' or "
+inline std::vector<std::string> split_up(std::string str, char delimiter = '\0') {
+
+    const std::string delims("\'\"`");
+    auto find_ws = [delimiter](char ch) {
+        return (delimiter == '\0') ? (std::isspace<char>(ch, std::locale()) != 0) : (ch == delimiter);
+    };
+    trim(str);
+
+    std::vector<std::string> output;
+    bool embeddedQuote = false;
+    char keyChar = ' ';
+    while(!str.empty()) {
+        if(delims.find_first_of(str[0]) != std::string::npos) {
+            keyChar = str[0];
+            auto end = str.find_first_of(keyChar, 1);
+            while((end != std::string::npos) && (str[end - 1] == '\\')) {  // deal with escaped quotes
+                end = str.find_first_of(keyChar, end + 1);
+                embeddedQuote = true;
+            }
+            if(end != std::string::npos) {
+                output.push_back(str.substr(1, end - 1));
+                if(end + 2 < str.size()) {
+                    str = str.substr(end + 2);
+                } else {
+                    str.clear();
+                }
+
+            } else {
+                output.push_back(str.substr(1));
+                str = "";
+            }
+        } else {
+            auto it = std::find_if(std::begin(str), std::end(str), find_ws);
+            if(it != std::end(str)) {
+                std::string value = std::string(str.begin(), it);
+                output.push_back(value);
+                str = std::string(it + 1, str.end());
+            } else {
+                output.push_back(str);
+                str = "";
+            }
+        }
+        // transform any embedded quotes into the regular character
+        if(embeddedQuote) {
+            output.back() = find_and_replace(output.back(), std::string("\\") + keyChar, std::string(1, keyChar));
+            embeddedQuote = false;
+        }
+        trim(str);
+    }
+    return output;
+}
+
+/// This function detects an equal or colon followed by an escaped quote after an argument
+/// then modifies the string to replace the equality with a space.  This is needed
+/// to allow the split up function to work properly and is intended to be used with the find_and_modify function
+/// the return value is the offset+1 which is required by the find_and_modify function.
+inline std::size_t escape_detect(std::string &str, std::size_t offset) {
+    auto next = str[offset + 1];
+    if((next == '\"') || (next == '\'') || (next == '`')) {
+        auto astart = str.find_last_of("-/ \"\'`", offset - 1);
+        if(astart != std::string::npos) {
+            if(str[astart] == ((str[offset] == '=') ? '-' : '/'))
+                str[offset] = ' ';  // interpret this as a space so the split_up works properly
+        }
+    }
+    return offset + 1;
+}
+
+/// Add quotes if the string contains spaces
+inline std::string &add_quotes_if_needed(std::string &str) {
+    if((str.front() != '"' && str.front() != '\'') || str.front() != str.back()) {
+        char quote = str.find('"') < str.find('\'') ? '\'' : '"';
+        if(str.find(' ') != std::string::npos) {
+            str.insert(0, 1, quote);
+            str.append(1, quote);
+        }
+    }
+    return str;
+}
+
+}  // namespace detail
+
+
+
+
+// Use one of these on all error classes.
+// These are temporary and are undef'd at the end of this file.
+#define CLI11_ERROR_DEF(parent, name)                                                                                  \
+  protected:                                                                                                           \
+    name(std::string ename, std::string msg, int exit_code) : parent(std::move(ename), std::move(msg), exit_code) {}   \
+    name(std::string ename, std::string msg, ExitCodes exit_code)                                                      \
+        : parent(std::move(ename), std::move(msg), exit_code) {}                                                       \
+                                                                                                                       \
+  public:                                                                                                              \
+    name(std::string msg, ExitCodes exit_code) : parent(#name, std::move(msg), exit_code) {}                           \
+    name(std::string msg, int exit_code) : parent(#name, std::move(msg), exit_code) {}
+
+// This is added after the one above if a class is used directly and builds its own message
+#define CLI11_ERROR_SIMPLE(name)                                                                                       \
+    explicit name(std::string msg) : name(#name, msg, ExitCodes::name) {}
+
+/// These codes are part of every error in CLI. They can be obtained from e using e.exit_code or as a quick shortcut,
+/// int values from e.get_error_code().
+enum class ExitCodes {
+    Success = 0,
+    IncorrectConstruction = 100,
+    BadNameString,
+    OptionAlreadyAdded,
+    FileError,
+    ConversionError,
+    ValidationError,
+    RequiredError,
+    RequiresError,
+    ExcludesError,
+    ExtrasError,
+    ConfigError,
+    InvalidError,
+    HorribleError,
+    OptionNotFound,
+    ArgumentMismatch,
+    BaseClass = 127
+};
+
+// Error definitions
+
+/// @defgroup error_group Errors
+/// @brief Errors thrown by CLI11
+///
+/// These are the errors that can be thrown. Some of them, like CLI::Success, are not really errors.
+/// @{
+
+/// All errors derive from this one
+class Error : public std::runtime_error {
+    int actual_exit_code;
+    std::string error_name{"Error"};
+
+  public:
+    int get_exit_code() const { return actual_exit_code; }
+
+    std::string get_name() const { return error_name; }
+
+    Error(std::string name, std::string msg, int exit_code = static_cast<int>(ExitCodes::BaseClass))
+        : runtime_error(msg), actual_exit_code(exit_code), error_name(std::move(name)) {}
+
+    Error(std::string name, std::string msg, ExitCodes exit_code) : Error(name, msg, static_cast<int>(exit_code)) {}
+};
+
+// Note: Using Error::Error constructors does not work on GCC 4.7
+
+/// Construction errors (not in parsing)
+class ConstructionError : public Error {
+    CLI11_ERROR_DEF(Error, ConstructionError)
+};
+
+/// Thrown when an option is set to conflicting values (non-vector and multi args, for example)
+class IncorrectConstruction : public ConstructionError {
+    CLI11_ERROR_DEF(ConstructionError, IncorrectConstruction)
+    CLI11_ERROR_SIMPLE(IncorrectConstruction)
+    static IncorrectConstruction PositionalFlag(std::string name) {
+        return IncorrectConstruction(name + ": Flags cannot be positional");
+    }
+    static IncorrectConstruction Set0Opt(std::string name) {
+        return IncorrectConstruction(name + ": Cannot set 0 expected, use a flag instead");
+    }
+    static IncorrectConstruction SetFlag(std::string name) {
+        return IncorrectConstruction(name + ": Cannot set an expected number for flags");
+    }
+    static IncorrectConstruction ChangeNotVector(std::string name) {
+        return IncorrectConstruction(name + ": You can only change the expected arguments for vectors");
+    }
+    static IncorrectConstruction AfterMultiOpt(std::string name) {
+        return IncorrectConstruction(
+            name + ": You can't change expected arguments after you've changed the multi option policy!");
+    }
+    static IncorrectConstruction MissingOption(std::string name) {
+        return IncorrectConstruction("Option " + name + " is not defined");
+    }
+    static IncorrectConstruction MultiOptionPolicy(std::string name) {
+        return IncorrectConstruction(name + ": multi_option_policy only works for flags and exact value options");
+    }
+};
+
+/// Thrown on construction of a bad name
+class BadNameString : public ConstructionError {
+    CLI11_ERROR_DEF(ConstructionError, BadNameString)
+    CLI11_ERROR_SIMPLE(BadNameString)
+    static BadNameString OneCharName(std::string name) { return BadNameString("Invalid one char name: " + name); }
+    static BadNameString BadLongName(std::string name) { return BadNameString("Bad long name: " + name); }
+    static BadNameString DashesOnly(std::string name) {
+        return BadNameString("Must have a name, not just dashes: " + name);
+    }
+    static BadNameString MultiPositionalNames(std::string name) {
+        return BadNameString("Only one positional name allowed, remove: " + name);
+    }
+};
+
+/// Thrown when an option already exists
+class OptionAlreadyAdded : public ConstructionError {
+    CLI11_ERROR_DEF(ConstructionError, OptionAlreadyAdded)
+    explicit OptionAlreadyAdded(std::string name)
+        : OptionAlreadyAdded(name + " is already added", ExitCodes::OptionAlreadyAdded) {}
+    static OptionAlreadyAdded Requires(std::string name, std::string other) {
+        return OptionAlreadyAdded(name + " requires " + other, ExitCodes::OptionAlreadyAdded);
+    }
+    static OptionAlreadyAdded Excludes(std::string name, std::string other) {
+        return OptionAlreadyAdded(name + " excludes " + other, ExitCodes::OptionAlreadyAdded);
+    }
+};
+
+// Parsing errors
+
+/// Anything that can error in Parse
+class ParseError : public Error {
+    CLI11_ERROR_DEF(Error, ParseError)
+};
+
+// Not really "errors"
+
+/// This is a successful completion on parsing, supposed to exit
+class Success : public ParseError {
+    CLI11_ERROR_DEF(ParseError, Success)
+    Success() : Success("Successfully completed, should be caught and quit", ExitCodes::Success) {}
+};
+
+/// -h or --help on command line
+class CallForHelp : public Success {
+    CLI11_ERROR_DEF(Success, CallForHelp)
+    CallForHelp() : CallForHelp("This should be caught in your main function, see examples", ExitCodes::Success) {}
+};
+
+/// Usually something like --help-all on command line
+class CallForAllHelp : public Success {
+    CLI11_ERROR_DEF(Success, CallForAllHelp)
+    CallForAllHelp()
+        : CallForAllHelp("This should be caught in your main function, see examples", ExitCodes::Success) {}
+};
+
+/// -v or --version on command line
+class CallForVersion : public Success {
+    CLI11_ERROR_DEF(Success, CallForVersion)
+    CallForVersion()
+        : CallForVersion("This should be caught in your main function, see examples", ExitCodes::Success) {}
+};
+
+/// Does not output a diagnostic in CLI11_PARSE, but allows main() to return with a specific error code.
+class RuntimeError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, RuntimeError)
+    explicit RuntimeError(int exit_code = 1) : RuntimeError("Runtime error", exit_code) {}
+};
+
+/// Thrown when parsing an INI file and it is missing
+class FileError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, FileError)
+    CLI11_ERROR_SIMPLE(FileError)
+    static FileError Missing(std::string name) { return FileError(name + " was not readable (missing?)"); }
+};
+
+/// Thrown when conversion call back fails, such as when an int fails to coerce to a string
+class ConversionError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, ConversionError)
+    CLI11_ERROR_SIMPLE(ConversionError)
+    ConversionError(std::string member, std::string name)
+        : ConversionError("The value " + member + " is not an allowed value for " + name) {}
+    ConversionError(std::string name, std::vector<std::string> results)
+        : ConversionError("Could not convert: " + name + " = " + detail::join(results)) {}
+    static ConversionError TooManyInputsFlag(std::string name) {
+        return ConversionError(name + ": too many inputs for a flag");
+    }
+    static ConversionError TrueFalse(std::string name) {
+        return ConversionError(name + ": Should be true/false or a number");
+    }
+};
+
+/// Thrown when validation of results fails
+class ValidationError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, ValidationError)
+    CLI11_ERROR_SIMPLE(ValidationError)
+    explicit ValidationError(std::string name, std::string msg) : ValidationError(name + ": " + msg) {}
+};
+
+/// Thrown when a required option is missing
+class RequiredError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, RequiredError)
+    explicit RequiredError(std::string name) : RequiredError(name + " is required", ExitCodes::RequiredError) {}
+    static RequiredError Subcommand(std::size_t min_subcom) {
+        if(min_subcom == 1) {
+            return RequiredError("A subcommand");
+        }
+        return RequiredError("Requires at least " + std::to_string(min_subcom) + " subcommands",
+                             ExitCodes::RequiredError);
+    }
+    static RequiredError
+    Option(std::size_t min_option, std::size_t max_option, std::size_t used, const std::string &option_list) {
+        if((min_option == 1) && (max_option == 1) && (used == 0))
+            return RequiredError("Exactly 1 option from [" + option_list + "]");
+        if((min_option == 1) && (max_option == 1) && (used > 1)) {
+            return RequiredError("Exactly 1 option from [" + option_list + "] is required and " + std::to_string(used) +
+                                     " were given",
+                                 ExitCodes::RequiredError);
+        }
+        if((min_option == 1) && (used == 0))
+            return RequiredError("At least 1 option from [" + option_list + "]");
+        if(used < min_option) {
+            return RequiredError("Requires at least " + std::to_string(min_option) + " options used and only " +
+                                     std::to_string(used) + "were given from [" + option_list + "]",
+                                 ExitCodes::RequiredError);
+        }
+        if(max_option == 1)
+            return RequiredError("Requires at most 1 options be given from [" + option_list + "]",
+                                 ExitCodes::RequiredError);
+
+        return RequiredError("Requires at most " + std::to_string(max_option) + " options be used and " +
+                                 std::to_string(used) + "were given from [" + option_list + "]",
+                             ExitCodes::RequiredError);
+    }
+};
+
+/// Thrown when the wrong number of arguments has been received
+class ArgumentMismatch : public ParseError {
+    CLI11_ERROR_DEF(ParseError, ArgumentMismatch)
+    CLI11_ERROR_SIMPLE(ArgumentMismatch)
+    ArgumentMismatch(std::string name, int expected, std::size_t received)
+        : ArgumentMismatch(expected > 0 ? ("Expected exactly " + std::to_string(expected) + " arguments to " + name +
+                                           ", got " + std::to_string(received))
+                                        : ("Expected at least " + std::to_string(-expected) + " arguments to " + name +
+                                           ", got " + std::to_string(received)),
+                           ExitCodes::ArgumentMismatch) {}
+
+    static ArgumentMismatch AtLeast(std::string name, int num, std::size_t received) {
+        return ArgumentMismatch(name + ": At least " + std::to_string(num) + " required but received " +
+                                std::to_string(received));
+    }
+    static ArgumentMismatch AtMost(std::string name, int num, std::size_t received) {
+        return ArgumentMismatch(name + ": At Most " + std::to_string(num) + " required but received " +
+                                std::to_string(received));
+    }
+    static ArgumentMismatch TypedAtLeast(std::string name, int num, std::string type) {
+        return ArgumentMismatch(name + ": " + std::to_string(num) + " required " + type + " missing");
+    }
+    static ArgumentMismatch FlagOverride(std::string name) {
+        return ArgumentMismatch(name + " was given a disallowed flag override");
+    }
+};
+
+/// Thrown when a requires option is missing
+class RequiresError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, RequiresError)
+    RequiresError(std::string curname, std::string subname)
+        : RequiresError(curname + " requires " + subname, ExitCodes::RequiresError) {}
+};
+
+/// Thrown when an excludes option is present
+class ExcludesError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, ExcludesError)
+    ExcludesError(std::string curname, std::string subname)
+        : ExcludesError(curname + " excludes " + subname, ExitCodes::ExcludesError) {}
+};
+
+/// Thrown when too many positionals or options are found
+class ExtrasError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, ExtrasError)
+    explicit ExtrasError(std::vector<std::string> args)
+        : ExtrasError((args.size() > 1 ? "The following arguments were not expected: "
+                                       : "The following argument was not expected: ") +
+                          detail::rjoin(args, " "),
+                      ExitCodes::ExtrasError) {}
+    ExtrasError(const std::string &name, std::vector<std::string> args)
+        : ExtrasError(name,
+                      (args.size() > 1 ? "The following arguments were not expected: "
+                                       : "The following argument was not expected: ") +
+                          detail::rjoin(args, " "),
+                      ExitCodes::ExtrasError) {}
+};
+
+/// Thrown when extra values are found in an INI file
+class ConfigError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, ConfigError)
+    CLI11_ERROR_SIMPLE(ConfigError)
+    static ConfigError Extras(std::string item) { return ConfigError("INI was not able to parse " + item); }
+    static ConfigError NotConfigurable(std::string item) {
+        return ConfigError(item + ": This option is not allowed in a configuration file");
+    }
+};
+
+/// Thrown when validation fails before parsing
+class InvalidError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, InvalidError)
+    explicit InvalidError(std::string name)
+        : InvalidError(name + ": Too many positional arguments with unlimited expected args", ExitCodes::InvalidError) {
+    }
+};
+
+/// This is just a safety check to verify selection and parsing match - you should not ever see it
+/// Strings are directly added to this error, but again, it should never be seen.
+class HorribleError : public ParseError {
+    CLI11_ERROR_DEF(ParseError, HorribleError)
+    CLI11_ERROR_SIMPLE(HorribleError)
+};
+
+// After parsing
+
+/// Thrown when counting a non-existent option
+class OptionNotFound : public Error {
+    CLI11_ERROR_DEF(Error, OptionNotFound)
+    explicit OptionNotFound(std::string name) : OptionNotFound(name + " not found", ExitCodes::OptionNotFound) {}
+};
+
+#undef CLI11_ERROR_DEF
+#undef CLI11_ERROR_SIMPLE
+
+/// @}
+
+
+
+
+// Type tools
+
+// Utilities for type enabling
+namespace detail {
+// Based generally on https://rmf.io/cxx11/almost-static-if
+/// Simple empty scoped class
+enum class enabler {};
+
+/// An instance to use in EnableIf
+constexpr enabler dummy = {};
+}  // namespace detail
+
+/// A copy of enable_if_t from C++14, compatible with C++11.
+///
+/// We could check to see if C++14 is being used, but it does not hurt to redefine this
+/// (even Google does this: https://github.com/google/skia/blob/main/include/private/SkTLogic.h)
+/// It is not in the std namespace anyway, so no harm done.
+template <bool B, class T = void> using enable_if_t = typename std::enable_if<B, T>::type;
+
+/// A copy of std::void_t from C++17 (helper for C++11 and C++14)
+template <typename... Ts> struct make_void { using type = void; };
+
+/// A copy of std::void_t from C++17 - same reasoning as enable_if_t, it does not hurt to redefine
+template <typename... Ts> using void_t = typename make_void<Ts...>::type;
+
+/// A copy of std::conditional_t from C++14 - same reasoning as enable_if_t, it does not hurt to redefine
+template <bool B, class T, class F> using conditional_t = typename std::conditional<B, T, F>::type;
+
+/// Check to see if something is bool (fail check by default)
+template <typename T> struct is_bool : std::false_type {};
+
+/// Check to see if something is bool (true if actually a bool)
+template <> struct is_bool<bool> : std::true_type {};
+
+/// Check to see if something is a shared pointer
+template <typename T> struct is_shared_ptr : std::false_type {};
+
+/// Check to see if something is a shared pointer (True if really a shared pointer)
+template <typename T> struct is_shared_ptr<std::shared_ptr<T>> : std::true_type {};
+
+/// Check to see if something is a shared pointer (True if really a shared pointer)
+template <typename T> struct is_shared_ptr<const std::shared_ptr<T>> : std::true_type {};
+
+/// Check to see if something is copyable pointer
+template <typename T> struct is_copyable_ptr {
+    static bool const value = is_shared_ptr<T>::value || std::is_pointer<T>::value;
+};
+
+/// This can be specialized to override the type deduction for IsMember.
+template <typename T> struct IsMemberType { using type = T; };
+
+/// The main custom type needed here is const char * should be a string.
+template <> struct IsMemberType<const char *> { using type = std::string; };
+
+namespace detail {
+
+// These are utilities for IsMember and other transforming objects
+
+/// Handy helper to access the element_type generically. This is not part of is_copyable_ptr because it requires that
+/// pointer_traits<T> be valid.
+
+/// not a pointer
+template <typename T, typename Enable = void> struct element_type { using type = T; };
+
+template <typename T> struct element_type<T, typename std::enable_if<is_copyable_ptr<T>::value>::type> {
+    using type = typename std::pointer_traits<T>::element_type;
+};
+
+/// Combination of the element type and value type - remove pointer (including smart pointers) and get the value_type of
+/// the container
+template <typename T> struct element_value_type { using type = typename element_type<T>::type::value_type; };
+
+/// Adaptor for set-like structure: This just wraps a normal container in a few utilities that do almost nothing.
+template <typename T, typename _ = void> struct pair_adaptor : std::false_type {
+    using value_type = typename T::value_type;
+    using first_type = typename std::remove_const<value_type>::type;
+    using second_type = typename std::remove_const<value_type>::type;
+
+    /// Get the first value (really just the underlying value)
+    template <typename Q> static auto first(Q &&pair_value) -> decltype(std::forward<Q>(pair_value)) {
+        return std::forward<Q>(pair_value);
+    }
+    /// Get the second value (really just the underlying value)
+    template <typename Q> static auto second(Q &&pair_value) -> decltype(std::forward<Q>(pair_value)) {
+        return std::forward<Q>(pair_value);
+    }
+};
+
+/// Adaptor for map-like structure (true version, must have key_type and mapped_type).
+/// This wraps a mapped container in a few utilities access it in a general way.
+template <typename T>
+struct pair_adaptor<
+    T,
+    conditional_t<false, void_t<typename T::value_type::first_type, typename T::value_type::second_type>, void>>
+    : std::true_type {
+    using value_type = typename T::value_type;
+    using first_type = typename std::remove_const<typename value_type::first_type>::type;
+    using second_type = typename std::remove_const<typename value_type::second_type>::type;
+
+    /// Get the first value (really just the underlying value)
+    template <typename Q> static auto first(Q &&pair_value) -> decltype(std::get<0>(std::forward<Q>(pair_value))) {
+        return std::get<0>(std::forward<Q>(pair_value));
+    }
+    /// Get the second value (really just the underlying value)
+    template <typename Q> static auto second(Q &&pair_value) -> decltype(std::get<1>(std::forward<Q>(pair_value))) {
+        return std::get<1>(std::forward<Q>(pair_value));
+    }
+};
+
+// Warning is suppressed due to "bug" in gcc<5.0 and gcc 7.0 with c++17 enabled that generates a Wnarrowing warning
+// in the unevaluated context even if the function that was using this wasn't used.  The standard says narrowing in
+// brace initialization shouldn't be allowed but for backwards compatibility gcc allows it in some contexts.  It is a
+// little fuzzy what happens in template constructs and I think that was something GCC took a little while to work out.
+// But regardless some versions of gcc generate a warning when they shouldn't from the following code so that should be
+// suppressed
+#ifdef __GNUC__
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wnarrowing"
+#endif
+// check for constructibility from a specific type and copy assignable used in the parse detection
+template <typename T, typename C> class is_direct_constructible {
+    template <typename TT, typename CC>
+    static auto test(int, std::true_type) -> decltype(
+// NVCC warns about narrowing conversions here
+#ifdef __CUDACC__
+#pragma diag_suppress 2361
+#endif
+        TT { std::declval<CC>() }
+#ifdef __CUDACC__
+#pragma diag_default 2361
+#endif
+        ,
+        std::is_move_assignable<TT>());
+
+    template <typename TT, typename CC> static auto test(int, std::false_type) -> std::false_type;
+
+    template <typename, typename> static auto test(...) -> std::false_type;
+
+  public:
+    static constexpr bool value = decltype(test<T, C>(0, typename std::is_constructible<T, C>::type()))::value;
+};
+#ifdef __GNUC__
+#pragma GCC diagnostic pop
+#endif
+
+// Check for output streamability
+// Based on https://stackoverflow.com/questions/22758291/how-can-i-detect-if-a-type-can-be-streamed-to-an-stdostream
+
+template <typename T, typename S = std::ostringstream> class is_ostreamable {
+    template <typename TT, typename SS>
+    static auto test(int) -> decltype(std::declval<SS &>() << std::declval<TT>(), std::true_type());
+
+    template <typename, typename> static auto test(...) -> std::false_type;
+
+  public:
+    static constexpr bool value = decltype(test<T, S>(0))::value;
+};
+
+/// Check for input streamability
+template <typename T, typename S = std::istringstream> class is_istreamable {
+    template <typename TT, typename SS>
+    static auto test(int) -> decltype(std::declval<SS &>() >> std::declval<TT &>(), std::true_type());
+
+    template <typename, typename> static auto test(...) -> std::false_type;
+
+  public:
+    static constexpr bool value = decltype(test<T, S>(0))::value;
+};
+
+/// Check for complex
+template <typename T> class is_complex {
+    template <typename TT>
+    static auto test(int) -> decltype(std::declval<TT>().real(), std::declval<TT>().imag(), std::true_type());
+
+    template <typename> static auto test(...) -> std::false_type;
+
+  public:
+    static constexpr bool value = decltype(test<T>(0))::value;
+};
+
+/// Templated operation to get a value from a stream
+template <typename T, enable_if_t<is_istreamable<T>::value, detail::enabler> = detail::dummy>
+bool from_stream(const std::string &istring, T &obj) {
+    std::istringstream is;
+    is.str(istring);
+    is >> obj;
+    return !is.fail() && !is.rdbuf()->in_avail();
+}
+
+template <typename T, enable_if_t<!is_istreamable<T>::value, detail::enabler> = detail::dummy>
+bool from_stream(const std::string & /*istring*/, T & /*obj*/) {
+    return false;
+}
+
+// check to see if an object is a mutable container (fail by default)
+template <typename T, typename _ = void> struct is_mutable_container : std::false_type {};
+
+/// type trait to test if a type is a mutable container meaning it has a value_type, it has an iterator, a clear, and
+/// end methods and an insert function.  And for our purposes we exclude std::string and types that can be constructed
+/// from a std::string
+template <typename T>
+struct is_mutable_container<
+    T,
+    conditional_t<false,
+                  void_t<typename T::value_type,
+                         decltype(std::declval<T>().end()),
+                         decltype(std::declval<T>().clear()),
+                         decltype(std::declval<T>().insert(std::declval<decltype(std::declval<T>().end())>(),
+                                                           std::declval<const typename T::value_type &>()))>,
+                  void>>
+    : public conditional_t<std::is_constructible<T, std::string>::value, std::false_type, std::true_type> {};
+
+// check to see if an object is a mutable container (fail by default)
+template <typename T, typename _ = void> struct is_readable_container : std::false_type {};
+
+/// type trait to test if a type is a container meaning it has a value_type, it has an iterator, a clear, and an end
+/// methods and an insert function.  And for our purposes we exclude std::string and types that can be constructed from
+/// a std::string
+template <typename T>
+struct is_readable_container<
+    T,
+    conditional_t<false, void_t<decltype(std::declval<T>().end()), decltype(std::declval<T>().begin())>, void>>
+    : public std::true_type {};
+
+// check to see if an object is a wrapper (fail by default)
+template <typename T, typename _ = void> struct is_wrapper : std::false_type {};
+
+// check if an object is a wrapper (it has a value_type defined)
+template <typename T>
+struct is_wrapper<T, conditional_t<false, void_t<typename T::value_type>, void>> : public std::true_type {};
+
+// Check for tuple like types, as in classes with a tuple_size type trait
+template <typename S> class is_tuple_like {
+    template <typename SS>
+    // static auto test(int)
+    //     -> decltype(std::conditional<(std::tuple_size<SS>::value > 0), std::true_type, std::false_type>::type());
+    static auto test(int) -> decltype(std::tuple_size<typename std::decay<SS>::type>::value, std::true_type{});
+    template <typename> static auto test(...) -> std::false_type;
+
+  public:
+    static constexpr bool value = decltype(test<S>(0))::value;
+};
+
+/// Convert an object to a string (directly forward if this can become a string)
+template <typename T, enable_if_t<std::is_convertible<T, std::string>::value, detail::enabler> = detail::dummy>
+auto to_string(T &&value) -> decltype(std::forward<T>(value)) {
+    return std::forward<T>(value);
+}
+
+/// Construct a string from the object
+template <typename T,
+          enable_if_t<std::is_constructible<std::string, T>::value && !std::is_convertible<T, std::string>::value,
+                      detail::enabler> = detail::dummy>
+std::string to_string(const T &value) {
+    return std::string(value);
+}
+
+/// Convert an object to a string (streaming must be supported for that type)
+template <typename T,
+          enable_if_t<!std::is_convertible<std::string, T>::value && !std::is_constructible<std::string, T>::value &&
+                          is_ostreamable<T>::value,
+                      detail::enabler> = detail::dummy>
+std::string to_string(T &&value) {
+    std::stringstream stream;
+    stream << value;
+    return stream.str();
+}
+
+/// If conversion is not supported, return an empty string (streaming is not supported for that type)
+template <typename T,
+          enable_if_t<!std::is_constructible<std::string, T>::value && !is_ostreamable<T>::value &&
+                          !is_readable_container<typename std::remove_const<T>::type>::value,
+                      detail::enabler> = detail::dummy>
+std::string to_string(T &&) {
+    return std::string{};
+}
+
+/// convert a readable container to a string
+template <typename T,
+          enable_if_t<!std::is_constructible<std::string, T>::value && !is_ostreamable<T>::value &&
+                          is_readable_container<T>::value,
+                      detail::enabler> = detail::dummy>
+std::string to_string(T &&variable) {
+    std::vector<std::string> defaults;
+    auto cval = variable.begin();
+    auto end = variable.end();
+    while(cval != end) {
+        defaults.emplace_back(CLI::detail::to_string(*cval));
+        ++cval;
+    }
+    return std::string("[" + detail::join(defaults) + "]");
+}
+
+/// special template overload
+template <typename T1,
+          typename T2,
+          typename T,
+          enable_if_t<std::is_same<T1, T2>::value, detail::enabler> = detail::dummy>
+auto checked_to_string(T &&value) -> decltype(to_string(std::forward<T>(value))) {
+    return to_string(std::forward<T>(value));
+}
+
+/// special template overload
+template <typename T1,
+          typename T2,
+          typename T,
+          enable_if_t<!std::is_same<T1, T2>::value, detail::enabler> = detail::dummy>
+std::string checked_to_string(T &&) {
+    return std::string{};
+}
+/// get a string as a convertible value for arithmetic types
+template <typename T, enable_if_t<std::is_arithmetic<T>::value, detail::enabler> = detail::dummy>
+std::string value_string(const T &value) {
+    return std::to_string(value);
+}
+/// get a string as a convertible value for enumerations
+template <typename T, enable_if_t<std::is_enum<T>::value, detail::enabler> = detail::dummy>
+std::string value_string(const T &value) {
+    return std::to_string(static_cast<typename std::underlying_type<T>::type>(value));
+}
+/// for other types just use the regular to_string function
+template <typename T,
+          enable_if_t<!std::is_enum<T>::value && !std::is_arithmetic<T>::value, detail::enabler> = detail::dummy>
+auto value_string(const T &value) -> decltype(to_string(value)) {
+    return to_string(value);
+}
+
+/// template to get the underlying value type if it exists or use a default
+template <typename T, typename def, typename Enable = void> struct wrapped_type { using type = def; };
+
+/// Type size for regular object types that do not look like a tuple
+template <typename T, typename def> struct wrapped_type<T, def, typename std::enable_if<is_wrapper<T>::value>::type> {
+    using type = typename T::value_type;
+};
+
+/// This will only trigger for actual void type
+template <typename T, typename Enable = void> struct type_count_base { static const int value{0}; };
+
+/// Type size for regular object types that do not look like a tuple
+template <typename T>
+struct type_count_base<T,
+                       typename std::enable_if<!is_tuple_like<T>::value && !is_mutable_container<T>::value &&
+                                               !std::is_void<T>::value>::type> {
+    static constexpr int value{1};
+};
+
+/// the base tuple size
+template <typename T>
+struct type_count_base<T, typename std::enable_if<is_tuple_like<T>::value && !is_mutable_container<T>::value>::type> {
+    static constexpr int value{std::tuple_size<T>::value};
+};
+
+/// Type count base for containers is the type_count_base of the individual element
+template <typename T> struct type_count_base<T, typename std::enable_if<is_mutable_container<T>::value>::type> {
+    static constexpr int value{type_count_base<typename T::value_type>::value};
+};
+
+/// Set of overloads to get the type size of an object
+
+/// forward declare the subtype_count structure
+template <typename T> struct subtype_count;
+
+/// forward declare the subtype_count_min structure
+template <typename T> struct subtype_count_min;
+
+/// This will only trigger for actual void type
+template <typename T, typename Enable = void> struct type_count { static const int value{0}; };
+
+/// Type size for regular object types that do not look like a tuple
+template <typename T>
+struct type_count<T,
+                  typename std::enable_if<!is_wrapper<T>::value && !is_tuple_like<T>::value && !is_complex<T>::value &&
+                                          !std::is_void<T>::value>::type> {
+    static constexpr int value{1};
+};
+
+/// Type size for complex since it sometimes looks like a wrapper
+template <typename T> struct type_count<T, typename std::enable_if<is_complex<T>::value>::type> {
+    static constexpr int value{2};
+};
+
+/// Type size of types that are wrappers,except complex and tuples(which can also be wrappers sometimes)
+template <typename T> struct type_count<T, typename std::enable_if<is_mutable_container<T>::value>::type> {
+    static constexpr int value{subtype_count<typename T::value_type>::value};
+};
+
+/// Type size of types that are wrappers,except containers complex and tuples(which can also be wrappers sometimes)
+template <typename T>
+struct type_count<T,
+                  typename std::enable_if<is_wrapper<T>::value && !is_complex<T>::value && !is_tuple_like<T>::value &&
+                                          !is_mutable_container<T>::value>::type> {
+    static constexpr int value{type_count<typename T::value_type>::value};
+};
+
+/// 0 if the index > tuple size
+template <typename T, std::size_t I>
+constexpr typename std::enable_if<I == type_count_base<T>::value, int>::type tuple_type_size() {
+    return 0;
+}
+
+/// Recursively generate the tuple type name
+template <typename T, std::size_t I>
+    constexpr typename std::enable_if < I<type_count_base<T>::value, int>::type tuple_type_size() {
+    return subtype_count<typename std::tuple_element<I, T>::type>::value + tuple_type_size<T, I + 1>();
+}
+
+/// Get the type size of the sum of type sizes for all the individual tuple types
+template <typename T> struct type_count<T, typename std::enable_if<is_tuple_like<T>::value>::type> {
+    static constexpr int value{tuple_type_size<T, 0>()};
+};
+
+/// definition of subtype count
+template <typename T> struct subtype_count {
+    static constexpr int value{is_mutable_container<T>::value ? expected_max_vector_size : type_count<T>::value};
+};
+
+/// This will only trigger for actual void type
+template <typename T, typename Enable = void> struct type_count_min { static const int value{0}; };
+
+/// Type size for regular object types that do not look like a tuple
+template <typename T>
+struct type_count_min<
+    T,
+    typename std::enable_if<!is_mutable_container<T>::value && !is_tuple_like<T>::value && !is_wrapper<T>::value &&
+                            !is_complex<T>::value && !std::is_void<T>::value>::type> {
+    static constexpr int value{type_count<T>::value};
+};
+
+/// Type size for complex since it sometimes looks like a wrapper
+template <typename T> struct type_count_min<T, typename std::enable_if<is_complex<T>::value>::type> {
+    static constexpr int value{1};
+};
+
+/// Type size min of types that are wrappers,except complex and tuples(which can also be wrappers sometimes)
+template <typename T>
+struct type_count_min<
+    T,
+    typename std::enable_if<is_wrapper<T>::value && !is_complex<T>::value && !is_tuple_like<T>::value>::type> {
+    static constexpr int value{subtype_count_min<typename T::value_type>::value};
+};
+
+/// 0 if the index > tuple size
+template <typename T, std::size_t I>
+constexpr typename std::enable_if<I == type_count_base<T>::value, int>::type tuple_type_size_min() {
+    return 0;
+}
+
+/// Recursively generate the tuple type name
+template <typename T, std::size_t I>
+    constexpr typename std::enable_if < I<type_count_base<T>::value, int>::type tuple_type_size_min() {
+    return subtype_count_min<typename std::tuple_element<I, T>::type>::value + tuple_type_size_min<T, I + 1>();
+}
+
+/// Get the type size of the sum of type sizes for all the individual tuple types
+template <typename T> struct type_count_min<T, typename std::enable_if<is_tuple_like<T>::value>::type> {
+    static constexpr int value{tuple_type_size_min<T, 0>()};
+};
+
+/// definition of subtype count
+template <typename T> struct subtype_count_min {
+    static constexpr int value{is_mutable_container<T>::value
+                                   ? ((type_count<T>::value < expected_max_vector_size) ? type_count<T>::value : 0)
+                                   : type_count_min<T>::value};
+};
+
+/// This will only trigger for actual void type
+template <typename T, typename Enable = void> struct expected_count { static const int value{0}; };
+
+/// For most types the number of expected items is 1
+template <typename T>
+struct expected_count<T,
+                      typename std::enable_if<!is_mutable_container<T>::value && !is_wrapper<T>::value &&
+                                              !std::is_void<T>::value>::type> {
+    static constexpr int value{1};
+};
+/// number of expected items in a vector
+template <typename T> struct expected_count<T, typename std::enable_if<is_mutable_container<T>::value>::type> {
+    static constexpr int value{expected_max_vector_size};
+};
+
+/// number of expected items in a vector
+template <typename T>
+struct expected_count<T, typename std::enable_if<!is_mutable_container<T>::value && is_wrapper<T>::value>::type> {
+    static constexpr int value{expected_count<typename T::value_type>::value};
+};
+
+// Enumeration of the different supported categorizations of objects
+enum class object_category : int {
+    char_value = 1,
+    integral_value = 2,
+    unsigned_integral = 4,
+    enumeration = 6,
+    boolean_value = 8,
+    floating_point = 10,
+    number_constructible = 12,
+    double_constructible = 14,
+    integer_constructible = 16,
+    // string like types
+    string_assignable = 23,
+    string_constructible = 24,
+    other = 45,
+    // special wrapper or container types
+    wrapper_value = 50,
+    complex_number = 60,
+    tuple_value = 70,
+    container_value = 80,
+
+};
+
+/// Set of overloads to classify an object according to type
+
+/// some type that is not otherwise recognized
+template <typename T, typename Enable = void> struct classify_object {
+    static constexpr object_category value{object_category::other};
+};
+
+/// Signed integers
+template <typename T>
+struct classify_object<
+    T,
+    typename std::enable_if<std::is_integral<T>::value && !std::is_same<T, char>::value && std::is_signed<T>::value &&
+                            !is_bool<T>::value && !std::is_enum<T>::value>::type> {
+    static constexpr object_category value{object_category::integral_value};
+};
+
+/// Unsigned integers
+template <typename T>
+struct classify_object<T,
+                       typename std::enable_if<std::is_integral<T>::value && std::is_unsigned<T>::value &&
+                                               !std::is_same<T, char>::value && !is_bool<T>::value>::type> {
+    static constexpr object_category value{object_category::unsigned_integral};
+};
+
+/// single character values
+template <typename T>
+struct classify_object<T, typename std::enable_if<std::is_same<T, char>::value && !std::is_enum<T>::value>::type> {
+    static constexpr object_category value{object_category::char_value};
+};
+
+/// Boolean values
+template <typename T> struct classify_object<T, typename std::enable_if<is_bool<T>::value>::type> {
+    static constexpr object_category value{object_category::boolean_value};
+};
+
+/// Floats
+template <typename T> struct classify_object<T, typename std::enable_if<std::is_floating_point<T>::value>::type> {
+    static constexpr object_category value{object_category::floating_point};
+};
+
+/// String and similar direct assignment
+template <typename T>
+struct classify_object<T,
+                       typename std::enable_if<!std::is_floating_point<T>::value && !std::is_integral<T>::value &&
+                                               std::is_assignable<T &, std::string>::value>::type> {
+    static constexpr object_category value{object_category::string_assignable};
+};
+
+/// String and similar constructible and copy assignment
+template <typename T>
+struct classify_object<
+    T,
+    typename std::enable_if<!std::is_floating_point<T>::value && !std::is_integral<T>::value &&
+                            !std::is_assignable<T &, std::string>::value && (type_count<T>::value == 1) &&
+                            std::is_constructible<T, std::string>::value>::type> {
+    static constexpr object_category value{object_category::string_constructible};
+};
+
+/// Enumerations
+template <typename T> struct classify_object<T, typename std::enable_if<std::is_enum<T>::value>::type> {
+    static constexpr object_category value{object_category::enumeration};
+};
+
+template <typename T> struct classify_object<T, typename std::enable_if<is_complex<T>::value>::type> {
+    static constexpr object_category value{object_category::complex_number};
+};
+
+/// Handy helper to contain a bunch of checks that rule out many common types (integers, string like, floating point,
+/// vectors, and enumerations
+template <typename T> struct uncommon_type {
+    using type = typename std::conditional<!std::is_floating_point<T>::value && !std::is_integral<T>::value &&
+                                               !std::is_assignable<T &, std::string>::value &&
+                                               !std::is_constructible<T, std::string>::value && !is_complex<T>::value &&
+                                               !is_mutable_container<T>::value && !std::is_enum<T>::value,
+                                           std::true_type,
+                                           std::false_type>::type;
+    static constexpr bool value = type::value;
+};
+
+/// wrapper type
+template <typename T>
+struct classify_object<T,
+                       typename std::enable_if<(!is_mutable_container<T>::value && is_wrapper<T>::value &&
+                                                !is_tuple_like<T>::value && uncommon_type<T>::value)>::type> {
+    static constexpr object_category value{object_category::wrapper_value};
+};
+
+/// Assignable from double or int
+template <typename T>
+struct classify_object<T,
+                       typename std::enable_if<uncommon_type<T>::value && type_count<T>::value == 1 &&
+                                               !is_wrapper<T>::value && is_direct_constructible<T, double>::value &&
+                                               is_direct_constructible<T, int>::value>::type> {
+    static constexpr object_category value{object_category::number_constructible};
+};
+
+/// Assignable from int
+template <typename T>
+struct classify_object<T,
+                       typename std::enable_if<uncommon_type<T>::value && type_count<T>::value == 1 &&
+                                               !is_wrapper<T>::value && !is_direct_constructible<T, double>::value &&
+                                               is_direct_constructible<T, int>::value>::type> {
+    static constexpr object_category value{object_category::integer_constructible};
+};
+
+/// Assignable from double
+template <typename T>
+struct classify_object<T,
+                       typename std::enable_if<uncommon_type<T>::value && type_count<T>::value == 1 &&
+                                               !is_wrapper<T>::value && is_direct_constructible<T, double>::value &&
+                                               !is_direct_constructible<T, int>::value>::type> {
+    static constexpr object_category value{object_category::double_constructible};
+};
+
+/// Tuple type
+template <typename T>
+struct classify_object<
+    T,
+    typename std::enable_if<is_tuple_like<T>::value &&
+                            ((type_count<T>::value >= 2 && !is_wrapper<T>::value) ||
+                             (uncommon_type<T>::value && !is_direct_constructible<T, double>::value &&
+                              !is_direct_constructible<T, int>::value))>::type> {
+    static constexpr object_category value{object_category::tuple_value};
+    // the condition on this class requires it be like a tuple, but on some compilers (like Xcode) tuples can be
+    // constructed from just the first element so tuples of <string, int,int> can be constructed from a string, which
+    // could lead to issues so there are two variants of the condition, the first isolates things with a type size >=2
+    // mainly to get tuples on Xcode with the exception of wrappers, the second is the main one and just separating out
+    // those cases that are caught by other object classifications
+};
+
+/// container type
+template <typename T> struct classify_object<T, typename std::enable_if<is_mutable_container<T>::value>::type> {
+    static constexpr object_category value{object_category::container_value};
+};
+
+// Type name print
+
+/// Was going to be based on
+///  http://stackoverflow.com/questions/1055452/c-get-name-of-type-in-template
+/// But this is cleaner and works better in this case
+
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::char_value, detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "CHAR";
+}
+
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::integral_value ||
+                          classify_object<T>::value == object_category::integer_constructible,
+                      detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "INT";
+}
+
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::unsigned_integral, detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "UINT";
+}
+
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::floating_point ||
+                          classify_object<T>::value == object_category::number_constructible ||
+                          classify_object<T>::value == object_category::double_constructible,
+                      detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "FLOAT";
+}
+
+/// Print name for enumeration types
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::enumeration, detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "ENUM";
+}
+
+/// Print name for enumeration types
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::boolean_value, detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "BOOLEAN";
+}
+
+/// Print name for enumeration types
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::complex_number, detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "COMPLEX";
+}
+
+/// Print for all other types
+template <typename T,
+          enable_if_t<classify_object<T>::value >= object_category::string_assignable &&
+                          classify_object<T>::value <= object_category::other,
+                      detail::enabler> = detail::dummy>
+constexpr const char *type_name() {
+    return "TEXT";
+}
+/// typename for tuple value
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::tuple_value && type_count_base<T>::value >= 2,
+                      detail::enabler> = detail::dummy>
+std::string type_name();  // forward declaration
+
+/// Generate type name for a wrapper or container value
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::container_value ||
+                          classify_object<T>::value == object_category::wrapper_value,
+                      detail::enabler> = detail::dummy>
+std::string type_name();  // forward declaration
+
+/// Print name for single element tuple types
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::tuple_value && type_count_base<T>::value == 1,
+                      detail::enabler> = detail::dummy>
+inline std::string type_name() {
+    return type_name<typename std::decay<typename std::tuple_element<0, T>::type>::type>();
+}
+
+/// Empty string if the index > tuple size
+template <typename T, std::size_t I>
+inline typename std::enable_if<I == type_count_base<T>::value, std::string>::type tuple_name() {
+    return std::string{};
+}
+
+/// Recursively generate the tuple type name
+template <typename T, std::size_t I>
+inline typename std::enable_if<(I < type_count_base<T>::value), std::string>::type tuple_name() {
+    std::string str = std::string(type_name<typename std::decay<typename std::tuple_element<I, T>::type>::type>()) +
+                      ',' + tuple_name<T, I + 1>();
+    if(str.back() == ',')
+        str.pop_back();
+    return str;
+}
+
+/// Print type name for tuples with 2 or more elements
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::tuple_value && type_count_base<T>::value >= 2,
+                      detail::enabler>>
+inline std::string type_name() {
+    auto tname = std::string(1, '[') + tuple_name<T, 0>();
+    tname.push_back(']');
+    return tname;
+}
+
+/// get the type name for a type that has a value_type member
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::container_value ||
+                          classify_object<T>::value == object_category::wrapper_value,
+                      detail::enabler>>
+inline std::string type_name() {
+    return type_name<typename T::value_type>();
+}
+
+// Lexical cast
+
+/// Convert to an unsigned integral
+template <typename T, enable_if_t<std::is_unsigned<T>::value, detail::enabler> = detail::dummy>
+bool integral_conversion(const std::string &input, T &output) noexcept {
+    if(input.empty()) {
+        return false;
+    }
+    char *val = nullptr;
+    std::uint64_t output_ll = std::strtoull(input.c_str(), &val, 0);
+    output = static_cast<T>(output_ll);
+    return val == (input.c_str() + input.size()) && static_cast<std::uint64_t>(output) == output_ll;
+}
+
+/// Convert to a signed integral
+template <typename T, enable_if_t<std::is_signed<T>::value, detail::enabler> = detail::dummy>
+bool integral_conversion(const std::string &input, T &output) noexcept {
+    if(input.empty()) {
+        return false;
+    }
+    char *val = nullptr;
+    std::int64_t output_ll = std::strtoll(input.c_str(), &val, 0);
+    output = static_cast<T>(output_ll);
+    return val == (input.c_str() + input.size()) && static_cast<std::int64_t>(output) == output_ll;
+}
+
+/// Convert a flag into an integer value  typically binary flags
+inline std::int64_t to_flag_value(std::string val) {
+    static const std::string trueString("true");
+    static const std::string falseString("false");
+    if(val == trueString) {
+        return 1;
+    }
+    if(val == falseString) {
+        return -1;
+    }
+    val = detail::to_lower(val);
+    std::int64_t ret;
+    if(val.size() == 1) {
+        if(val[0] >= '1' && val[0] <= '9') {
+            return (static_cast<std::int64_t>(val[0]) - '0');
+        }
+        switch(val[0]) {
+        case '0':
+        case 'f':
+        case 'n':
+        case '-':
+            ret = -1;
+            break;
+        case 't':
+        case 'y':
+        case '+':
+            ret = 1;
+            break;
+        default:
+            throw std::invalid_argument("unrecognized character");
+        }
+        return ret;
+    }
+    if(val == trueString || val == "on" || val == "yes" || val == "enable") {
+        ret = 1;
+    } else if(val == falseString || val == "off" || val == "no" || val == "disable") {
+        ret = -1;
+    } else {
+        ret = std::stoll(val);
+    }
+    return ret;
+}
+
+/// Integer conversion
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::integral_value ||
+                          classify_object<T>::value == object_category::unsigned_integral,
+                      detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    return integral_conversion(input, output);
+}
+
+/// char values
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::char_value, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    if(input.size() == 1) {
+        output = static_cast<T>(input[0]);
+        return true;
+    }
+    return integral_conversion(input, output);
+}
+
+/// Boolean values
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::boolean_value, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    try {
+        auto out = to_flag_value(input);
+        output = (out > 0);
+        return true;
+    } catch(const std::invalid_argument &) {
+        return false;
+    } catch(const std::out_of_range &) {
+        // if the number is out of the range of a 64 bit value then it is still a number and for this purpose is still
+        // valid all we care about the sign
+        output = (input[0] != '-');
+        return true;
+    }
+}
+
+/// Floats
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::floating_point, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    if(input.empty()) {
+        return false;
+    }
+    char *val = nullptr;
+    auto output_ld = std::strtold(input.c_str(), &val);
+    output = static_cast<T>(output_ld);
+    return val == (input.c_str() + input.size());
+}
+
+/// complex
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::complex_number, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    using XC = typename wrapped_type<T, double>::type;
+    XC x{0.0}, y{0.0};
+    auto str1 = input;
+    bool worked = false;
+    auto nloc = str1.find_last_of("+-");
+    if(nloc != std::string::npos && nloc > 0) {
+        worked = detail::lexical_cast(str1.substr(0, nloc), x);
+        str1 = str1.substr(nloc);
+        if(str1.back() == 'i' || str1.back() == 'j')
+            str1.pop_back();
+        worked = worked && detail::lexical_cast(str1, y);
+    } else {
+        if(str1.back() == 'i' || str1.back() == 'j') {
+            str1.pop_back();
+            worked = detail::lexical_cast(str1, y);
+            x = XC{0};
+        } else {
+            worked = detail::lexical_cast(str1, x);
+            y = XC{0};
+        }
+    }
+    if(worked) {
+        output = T{x, y};
+        return worked;
+    }
+    return from_stream(input, output);
+}
+
+/// String and similar direct assignment
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::string_assignable, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    output = input;
+    return true;
+}
+
+/// String and similar constructible and copy assignment
+template <
+    typename T,
+    enable_if_t<classify_object<T>::value == object_category::string_constructible, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    output = T(input);
+    return true;
+}
+
+/// Enumerations
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::enumeration, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    typename std::underlying_type<T>::type val;
+    if(!integral_conversion(input, val)) {
+        return false;
+    }
+    output = static_cast<T>(val);
+    return true;
+}
+
+/// wrapper types
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::wrapper_value &&
+                          std::is_assignable<T &, typename T::value_type>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    typename T::value_type val;
+    if(lexical_cast(input, val)) {
+        output = val;
+        return true;
+    }
+    return from_stream(input, output);
+}
+
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::wrapper_value &&
+                          !std::is_assignable<T &, typename T::value_type>::value && std::is_assignable<T &, T>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    typename T::value_type val;
+    if(lexical_cast(input, val)) {
+        output = T{val};
+        return true;
+    }
+    return from_stream(input, output);
+}
+
+/// Assignable from double or int
+template <
+    typename T,
+    enable_if_t<classify_object<T>::value == object_category::number_constructible, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    int val;
+    if(integral_conversion(input, val)) {
+        output = T(val);
+        return true;
+    } else {
+        double dval;
+        if(lexical_cast(input, dval)) {
+            output = T{dval};
+            return true;
+        }
+    }
+    return from_stream(input, output);
+}
+
+/// Assignable from int
+template <
+    typename T,
+    enable_if_t<classify_object<T>::value == object_category::integer_constructible, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    int val;
+    if(integral_conversion(input, val)) {
+        output = T(val);
+        return true;
+    }
+    return from_stream(input, output);
+}
+
+/// Assignable from double
+template <
+    typename T,
+    enable_if_t<classify_object<T>::value == object_category::double_constructible, detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    double val;
+    if(lexical_cast(input, val)) {
+        output = T{val};
+        return true;
+    }
+    return from_stream(input, output);
+}
+
+/// Non-string convertible from an int
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::other && std::is_assignable<T &, int>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    int val;
+    if(integral_conversion(input, val)) {
+#ifdef _MSC_VER
+#pragma warning(push)
+#pragma warning(disable : 4800)
+#endif
+        // with Atomic<XX> this could produce a warning due to the conversion but if atomic gets here it is an old style
+        // so will most likely still work
+        output = val;
+#ifdef _MSC_VER
+#pragma warning(pop)
+#endif
+        return true;
+    }
+    // LCOV_EXCL_START
+    // This version of cast is only used for odd cases in an older compilers the fail over
+    // from_stream is tested elsewhere an not relevant for coverage here
+    return from_stream(input, output);
+    // LCOV_EXCL_STOP
+}
+
+/// Non-string parsable by a stream
+template <typename T,
+          enable_if_t<classify_object<T>::value == object_category::other && !std::is_assignable<T &, int>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_cast(const std::string &input, T &output) {
+    static_assert(is_istreamable<T>::value,
+                  "option object type must have a lexical cast overload or streaming input operator(>>) defined, if it "
+                  "is convertible from another type use the add_option<T, XC>(...) with XC being the known type");
+    return from_stream(input, output);
+}
+
+/// Assign a value through lexical cast operations
+/// Strings can be empty so we need to do a little different
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<std::is_same<AssignTo, ConvertTo>::value &&
+                          (classify_object<AssignTo>::value == object_category::string_assignable ||
+                           classify_object<AssignTo>::value == object_category::string_constructible),
+                      detail::enabler> = detail::dummy>
+bool lexical_assign(const std::string &input, AssignTo &output) {
+    return lexical_cast(input, output);
+}
+
+/// Assign a value through lexical cast operations
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<std::is_same<AssignTo, ConvertTo>::value && std::is_assignable<AssignTo &, AssignTo>::value &&
+                          classify_object<AssignTo>::value != object_category::string_assignable &&
+                          classify_object<AssignTo>::value != object_category::string_constructible,
+                      detail::enabler> = detail::dummy>
+bool lexical_assign(const std::string &input, AssignTo &output) {
+    if(input.empty()) {
+        output = AssignTo{};
+        return true;
+    }
+
+    return lexical_cast(input, output);
+}
+
+/// Assign a value through lexical cast operations
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<std::is_same<AssignTo, ConvertTo>::value && !std::is_assignable<AssignTo &, AssignTo>::value &&
+                          classify_object<AssignTo>::value == object_category::wrapper_value,
+                      detail::enabler> = detail::dummy>
+bool lexical_assign(const std::string &input, AssignTo &output) {
+    if(input.empty()) {
+        typename AssignTo::value_type emptyVal{};
+        output = emptyVal;
+        return true;
+    }
+    return lexical_cast(input, output);
+}
+
+/// Assign a value through lexical cast operations for int compatible values
+/// mainly for atomic operations on some compilers
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<std::is_same<AssignTo, ConvertTo>::value && !std::is_assignable<AssignTo &, AssignTo>::value &&
+                          classify_object<AssignTo>::value != object_category::wrapper_value &&
+                          std::is_assignable<AssignTo &, int>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_assign(const std::string &input, AssignTo &output) {
+    if(input.empty()) {
+        output = 0;
+        return true;
+    }
+    int val;
+    if(lexical_cast(input, val)) {
+        output = val;
+        return true;
+    }
+    return false;
+}
+
+/// Assign a value converted from a string in lexical cast to the output value directly
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<!std::is_same<AssignTo, ConvertTo>::value && std::is_assignable<AssignTo &, ConvertTo &>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_assign(const std::string &input, AssignTo &output) {
+    ConvertTo val{};
+    bool parse_result = (!input.empty()) ? lexical_cast<ConvertTo>(input, val) : true;
+    if(parse_result) {
+        output = val;
+    }
+    return parse_result;
+}
+
+/// Assign a value from a lexical cast through constructing a value and move assigning it
+template <
+    typename AssignTo,
+    typename ConvertTo,
+    enable_if_t<!std::is_same<AssignTo, ConvertTo>::value && !std::is_assignable<AssignTo &, ConvertTo &>::value &&
+                    std::is_move_assignable<AssignTo>::value,
+                detail::enabler> = detail::dummy>
+bool lexical_assign(const std::string &input, AssignTo &output) {
+    ConvertTo val{};
+    bool parse_result = input.empty() ? true : lexical_cast<ConvertTo>(input, val);
+    if(parse_result) {
+        output = AssignTo(val);  // use () form of constructor to allow some implicit conversions
+    }
+    return parse_result;
+}
+
+/// primary lexical conversion operation, 1 string to 1 type of some kind
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<classify_object<ConvertTo>::value <= object_category::other &&
+                          classify_object<AssignTo>::value <= object_category::wrapper_value,
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std ::string> &strings, AssignTo &output) {
+    return lexical_assign<AssignTo, ConvertTo>(strings[0], output);
+}
+
+/// Lexical conversion if there is only one element but the conversion type is for two, then call a two element
+/// constructor
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<(type_count<AssignTo>::value <= 2) && expected_count<AssignTo>::value == 1 &&
+                          is_tuple_like<ConvertTo>::value && type_count_base<ConvertTo>::value == 2,
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std ::string> &strings, AssignTo &output) {
+    // the remove const is to handle pair types coming from a container
+    typename std::remove_const<typename std::tuple_element<0, ConvertTo>::type>::type v1;
+    typename std::tuple_element<1, ConvertTo>::type v2;
+    bool retval = lexical_assign<decltype(v1), decltype(v1)>(strings[0], v1);
+    if(strings.size() > 1) {
+        retval = retval && lexical_assign<decltype(v2), decltype(v2)>(strings[1], v2);
+    }
+    if(retval) {
+        output = AssignTo{v1, v2};
+    }
+    return retval;
+}
+
+/// Lexical conversion of a container types of single elements
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_mutable_container<AssignTo>::value && is_mutable_container<ConvertTo>::value &&
+                          type_count<ConvertTo>::value == 1,
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std ::string> &strings, AssignTo &output) {
+    output.erase(output.begin(), output.end());
+    for(const auto &elem : strings) {
+        typename AssignTo::value_type out;
+        bool retval = lexical_assign<typename AssignTo::value_type, typename ConvertTo::value_type>(elem, out);
+        if(!retval) {
+            return false;
+        }
+        output.insert(output.end(), std::move(out));
+    }
+    return (!output.empty());
+}
+
+/// Lexical conversion for complex types
+template <class AssignTo, class ConvertTo, enable_if_t<is_complex<ConvertTo>::value, detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std::string> &strings, AssignTo &output) {
+
+    if(strings.size() >= 2 && !strings[1].empty()) {
+        using XC2 = typename wrapped_type<ConvertTo, double>::type;
+        XC2 x{0.0}, y{0.0};
+        auto str1 = strings[1];
+        if(str1.back() == 'i' || str1.back() == 'j') {
+            str1.pop_back();
+        }
+        auto worked = detail::lexical_cast(strings[0], x) && detail::lexical_cast(str1, y);
+        if(worked) {
+            output = ConvertTo{x, y};
+        }
+        return worked;
+    } else {
+        return lexical_assign<AssignTo, ConvertTo>(strings[0], output);
+    }
+}
+
+/// Conversion to a vector type using a particular single type as the conversion type
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_mutable_container<AssignTo>::value && (expected_count<ConvertTo>::value == 1) &&
+                          (type_count<ConvertTo>::value == 1),
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std ::string> &strings, AssignTo &output) {
+    bool retval = true;
+    output.clear();
+    output.reserve(strings.size());
+    for(const auto &elem : strings) {
+
+        output.emplace_back();
+        retval = retval && lexical_assign<typename AssignTo::value_type, ConvertTo>(elem, output.back());
+    }
+    return (!output.empty()) && retval;
+}
+
+// forward declaration
+
+/// Lexical conversion of a container types with conversion type of two elements
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_mutable_container<AssignTo>::value && is_mutable_container<ConvertTo>::value &&
+                          type_count_base<ConvertTo>::value == 2,
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(std::vector<std::string> strings, AssignTo &output);
+
+/// Lexical conversion of a vector types with type_size >2 forward declaration
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_mutable_container<AssignTo>::value && is_mutable_container<ConvertTo>::value &&
+                          type_count_base<ConvertTo>::value != 2 &&
+                          ((type_count<ConvertTo>::value > 2) ||
+                           (type_count<ConvertTo>::value > type_count_base<ConvertTo>::value)),
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std::string> &strings, AssignTo &output);
+
+/// Conversion for tuples
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_tuple_like<AssignTo>::value && is_tuple_like<ConvertTo>::value &&
+                          (type_count_base<ConvertTo>::value != type_count<ConvertTo>::value ||
+                           type_count<ConvertTo>::value > 2),
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std::string> &strings, AssignTo &output);  // forward declaration
+
+/// Conversion for operations where the assigned type is some class but the conversion is a mutable container or large
+/// tuple
+template <typename AssignTo,
+          typename ConvertTo,
+          enable_if_t<!is_tuple_like<AssignTo>::value && !is_mutable_container<AssignTo>::value &&
+                          classify_object<ConvertTo>::value != object_category::wrapper_value &&
+                          (is_mutable_container<ConvertTo>::value || type_count<ConvertTo>::value > 2),
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std ::string> &strings, AssignTo &output) {
+
+    if(strings.size() > 1 || (!strings.empty() && !(strings.front().empty()))) {
+        ConvertTo val;
+        auto retval = lexical_conversion<ConvertTo, ConvertTo>(strings, val);
+        output = AssignTo{val};
+        return retval;
+    }
+    output = AssignTo{};
+    return true;
+}
+
+/// function template for converting tuples if the static Index is greater than the tuple size
+template <class AssignTo, class ConvertTo, std::size_t I>
+inline typename std::enable_if<(I >= type_count_base<AssignTo>::value), bool>::type
+tuple_conversion(const std::vector<std::string> &, AssignTo &) {
+    return true;
+}
+
+/// Conversion of a tuple element where the type size ==1 and not a mutable container
+template <class AssignTo, class ConvertTo>
+inline typename std::enable_if<!is_mutable_container<ConvertTo>::value && type_count<ConvertTo>::value == 1, bool>::type
+tuple_type_conversion(std::vector<std::string> &strings, AssignTo &output) {
+    auto retval = lexical_assign<AssignTo, ConvertTo>(strings[0], output);
+    strings.erase(strings.begin());
+    return retval;
+}
+
+/// Conversion of a tuple element where the type size !=1 but the size is fixed and not a mutable container
+template <class AssignTo, class ConvertTo>
+inline typename std::enable_if<!is_mutable_container<ConvertTo>::value && (type_count<ConvertTo>::value > 1) &&
+                                   type_count<ConvertTo>::value == type_count_min<ConvertTo>::value,
+                               bool>::type
+tuple_type_conversion(std::vector<std::string> &strings, AssignTo &output) {
+    auto retval = lexical_conversion<AssignTo, ConvertTo>(strings, output);
+    strings.erase(strings.begin(), strings.begin() + type_count<ConvertTo>::value);
+    return retval;
+}
+
+/// Conversion of a tuple element where the type is a mutable container or a type with different min and max type sizes
+template <class AssignTo, class ConvertTo>
+inline typename std::enable_if<is_mutable_container<ConvertTo>::value ||
+                                   type_count<ConvertTo>::value != type_count_min<ConvertTo>::value,
+                               bool>::type
+tuple_type_conversion(std::vector<std::string> &strings, AssignTo &output) {
+
+    std::size_t index{subtype_count_min<ConvertTo>::value};
+    const std::size_t mx_count{subtype_count<ConvertTo>::value};
+    const std::size_t mx{(std::max)(mx_count, strings.size())};
+
+    while(index < mx) {
+        if(is_separator(strings[index])) {
+            break;
+        }
+        ++index;
+    }
+    bool retval = lexical_conversion<AssignTo, ConvertTo>(
+        std::vector<std::string>(strings.begin(), strings.begin() + static_cast<std::ptrdiff_t>(index)), output);
+    strings.erase(strings.begin(), strings.begin() + static_cast<std::ptrdiff_t>(index) + 1);
+    return retval;
+}
+
+/// Tuple conversion operation
+template <class AssignTo, class ConvertTo, std::size_t I>
+inline typename std::enable_if<(I < type_count_base<AssignTo>::value), bool>::type
+tuple_conversion(std::vector<std::string> strings, AssignTo &output) {
+    bool retval = true;
+    using ConvertToElement = typename std::
+        conditional<is_tuple_like<ConvertTo>::value, typename std::tuple_element<I, ConvertTo>::type, ConvertTo>::type;
+    if(!strings.empty()) {
+        retval = retval && tuple_type_conversion<typename std::tuple_element<I, AssignTo>::type, ConvertToElement>(
+                               strings, std::get<I>(output));
+    }
+    retval = retval && tuple_conversion<AssignTo, ConvertTo, I + 1>(std::move(strings), output);
+    return retval;
+}
+
+/// Lexical conversion of a container types with tuple elements of size 2
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_mutable_container<AssignTo>::value && is_mutable_container<ConvertTo>::value &&
+                          type_count_base<ConvertTo>::value == 2,
+                      detail::enabler>>
+bool lexical_conversion(std::vector<std::string> strings, AssignTo &output) {
+    output.clear();
+    while(!strings.empty()) {
+
+        typename std::remove_const<typename std::tuple_element<0, typename ConvertTo::value_type>::type>::type v1;
+        typename std::tuple_element<1, typename ConvertTo::value_type>::type v2;
+        bool retval = tuple_type_conversion<decltype(v1), decltype(v1)>(strings, v1);
+        if(!strings.empty()) {
+            retval = retval && tuple_type_conversion<decltype(v2), decltype(v2)>(strings, v2);
+        }
+        if(retval) {
+            output.insert(output.end(), typename AssignTo::value_type{v1, v2});
+        } else {
+            return false;
+        }
+    }
+    return (!output.empty());
+}
+
+/// lexical conversion of tuples with type count>2 or tuples of types of some element with a type size>=2
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_tuple_like<AssignTo>::value && is_tuple_like<ConvertTo>::value &&
+                          (type_count_base<ConvertTo>::value != type_count<ConvertTo>::value ||
+                           type_count<ConvertTo>::value > 2),
+                      detail::enabler>>
+bool lexical_conversion(const std::vector<std ::string> &strings, AssignTo &output) {
+    static_assert(
+        !is_tuple_like<ConvertTo>::value || type_count_base<AssignTo>::value == type_count_base<ConvertTo>::value,
+        "if the conversion type is defined as a tuple it must be the same size as the type you are converting to");
+    return tuple_conversion<AssignTo, ConvertTo, 0>(strings, output);
+}
+
+/// Lexical conversion of a vector types for everything but tuples of two elements and types of size 1
+template <class AssignTo,
+          class ConvertTo,
+          enable_if_t<is_mutable_container<AssignTo>::value && is_mutable_container<ConvertTo>::value &&
+                          type_count_base<ConvertTo>::value != 2 &&
+                          ((type_count<ConvertTo>::value > 2) ||
+                           (type_count<ConvertTo>::value > type_count_base<ConvertTo>::value)),
+                      detail::enabler>>
+bool lexical_conversion(const std::vector<std ::string> &strings, AssignTo &output) {
+    bool retval = true;
+    output.clear();
+    std::vector<std::string> temp;
+    std::size_t ii{0};
+    std::size_t icount{0};
+    std::size_t xcm{type_count<ConvertTo>::value};
+    auto ii_max = strings.size();
+    while(ii < ii_max) {
+        temp.push_back(strings[ii]);
+        ++ii;
+        ++icount;
+        if(icount == xcm || is_separator(temp.back()) || ii == ii_max) {
+            if(static_cast<int>(xcm) > type_count_min<ConvertTo>::value && is_separator(temp.back())) {
+                temp.pop_back();
+            }
+            typename AssignTo::value_type temp_out;
+            retval = retval &&
+                     lexical_conversion<typename AssignTo::value_type, typename ConvertTo::value_type>(temp, temp_out);
+            temp.clear();
+            if(!retval) {
+                return false;
+            }
+            output.insert(output.end(), std::move(temp_out));
+            icount = 0;
+        }
+    }
+    return retval;
+}
+
+/// conversion for wrapper types
+template <typename AssignTo,
+          class ConvertTo,
+          enable_if_t<classify_object<ConvertTo>::value == object_category::wrapper_value &&
+                          std::is_assignable<ConvertTo &, ConvertTo>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std::string> &strings, AssignTo &output) {
+    if(strings.empty() || strings.front().empty()) {
+        output = ConvertTo{};
+        return true;
+    }
+    typename ConvertTo::value_type val;
+    if(lexical_conversion<typename ConvertTo::value_type, typename ConvertTo::value_type>(strings, val)) {
+        output = ConvertTo{val};
+        return true;
+    }
+    return false;
+}
+
+/// conversion for wrapper types
+template <typename AssignTo,
+          class ConvertTo,
+          enable_if_t<classify_object<ConvertTo>::value == object_category::wrapper_value &&
+                          !std::is_assignable<AssignTo &, ConvertTo>::value,
+                      detail::enabler> = detail::dummy>
+bool lexical_conversion(const std::vector<std::string> &strings, AssignTo &output) {
+    using ConvertType = typename ConvertTo::value_type;
+    if(strings.empty() || strings.front().empty()) {
+        output = ConvertType{};
+        return true;
+    }
+    ConvertType val;
+    if(lexical_conversion<typename ConvertTo::value_type, typename ConvertTo::value_type>(strings, val)) {
+        output = val;
+        return true;
+    }
+    return false;
+}
+
+/// Sum a vector of flag representations
+/// The flag vector produces a series of strings in a vector,  simple true is represented by a "1",  simple false is
+/// by
+/// "-1" an if numbers are passed by some fashion they are captured as well so the function just checks for the most
+/// common true and false strings then uses stoll to convert the rest for summing
+template <typename T, enable_if_t<std::is_unsigned<T>::value, detail::enabler> = detail::dummy>
+void sum_flag_vector(const std::vector<std::string> &flags, T &output) {
+    std::int64_t count{0};
+    for(auto &flag : flags) {
+        count += detail::to_flag_value(flag);
+    }
+    output = (count > 0) ? static_cast<T>(count) : T{0};
+}
+
+/// Sum a vector of flag representations
+/// The flag vector produces a series of strings in a vector,  simple true is represented by a "1",  simple false is
+/// by
+/// "-1" an if numbers are passed by some fashion they are captured as well so the function just checks for the most
+/// common true and false strings then uses stoll to convert the rest for summing
+template <typename T, enable_if_t<std::is_signed<T>::value, detail::enabler> = detail::dummy>
+void sum_flag_vector(const std::vector<std::string> &flags, T &output) {
+    std::int64_t count{0};
+    for(auto &flag : flags) {
+        count += detail::to_flag_value(flag);
+    }
+    output = static_cast<T>(count);
+}
+
+#ifdef _MSC_VER
+#pragma warning(push)
+#pragma warning(disable : 4800)
+#endif
+// with Atomic<XX> this could produce a warning due to the conversion but if atomic gets here it is an old style so will
+// most likely still work
+
+/// Sum a vector of flag representations
+/// The flag vector produces a series of strings in a vector,  simple true is represented by a "1",  simple false is
+/// by
+/// "-1" an if numbers are passed by some fashion they are captured as well so the function just checks for the most
+/// common true and false strings then uses stoll to convert the rest for summing
+template <typename T,
+          enable_if_t<!std::is_signed<T>::value && !std::is_unsigned<T>::value, detail::enabler> = detail::dummy>
+void sum_flag_vector(const std::vector<std::string> &flags, T &output) {
+    std::int64_t count{0};
+    for(auto &flag : flags) {
+        count += detail::to_flag_value(flag);
+    }
+    std::string out = detail::to_string(count);
+    lexical_cast(out, output);
+}
+
+#ifdef _MSC_VER
+#pragma warning(pop)
+#endif
+
+}  // namespace detail
+
+
+
+namespace detail {
+
+// Returns false if not a short option. Otherwise, sets opt name and rest and returns true
+inline bool split_short(const std::string &current, std::string &name, std::string &rest) {
+    if(current.size() > 1 && current[0] == '-' && valid_first_char(current[1])) {
+        name = current.substr(1, 1);
+        rest = current.substr(2);
+        return true;
+    }
+    return false;
+}
+
+// Returns false if not a long option. Otherwise, sets opt name and other side of = and returns true
+inline bool split_long(const std::string &current, std::string &name, std::string &value) {
+    if(current.size() > 2 && current.substr(0, 2) == "--" && valid_first_char(current[2])) {
+        auto loc = current.find_first_of('=');
+        if(loc != std::string::npos) {
+            name = current.substr(2, loc - 2);
+            value = current.substr(loc + 1);
+        } else {
+            name = current.substr(2);
+            value = "";
+        }
+        return true;
+    }
+    return false;
+}
+
+// Returns false if not a windows style option. Otherwise, sets opt name and value and returns true
+inline bool split_windows_style(const std::string &current, std::string &name, std::string &value) {
+    if(current.size() > 1 && current[0] == '/' && valid_first_char(current[1])) {
+        auto loc = current.find_first_of(':');
+        if(loc != std::string::npos) {
+            name = current.substr(1, loc - 1);
+            value = current.substr(loc + 1);
+        } else {
+            name = current.substr(1);
+            value = "";
+        }
+        return true;
+    }
+    return false;
+}
+
+// Splits a string into multiple long and short names
+inline std::vector<std::string> split_names(std::string current) {
+    std::vector<std::string> output;
+    std::size_t val;
+    while((val = current.find(",")) != std::string::npos) {
+        output.push_back(trim_copy(current.substr(0, val)));
+        current = current.substr(val + 1);
+    }
+    output.push_back(trim_copy(current));
+    return output;
+}
+
+/// extract default flag values either {def} or starting with a !
+inline std::vector<std::pair<std::string, std::string>> get_default_flag_values(const std::string &str) {
+    std::vector<std::string> flags = split_names(str);
+    flags.erase(std::remove_if(flags.begin(),
+                               flags.end(),
+                               [](const std::string &name) {
+                                   return ((name.empty()) || (!(((name.find_first_of('{') != std::string::npos) &&
+                                                                 (name.back() == '}')) ||
+                                                                (name[0] == '!'))));
+                               }),
+                flags.end());
+    std::vector<std::pair<std::string, std::string>> output;
+    output.reserve(flags.size());
+    for(auto &flag : flags) {
+        auto def_start = flag.find_first_of('{');
+        std::string defval = "false";
+        if((def_start != std::string::npos) && (flag.back() == '}')) {
+            defval = flag.substr(def_start + 1);
+            defval.pop_back();
+            flag.erase(def_start, std::string::npos);
+        }
+        flag.erase(0, flag.find_first_not_of("-!"));
+        output.emplace_back(flag, defval);
+    }
+    return output;
+}
+
+/// Get a vector of short names, one of long names, and a single name
+inline std::tuple<std::vector<std::string>, std::vector<std::string>, std::string>
+get_names(const std::vector<std::string> &input) {
+
+    std::vector<std::string> short_names;
+    std::vector<std::string> long_names;
+    std::string pos_name;
+
+    for(std::string name : input) {
+        if(name.length() == 0) {
+            continue;
+        }
+        if(name.length() > 1 && name[0] == '-' && name[1] != '-') {
+            if(name.length() == 2 && valid_first_char(name[1]))
+                short_names.emplace_back(1, name[1]);
+            else
+                throw BadNameString::OneCharName(name);
+        } else if(name.length() > 2 && name.substr(0, 2) == "--") {
+            name = name.substr(2);
+            if(valid_name_string(name))
+                long_names.push_back(name);
+            else
+                throw BadNameString::BadLongName(name);
+        } else if(name == "-" || name == "--") {
+            throw BadNameString::DashesOnly(name);
+        } else {
+            if(pos_name.length() > 0)
+                throw BadNameString::MultiPositionalNames(name);
+            pos_name = name;
+        }
+    }
+
+    return std::tuple<std::vector<std::string>, std::vector<std::string>, std::string>(
+        short_names, long_names, pos_name);
+}
+
+}  // namespace detail
+
+
+
+class App;
+
+/// Holds values to load into Options
+struct ConfigItem {
+    /// This is the list of parents
+    std::vector<std::string> parents{};
+
+    /// This is the name
+    std::string name{};
+
+    /// Listing of inputs
+    std::vector<std::string> inputs{};
+
+    /// The list of parents and name joined by "."
+    std::string fullname() const {
+        std::vector<std::string> tmp = parents;
+        tmp.emplace_back(name);
+        return detail::join(tmp, ".");
+    }
+};
+
+/// This class provides a converter for configuration files.
+class Config {
+  protected:
+    std::vector<ConfigItem> items{};
+
+  public:
+    /// Convert an app into a configuration
+    virtual std::string to_config(const App *, bool, bool, std::string) const = 0;
+
+    /// Convert a configuration into an app
+    virtual std::vector<ConfigItem> from_config(std::istream &) const = 0;
+
+    /// Get a flag value
+    virtual std::string to_flag(const ConfigItem &item) const {
+        if(item.inputs.size() == 1) {
+            return item.inputs.at(0);
+        }
+        throw ConversionError::TooManyInputsFlag(item.fullname());
+    }
+
+    /// Parse a config file, throw an error (ParseError:ConfigParseError or FileError) on failure
+    std::vector<ConfigItem> from_file(const std::string &name) {
+        std::ifstream input{name};
+        if(!input.good())
+            throw FileError::Missing(name);
+
+        return from_config(input);
+    }
+
+    /// Virtual destructor
+    virtual ~Config() = default;
+};
+
+/// This converter works with INI/TOML files; to write INI files use ConfigINI
+class ConfigBase : public Config {
+  protected:
+    /// the character used for comments
+    char commentChar = '#';
+    /// the character used to start an array '\0' is a default to not use
+    char arrayStart = '[';
+    /// the character used to end an array '\0' is a default to not use
+    char arrayEnd = ']';
+    /// the character used to separate elements in an array
+    char arraySeparator = ',';
+    /// the character used separate the name from the value
+    char valueDelimiter = '=';
+    /// the character to use around strings
+    char stringQuote = '"';
+    /// the character to use around single characters
+    char characterQuote = '\'';
+    /// the maximum number of layers to allow
+    uint8_t maximumLayers{255};
+    /// the separator used to separator parent layers
+    char parentSeparatorChar{'.'};
+    /// Specify the configuration index to use for arrayed sections
+    int16_t configIndex{-1};
+    /// Specify the configuration section that should be used
+    std::string configSection{};
+
+  public:
+    std::string
+    to_config(const App * /*app*/, bool default_also, bool write_description, std::string prefix) const override;
+
+    std::vector<ConfigItem> from_config(std::istream &input) const override;
+    /// Specify the configuration for comment characters
+    ConfigBase *comment(char cchar) {
+        commentChar = cchar;
+        return this;
+    }
+    /// Specify the start and end characters for an array
+    ConfigBase *arrayBounds(char aStart, char aEnd) {
+        arrayStart = aStart;
+        arrayEnd = aEnd;
+        return this;
+    }
+    /// Specify the delimiter character for an array
+    ConfigBase *arrayDelimiter(char aSep) {
+        arraySeparator = aSep;
+        return this;
+    }
+    /// Specify the delimiter between a name and value
+    ConfigBase *valueSeparator(char vSep) {
+        valueDelimiter = vSep;
+        return this;
+    }
+    /// Specify the quote characters used around strings and characters
+    ConfigBase *quoteCharacter(char qString, char qChar) {
+        stringQuote = qString;
+        characterQuote = qChar;
+        return this;
+    }
+    /// Specify the maximum number of parents
+    ConfigBase *maxLayers(uint8_t layers) {
+        maximumLayers = layers;
+        return this;
+    }
+    /// Specify the separator to use for parent layers
+    ConfigBase *parentSeparator(char sep) {
+        parentSeparatorChar = sep;
+        return this;
+    }
+    /// get a reference to the configuration section
+    std::string &sectionRef() { return configSection; }
+    /// get the section
+    const std::string &section() const { return configSection; }
+    /// specify a particular section of the configuration file to use
+    ConfigBase *section(const std::string &sectionName) {
+        configSection = sectionName;
+        return this;
+    }
+
+    /// get a reference to the configuration index
+    int16_t &indexRef() { return configIndex; }
+    /// get the section index
+    int16_t index() const { return configIndex; }
+    /// specify a particular index in the section to use (-1) for all sections to use
+    ConfigBase *index(int16_t sectionIndex) {
+        configIndex = sectionIndex;
+        return this;
+    }
+};
+
+/// the default Config is the TOML file format
+using ConfigTOML = ConfigBase;
+
+/// ConfigINI generates a "standard" INI compliant output
+class ConfigINI : public ConfigTOML {
+
+  public:
+    ConfigINI() {
+        commentChar = ';';
+        arrayStart = '\0';
+        arrayEnd = '\0';
+        arraySeparator = ' ';
+        valueDelimiter = '=';
+    }
+};
+
+
+
+class Option;
+
+/// @defgroup validator_group Validators
+
+/// @brief Some validators that are provided
+///
+/// These are simple `std::string(const std::string&)` validators that are useful. They return
+/// a string if the validation fails. A custom struct is provided, as well, with the same user
+/// semantics, but with the ability to provide a new type name.
+/// @{
+
+///
+class Validator {
+  protected:
+    /// This is the description function, if empty the description_ will be used
+    std::function<std::string()> desc_function_{[]() { return std::string{}; }};
+
+    /// This is the base function that is to be called.
+    /// Returns a string error message if validation fails.
+    std::function<std::string(std::string &)> func_{[](std::string &) { return std::string{}; }};
+    /// The name for search purposes of the Validator
+    std::string name_{};
+    /// A Validator will only apply to an indexed value (-1 is all elements)
+    int application_index_ = -1;
+    /// Enable for Validator to allow it to be disabled if need be
+    bool active_{true};
+    /// specify that a validator should not modify the input
+    bool non_modifying_{false};
+
+  public:
+    Validator() = default;
+    /// Construct a Validator with just the description string
+    explicit Validator(std::string validator_desc) : desc_function_([validator_desc]() { return validator_desc; }) {}
+    /// Construct Validator from basic information
+    Validator(std::function<std::string(std::string &)> op, std::string validator_desc, std::string validator_name = "")
+        : desc_function_([validator_desc]() { return validator_desc; }), func_(std::move(op)),
+          name_(std::move(validator_name)) {}
+    /// Set the Validator operation function
+    Validator &operation(std::function<std::string(std::string &)> op) {
+        func_ = std::move(op);
+        return *this;
+    }
+    /// This is the required operator for a Validator - provided to help
+    /// users (CLI11 uses the member `func` directly)
+    std::string operator()(std::string &str) const {
+        std::string retstring;
+        if(active_) {
+            if(non_modifying_) {
+                std::string value = str;
+                retstring = func_(value);
+            } else {
+                retstring = func_(str);
+            }
+        }
+        return retstring;
+    }
+
+    /// This is the required operator for a Validator - provided to help
+    /// users (CLI11 uses the member `func` directly)
+    std::string operator()(const std::string &str) const {
+        std::string value = str;
+        return (active_) ? func_(value) : std::string{};
+    }
+
+    /// Specify the type string
+    Validator &description(std::string validator_desc) {
+        desc_function_ = [validator_desc]() { return validator_desc; };
+        return *this;
+    }
+    /// Specify the type string
+    Validator description(std::string validator_desc) const {
+        Validator newval(*this);
+        newval.desc_function_ = [validator_desc]() { return validator_desc; };
+        return newval;
+    }
+    /// Generate type description information for the Validator
+    std::string get_description() const {
+        if(active_) {
+            return desc_function_();
+        }
+        return std::string{};
+    }
+    /// Specify the type string
+    Validator &name(std::string validator_name) {
+        name_ = std::move(validator_name);
+        return *this;
+    }
+    /// Specify the type string
+    Validator name(std::string validator_name) const {
+        Validator newval(*this);
+        newval.name_ = std::move(validator_name);
+        return newval;
+    }
+    /// Get the name of the Validator
+    const std::string &get_name() const { return name_; }
+    /// Specify whether the Validator is active or not
+    Validator &active(bool active_val = true) {
+        active_ = active_val;
+        return *this;
+    }
+    /// Specify whether the Validator is active or not
+    Validator active(bool active_val = true) const {
+        Validator newval(*this);
+        newval.active_ = active_val;
+        return newval;
+    }
+
+    /// Specify whether the Validator can be modifying or not
+    Validator &non_modifying(bool no_modify = true) {
+        non_modifying_ = no_modify;
+        return *this;
+    }
+    /// Specify the application index of a validator
+    Validator &application_index(int app_index) {
+        application_index_ = app_index;
+        return *this;
+    }
+    /// Specify the application index of a validator
+    Validator application_index(int app_index) const {
+        Validator newval(*this);
+        newval.application_index_ = app_index;
+        return newval;
+    }
+    /// Get the current value of the application index
+    int get_application_index() const { return application_index_; }
+    /// Get a boolean if the validator is active
+    bool get_active() const { return active_; }
+
+    /// Get a boolean if the validator is allowed to modify the input returns true if it can modify the input
+    bool get_modifying() const { return !non_modifying_; }
+
+    /// Combining validators is a new validator. Type comes from left validator if function, otherwise only set if the
+    /// same.
+    Validator operator&(const Validator &other) const {
+        Validator newval;
+
+        newval._merge_description(*this, other, " AND ");
+
+        // Give references (will make a copy in lambda function)
+        const std::function<std::string(std::string & filename)> &f1 = func_;
+        const std::function<std::string(std::string & filename)> &f2 = other.func_;
+
+        newval.func_ = [f1, f2](std::string &input) {
+            std::string s1 = f1(input);
+            std::string s2 = f2(input);
+            if(!s1.empty() && !s2.empty())
+                return std::string("(") + s1 + ") AND (" + s2 + ")";
+            else
+                return s1 + s2;
+        };
+
+        newval.active_ = (active_ & other.active_);
+        newval.application_index_ = application_index_;
+        return newval;
+    }
+
+    /// Combining validators is a new validator. Type comes from left validator if function, otherwise only set if the
+    /// same.
+    Validator operator|(const Validator &other) const {
+        Validator newval;
+
+        newval._merge_description(*this, other, " OR ");
+
+        // Give references (will make a copy in lambda function)
+        const std::function<std::string(std::string &)> &f1 = func_;
+        const std::function<std::string(std::string &)> &f2 = other.func_;
+
+        newval.func_ = [f1, f2](std::string &input) {
+            std::string s1 = f1(input);
+            std::string s2 = f2(input);
+            if(s1.empty() || s2.empty())
+                return std::string();
+
+            return std::string("(") + s1 + ") OR (" + s2 + ")";
+        };
+        newval.active_ = (active_ & other.active_);
+        newval.application_index_ = application_index_;
+        return newval;
+    }
+
+    /// Create a validator that fails when a given validator succeeds
+    Validator operator!() const {
+        Validator newval;
+        const std::function<std::string()> &dfunc1 = desc_function_;
+        newval.desc_function_ = [dfunc1]() {
+            auto str = dfunc1();
+            return (!str.empty()) ? std::string("NOT ") + str : std::string{};
+        };
+        // Give references (will make a copy in lambda function)
+        const std::function<std::string(std::string & res)> &f1 = func_;
+
+        newval.func_ = [f1, dfunc1](std::string &test) -> std::string {
+            std::string s1 = f1(test);
+            if(s1.empty()) {
+                return std::string("check ") + dfunc1() + " succeeded improperly";
+            }
+            return std::string{};
+        };
+        newval.active_ = active_;
+        newval.application_index_ = application_index_;
+        return newval;
+    }
+
+  private:
+    void _merge_description(const Validator &val1, const Validator &val2, const std::string &merger) {
+
+        const std::function<std::string()> &dfunc1 = val1.desc_function_;
+        const std::function<std::string()> &dfunc2 = val2.desc_function_;
+
+        desc_function_ = [=]() {
+            std::string f1 = dfunc1();
+            std::string f2 = dfunc2();
+            if((f1.empty()) || (f2.empty())) {
+                return f1 + f2;
+            }
+            return std::string(1, '(') + f1 + ')' + merger + '(' + f2 + ')';
+        };
+    }
+};  // namespace CLI
+
+/// Class wrapping some of the accessors of Validator
+class CustomValidator : public Validator {
+  public:
+};
+// The implementation of the built in validators is using the Validator class;
+// the user is only expected to use the const (static) versions (since there's no setup).
+// Therefore, this is in detail.
+namespace detail {
+
+/// CLI enumeration of different file types
+enum class path_type { nonexistent, file, directory };
+
+#if defined CLI11_HAS_FILESYSTEM && CLI11_HAS_FILESYSTEM > 0
+/// get the type of the path from a file name
+inline path_type check_path(const char *file) noexcept {
+    std::error_code ec;
+    auto stat = std::filesystem::status(file, ec);
+    if(ec) {
+        return path_type::nonexistent;
+    }
+    switch(stat.type()) {
+    case std::filesystem::file_type::none:
+    case std::filesystem::file_type::not_found:
+        return path_type::nonexistent;
+    case std::filesystem::file_type::directory:
+        return path_type::directory;
+    case std::filesystem::file_type::symlink:
+    case std::filesystem::file_type::block:
+    case std::filesystem::file_type::character:
+    case std::filesystem::file_type::fifo:
+    case std::filesystem::file_type::socket:
+    case std::filesystem::file_type::regular:
+    case std::filesystem::file_type::unknown:
+    default:
+        return path_type::file;
+    }
+}
+#else
+/// get the type of the path from a file name
+inline path_type check_path(const char *file) noexcept {
+#if defined(_MSC_VER)
+    struct __stat64 buffer;
+    if(_stat64(file, &buffer) == 0) {
+        return ((buffer.st_mode & S_IFDIR) != 0) ? path_type::directory : path_type::file;
+    }
+#else
+    struct stat buffer;
+    if(stat(file, &buffer) == 0) {
+        return ((buffer.st_mode & S_IFDIR) != 0) ? path_type::directory : path_type::file;
+    }
+#endif
+    return path_type::nonexistent;
+}
+#endif
+/// Check for an existing file (returns error message if check fails)
+class ExistingFileValidator : public Validator {
+  public:
+    ExistingFileValidator() : Validator("FILE") {
+        func_ = [](std::string &filename) {
+            auto path_result = check_path(filename.c_str());
+            if(path_result == path_type::nonexistent) {
+                return "File does not exist: " + filename;
+            }
+            if(path_result == path_type::directory) {
+                return "File is actually a directory: " + filename;
+            }
+            return std::string();
+        };
+    }
+};
+
+/// Check for an existing directory (returns error message if check fails)
+class ExistingDirectoryValidator : public Validator {
+  public:
+    ExistingDirectoryValidator() : Validator("DIR") {
+        func_ = [](std::string &filename) {
+            auto path_result = check_path(filename.c_str());
+            if(path_result == path_type::nonexistent) {
+                return "Directory does not exist: " + filename;
+            }
+            if(path_result == path_type::file) {
+                return "Directory is actually a file: " + filename;
+            }
+            return std::string();
+        };
+    }
+};
+
+/// Check for an existing path
+class ExistingPathValidator : public Validator {
+  public:
+    ExistingPathValidator() : Validator("PATH(existing)") {
+        func_ = [](std::string &filename) {
+            auto path_result = check_path(filename.c_str());
+            if(path_result == path_type::nonexistent) {
+                return "Path does not exist: " + filename;
+            }
+            return std::string();
+        };
+    }
+};
+
+/// Check for an non-existing path
+class NonexistentPathValidator : public Validator {
+  public:
+    NonexistentPathValidator() : Validator("PATH(non-existing)") {
+        func_ = [](std::string &filename) {
+            auto path_result = check_path(filename.c_str());
+            if(path_result != path_type::nonexistent) {
+                return "Path already exists: " + filename;
+            }
+            return std::string();
+        };
+    }
+};
+
+/// Validate the given string is a legal ipv4 address
+class IPV4Validator : public Validator {
+  public:
+    IPV4Validator() : Validator("IPV4") {
+        func_ = [](std::string &ip_addr) {
+            auto result = CLI::detail::split(ip_addr, '.');
+            if(result.size() != 4) {
+                return std::string("Invalid IPV4 address must have four parts (") + ip_addr + ')';
+            }
+            int num;
+            for(const auto &var : result) {
+                bool retval = detail::lexical_cast(var, num);
+                if(!retval) {
+                    return std::string("Failed parsing number (") + var + ')';
+                }
+                if(num < 0 || num > 255) {
+                    return std::string("Each IP number must be between 0 and 255 ") + var;
+                }
+            }
+            return std::string();
+        };
+    }
+};
+
+}  // namespace detail
+
+// Static is not needed here, because global const implies static.
+
+/// Check for existing file (returns error message if check fails)
+const detail::ExistingFileValidator ExistingFile;
+
+/// Check for an existing directory (returns error message if check fails)
+const detail::ExistingDirectoryValidator ExistingDirectory;
+
+/// Check for an existing path
+const detail::ExistingPathValidator ExistingPath;
+
+/// Check for an non-existing path
+const detail::NonexistentPathValidator NonexistentPath;
+
+/// Check for an IP4 address
+const detail::IPV4Validator ValidIPV4;
+
+/// Validate the input as a particular type
+template <typename DesiredType> class TypeValidator : public Validator {
+  public:
+    explicit TypeValidator(const std::string &validator_name) : Validator(validator_name) {
+        func_ = [](std::string &input_string) {
+            auto val = DesiredType();
+            if(!detail::lexical_cast(input_string, val)) {
+                return std::string("Failed parsing ") + input_string + " as a " + detail::type_name<DesiredType>();
+            }
+            return std::string();
+        };
+    }
+    TypeValidator() : TypeValidator(detail::type_name<DesiredType>()) {}
+};
+
+/// Check for a number
+const TypeValidator<double> Number("NUMBER");
+
+/// Produce a range (factory). Min and max are inclusive.
+class Range : public Validator {
+  public:
+    /// This produces a range with min and max inclusive.
+    ///
+    /// Note that the constructor is templated, but the struct is not, so C++17 is not
+    /// needed to provide nice syntax for Range(a,b).
+    template <typename T>
+    Range(T min_val, T max_val, const std::string &validator_name = std::string{}) : Validator(validator_name) {
+        if(validator_name.empty()) {
+            std::stringstream out;
+            out << detail::type_name<T>() << " in [" << min_val << " - " << max_val << "]";
+            description(out.str());
+        }
+
+        func_ = [min_val, max_val](std::string &input) {
+            T val;
+            bool converted = detail::lexical_cast(input, val);
+            if((!converted) || (val < min_val || val > max_val))
+                return std::string("Value ") + input + " not in range " + std::to_string(min_val) + " to " +
+                       std::to_string(max_val);
+
+            return std::string{};
+        };
+    }
+
+    /// Range of one value is 0 to value
+    template <typename T>
+    explicit Range(T max_val, const std::string &validator_name = std::string{})
+        : Range(static_cast<T>(0), max_val, validator_name) {}
+};
+
+/// Check for a non negative number
+const Range NonNegativeNumber((std::numeric_limits<double>::max)(), "NONNEGATIVE");
+
+/// Check for a positive valued number (val>0.0), min() her is the smallest positive number
+const Range PositiveNumber((std::numeric_limits<double>::min)(), (std::numeric_limits<double>::max)(), "POSITIVE");
+
+/// Produce a bounded range (factory). Min and max are inclusive.
+class Bound : public Validator {
+  public:
+    /// This bounds a value with min and max inclusive.
+    ///
+    /// Note that the constructor is templated, but the struct is not, so C++17 is not
+    /// needed to provide nice syntax for Range(a,b).
+    template <typename T> Bound(T min_val, T max_val) {
+        std::stringstream out;
+        out << detail::type_name<T>() << " bounded to [" << min_val << " - " << max_val << "]";
+        description(out.str());
+
+        func_ = [min_val, max_val](std::string &input) {
+            T val;
+            bool converted = detail::lexical_cast(input, val);
+            if(!converted) {
+                return std::string("Value ") + input + " could not be converted";
+            }
+            if(val < min_val)
+                input = detail::to_string(min_val);
+            else if(val > max_val)
+                input = detail::to_string(max_val);
+
+            return std::string{};
+        };
+    }
+
+    /// Range of one value is 0 to value
+    template <typename T> explicit Bound(T max_val) : Bound(static_cast<T>(0), max_val) {}
+};
+
+namespace detail {
+template <typename T,
+          enable_if_t<is_copyable_ptr<typename std::remove_reference<T>::type>::value, detail::enabler> = detail::dummy>
+auto smart_deref(T value) -> decltype(*value) {
+    return *value;
+}
+
+template <
+    typename T,
+    enable_if_t<!is_copyable_ptr<typename std::remove_reference<T>::type>::value, detail::enabler> = detail::dummy>
+typename std::remove_reference<T>::type &smart_deref(T &value) {
+    return value;
+}
+/// Generate a string representation of a set
+template <typename T> std::string generate_set(const T &set) {
+    using element_t = typename detail::element_type<T>::type;
+    using iteration_type_t = typename detail::pair_adaptor<element_t>::value_type;  // the type of the object pair
+    std::string out(1, '{');
+    out.append(detail::join(
+        detail::smart_deref(set),
+        [](const iteration_type_t &v) { return detail::pair_adaptor<element_t>::first(v); },
+        ","));
+    out.push_back('}');
+    return out;
+}
+
+/// Generate a string representation of a map
+template <typename T> std::string generate_map(const T &map, bool key_only = false) {
+    using element_t = typename detail::element_type<T>::type;
+    using iteration_type_t = typename detail::pair_adaptor<element_t>::value_type;  // the type of the object pair
+    std::string out(1, '{');
+    out.append(detail::join(
+        detail::smart_deref(map),
+        [key_only](const iteration_type_t &v) {
+            std::string res{detail::to_string(detail::pair_adaptor<element_t>::first(v))};
+
+            if(!key_only) {
+                res.append("->");
+                res += detail::to_string(detail::pair_adaptor<element_t>::second(v));
+            }
+            return res;
+        },
+        ","));
+    out.push_back('}');
+    return out;
+}
+
+template <typename C, typename V> struct has_find {
+    template <typename CC, typename VV>
+    static auto test(int) -> decltype(std::declval<CC>().find(std::declval<VV>()), std::true_type());
+    template <typename, typename> static auto test(...) -> decltype(std::false_type());
+
+    static const auto value = decltype(test<C, V>(0))::value;
+    using type = std::integral_constant<bool, value>;
+};
+
+/// A search function
+template <typename T, typename V, enable_if_t<!has_find<T, V>::value, detail::enabler> = detail::dummy>
+auto search(const T &set, const V &val) -> std::pair<bool, decltype(std::begin(detail::smart_deref(set)))> {
+    using element_t = typename detail::element_type<T>::type;
+    auto &setref = detail::smart_deref(set);
+    auto it = std::find_if(std::begin(setref), std::end(setref), [&val](decltype(*std::begin(setref)) v) {
+        return (detail::pair_adaptor<element_t>::first(v) == val);
+    });
+    return {(it != std::end(setref)), it};
+}
+
+/// A search function that uses the built in find function
+template <typename T, typename V, enable_if_t<has_find<T, V>::value, detail::enabler> = detail::dummy>
+auto search(const T &set, const V &val) -> std::pair<bool, decltype(std::begin(detail::smart_deref(set)))> {
+    auto &setref = detail::smart_deref(set);
+    auto it = setref.find(val);
+    return {(it != std::end(setref)), it};
+}
+
+/// A search function with a filter function
+template <typename T, typename V>
+auto search(const T &set, const V &val, const std::function<V(V)> &filter_function)
+    -> std::pair<bool, decltype(std::begin(detail::smart_deref(set)))> {
+    using element_t = typename detail::element_type<T>::type;
+    // do the potentially faster first search
+    auto res = search(set, val);
+    if((res.first) || (!(filter_function))) {
+        return res;
+    }
+    // if we haven't found it do the longer linear search with all the element translations
+    auto &setref = detail::smart_deref(set);
+    auto it = std::find_if(std::begin(setref), std::end(setref), [&](decltype(*std::begin(setref)) v) {
+        V a{detail::pair_adaptor<element_t>::first(v)};
+        a = filter_function(a);
+        return (a == val);
+    });
+    return {(it != std::end(setref)), it};
+}
+
+// the following suggestion was made by Nikita Ofitserov(@himikof)
+// done in templates to prevent compiler warnings on negation of unsigned numbers
+
+/// Do a check for overflow on signed numbers
+template <typename T>
+inline typename std::enable_if<std::is_signed<T>::value, T>::type overflowCheck(const T &a, const T &b) {
+    if((a > 0) == (b > 0)) {
+        return ((std::numeric_limits<T>::max)() / (std::abs)(a) < (std::abs)(b));
+    } else {
+        return ((std::numeric_limits<T>::min)() / (std::abs)(a) > -(std::abs)(b));
+    }
+}
+/// Do a check for overflow on unsigned numbers
+template <typename T>
+inline typename std::enable_if<!std::is_signed<T>::value, T>::type overflowCheck(const T &a, const T &b) {
+    return ((std::numeric_limits<T>::max)() / a < b);
+}
+
+/// Performs a *= b; if it doesn't cause integer overflow. Returns false otherwise.
+template <typename T> typename std::enable_if<std::is_integral<T>::value, bool>::type checked_multiply(T &a, T b) {
+    if(a == 0 || b == 0 || a == 1 || b == 1) {
+        a *= b;
+        return true;
+    }
+    if(a == (std::numeric_limits<T>::min)() || b == (std::numeric_limits<T>::min)()) {
+        return false;
+    }
+    if(overflowCheck(a, b)) {
+        return false;
+    }
+    a *= b;
+    return true;
+}
+
+/// Performs a *= b; if it doesn't equal infinity. Returns false otherwise.
+template <typename T>
+typename std::enable_if<std::is_floating_point<T>::value, bool>::type checked_multiply(T &a, T b) {
+    T c = a * b;
+    if(std::isinf(c) && !std::isinf(a) && !std::isinf(b)) {
+        return false;
+    }
+    a = c;
+    return true;
+}
+
+}  // namespace detail
+/// Verify items are in a set
+class IsMember : public Validator {
+  public:
+    using filter_fn_t = std::function<std::string(std::string)>;
+
+    /// This allows in-place construction using an initializer list
+    template <typename T, typename... Args>
+    IsMember(std::initializer_list<T> values, Args &&...args)
+        : IsMember(std::vector<T>(values), std::forward<Args>(args)...) {}
+
+    /// This checks to see if an item is in a set (empty function)
+    template <typename T> explicit IsMember(T &&set) : IsMember(std::forward<T>(set), nullptr) {}
+
+    /// This checks to see if an item is in a set: pointer or copy version. You can pass in a function that will filter
+    /// both sides of the comparison before computing the comparison.
+    template <typename T, typename F> explicit IsMember(T set, F filter_function) {
+
+        // Get the type of the contained item - requires a container have ::value_type
+        // if the type does not have first_type and second_type, these are both value_type
+        using element_t = typename detail::element_type<T>::type;             // Removes (smart) pointers if needed
+        using item_t = typename detail::pair_adaptor<element_t>::first_type;  // Is value_type if not a map
+
+        using local_item_t = typename IsMemberType<item_t>::type;  // This will convert bad types to good ones
+                                                                   // (const char * to std::string)
+
+        // Make a local copy of the filter function, using a std::function if not one already
+        std::function<local_item_t(local_item_t)> filter_fn = filter_function;
+
+        // This is the type name for help, it will take the current version of the set contents
+        desc_function_ = [set]() { return detail::generate_set(detail::smart_deref(set)); };
+
+        // This is the function that validates
+        // It stores a copy of the set pointer-like, so shared_ptr will stay alive
+        func_ = [set, filter_fn](std::string &input) {
+            local_item_t b;
+            if(!detail::lexical_cast(input, b)) {
+                throw ValidationError(input);  // name is added later
+            }
+            if(filter_fn) {
+                b = filter_fn(b);
+            }
+            auto res = detail::search(set, b, filter_fn);
+            if(res.first) {
+                // Make sure the version in the input string is identical to the one in the set
+                if(filter_fn) {
+                    input = detail::value_string(detail::pair_adaptor<element_t>::first(*(res.second)));
+                }
+
+                // Return empty error string (success)
+                return std::string{};
+            }
+
+            // If you reach this point, the result was not found
+            return input + " not in " + detail::generate_set(detail::smart_deref(set));
+        };
+    }
+
+    /// You can pass in as many filter functions as you like, they nest (string only currently)
+    template <typename T, typename... Args>
+    IsMember(T &&set, filter_fn_t filter_fn_1, filter_fn_t filter_fn_2, Args &&...other)
+        : IsMember(
+              std::forward<T>(set),
+              [filter_fn_1, filter_fn_2](std::string a) { return filter_fn_2(filter_fn_1(a)); },
+              other...) {}
+};
+
+/// definition of the default transformation object
+template <typename T> using TransformPairs = std::vector<std::pair<std::string, T>>;
+
+/// Translate named items to other or a value set
+class Transformer : public Validator {
+  public:
+    using filter_fn_t = std::function<std::string(std::string)>;
+
+    /// This allows in-place construction
+    template <typename... Args>
+    Transformer(std::initializer_list<std::pair<std::string, std::string>> values, Args &&...args)
+        : Transformer(TransformPairs<std::string>(values), std::forward<Args>(args)...) {}
+
+    /// direct map of std::string to std::string
+    template <typename T> explicit Transformer(T &&mapping) : Transformer(std::forward<T>(mapping), nullptr) {}
+
+    /// This checks to see if an item is in a set: pointer or copy version. You can pass in a function that will filter
+    /// both sides of the comparison before computing the comparison.
+    template <typename T, typename F> explicit Transformer(T mapping, F filter_function) {
+
+        static_assert(detail::pair_adaptor<typename detail::element_type<T>::type>::value,
+                      "mapping must produce value pairs");
+        // Get the type of the contained item - requires a container have ::value_type
+        // if the type does not have first_type and second_type, these are both value_type
+        using element_t = typename detail::element_type<T>::type;             // Removes (smart) pointers if needed
+        using item_t = typename detail::pair_adaptor<element_t>::first_type;  // Is value_type if not a map
+        using local_item_t = typename IsMemberType<item_t>::type;             // Will convert bad types to good ones
+                                                                              // (const char * to std::string)
+
+        // Make a local copy of the filter function, using a std::function if not one already
+        std::function<local_item_t(local_item_t)> filter_fn = filter_function;
+
+        // This is the type name for help, it will take the current version of the set contents
+        desc_function_ = [mapping]() { return detail::generate_map(detail::smart_deref(mapping)); };
+
+        func_ = [mapping, filter_fn](std::string &input) {
+            local_item_t b;
+            if(!detail::lexical_cast(input, b)) {
+                return std::string();
+                // there is no possible way we can match anything in the mapping if we can't convert so just return
+            }
+            if(filter_fn) {
+                b = filter_fn(b);
+            }
+            auto res = detail::search(mapping, b, filter_fn);
+            if(res.first) {
+                input = detail::value_string(detail::pair_adaptor<element_t>::second(*res.second));
+            }
+            return std::string{};
+        };
+    }
+
+    /// You can pass in as many filter functions as you like, they nest
+    template <typename T, typename... Args>
+    Transformer(T &&mapping, filter_fn_t filter_fn_1, filter_fn_t filter_fn_2, Args &&...other)
+        : Transformer(
+              std::forward<T>(mapping),
+              [filter_fn_1, filter_fn_2](std::string a) { return filter_fn_2(filter_fn_1(a)); },
+              other...) {}
+};
+
+/// translate named items to other or a value set
+class CheckedTransformer : public Validator {
+  public:
+    using filter_fn_t = std::function<std::string(std::string)>;
+
+    /// This allows in-place construction
+    template <typename... Args>
+    CheckedTransformer(std::initializer_list<std::pair<std::string, std::string>> values, Args &&...args)
+        : CheckedTransformer(TransformPairs<std::string>(values), std::forward<Args>(args)...) {}
+
+    /// direct map of std::string to std::string
+    template <typename T> explicit CheckedTransformer(T mapping) : CheckedTransformer(std::move(mapping), nullptr) {}
+
+    /// This checks to see if an item is in a set: pointer or copy version. You can pass in a function that will filter
+    /// both sides of the comparison before computing the comparison.
+    template <typename T, typename F> explicit CheckedTransformer(T mapping, F filter_function) {
+
+        static_assert(detail::pair_adaptor<typename detail::element_type<T>::type>::value,
+                      "mapping must produce value pairs");
+        // Get the type of the contained item - requires a container have ::value_type
+        // if the type does not have first_type and second_type, these are both value_type
+        using element_t = typename detail::element_type<T>::type;             // Removes (smart) pointers if needed
+        using item_t = typename detail::pair_adaptor<element_t>::first_type;  // Is value_type if not a map
+        using local_item_t = typename IsMemberType<item_t>::type;             // Will convert bad types to good ones
+                                                                              // (const char * to std::string)
+        using iteration_type_t = typename detail::pair_adaptor<element_t>::value_type;  // the type of the object pair
+
+        // Make a local copy of the filter function, using a std::function if not one already
+        std::function<local_item_t(local_item_t)> filter_fn = filter_function;
+
+        auto tfunc = [mapping]() {
+            std::string out("value in ");
+            out += detail::generate_map(detail::smart_deref(mapping)) + " OR {";
+            out += detail::join(
+                detail::smart_deref(mapping),
+                [](const iteration_type_t &v) { return detail::to_string(detail::pair_adaptor<element_t>::second(v)); },
+                ",");
+            out.push_back('}');
+            return out;
+        };
+
+        desc_function_ = tfunc;
+
+        func_ = [mapping, tfunc, filter_fn](std::string &input) {
+            local_item_t b;
+            bool converted = detail::lexical_cast(input, b);
+            if(converted) {
+                if(filter_fn) {
+                    b = filter_fn(b);
+                }
+                auto res = detail::search(mapping, b, filter_fn);
+                if(res.first) {
+                    input = detail::value_string(detail::pair_adaptor<element_t>::second(*res.second));
+                    return std::string{};
+                }
+            }
+            for(const auto &v : detail::smart_deref(mapping)) {
+                auto output_string = detail::value_string(detail::pair_adaptor<element_t>::second(v));
+                if(output_string == input) {
+                    return std::string();
+                }
+            }
+
+            return "Check " + input + " " + tfunc() + " FAILED";
+        };
+    }
+
+    /// You can pass in as many filter functions as you like, they nest
+    template <typename T, typename... Args>
+    CheckedTransformer(T &&mapping, filter_fn_t filter_fn_1, filter_fn_t filter_fn_2, Args &&...other)
+        : CheckedTransformer(
+              std::forward<T>(mapping),
+              [filter_fn_1, filter_fn_2](std::string a) { return filter_fn_2(filter_fn_1(a)); },
+              other...) {}
+};
+
+/// Helper function to allow ignore_case to be passed to IsMember or Transform
+inline std::string ignore_case(std::string item) { return detail::to_lower(item); }
+
+/// Helper function to allow ignore_underscore to be passed to IsMember or Transform
+inline std::string ignore_underscore(std::string item) { return detail::remove_underscore(item); }
+
+/// Helper function to allow checks to ignore spaces to be passed to IsMember or Transform
+inline std::string ignore_space(std::string item) {
+    item.erase(std::remove(std::begin(item), std::end(item), ' '), std::end(item));
+    item.erase(std::remove(std::begin(item), std::end(item), '\t'), std::end(item));
+    return item;
+}
+
+/// Multiply a number by a factor using given mapping.
+/// Can be used to write transforms for SIZE or DURATION inputs.
+///
+/// Example:
+///   With mapping = `{"b"->1, "kb"->1024, "mb"->1024*1024}`
+///   one can recognize inputs like "100", "12kb", "100 MB",
+///   that will be automatically transformed to 100, 14448, 104857600.
+///
+/// Output number type matches the type in the provided mapping.
+/// Therefore, if it is required to interpret real inputs like "0.42 s",
+/// the mapping should be of a type <string, float> or <string, double>.
+class AsNumberWithUnit : public Validator {
+  public:
+    /// Adjust AsNumberWithUnit behavior.
+    /// CASE_SENSITIVE/CASE_INSENSITIVE controls how units are matched.
+    /// UNIT_OPTIONAL/UNIT_REQUIRED throws ValidationError
+    ///   if UNIT_REQUIRED is set and unit literal is not found.
+    enum Options {
+        CASE_SENSITIVE = 0,
+        CASE_INSENSITIVE = 1,
+        UNIT_OPTIONAL = 0,
+        UNIT_REQUIRED = 2,
+        DEFAULT = CASE_INSENSITIVE | UNIT_OPTIONAL
+    };
+
+    template <typename Number>
+    explicit AsNumberWithUnit(std::map<std::string, Number> mapping,
+                              Options opts = DEFAULT,
+                              const std::string &unit_name = "UNIT") {
+        description(generate_description<Number>(unit_name, opts));
+        validate_mapping(mapping, opts);
+
+        // transform function
+        func_ = [mapping, opts](std::string &input) -> std::string {
+            Number num;
+
+            detail::rtrim(input);
+            if(input.empty()) {
+                throw ValidationError("Input is empty");
+            }
+
+            // Find split position between number and prefix
+            auto unit_begin = input.end();
+            while(unit_begin > input.begin() && std::isalpha(*(unit_begin - 1), std::locale())) {
+                --unit_begin;
+            }
+
+            std::string unit{unit_begin, input.end()};
+            input.resize(static_cast<std::size_t>(std::distance(input.begin(), unit_begin)));
+            detail::trim(input);
+
+            if(opts & UNIT_REQUIRED && unit.empty()) {
+                throw ValidationError("Missing mandatory unit");
+            }
+            if(opts & CASE_INSENSITIVE) {
+                unit = detail::to_lower(unit);
+            }
+            if(unit.empty()) {
+                if(!detail::lexical_cast(input, num)) {
+                    throw ValidationError(std::string("Value ") + input + " could not be converted to " +
+                                          detail::type_name<Number>());
+                }
+                // No need to modify input if no unit passed
+                return {};
+            }
+
+            // find corresponding factor
+            auto it = mapping.find(unit);
+            if(it == mapping.end()) {
+                throw ValidationError(unit +
+                                      " unit not recognized. "
+                                      "Allowed values: " +
+                                      detail::generate_map(mapping, true));
+            }
+
+            if(!input.empty()) {
+                bool converted = detail::lexical_cast(input, num);
+                if(!converted) {
+                    throw ValidationError(std::string("Value ") + input + " could not be converted to " +
+                                          detail::type_name<Number>());
+                }
+                // perform safe multiplication
+                bool ok = detail::checked_multiply(num, it->second);
+                if(!ok) {
+                    throw ValidationError(detail::to_string(num) + " multiplied by " + unit +
+                                          " factor would cause number overflow. Use smaller value.");
+                }
+            } else {
+                num = static_cast<Number>(it->second);
+            }
+
+            input = detail::to_string(num);
+
+            return {};
+        };
+    }
+
+  private:
+    /// Check that mapping contains valid units.
+    /// Update mapping for CASE_INSENSITIVE mode.
+    template <typename Number> static void validate_mapping(std::map<std::string, Number> &mapping, Options opts) {
+        for(auto &kv : mapping) {
+            if(kv.first.empty()) {
+                throw ValidationError("Unit must not be empty.");
+            }
+            if(!detail::isalpha(kv.first)) {
+                throw ValidationError("Unit must contain only letters.");
+            }
+        }
+
+        // make all units lowercase if CASE_INSENSITIVE
+        if(opts & CASE_INSENSITIVE) {
+            std::map<std::string, Number> lower_mapping;
+            for(auto &kv : mapping) {
+                auto s = detail::to_lower(kv.first);
+                if(lower_mapping.count(s)) {
+                    throw ValidationError(std::string("Several matching lowercase unit representations are found: ") +
+                                          s);
+                }
+                lower_mapping[detail::to_lower(kv.first)] = kv.second;
+            }
+            mapping = std::move(lower_mapping);
+        }
+    }
+
+    /// Generate description like this: NUMBER [UNIT]
+    template <typename Number> static std::string generate_description(const std::string &name, Options opts) {
+        std::stringstream out;
+        out << detail::type_name<Number>() << ' ';
+        if(opts & UNIT_REQUIRED) {
+            out << name;
+        } else {
+            out << '[' << name << ']';
+        }
+        return out.str();
+    }
+};
+
+/// Converts a human-readable size string (with unit literal) to uin64_t size.
+/// Example:
+///   "100" => 100
+///   "1 b" => 100
+///   "10Kb" => 10240 // you can configure this to be interpreted as kilobyte (*1000) or kibibyte (*1024)
+///   "10 KB" => 10240
+///   "10 kb" => 10240
+///   "10 kib" => 10240 // *i, *ib are always interpreted as *bibyte (*1024)
+///   "10kb" => 10240
+///   "2 MB" => 2097152
+///   "2 EiB" => 2^61 // Units up to exibyte are supported
+class AsSizeValue : public AsNumberWithUnit {
+  public:
+    using result_t = std::uint64_t;
+
+    /// If kb_is_1000 is true,
+    /// interpret 'kb', 'k' as 1000 and 'kib', 'ki' as 1024
+    /// (same applies to higher order units as well).
+    /// Otherwise, interpret all literals as factors of 1024.
+    /// The first option is formally correct, but
+    /// the second interpretation is more wide-spread
+    /// (see https://en.wikipedia.org/wiki/Binary_prefix).
+    explicit AsSizeValue(bool kb_is_1000) : AsNumberWithUnit(get_mapping(kb_is_1000)) {
+        if(kb_is_1000) {
+            description("SIZE [b, kb(=1000b), kib(=1024b), ...]");
+        } else {
+            description("SIZE [b, kb(=1024b), ...]");
+        }
+    }
+
+  private:
+    /// Get <size unit, factor> mapping
+    static std::map<std::string, result_t> init_mapping(bool kb_is_1000) {
+        std::map<std::string, result_t> m;
+        result_t k_factor = kb_is_1000 ? 1000 : 1024;
+        result_t ki_factor = 1024;
+        result_t k = 1;
+        result_t ki = 1;
+        m["b"] = 1;
+        for(std::string p : {"k", "m", "g", "t", "p", "e"}) {
+            k *= k_factor;
+            ki *= ki_factor;
+            m[p] = k;
+            m[p + "b"] = k;
+            m[p + "i"] = ki;
+            m[p + "ib"] = ki;
+        }
+        return m;
+    }
+
+    /// Cache calculated mapping
+    static std::map<std::string, result_t> get_mapping(bool kb_is_1000) {
+        if(kb_is_1000) {
+            static auto m = init_mapping(true);
+            return m;
+        } else {
+            static auto m = init_mapping(false);
+            return m;
+        }
+    }
+};
+
+namespace detail {
+/// Split a string into a program name and command line arguments
+/// the string is assumed to contain a file name followed by other arguments
+/// the return value contains is a pair with the first argument containing the program name and the second
+/// everything else.
+inline std::pair<std::string, std::string> split_program_name(std::string commandline) {
+    // try to determine the programName
+    std::pair<std::string, std::string> vals;
+    trim(commandline);
+    auto esp = commandline.find_first_of(' ', 1);
+    while(detail::check_path(commandline.substr(0, esp).c_str()) != path_type::file) {
+        esp = commandline.find_first_of(' ', esp + 1);
+        if(esp == std::string::npos) {
+            // if we have reached the end and haven't found a valid file just assume the first argument is the
+            // program name
+            if(commandline[0] == '"' || commandline[0] == '\'' || commandline[0] == '`') {
+                bool embeddedQuote = false;
+                auto keyChar = commandline[0];
+                auto end = commandline.find_first_of(keyChar, 1);
+                while((end != std::string::npos) && (commandline[end - 1] == '\\')) {  // deal with escaped quotes
+                    end = commandline.find_first_of(keyChar, end + 1);
+                    embeddedQuote = true;
+                }
+                if(end != std::string::npos) {
+                    vals.first = commandline.substr(1, end - 1);
+                    esp = end + 1;
+                    if(embeddedQuote) {
+                        vals.first = find_and_replace(vals.first, std::string("\\") + keyChar, std::string(1, keyChar));
+                    }
+                } else {
+                    esp = commandline.find_first_of(' ', 1);
+                }
+            } else {
+                esp = commandline.find_first_of(' ', 1);
+            }
+
+            break;
+        }
+    }
+    if(vals.first.empty()) {
+        vals.first = commandline.substr(0, esp);
+        rtrim(vals.first);
+    }
+
+    // strip the program name
+    vals.second = (esp != std::string::npos) ? commandline.substr(esp + 1) : std::string{};
+    ltrim(vals.second);
+    return vals;
+}
+
+}  // namespace detail
+/// @}
+
+
+
+
+class Option;
+class App;
+
+/// This enum signifies the type of help requested
+///
+/// This is passed in by App; all user classes must accept this as
+/// the second argument.
+
+enum class AppFormatMode {
+    Normal,  ///< The normal, detailed help
+    All,     ///< A fully expanded help
+    Sub,     ///< Used when printed as part of expanded subcommand
+};
+
+/// This is the minimum requirements to run a formatter.
+///
+/// A user can subclass this is if they do not care at all
+/// about the structure in CLI::Formatter.
+class FormatterBase {
+  protected:
+    /// @name Options
+    ///@{
+
+    /// The width of the first column
+    std::size_t column_width_{30};
+
+    /// @brief The required help printout labels (user changeable)
+    /// Values are Needs, Excludes, etc.
+    std::map<std::string, std::string> labels_{};
+
+    ///@}
+    /// @name Basic
+    ///@{
+
+  public:
+    FormatterBase() = default;
+    FormatterBase(const FormatterBase &) = default;
+    FormatterBase(FormatterBase &&) = default;
+
+    /// Adding a destructor in this form to work around bug in GCC 4.7
+    virtual ~FormatterBase() noexcept {}  // NOLINT(modernize-use-equals-default)
+
+    /// This is the key method that puts together help
+    virtual std::string make_help(const App *, std::string, AppFormatMode) const = 0;
+
+    ///@}
+    /// @name Setters
+    ///@{
+
+    /// Set the "REQUIRED" label
+    void label(std::string key, std::string val) { labels_[key] = val; }
+
+    /// Set the column width
+    void column_width(std::size_t val) { column_width_ = val; }
+
+    ///@}
+    /// @name Getters
+    ///@{
+
+    /// Get the current value of a name (REQUIRED, etc.)
+    std::string get_label(std::string key) const {
+        if(labels_.find(key) == labels_.end())
+            return key;
+        else
+            return labels_.at(key);
+    }
+
+    /// Get the current column width
+    std::size_t get_column_width() const { return column_width_; }
+
+    ///@}
+};
+
+/// This is a specialty override for lambda functions
+class FormatterLambda final : public FormatterBase {
+    using funct_t = std::function<std::string(const App *, std::string, AppFormatMode)>;
+
+    /// The lambda to hold and run
+    funct_t lambda_;
+
+  public:
+    /// Create a FormatterLambda with a lambda function
+    explicit FormatterLambda(funct_t funct) : lambda_(std::move(funct)) {}
+
+    /// Adding a destructor (mostly to make GCC 4.7 happy)
+    ~FormatterLambda() noexcept override {}  // NOLINT(modernize-use-equals-default)
+
+    /// This will simply call the lambda function
+    std::string make_help(const App *app, std::string name, AppFormatMode mode) const override {
+        return lambda_(app, name, mode);
+    }
+};
+
+/// This is the default Formatter for CLI11. It pretty prints help output, and is broken into quite a few
+/// overridable methods, to be highly customizable with minimal effort.
+class Formatter : public FormatterBase {
+  public:
+    Formatter() = default;
+    Formatter(const Formatter &) = default;
+    Formatter(Formatter &&) = default;
+
+    /// @name Overridables
+    ///@{
+
+    /// This prints out a group of options with title
+    ///
+    virtual std::string make_group(std::string group, bool is_positional, std::vector<const Option *> opts) const;
+
+    /// This prints out just the positionals "group"
+    virtual std::string make_positionals(const App *app) const;
+
+    /// This prints out all the groups of options
+    std::string make_groups(const App *app, AppFormatMode mode) const;
+
+    /// This prints out all the subcommands
+    virtual std::string make_subcommands(const App *app, AppFormatMode mode) const;
+
+    /// This prints out a subcommand
+    virtual std::string make_subcommand(const App *sub) const;
+
+    /// This prints out a subcommand in help-all
+    virtual std::string make_expanded(const App *sub) const;
+
+    /// This prints out all the groups of options
+    virtual std::string make_footer(const App *app) const;
+
+    /// This displays the description line
+    virtual std::string make_description(const App *app) const;
+
+    /// This displays the usage line
+    virtual std::string make_usage(const App *app, std::string name) const;
+
+    /// This puts everything together
+    std::string make_help(const App * /*app*/, std::string, AppFormatMode) const override;
+
+    ///@}
+    /// @name Options
+    ///@{
+
+    /// This prints out an option help line, either positional or optional form
+    virtual std::string make_option(const Option *opt, bool is_positional) const {
+        std::stringstream out;
+        detail::format_help(
+            out, make_option_name(opt, is_positional) + make_option_opts(opt), make_option_desc(opt), column_width_);
+        return out.str();
+    }
+
+    /// @brief This is the name part of an option, Default: left column
+    virtual std::string make_option_name(const Option *, bool) const;
+
+    /// @brief This is the options part of the name, Default: combined into left column
+    virtual std::string make_option_opts(const Option *) const;
+
+    /// @brief This is the description. Default: Right column, on new line if left column too large
+    virtual std::string make_option_desc(const Option *) const;
+
+    /// @brief This is used to print the name on the USAGE line
+    virtual std::string make_option_usage(const Option *opt) const;
+
+    ///@}
+};
+
+
+
+
+using results_t = std::vector<std::string>;
+/// callback function definition
+using callback_t = std::function<bool(const results_t &)>;
+
+class Option;
+class App;
+
+using Option_p = std::unique_ptr<Option>;
+/// Enumeration of the multiOption Policy selection
+enum class MultiOptionPolicy : char {
+    Throw,      //!< Throw an error if any extra arguments were given
+    TakeLast,   //!< take only the last Expected number of arguments
+    TakeFirst,  //!< take only the first Expected number of arguments
+    Join,       //!< merge all the arguments together into a single string via the delimiter character default('\n')
+    TakeAll     //!< just get all the passed argument regardless
+};
+
+/// This is the CRTP base class for Option and OptionDefaults. It was designed this way
+/// to share parts of the class; an OptionDefaults can copy to an Option.
+template <typename CRTP> class OptionBase {
+    friend App;
+
+  protected:
+    /// The group membership
+    std::string group_ = std::string("Options");
+
+    /// True if this is a required option
+    bool required_{false};
+
+    /// Ignore the case when matching (option, not value)
+    bool ignore_case_{false};
+
+    /// Ignore underscores when matching (option, not value)
+    bool ignore_underscore_{false};
+
+    /// Allow this option to be given in a configuration file
+    bool configurable_{true};
+
+    /// Disable overriding flag values with '=value'
+    bool disable_flag_override_{false};
+
+    /// Specify a delimiter character for vector arguments
+    char delimiter_{'\0'};
+
+    /// Automatically capture default value
+    bool always_capture_default_{false};
+
+    /// Policy for handling multiple arguments beyond the expected Max
+    MultiOptionPolicy multi_option_policy_{MultiOptionPolicy::Throw};
+
+    /// Copy the contents to another similar class (one based on OptionBase)
+    template <typename T> void copy_to(T *other) const {
+        other->group(group_);
+        other->required(required_);
+        other->ignore_case(ignore_case_);
+        other->ignore_underscore(ignore_underscore_);
+        other->configurable(configurable_);
+        other->disable_flag_override(disable_flag_override_);
+        other->delimiter(delimiter_);
+        other->always_capture_default(always_capture_default_);
+        other->multi_option_policy(multi_option_policy_);
+    }
+
+  public:
+    // setters
+
+    /// Changes the group membership
+    CRTP *group(const std::string &name) {
+        if(!detail::valid_alias_name_string(name)) {
+            throw IncorrectConstruction("Group names may not contain newlines or null characters");
+        }
+        group_ = name;
+        return static_cast<CRTP *>(this);
+    }
+
+    /// Set the option as required
+    CRTP *required(bool value = true) {
+        required_ = value;
+        return static_cast<CRTP *>(this);
+    }
+
+    /// Support Plumbum term
+    CRTP *mandatory(bool value = true) { return required(value); }
+
+    CRTP *always_capture_default(bool value = true) {
+        always_capture_default_ = value;
+        return static_cast<CRTP *>(this);
+    }
+
+    // Getters
+
+    /// Get the group of this option
+    const std::string &get_group() const { return group_; }
+
+    /// True if this is a required option
+    bool get_required() const { return required_; }
+
+    /// The status of ignore case
+    bool get_ignore_case() const { return ignore_case_; }
+
+    /// The status of ignore_underscore
+    bool get_ignore_underscore() const { return ignore_underscore_; }
+
+    /// The status of configurable
+    bool get_configurable() const { return configurable_; }
+
+    /// The status of configurable
+    bool get_disable_flag_override() const { return disable_flag_override_; }
+
+    /// Get the current delimiter char
+    char get_delimiter() const { return delimiter_; }
+
+    /// Return true if this will automatically capture the default value for help printing
+    bool get_always_capture_default() const { return always_capture_default_; }
+
+    /// The status of the multi option policy
+    MultiOptionPolicy get_multi_option_policy() const { return multi_option_policy_; }
+
+    // Shortcuts for multi option policy
+
+    /// Set the multi option policy to take last
+    CRTP *take_last() {
+        auto self = static_cast<CRTP *>(this);
+        self->multi_option_policy(MultiOptionPolicy::TakeLast);
+        return self;
+    }
+
+    /// Set the multi option policy to take last
+    CRTP *take_first() {
+        auto self = static_cast<CRTP *>(this);
+        self->multi_option_policy(MultiOptionPolicy::TakeFirst);
+        return self;
+    }
+
+    /// Set the multi option policy to take all arguments
+    CRTP *take_all() {
+        auto self = static_cast<CRTP *>(this);
+        self->multi_option_policy(MultiOptionPolicy::TakeAll);
+        return self;
+    }
+
+    /// Set the multi option policy to join
+    CRTP *join() {
+        auto self = static_cast<CRTP *>(this);
+        self->multi_option_policy(MultiOptionPolicy::Join);
+        return self;
+    }
+
+    /// Set the multi option policy to join with a specific delimiter
+    CRTP *join(char delim) {
+        auto self = static_cast<CRTP *>(this);
+        self->delimiter_ = delim;
+        self->multi_option_policy(MultiOptionPolicy::Join);
+        return self;
+    }
+
+    /// Allow in a configuration file
+    CRTP *configurable(bool value = true) {
+        configurable_ = value;
+        return static_cast<CRTP *>(this);
+    }
+
+    /// Allow in a configuration file
+    CRTP *delimiter(char value = '\0') {
+        delimiter_ = value;
+        return static_cast<CRTP *>(this);
+    }
+};
+
+/// This is a version of OptionBase that only supports setting values,
+/// for defaults. It is stored as the default option in an App.
+class OptionDefaults : public OptionBase<OptionDefaults> {
+  public:
+    OptionDefaults() = default;
+
+    // Methods here need a different implementation if they are Option vs. OptionDefault
+
+    /// Take the last argument if given multiple times
+    OptionDefaults *multi_option_policy(MultiOptionPolicy value = MultiOptionPolicy::Throw) {
+        multi_option_policy_ = value;
+        return this;
+    }
+
+    /// Ignore the case of the option name
+    OptionDefaults *ignore_case(bool value = true) {
+        ignore_case_ = value;
+        return this;
+    }
+
+    /// Ignore underscores in the option name
+    OptionDefaults *ignore_underscore(bool value = true) {
+        ignore_underscore_ = value;
+        return this;
+    }
+
+    /// Disable overriding flag values with an '=<value>' segment
+    OptionDefaults *disable_flag_override(bool value = true) {
+        disable_flag_override_ = value;
+        return this;
+    }
+
+    /// set a delimiter character to split up single arguments to treat as multiple inputs
+    OptionDefaults *delimiter(char value = '\0') {
+        delimiter_ = value;
+        return this;
+    }
+};
+
+class Option : public OptionBase<Option> {
+    friend App;
+
+  protected:
+    /// @name Names
+    ///@{
+
+    /// A list of the short names (`-a`) without the leading dashes
+    std::vector<std::string> snames_{};
+
+    /// A list of the long names (`--long`) without the leading dashes
+    std::vector<std::string> lnames_{};
+
+    /// A list of the flag names with the appropriate default value, the first part of the pair should be duplicates of
+    /// what is in snames or lnames but will trigger a particular response on a flag
+    std::vector<std::pair<std::string, std::string>> default_flag_values_{};
+
+    /// a list of flag names with specified default values;
+    std::vector<std::string> fnames_{};
+
+    /// A positional name
+    std::string pname_{};
+
+    /// If given, check the environment for this option
+    std::string envname_{};
+
+    ///@}
+    /// @name Help
+    ///@{
+
+    /// The description for help strings
+    std::string description_{};
+
+    /// A human readable default value, either manually set, captured, or captured by default
+    std::string default_str_{};
+
+    /// If given, replace the text that describes the option type and usage in the help text
+    std::string option_text_{};
+
+    /// A human readable type value, set when App creates this
+    ///
+    /// This is a lambda function so "types" can be dynamic, such as when a set prints its contents.
+    std::function<std::string()> type_name_{[]() { return std::string(); }};
+
+    /// Run this function to capture a default (ignore if empty)
+    std::function<std::string()> default_function_{};
+
+    ///@}
+    /// @name Configuration
+    ///@{
+
+    /// The number of arguments that make up one option. max is the nominal type size, min is the minimum number of
+    /// strings
+    int type_size_max_{1};
+    /// The minimum number of arguments an option should be expecting
+    int type_size_min_{1};
+
+    /// The minimum number of expected values
+    int expected_min_{1};
+    /// The maximum number of expected values
+    int expected_max_{1};
+
+    /// A list of Validators to run on each value parsed
+    std::vector<Validator> validators_{};
+
+    /// A list of options that are required with this option
+    std::set<Option *> needs_{};
+
+    /// A list of options that are excluded with this option
+    std::set<Option *> excludes_{};
+
+    ///@}
+    /// @name Other
+    ///@{
+
+    /// link back up to the parent App for fallthrough
+    App *parent_{nullptr};
+
+    /// Options store a callback to do all the work
+    callback_t callback_{};
+
+    ///@}
+    /// @name Parsing results
+    ///@{
+
+    /// complete Results of parsing
+    results_t results_{};
+    /// results after reduction
+    results_t proc_results_{};
+    /// enumeration for the option state machine
+    enum class option_state : char {
+        parsing = 0,       //!< The option is currently collecting parsed results
+        validated = 2,     //!< the results have been validated
+        reduced = 4,       //!< a subset of results has been generated
+        callback_run = 6,  //!< the callback has been executed
+    };
+    /// Whether the callback has run (needed for INI parsing)
+    option_state current_option_state_{option_state::parsing};
+    /// Specify that extra args beyond type_size_max should be allowed
+    bool allow_extra_args_{false};
+    /// Specify that the option should act like a flag vs regular option
+    bool flag_like_{false};
+    /// Control option to run the callback to set the default
+    bool run_callback_for_default_{false};
+    /// flag indicating a separator needs to be injected after each argument call
+    bool inject_separator_{false};
+    /// flag indicating that the option should trigger the validation and callback chain on each result when loaded
+    bool trigger_on_result_{false};
+    /// flag indicating that the option should force the callback regardless if any results present
+    bool force_callback_{false};
+    ///@}
+
+    /// Making an option by hand is not defined, it must be made by the App class
+    Option(std::string option_name, std::string option_description, callback_t callback, App *parent)
+        : description_(std::move(option_description)), parent_(parent), callback_(std::move(callback)) {
+        std::tie(snames_, lnames_, pname_) = detail::get_names(detail::split_names(option_name));
+    }
+
+  public:
+    /// @name Basic
+    ///@{
+
+    Option(const Option &) = delete;
+    Option &operator=(const Option &) = delete;
+
+    /// Count the total number of times an option was passed
+    std::size_t count() const { return results_.size(); }
+
+    /// True if the option was not passed
+    bool empty() const { return results_.empty(); }
+
+    /// This bool operator returns true if any arguments were passed or the option callback is forced
+    explicit operator bool() const { return !empty() || force_callback_; }
+
+    /// Clear the parsed results (mostly for testing)
+    void clear() {
+        results_.clear();
+        current_option_state_ = option_state::parsing;
+    }
+
+    ///@}
+    /// @name Setting options
+    ///@{
+
+    /// Set the number of expected arguments
+    Option *expected(int value) {
+        if(value < 0) {
+            expected_min_ = -value;
+            if(expected_max_ < expected_min_) {
+                expected_max_ = expected_min_;
+            }
+            allow_extra_args_ = true;
+            flag_like_ = false;
+        } else if(value == detail::expected_max_vector_size) {
+            expected_min_ = 1;
+            expected_max_ = detail::expected_max_vector_size;
+            allow_extra_args_ = true;
+            flag_like_ = false;
+        } else {
+            expected_min_ = value;
+            expected_max_ = value;
+            flag_like_ = (expected_min_ == 0);
+        }
+        return this;
+    }
+
+    /// Set the range of expected arguments
+    Option *expected(int value_min, int value_max) {
+        if(value_min < 0) {
+            value_min = -value_min;
+        }
+
+        if(value_max < 0) {
+            value_max = detail::expected_max_vector_size;
+        }
+        if(value_max < value_min) {
+            expected_min_ = value_max;
+            expected_max_ = value_min;
+        } else {
+            expected_max_ = value_max;
+            expected_min_ = value_min;
+        }
+
+        return this;
+    }
+    /// Set the value of allow_extra_args which allows extra value arguments on the flag or option to be included
+    /// with each instance
+    Option *allow_extra_args(bool value = true) {
+        allow_extra_args_ = value;
+        return this;
+    }
+    /// Get the current value of allow extra args
+    bool get_allow_extra_args() const { return allow_extra_args_; }
+    /// Set the value of trigger_on_parse which specifies that the option callback should be triggered on every parse
+    Option *trigger_on_parse(bool value = true) {
+        trigger_on_result_ = value;
+        return this;
+    }
+    /// The status of trigger on parse
+    bool get_trigger_on_parse() const { return trigger_on_result_; }
+
+    /// Set the value of force_callback
+    Option *force_callback(bool value = true) {
+        force_callback_ = value;
+        return this;
+    }
+    /// The status of force_callback
+    bool get_force_callback() const { return force_callback_; }
+
+    /// Set the value of run_callback_for_default which controls whether the callback function should be called to set
+    /// the default This is controlled automatically but could be manipulated by the user.
+    Option *run_callback_for_default(bool value = true) {
+        run_callback_for_default_ = value;
+        return this;
+    }
+    /// Get the current value of run_callback_for_default
+    bool get_run_callback_for_default() const { return run_callback_for_default_; }
+
+    /// Adds a Validator with a built in type name
+    Option *check(Validator validator, const std::string &validator_name = "") {
+        validator.non_modifying();
+        validators_.push_back(std::move(validator));
+        if(!validator_name.empty())
+            validators_.back().name(validator_name);
+        return this;
+    }
+
+    /// Adds a Validator. Takes a const string& and returns an error message (empty if conversion/check is okay).
+    Option *check(std::function<std::string(const std::string &)> Validator,
+                  std::string Validator_description = "",
+                  std::string Validator_name = "") {
+        validators_.emplace_back(Validator, std::move(Validator_description), std::move(Validator_name));
+        validators_.back().non_modifying();
+        return this;
+    }
+
+    /// Adds a transforming Validator with a built in type name
+    Option *transform(Validator Validator, const std::string &Validator_name = "") {
+        validators_.insert(validators_.begin(), std::move(Validator));
+        if(!Validator_name.empty())
+            validators_.front().name(Validator_name);
+        return this;
+    }
+
+    /// Adds a Validator-like function that can change result
+    Option *transform(const std::function<std::string(std::string)> &func,
+                      std::string transform_description = "",
+                      std::string transform_name = "") {
+        validators_.insert(validators_.begin(),
+                           Validator(
+                               [func](std::string &val) {
+                                   val = func(val);
+                                   return std::string{};
+                               },
+                               std::move(transform_description),
+                               std::move(transform_name)));
+
+        return this;
+    }
+
+    /// Adds a user supplied function to run on each item passed in (communicate though lambda capture)
+    Option *each(const std::function<void(std::string)> &func) {
+        validators_.emplace_back(
+            [func](std::string &inout) {
+                func(inout);
+                return std::string{};
+            },
+            std::string{});
+        return this;
+    }
+    /// Get a named Validator
+    Validator *get_validator(const std::string &Validator_name = "") {
+        for(auto &Validator : validators_) {
+            if(Validator_name == Validator.get_name()) {
+                return &Validator;
+            }
+        }
+        if((Validator_name.empty()) && (!validators_.empty())) {
+            return &(validators_.front());
+        }
+        throw OptionNotFound(std::string{"Validator "} + Validator_name + " Not Found");
+    }
+
+    /// Get a Validator by index NOTE: this may not be the order of definition
+    Validator *get_validator(int index) {
+        // This is an signed int so that it is not equivalent to a pointer.
+        if(index >= 0 && index < static_cast<int>(validators_.size())) {
+            return &(validators_[static_cast<decltype(validators_)::size_type>(index)]);
+        }
+        throw OptionNotFound("Validator index is not valid");
+    }
+
+    /// Sets required options
+    Option *needs(Option *opt) {
+        if(opt != this) {
+            needs_.insert(opt);
+        }
+        return this;
+    }
+
+    /// Can find a string if needed
+    template <typename T = App> Option *needs(std::string opt_name) {
+        auto opt = static_cast<T *>(parent_)->get_option_no_throw(opt_name);
+        if(opt == nullptr) {
+            throw IncorrectConstruction::MissingOption(opt_name);
+        }
+        return needs(opt);
+    }
+
+    /// Any number supported, any mix of string and Opt
+    template <typename A, typename B, typename... ARG> Option *needs(A opt, B opt1, ARG... args) {
+        needs(opt);
+        return needs(opt1, args...);
+    }
+
+    /// Remove needs link from an option. Returns true if the option really was in the needs list.
+    bool remove_needs(Option *opt) {
+        auto iterator = std::find(std::begin(needs_), std::end(needs_), opt);
+
+        if(iterator == std::end(needs_)) {
+            return false;
+        }
+        needs_.erase(iterator);
+        return true;
+    }
+
+    /// Sets excluded options
+    Option *excludes(Option *opt) {
+        if(opt == this) {
+            throw(IncorrectConstruction("and option cannot exclude itself"));
+        }
+        excludes_.insert(opt);
+
+        // Help text should be symmetric - excluding a should exclude b
+        opt->excludes_.insert(this);
+
+        // Ignoring the insert return value, excluding twice is now allowed.
+        // (Mostly to allow both directions to be excluded by user, even though the library does it for you.)
+
+        return this;
+    }
+
+    /// Can find a string if needed
+    template <typename T = App> Option *excludes(std::string opt_name) {
+        auto opt = static_cast<T *>(parent_)->get_option_no_throw(opt_name);
+        if(opt == nullptr) {
+            throw IncorrectConstruction::MissingOption(opt_name);
+        }
+        return excludes(opt);
+    }
+
+    /// Any number supported, any mix of string and Opt
+    template <typename A, typename B, typename... ARG> Option *excludes(A opt, B opt1, ARG... args) {
+        excludes(opt);
+        return excludes(opt1, args...);
+    }
+
+    /// Remove needs link from an option. Returns true if the option really was in the needs list.
+    bool remove_excludes(Option *opt) {
+        auto iterator = std::find(std::begin(excludes_), std::end(excludes_), opt);
+
+        if(iterator == std::end(excludes_)) {
+            return false;
+        }
+        excludes_.erase(iterator);
+        return true;
+    }
+
+    /// Sets environment variable to read if no option given
+    Option *envname(std::string name) {
+        envname_ = std::move(name);
+        return this;
+    }
+
+    /// Ignore case
+    ///
+    /// The template hides the fact that we don't have the definition of App yet.
+    /// You are never expected to add an argument to the template here.
+    template <typename T = App> Option *ignore_case(bool value = true) {
+        if(!ignore_case_ && value) {
+            ignore_case_ = value;
+            auto *parent = static_cast<T *>(parent_);
+            for(const Option_p &opt : parent->options_) {
+                if(opt.get() == this) {
+                    continue;
+                }
+                auto &omatch = opt->matching_name(*this);
+                if(!omatch.empty()) {
+                    ignore_case_ = false;
+                    throw OptionAlreadyAdded("adding ignore case caused a name conflict with " + omatch);
+                }
+            }
+        } else {
+            ignore_case_ = value;
+        }
+        return this;
+    }
+
+    /// Ignore underscores in the option names
+    ///
+    /// The template hides the fact that we don't have the definition of App yet.
+    /// You are never expected to add an argument to the template here.
+    template <typename T = App> Option *ignore_underscore(bool value = true) {
+
+        if(!ignore_underscore_ && value) {
+            ignore_underscore_ = value;
+            auto *parent = static_cast<T *>(parent_);
+            for(const Option_p &opt : parent->options_) {
+                if(opt.get() == this) {
+                    continue;
+                }
+                auto &omatch = opt->matching_name(*this);
+                if(!omatch.empty()) {
+                    ignore_underscore_ = false;
+                    throw OptionAlreadyAdded("adding ignore underscore caused a name conflict with " + omatch);
+                }
+            }
+        } else {
+            ignore_underscore_ = value;
+        }
+        return this;
+    }
+
+    /// Take the last argument if given multiple times (or another policy)
+    Option *multi_option_policy(MultiOptionPolicy value = MultiOptionPolicy::Throw) {
+        if(value != multi_option_policy_) {
+            if(multi_option_policy_ == MultiOptionPolicy::Throw && expected_max_ == detail::expected_max_vector_size &&
+               expected_min_ > 1) {  // this bizarre condition is to maintain backwards compatibility
+                                     // with the previous behavior of expected_ with vectors
+                expected_max_ = expected_min_;
+            }
+            multi_option_policy_ = value;
+            current_option_state_ = option_state::parsing;
+        }
+        return this;
+    }
+
+    /// Disable flag overrides values, e.g. --flag=<value> is not allowed
+    Option *disable_flag_override(bool value = true) {
+        disable_flag_override_ = value;
+        return this;
+    }
+    ///@}
+    /// @name Accessors
+    ///@{
+
+    /// The number of arguments the option expects
+    int get_type_size() const { return type_size_min_; }
+
+    /// The minimum number of arguments the option expects
+    int get_type_size_min() const { return type_size_min_; }
+    /// The maximum number of arguments the option expects
+    int get_type_size_max() const { return type_size_max_; }
+
+    /// Return the inject_separator flag
+    int get_inject_separator() const { return inject_separator_; }
+
+    /// The environment variable associated to this value
+    std::string get_envname() const { return envname_; }
+
+    /// The set of options needed
+    std::set<Option *> get_needs() const { return needs_; }
+
+    /// The set of options excluded
+    std::set<Option *> get_excludes() const { return excludes_; }
+
+    /// The default value (for help printing)
+    std::string get_default_str() const { return default_str_; }
+
+    /// Get the callback function
+    callback_t get_callback() const { return callback_; }
+
+    /// Get the long names
+    const std::vector<std::string> &get_lnames() const { return lnames_; }
+
+    /// Get the short names
+    const std::vector<std::string> &get_snames() const { return snames_; }
+
+    /// Get the flag names with specified default values
+    const std::vector<std::string> &get_fnames() const { return fnames_; }
+    /// Get a single name for the option, first of lname, pname, sname, envname
+    const std::string &get_single_name() const {
+        if(!lnames_.empty()) {
+            return lnames_[0];
+        }
+        if(!pname_.empty()) {
+            return pname_;
+        }
+        if(!snames_.empty()) {
+            return snames_[0];
+        }
+        return envname_;
+    }
+    /// The number of times the option expects to be included
+    int get_expected() const { return expected_min_; }
+
+    /// The number of times the option expects to be included
+    int get_expected_min() const { return expected_min_; }
+    /// The max number of times the option expects to be included
+    int get_expected_max() const { return expected_max_; }
+
+    /// The total min number of expected  string values to be used
+    int get_items_expected_min() const { return type_size_min_ * expected_min_; }
+
+    /// Get the maximum number of items expected to be returned and used for the callback
+    int get_items_expected_max() const {
+        int t = type_size_max_;
+        return detail::checked_multiply(t, expected_max_) ? t : detail::expected_max_vector_size;
+    }
+    /// The total min number of expected  string values to be used
+    int get_items_expected() const { return get_items_expected_min(); }
+
+    /// True if the argument can be given directly
+    bool get_positional() const { return pname_.length() > 0; }
+
+    /// True if option has at least one non-positional name
+    bool nonpositional() const { return (snames_.size() + lnames_.size()) > 0; }
+
+    /// True if option has description
+    bool has_description() const { return description_.length() > 0; }
+
+    /// Get the description
+    const std::string &get_description() const { return description_; }
+
+    /// Set the description
+    Option *description(std::string option_description) {
+        description_ = std::move(option_description);
+        return this;
+    }
+
+    Option *option_text(std::string text) {
+        option_text_ = std::move(text);
+        return this;
+    }
+
+    const std::string &get_option_text() const { return option_text_; }
+
+    ///@}
+    /// @name Help tools
+    ///@{
+
+    /// \brief Gets a comma separated list of names.
+    /// Will include / prefer the positional name if positional is true.
+    /// If all_options is false, pick just the most descriptive name to show.
+    /// Use `get_name(true)` to get the positional name (replaces `get_pname`)
+    std::string get_name(bool positional = false,  ///< Show the positional name
+                         bool all_options = false  ///< Show every option
+    ) const {
+        if(get_group().empty())
+            return {};  // Hidden
+
+        if(all_options) {
+
+            std::vector<std::string> name_list;
+
+            /// The all list will never include a positional unless asked or that's the only name.
+            if((positional && (!pname_.empty())) || (snames_.empty() && lnames_.empty())) {
+                name_list.push_back(pname_);
+            }
+            if((get_items_expected() == 0) && (!fnames_.empty())) {
+                for(const std::string &sname : snames_) {
+                    name_list.push_back("-" + sname);
+                    if(check_fname(sname)) {
+                        name_list.back() += "{" + get_flag_value(sname, "") + "}";
+                    }
+                }
+
+                for(const std::string &lname : lnames_) {
+                    name_list.push_back("--" + lname);
+                    if(check_fname(lname)) {
+                        name_list.back() += "{" + get_flag_value(lname, "") + "}";
+                    }
+                }
+            } else {
+                for(const std::string &sname : snames_)
+                    name_list.push_back("-" + sname);
+
+                for(const std::string &lname : lnames_)
+                    name_list.push_back("--" + lname);
+            }
+
+            return detail::join(name_list);
+        }
+
+        // This returns the positional name no matter what
+        if(positional)
+            return pname_;
+
+        // Prefer long name
+        if(!lnames_.empty())
+            return std::string(2, '-') + lnames_[0];
+
+        // Or short name if no long name
+        if(!snames_.empty())
+            return std::string(1, '-') + snames_[0];
+
+        // If positional is the only name, it's okay to use that
+        return pname_;
+    }
+
+    ///@}
+    /// @name Parser tools
+    ///@{
+
+    /// Process the callback
+    void run_callback() {
+        if(force_callback_ && results_.empty()) {
+            add_result(default_str_);
+        }
+        if(current_option_state_ == option_state::parsing) {
+            _validate_results(results_);
+            current_option_state_ = option_state::validated;
+        }
+
+        if(current_option_state_ < option_state::reduced) {
+            _reduce_results(proc_results_, results_);
+            current_option_state_ = option_state::reduced;
+        }
+        if(current_option_state_ >= option_state::reduced) {
+            current_option_state_ = option_state::callback_run;
+            if(!(callback_)) {
+                return;
+            }
+            const results_t &send_results = proc_results_.empty() ? results_ : proc_results_;
+            bool local_result = callback_(send_results);
+
+            if(!local_result)
+                throw ConversionError(get_name(), results_);
+        }
+    }
+
+    /// If options share any of the same names, find it
+    const std::string &matching_name(const Option &other) const {
+        static const std::string estring;
+        for(const std::string &sname : snames_)
+            if(other.check_sname(sname))
+                return sname;
+        for(const std::string &lname : lnames_)
+            if(other.check_lname(lname))
+                return lname;
+
+        if(ignore_case_ ||
+           ignore_underscore_) {  // We need to do the inverse, in case we are ignore_case or ignore underscore
+            for(const std::string &sname : other.snames_)
+                if(check_sname(sname))
+                    return sname;
+            for(const std::string &lname : other.lnames_)
+                if(check_lname(lname))
+                    return lname;
+        }
+        return estring;
+    }
+    /// If options share any of the same names, they are equal (not counting positional)
+    bool operator==(const Option &other) const { return !matching_name(other).empty(); }
+
+    /// Check a name. Requires "-" or "--" for short / long, supports positional name
+    bool check_name(const std::string &name) const {
+
+        if(name.length() > 2 && name[0] == '-' && name[1] == '-')
+            return check_lname(name.substr(2));
+        if(name.length() > 1 && name.front() == '-')
+            return check_sname(name.substr(1));
+        if(!pname_.empty()) {
+            std::string local_pname = pname_;
+            std::string local_name = name;
+            if(ignore_underscore_) {
+                local_pname = detail::remove_underscore(local_pname);
+                local_name = detail::remove_underscore(local_name);
+            }
+            if(ignore_case_) {
+                local_pname = detail::to_lower(local_pname);
+                local_name = detail::to_lower(local_name);
+            }
+            if(local_name == local_pname) {
+                return true;
+            }
+        }
+
+        if(!envname_.empty()) {
+            // this needs to be the original since envname_ shouldn't match on case insensitivity
+            return (name == envname_);
+        }
+        return false;
+    }
+
+    /// Requires "-" to be removed from string
+    bool check_sname(std::string name) const {
+        return (detail::find_member(std::move(name), snames_, ignore_case_) >= 0);
+    }
+
+    /// Requires "--" to be removed from string
+    bool check_lname(std::string name) const {
+        return (detail::find_member(std::move(name), lnames_, ignore_case_, ignore_underscore_) >= 0);
+    }
+
+    /// Requires "--" to be removed from string
+    bool check_fname(std::string name) const {
+        if(fnames_.empty()) {
+            return false;
+        }
+        return (detail::find_member(std::move(name), fnames_, ignore_case_, ignore_underscore_) >= 0);
+    }
+
+    /// Get the value that goes for a flag, nominally gets the default value but allows for overrides if not
+    /// disabled
+    std::string get_flag_value(const std::string &name, std::string input_value) const {
+        static const std::string trueString{"true"};
+        static const std::string falseString{"false"};
+        static const std::string emptyString{"{}"};
+        // check for disable flag override_
+        if(disable_flag_override_) {
+            if(!((input_value.empty()) || (input_value == emptyString))) {
+                auto default_ind = detail::find_member(name, fnames_, ignore_case_, ignore_underscore_);
+                if(default_ind >= 0) {
+                    // We can static cast this to std::size_t because it is more than 0 in this block
+                    if(default_flag_values_[static_cast<std::size_t>(default_ind)].second != input_value) {
+                        throw(ArgumentMismatch::FlagOverride(name));
+                    }
+                } else {
+                    if(input_value != trueString) {
+                        throw(ArgumentMismatch::FlagOverride(name));
+                    }
+                }
+            }
+        }
+        auto ind = detail::find_member(name, fnames_, ignore_case_, ignore_underscore_);
+        if((input_value.empty()) || (input_value == emptyString)) {
+            if(flag_like_) {
+                return (ind < 0) ? trueString : default_flag_values_[static_cast<std::size_t>(ind)].second;
+            } else {
+                return (ind < 0) ? default_str_ : default_flag_values_[static_cast<std::size_t>(ind)].second;
+            }
+        }
+        if(ind < 0) {
+            return input_value;
+        }
+        if(default_flag_values_[static_cast<std::size_t>(ind)].second == falseString) {
+            try {
+                auto val = detail::to_flag_value(input_value);
+                return (val == 1) ? falseString : (val == (-1) ? trueString : std::to_string(-val));
+            } catch(const std::invalid_argument &) {
+                return input_value;
+            }
+        } else {
+            return input_value;
+        }
+    }
+
+    /// Puts a result at the end
+    Option *add_result(std::string s) {
+        _add_result(std::move(s), results_);
+        current_option_state_ = option_state::parsing;
+        return this;
+    }
+
+    /// Puts a result at the end and get a count of the number of arguments actually added
+    Option *add_result(std::string s, int &results_added) {
+        results_added = _add_result(std::move(s), results_);
+        current_option_state_ = option_state::parsing;
+        return this;
+    }
+
+    /// Puts a result at the end
+    Option *add_result(std::vector<std::string> s) {
+        current_option_state_ = option_state::parsing;
+        for(auto &str : s) {
+            _add_result(std::move(str), results_);
+        }
+        return this;
+    }
+
+    /// Get the current complete results set
+    const results_t &results() const { return results_; }
+
+    /// Get a copy of the results
+    results_t reduced_results() const {
+        results_t res = proc_results_.empty() ? results_ : proc_results_;
+        if(current_option_state_ < option_state::reduced) {
+            if(current_option_state_ == option_state::parsing) {
+                res = results_;
+                _validate_results(res);
+            }
+            if(!res.empty()) {
+                results_t extra;
+                _reduce_results(extra, res);
+                if(!extra.empty()) {
+                    res = std::move(extra);
+                }
+            }
+        }
+        return res;
+    }
+
+    /// Get the results as a specified type
+    template <typename T> void results(T &output) const {
+        bool retval;
+        if(current_option_state_ >= option_state::reduced || (results_.size() == 1 && validators_.empty())) {
+            const results_t &res = (proc_results_.empty()) ? results_ : proc_results_;
+            retval = detail::lexical_conversion<T, T>(res, output);
+        } else {
+            results_t res;
+            if(results_.empty()) {
+                if(!default_str_.empty()) {
+                    // _add_results takes an rvalue only
+                    _add_result(std::string(default_str_), res);
+                    _validate_results(res);
+                    results_t extra;
+                    _reduce_results(extra, res);
+                    if(!extra.empty()) {
+                        res = std::move(extra);
+                    }
+                } else {
+                    res.emplace_back();
+                }
+            } else {
+                res = reduced_results();
+            }
+            retval = detail::lexical_conversion<T, T>(res, output);
+        }
+        if(!retval) {
+            throw ConversionError(get_name(), results_);
+        }
+    }
+
+    /// Return the results as the specified type
+    template <typename T> T as() const {
+        T output;
+        results(output);
+        return output;
+    }
+
+    /// See if the callback has been run already
+    bool get_callback_run() const { return (current_option_state_ == option_state::callback_run); }
+
+    ///@}
+    /// @name Custom options
+    ///@{
+
+    /// Set the type function to run when displayed on this option
+    Option *type_name_fn(std::function<std::string()> typefun) {
+        type_name_ = std::move(typefun);
+        return this;
+    }
+
+    /// Set a custom option typestring
+    Option *type_name(std::string typeval) {
+        type_name_fn([typeval]() { return typeval; });
+        return this;
+    }
+
+    /// Set a custom option size
+    Option *type_size(int option_type_size) {
+        if(option_type_size < 0) {
+            // this section is included for backwards compatibility
+            type_size_max_ = -option_type_size;
+            type_size_min_ = -option_type_size;
+            expected_max_ = detail::expected_max_vector_size;
+        } else {
+            type_size_max_ = option_type_size;
+            if(type_size_max_ < detail::expected_max_vector_size) {
+                type_size_min_ = option_type_size;
+            } else {
+                inject_separator_ = true;
+            }
+            if(type_size_max_ == 0)
+                required_ = false;
+        }
+        return this;
+    }
+    /// Set a custom option type size range
+    Option *type_size(int option_type_size_min, int option_type_size_max) {
+        if(option_type_size_min < 0 || option_type_size_max < 0) {
+            // this section is included for backwards compatibility
+            expected_max_ = detail::expected_max_vector_size;
+            option_type_size_min = (std::abs)(option_type_size_min);
+            option_type_size_max = (std::abs)(option_type_size_max);
+        }
+
+        if(option_type_size_min > option_type_size_max) {
+            type_size_max_ = option_type_size_min;
+            type_size_min_ = option_type_size_max;
+        } else {
+            type_size_min_ = option_type_size_min;
+            type_size_max_ = option_type_size_max;
+        }
+        if(type_size_max_ == 0) {
+            required_ = false;
+        }
+        if(type_size_max_ >= detail::expected_max_vector_size) {
+            inject_separator_ = true;
+        }
+        return this;
+    }
+
+    /// Set the value of the separator injection flag
+    void inject_separator(bool value = true) { inject_separator_ = value; }
+
+    /// Set a capture function for the default. Mostly used by App.
+    Option *default_function(const std::function<std::string()> &func) {
+        default_function_ = func;
+        return this;
+    }
+
+    /// Capture the default value from the original value (if it can be captured)
+    Option *capture_default_str() {
+        if(default_function_) {
+            default_str_ = default_function_();
+        }
+        return this;
+    }
+
+    /// Set the default value string representation (does not change the contained value)
+    Option *default_str(std::string val) {
+        default_str_ = std::move(val);
+        return this;
+    }
+
+    /// Set the default value and validate the results and run the callback if appropriate to set the value into the
+    /// bound value only available for types that can be converted to a string
+    template <typename X> Option *default_val(const X &val) {
+        std::string val_str = detail::to_string(val);
+        auto old_option_state = current_option_state_;
+        results_t old_results{std::move(results_)};
+        results_.clear();
+        try {
+            add_result(val_str);
+            // if trigger_on_result_ is set the callback already ran
+            if(run_callback_for_default_ && !trigger_on_result_) {
+                run_callback();  // run callback sets the state we need to reset it again
+                current_option_state_ = option_state::parsing;
+            } else {
+                _validate_results(results_);
+                current_option_state_ = old_option_state;
+            }
+        } catch(const CLI::Error &) {
+            // this should be done
+            results_ = std::move(old_results);
+            current_option_state_ = old_option_state;
+            throw;
+        }
+        results_ = std::move(old_results);
+        default_str_ = std::move(val_str);
+        return this;
+    }
+
+    /// Get the full typename for this option
+    std::string get_type_name() const {
+        std::string full_type_name = type_name_();
+        if(!validators_.empty()) {
+            for(auto &Validator : validators_) {
+                std::string vtype = Validator.get_description();
+                if(!vtype.empty()) {
+                    full_type_name += ":" + vtype;
+                }
+            }
+        }
+        return full_type_name;
+    }
+
+  private:
+    /// Run the results through the Validators
+    void _validate_results(results_t &res) const {
+        // Run the Validators (can change the string)
+        if(!validators_.empty()) {
+            if(type_size_max_ > 1) {  // in this context index refers to the index in the type
+                int index = 0;
+                if(get_items_expected_max() < static_cast<int>(res.size()) &&
+                   multi_option_policy_ == CLI::MultiOptionPolicy::TakeLast) {
+                    // create a negative index for the earliest ones
+                    index = get_items_expected_max() - static_cast<int>(res.size());
+                }
+
+                for(std::string &result : res) {
+                    if(detail::is_separator(result) && type_size_max_ != type_size_min_ && index >= 0) {
+                        index = 0;  // reset index for variable size chunks
+                        continue;
+                    }
+                    auto err_msg = _validate(result, (index >= 0) ? (index % type_size_max_) : index);
+                    if(!err_msg.empty())
+                        throw ValidationError(get_name(), err_msg);
+                    ++index;
+                }
+            } else {
+                int index = 0;
+                if(expected_max_ < static_cast<int>(res.size()) &&
+                   multi_option_policy_ == CLI::MultiOptionPolicy::TakeLast) {
+                    // create a negative index for the earliest ones
+                    index = expected_max_ - static_cast<int>(res.size());
+                }
+                for(std::string &result : res) {
+                    auto err_msg = _validate(result, index);
+                    ++index;
+                    if(!err_msg.empty())
+                        throw ValidationError(get_name(), err_msg);
+                }
+            }
+        }
+    }
+
+    /** reduce the results in accordance with the MultiOptionPolicy
+    @param[out] res results are assigned to res if there if they are different
+    */
+    void _reduce_results(results_t &res, const results_t &original) const {
+
+        // max num items expected or length of vector, always at least 1
+        // Only valid for a trimming policy
+
+        res.clear();
+        // Operation depends on the policy setting
+        switch(multi_option_policy_) {
+        case MultiOptionPolicy::TakeAll:
+            break;
+        case MultiOptionPolicy::TakeLast: {
+            // Allow multi-option sizes (including 0)
+            std::size_t trim_size = std::min<std::size_t>(
+                static_cast<std::size_t>(std::max<int>(get_items_expected_max(), 1)), original.size());
+            if(original.size() != trim_size) {
+                res.assign(original.end() - static_cast<results_t::difference_type>(trim_size), original.end());
+            }
+        } break;
+        case MultiOptionPolicy::TakeFirst: {
+            std::size_t trim_size = std::min<std::size_t>(
+                static_cast<std::size_t>(std::max<int>(get_items_expected_max(), 1)), original.size());
+            if(original.size() != trim_size) {
+                res.assign(original.begin(), original.begin() + static_cast<results_t::difference_type>(trim_size));
+            }
+        } break;
+        case MultiOptionPolicy::Join:
+            if(results_.size() > 1) {
+                res.push_back(detail::join(original, std::string(1, (delimiter_ == '\0') ? '\n' : delimiter_)));
+            }
+            break;
+        case MultiOptionPolicy::Throw:
+        default: {
+            auto num_min = static_cast<std::size_t>(get_items_expected_min());
+            auto num_max = static_cast<std::size_t>(get_items_expected_max());
+            if(num_min == 0) {
+                num_min = 1;
+            }
+            if(num_max == 0) {
+                num_max = 1;
+            }
+            if(original.size() < num_min) {
+                throw ArgumentMismatch::AtLeast(get_name(), static_cast<int>(num_min), original.size());
+            }
+            if(original.size() > num_max) {
+                throw ArgumentMismatch::AtMost(get_name(), static_cast<int>(num_max), original.size());
+            }
+            break;
+        }
+        }
+    }
+
+    // Run a result through the Validators
+    std::string _validate(std::string &result, int index) const {
+        std::string err_msg;
+        if(result.empty() && expected_min_ == 0) {
+            // an empty with nothing expected is allowed
+            return err_msg;
+        }
+        for(const auto &vali : validators_) {
+            auto v = vali.get_application_index();
+            if(v == -1 || v == index) {
+                try {
+                    err_msg = vali(result);
+                } catch(const ValidationError &err) {
+                    err_msg = err.what();
+                }
+                if(!err_msg.empty())
+                    break;
+            }
+        }
+
+        return err_msg;
+    }
+
+    /// Add a single result to the result set, taking into account delimiters
+    int _add_result(std::string &&result, std::vector<std::string> &res) const {
+        int result_count = 0;
+        if(allow_extra_args_ && !result.empty() && result.front() == '[' &&
+           result.back() == ']') {  // this is now a vector string likely from the default or user entry
+            result.pop_back();
+
+            for(auto &var : CLI::detail::split(result.substr(1), ',')) {
+                if(!var.empty()) {
+                    result_count += _add_result(std::move(var), res);
+                }
+            }
+            return result_count;
+        }
+        if(delimiter_ == '\0') {
+            res.push_back(std::move(result));
+            ++result_count;
+        } else {
+            if((result.find_first_of(delimiter_) != std::string::npos)) {
+                for(const auto &var : CLI::detail::split(result, delimiter_)) {
+                    if(!var.empty()) {
+                        res.push_back(var);
+                        ++result_count;
+                    }
+                }
+            } else {
+                res.push_back(std::move(result));
+                ++result_count;
+            }
+        }
+        return result_count;
+    }
+};  // namespace CLI
+
+
+
+
+#ifndef CLI11_PARSE
+#define CLI11_PARSE(app, argc, argv)                                                                                   \
+    try {                                                                                                              \
+        (app).parse((argc), (argv));                                                                                   \
+    } catch(const CLI::ParseError &e) {                                                                                \
+        return (app).exit(e);                                                                                          \
+    }
+#endif
+
+namespace detail {
+enum class Classifier { NONE, POSITIONAL_MARK, SHORT, LONG, WINDOWS_STYLE, SUBCOMMAND, SUBCOMMAND_TERMINATOR };
+struct AppFriend;
+}  // namespace detail
+
+namespace FailureMessage {
+std::string simple(const App *app, const Error &e);
+std::string help(const App *app, const Error &e);
+}  // namespace FailureMessage
+
+/// enumeration of modes of how to deal with extras in config files
+
+enum class config_extras_mode : char { error = 0, ignore, ignore_all, capture };
+
+class App;
+
+using App_p = std::shared_ptr<App>;
+
+class Option_group;
+/// Creates a command line program, with very few defaults.
+/** To use, create a new `Program()` instance with `argc`, `argv`, and a help description. The templated
+ *  add_option methods make it easy to prepare options. Remember to call `.start` before starting your
+ * program, so that the options can be evaluated and the help option doesn't accidentally run your program. */
+class App {
+    friend Option;
+    friend detail::AppFriend;
+
+  protected:
+    // This library follows the Google style guide for member names ending in underscores
+
+    /// @name Basics
+    ///@{
+
+    /// Subcommand name or program name (from parser if name is empty)
+    std::string name_{};
+
+    /// Description of the current program/subcommand
+    std::string description_{};
+
+    /// If true, allow extra arguments (ie, don't throw an error). INHERITABLE
+    bool allow_extras_{false};
+
+    /// If ignore, allow extra arguments in the ini file (ie, don't throw an error). INHERITABLE
+    /// if error error on an extra argument, and if capture feed it to the app
+    config_extras_mode allow_config_extras_{config_extras_mode::ignore};
+
+    ///  If true, return immediately on an unrecognized option (implies allow_extras) INHERITABLE
+    bool prefix_command_{false};
+
+    /// If set to true the name was automatically generated from the command line vs a user set name
+    bool has_automatic_name_{false};
+
+    /// If set to true the subcommand is required to be processed and used, ignored for main app
+    bool required_{false};
+
+    /// If set to true the subcommand is disabled and cannot be used, ignored for main app
+    bool disabled_{false};
+
+    /// Flag indicating that the pre_parse_callback has been triggered
+    bool pre_parse_called_{false};
+
+    /// Flag indicating that the callback for the subcommand should be executed immediately on parse completion which is
+    /// before help or ini files are processed. INHERITABLE
+    bool immediate_callback_{false};
+
+    /// This is a function that runs prior to the start of parsing
+    std::function<void(std::size_t)> pre_parse_callback_{};
+
+    /// This is a function that runs when parsing has finished.
+    std::function<void()> parse_complete_callback_{};
+
+    /// This is a function that runs when all processing has completed
+    std::function<void()> final_callback_{};
+
+    ///@}
+    /// @name Options
+    ///@{
+
+    /// The default values for options, customizable and changeable INHERITABLE
+    OptionDefaults option_defaults_{};
+
+    /// The list of options, stored locally
+    std::vector<Option_p> options_{};
+
+    ///@}
+    /// @name Help
+    ///@{
+
+    /// Footer to put after all options in the help output INHERITABLE
+    std::string footer_{};
+
+    /// This is a function that generates a footer to put after all other options in help output
+    std::function<std::string()> footer_callback_{};
+
+    /// A pointer to the help flag if there is one INHERITABLE
+    Option *help_ptr_{nullptr};
+
+    /// A pointer to the help all flag if there is one INHERITABLE
+    Option *help_all_ptr_{nullptr};
+
+    /// A pointer to a version flag if there is one
+    Option *version_ptr_{nullptr};
+
+    /// This is the formatter for help printing. Default provided. INHERITABLE (same pointer)
+    std::shared_ptr<FormatterBase> formatter_{new Formatter()};
+
+    /// The error message printing function INHERITABLE
+    std::function<std::string(const App *, const Error &e)> failure_message_{FailureMessage::simple};
+
+    ///@}
+    /// @name Parsing
+    ///@{
+
+    using missing_t = std::vector<std::pair<detail::Classifier, std::string>>;
+
+    /// Pair of classifier, string for missing options. (extra detail is removed on returning from parse)
+    ///
+    /// This is faster and cleaner than storing just a list of strings and reparsing. This may contain the -- separator.
+    missing_t missing_{};
+
+    /// This is a list of pointers to options with the original parse order
+    std::vector<Option *> parse_order_{};
+
+    /// This is a list of the subcommands collected, in order
+    std::vector<App *> parsed_subcommands_{};
+
+    /// this is a list of subcommands that are exclusionary to this one
+    std::set<App *> exclude_subcommands_{};
+
+    /// This is a list of options which are exclusionary to this App, if the options were used this subcommand should
+    /// not be
+    std::set<Option *> exclude_options_{};
+
+    /// this is a list of subcommands or option groups that are required by this one, the list is not mutual,  the
+    /// listed subcommands do not require this one
+    std::set<App *> need_subcommands_{};
+
+    /// This is a list of options which are required by this app, the list is not mutual, listed options do not need the
+    /// subcommand not be
+    std::set<Option *> need_options_{};
+
+    ///@}
+    /// @name Subcommands
+    ///@{
+
+    /// Storage for subcommand list
+    std::vector<App_p> subcommands_{};
+
+    /// If true, the program name is not case sensitive INHERITABLE
+    bool ignore_case_{false};
+
+    /// If true, the program should ignore underscores INHERITABLE
+    bool ignore_underscore_{false};
+
+    /// Allow subcommand fallthrough, so that parent commands can collect commands after subcommand.  INHERITABLE
+    bool fallthrough_{false};
+
+    /// Allow '/' for options for Windows like options. Defaults to true on Windows, false otherwise. INHERITABLE
+    bool allow_windows_style_options_{
+#ifdef _WIN32
+        true
+#else
+        false
+#endif
+    };
+    /// specify that positional arguments come at the end of the argument sequence not inheritable
+    bool positionals_at_end_{false};
+
+    enum class startup_mode : char { stable, enabled, disabled };
+    /// specify the startup mode for the app
+    /// stable=no change, enabled= startup enabled, disabled=startup disabled
+    startup_mode default_startup{startup_mode::stable};
+
+    /// if set to true the subcommand can be triggered via configuration files INHERITABLE
+    bool configurable_{false};
+
+    /// If set to true positional options are validated before assigning INHERITABLE
+    bool validate_positionals_{false};
+
+    /// indicator that the subcommand is silent and won't show up in subcommands list
+    /// This is potentially useful as a modifier subcommand
+    bool silent_{false};
+
+    /// Counts the number of times this command/subcommand was parsed
+    std::uint32_t parsed_{0U};
+
+    /// Minimum required subcommands (not inheritable!)
+    std::size_t require_subcommand_min_{0};
+
+    /// Max number of subcommands allowed (parsing stops after this number). 0 is unlimited INHERITABLE
+    std::size_t require_subcommand_max_{0};
+
+    /// Minimum required options (not inheritable!)
+    std::size_t require_option_min_{0};
+
+    /// Max number of options allowed. 0 is unlimited (not inheritable)
+    std::size_t require_option_max_{0};
+
+    /// A pointer to the parent if this is a subcommand
+    App *parent_{nullptr};
+
+    /// The group membership INHERITABLE
+    std::string group_{"Subcommands"};
+
+    /// Alias names for the subcommand
+    std::vector<std::string> aliases_{};
+
+    ///@}
+    /// @name Config
+    ///@{
+
+    /// Pointer to the config option
+    Option *config_ptr_{nullptr};
+
+    /// This is the formatter for help printing. Default provided. INHERITABLE (same pointer)
+    std::shared_ptr<Config> config_formatter_{new ConfigTOML()};
+
+    ///@}
+
+    /// Special private constructor for subcommand
+    App(std::string app_description, std::string app_name, App *parent)
+        : name_(std::move(app_name)), description_(std::move(app_description)), parent_(parent) {
+        // Inherit if not from a nullptr
+        if(parent_ != nullptr) {
+            if(parent_->help_ptr_ != nullptr)
+                set_help_flag(parent_->help_ptr_->get_name(false, true), parent_->help_ptr_->get_description());
+            if(parent_->help_all_ptr_ != nullptr)
+                set_help_all_flag(parent_->help_all_ptr_->get_name(false, true),
+                                  parent_->help_all_ptr_->get_description());
+
+            /// OptionDefaults
+            option_defaults_ = parent_->option_defaults_;
+
+            // INHERITABLE
+            failure_message_ = parent_->failure_message_;
+            allow_extras_ = parent_->allow_extras_;
+            allow_config_extras_ = parent_->allow_config_extras_;
+            prefix_command_ = parent_->prefix_command_;
+            immediate_callback_ = parent_->immediate_callback_;
+            ignore_case_ = parent_->ignore_case_;
+            ignore_underscore_ = parent_->ignore_underscore_;
+            fallthrough_ = parent_->fallthrough_;
+            validate_positionals_ = parent_->validate_positionals_;
+            configurable_ = parent_->configurable_;
+            allow_windows_style_options_ = parent_->allow_windows_style_options_;
+            group_ = parent_->group_;
+            footer_ = parent_->footer_;
+            formatter_ = parent_->formatter_;
+            config_formatter_ = parent_->config_formatter_;
+            require_subcommand_max_ = parent_->require_subcommand_max_;
+        }
+    }
+
+  public:
+    /// @name Basic
+    ///@{
+
+    /// Create a new program. Pass in the same arguments as main(), along with a help string.
+    explicit App(std::string app_description = "", std::string app_name = "")
+        : App(app_description, app_name, nullptr) {
+        set_help_flag("-h,--help", "Print this help message and exit");
+    }
+
+    App(const App &) = delete;
+    App &operator=(const App &) = delete;
+
+    /// virtual destructor
+    virtual ~App() = default;
+
+    /// Set a callback for execution when all parsing and processing has completed
+    ///
+    /// Due to a bug in c++11,
+    /// it is not possible to overload on std::function (fixed in c++14
+    /// and backported to c++11 on newer compilers). Use capture by reference
+    /// to get a pointer to App if needed.
+    App *callback(std::function<void()> app_callback) {
+        if(immediate_callback_) {
+            parse_complete_callback_ = std::move(app_callback);
+        } else {
+            final_callback_ = std::move(app_callback);
+        }
+        return this;
+    }
+
+    /// Set a callback for execution when all parsing and processing has completed
+    /// aliased as callback
+    App *final_callback(std::function<void()> app_callback) {
+        final_callback_ = std::move(app_callback);
+        return this;
+    }
+
+    /// Set a callback to execute when parsing has completed for the app
+    ///
+    App *parse_complete_callback(std::function<void()> pc_callback) {
+        parse_complete_callback_ = std::move(pc_callback);
+        return this;
+    }
+
+    /// Set a callback to execute prior to parsing.
+    ///
+    App *preparse_callback(std::function<void(std::size_t)> pp_callback) {
+        pre_parse_callback_ = std::move(pp_callback);
+        return this;
+    }
+
+    /// Set a name for the app (empty will use parser to set the name)
+    App *name(std::string app_name = "") {
+
+        if(parent_ != nullptr) {
+            auto oname = name_;
+            name_ = app_name;
+            auto &res = _compare_subcommand_names(*this, *_get_fallthrough_parent());
+            if(!res.empty()) {
+                name_ = oname;
+                throw(OptionAlreadyAdded(app_name + " conflicts with existing subcommand names"));
+            }
+        } else {
+            name_ = app_name;
+        }
+        has_automatic_name_ = false;
+        return this;
+    }
+
+    /// Set an alias for the app
+    App *alias(std::string app_name) {
+        if(app_name.empty() || !detail::valid_alias_name_string(app_name)) {
+            throw IncorrectConstruction("Aliases may not be empty or contain newlines or null characters");
+        }
+        if(parent_ != nullptr) {
+            aliases_.push_back(app_name);
+            auto &res = _compare_subcommand_names(*this, *_get_fallthrough_parent());
+            if(!res.empty()) {
+                aliases_.pop_back();
+                throw(OptionAlreadyAdded("alias already matches an existing subcommand: " + app_name));
+            }
+        } else {
+            aliases_.push_back(app_name);
+        }
+
+        return this;
+    }
+
+    /// Remove the error when extras are left over on the command line.
+    App *allow_extras(bool allow = true) {
+        allow_extras_ = allow;
+        return this;
+    }
+
+    /// Remove the error when extras are left over on the command line.
+    App *required(bool require = true) {
+        required_ = require;
+        return this;
+    }
+
+    /// Disable the subcommand or option group
+    App *disabled(bool disable = true) {
+        disabled_ = disable;
+        return this;
+    }
+
+    /// silence the subcommand from showing up in the processed list
+    App *silent(bool silence = true) {
+        silent_ = silence;
+        return this;
+    }
+
+    /// Set the subcommand to be disabled by default, so on clear(), at the start of each parse it is disabled
+    App *disabled_by_default(bool disable = true) {
+        if(disable) {
+            default_startup = startup_mode::disabled;
+        } else {
+            default_startup = (default_startup == startup_mode::enabled) ? startup_mode::enabled : startup_mode::stable;
+        }
+        return this;
+    }
+
+    /// Set the subcommand to be enabled by default, so on clear(), at the start of each parse it is enabled (not
+    /// disabled)
+    App *enabled_by_default(bool enable = true) {
+        if(enable) {
+            default_startup = startup_mode::enabled;
+        } else {
+            default_startup =
+                (default_startup == startup_mode::disabled) ? startup_mode::disabled : startup_mode::stable;
+        }
+        return this;
+    }
+
+    /// Set the subcommand callback to be executed immediately on subcommand completion
+    App *immediate_callback(bool immediate = true) {
+        immediate_callback_ = immediate;
+        if(immediate_callback_) {
+            if(final_callback_ && !(parse_complete_callback_)) {
+                std::swap(final_callback_, parse_complete_callback_);
+            }
+        } else if(!(final_callback_) && parse_complete_callback_) {
+            std::swap(final_callback_, parse_complete_callback_);
+        }
+        return this;
+    }
+
+    /// Set the subcommand to validate positional arguments before assigning
+    App *validate_positionals(bool validate = true) {
+        validate_positionals_ = validate;
+        return this;
+    }
+
+    /// ignore extras in config files
+    App *allow_config_extras(bool allow = true) {
+        if(allow) {
+            allow_config_extras_ = config_extras_mode::capture;
+            allow_extras_ = true;
+        } else {
+            allow_config_extras_ = config_extras_mode::error;
+        }
+        return this;
+    }
+
+    /// ignore extras in config files
+    App *allow_config_extras(config_extras_mode mode) {
+        allow_config_extras_ = mode;
+        return this;
+    }
+
+    /// Do not parse anything after the first unrecognized option and return
+    App *prefix_command(bool allow = true) {
+        prefix_command_ = allow;
+        return this;
+    }
+
+    /// Ignore case. Subcommands inherit value.
+    App *ignore_case(bool value = true) {
+        if(value && !ignore_case_) {
+            ignore_case_ = true;
+            auto *p = (parent_ != nullptr) ? _get_fallthrough_parent() : this;
+            auto &match = _compare_subcommand_names(*this, *p);
+            if(!match.empty()) {
+                ignore_case_ = false;  // we are throwing so need to be exception invariant
+                throw OptionAlreadyAdded("ignore case would cause subcommand name conflicts: " + match);
+            }
+        }
+        ignore_case_ = value;
+        return this;
+    }
+
+    /// Allow windows style options, such as `/opt`. First matching short or long name used. Subcommands inherit
+    /// value.
+    App *allow_windows_style_options(bool value = true) {
+        allow_windows_style_options_ = value;
+        return this;
+    }
+
+    /// Specify that the positional arguments are only at the end of the sequence
+    App *positionals_at_end(bool value = true) {
+        positionals_at_end_ = value;
+        return this;
+    }
+
+    /// Specify that the subcommand can be triggered by a config file
+    App *configurable(bool value = true) {
+        configurable_ = value;
+        return this;
+    }
+
+    /// Ignore underscore. Subcommands inherit value.
+    App *ignore_underscore(bool value = true) {
+        if(value && !ignore_underscore_) {
+            ignore_underscore_ = true;
+            auto *p = (parent_ != nullptr) ? _get_fallthrough_parent() : this;
+            auto &match = _compare_subcommand_names(*this, *p);
+            if(!match.empty()) {
+                ignore_underscore_ = false;
+                throw OptionAlreadyAdded("ignore underscore would cause subcommand name conflicts: " + match);
+            }
+        }
+        ignore_underscore_ = value;
+        return this;
+    }
+
+    /// Set the help formatter
+    App *formatter(std::shared_ptr<FormatterBase> fmt) {
+        formatter_ = fmt;
+        return this;
+    }
+
+    /// Set the help formatter
+    App *formatter_fn(std::function<std::string(const App *, std::string, AppFormatMode)> fmt) {
+        formatter_ = std::make_shared<FormatterLambda>(fmt);
+        return this;
+    }
+
+    /// Set the config formatter
+    App *config_formatter(std::shared_ptr<Config> fmt) {
+        config_formatter_ = fmt;
+        return this;
+    }
+
+    /// Check to see if this subcommand was parsed, true only if received on command line.
+    bool parsed() const { return parsed_ > 0; }
+
+    /// Get the OptionDefault object, to set option defaults
+    OptionDefaults *option_defaults() { return &option_defaults_; }
+
+    ///@}
+    /// @name Adding options
+    ///@{
+
+    /// Add an option, will automatically understand the type for common types.
+    ///
+    /// To use, create a variable with the expected type, and pass it in after the name.
+    /// After start is called, you can use count to see if the value was passed, and
+    /// the value will be initialized properly. Numbers, vectors, and strings are supported.
+    ///
+    /// ->required(), ->default, and the validators are options,
+    /// The positional options take an optional number of arguments.
+    ///
+    /// For example,
+    ///
+    ///     std::string filename;
+    ///     program.add_option("filename", filename, "description of filename");
+    ///
+    Option *add_option(std::string option_name,
+                       callback_t option_callback,
+                       std::string option_description = "",
+                       bool defaulted = false,
+                       std::function<std::string()> func = {}) {
+        Option myopt{option_name, option_description, option_callback, this};
+
+        if(std::find_if(std::begin(options_), std::end(options_), [&myopt](const Option_p &v) {
+               return *v == myopt;
+           }) == std::end(options_)) {
+            options_.emplace_back();
+            Option_p &option = options_.back();
+            option.reset(new Option(option_name, option_description, option_callback, this));
+
+            // Set the default string capture function
+            option->default_function(func);
+
+            // For compatibility with CLI11 1.7 and before, capture the default string here
+            if(defaulted)
+                option->capture_default_str();
+
+            // Transfer defaults to the new option
+            option_defaults_.copy_to(option.get());
+
+            // Don't bother to capture if we already did
+            if(!defaulted && option->get_always_capture_default())
+                option->capture_default_str();
+
+            return option.get();
+        }
+        // we know something matches now find what it is so we can produce more error information
+        for(auto &opt : options_) {
+            auto &matchname = opt->matching_name(myopt);
+            if(!matchname.empty()) {
+                throw(OptionAlreadyAdded("added option matched existing option name: " + matchname));
+            }
+        }
+        // this line should not be reached the above loop should trigger the throw
+        throw(OptionAlreadyAdded("added option matched existing option name"));  // LCOV_EXCL_LINE
+    }
+
+    /// Add option for assigning to a variable
+    template <typename AssignTo,
+              typename ConvertTo = AssignTo,
+              enable_if_t<!std::is_const<ConvertTo>::value, detail::enabler> = detail::dummy>
+    Option *add_option(std::string option_name,
+                       AssignTo &variable,  ///< The variable to set
+                       std::string option_description = "") {
+
+        auto fun = [&variable](const CLI::results_t &res) {  // comment for spacing
+            return detail::lexical_conversion<AssignTo, ConvertTo>(res, variable);
+        };
+
+        Option *opt = add_option(option_name, fun, option_description, false, [&variable]() {
+            return CLI::detail::checked_to_string<AssignTo, ConvertTo>(variable);
+        });
+        opt->type_name(detail::type_name<ConvertTo>());
+        // these must be actual lvalues since (std::max) sometimes is defined in terms of references and references
+        // to structs used in the evaluation can be temporary so that would cause issues.
+        auto Tcount = detail::type_count<AssignTo>::value;
+        auto XCcount = detail::type_count<ConvertTo>::value;
+        opt->type_size(detail::type_count_min<ConvertTo>::value, (std::max)(Tcount, XCcount));
+        opt->expected(detail::expected_count<ConvertTo>::value);
+        opt->run_callback_for_default();
+        return opt;
+    }
+
+    /// Add option for assigning to a variable
+    template <typename AssignTo, enable_if_t<!std::is_const<AssignTo>::value, detail::enabler> = detail::dummy>
+    Option *add_option_no_stream(std::string option_name,
+                                 AssignTo &variable,  ///< The variable to set
+                                 std::string option_description = "") {
+
+        auto fun = [&variable](const CLI::results_t &res) {  // comment for spacing
+            return detail::lexical_conversion<AssignTo, AssignTo>(res, variable);
+        };
+
+        Option *opt = add_option(option_name, fun, option_description, false, []() { return std::string{}; });
+        opt->type_name(detail::type_name<AssignTo>());
+        opt->type_size(detail::type_count_min<AssignTo>::value, detail::type_count<AssignTo>::value);
+        opt->expected(detail::expected_count<AssignTo>::value);
+        opt->run_callback_for_default();
+        return opt;
+    }
+
+    /// Add option for a callback of a specific type
+    template <typename ArgType>
+    Option *add_option_function(std::string option_name,
+                                const std::function<void(const ArgType &)> &func,  ///< the callback to execute
+                                std::string option_description = "") {
+
+        auto fun = [func](const CLI::results_t &res) {
+            ArgType variable;
+            bool result = detail::lexical_conversion<ArgType, ArgType>(res, variable);
+            if(result) {
+                func(variable);
+            }
+            return result;
+        };
+
+        Option *opt = add_option(option_name, std::move(fun), option_description, false);
+        opt->type_name(detail::type_name<ArgType>());
+        opt->type_size(detail::type_count_min<ArgType>::value, detail::type_count<ArgType>::value);
+        opt->expected(detail::expected_count<ArgType>::value);
+        return opt;
+    }
+
+    /// Add option with no description or variable assignment
+    Option *add_option(std::string option_name) {
+        return add_option(option_name, CLI::callback_t{}, std::string{}, false);
+    }
+
+    /// Add option with description but with no variable assignment or callback
+    template <typename T,
+              enable_if_t<std::is_const<T>::value && std::is_constructible<std::string, T>::value, detail::enabler> =
+                  detail::dummy>
+    Option *add_option(std::string option_name, T &option_description) {
+        return add_option(option_name, CLI::callback_t(), option_description, false);
+    }
+
+    /// Set a help flag, replace the existing one if present
+    Option *set_help_flag(std::string flag_name = "", const std::string &help_description = "") {
+        // take flag_description by const reference otherwise add_flag tries to assign to help_description
+        if(help_ptr_ != nullptr) {
+            remove_option(help_ptr_);
+            help_ptr_ = nullptr;
+        }
+
+        // Empty name will simply remove the help flag
+        if(!flag_name.empty()) {
+            help_ptr_ = add_flag(flag_name, help_description);
+            help_ptr_->configurable(false);
+        }
+
+        return help_ptr_;
+    }
+
+    /// Set a help all flag, replaced the existing one if present
+    Option *set_help_all_flag(std::string help_name = "", const std::string &help_description = "") {
+        // take flag_description by const reference otherwise add_flag tries to assign to flag_description
+        if(help_all_ptr_ != nullptr) {
+            remove_option(help_all_ptr_);
+            help_all_ptr_ = nullptr;
+        }
+
+        // Empty name will simply remove the help all flag
+        if(!help_name.empty()) {
+            help_all_ptr_ = add_flag(help_name, help_description);
+            help_all_ptr_->configurable(false);
+        }
+
+        return help_all_ptr_;
+    }
+
+    /// Set a version flag and version display string, replace the existing one if present
+    Option *set_version_flag(std::string flag_name = "",
+                             const std::string &versionString = "",
+                             const std::string &version_help = "Display program version information and exit") {
+        // take flag_description by const reference otherwise add_flag tries to assign to version_description
+        if(version_ptr_ != nullptr) {
+            remove_option(version_ptr_);
+            version_ptr_ = nullptr;
+        }
+
+        // Empty name will simply remove the version flag
+        if(!flag_name.empty()) {
+            version_ptr_ = add_flag_callback(
+                flag_name, [versionString]() { throw(CLI::CallForVersion(versionString, 0)); }, version_help);
+            version_ptr_->configurable(false);
+        }
+
+        return version_ptr_;
+    }
+    /// Generate the version string through a callback function
+    Option *set_version_flag(std::string flag_name,
+                             std::function<std::string()> vfunc,
+                             const std::string &version_help = "Display program version information and exit") {
+        if(version_ptr_ != nullptr) {
+            remove_option(version_ptr_);
+            version_ptr_ = nullptr;
+        }
+
+        // Empty name will simply remove the version flag
+        if(!flag_name.empty()) {
+            version_ptr_ = add_flag_callback(
+                flag_name, [vfunc]() { throw(CLI::CallForVersion(vfunc(), 0)); }, version_help);
+            version_ptr_->configurable(false);
+        }
+
+        return version_ptr_;
+    }
+
+  private:
+    /// Internal function for adding a flag
+    Option *_add_flag_internal(std::string flag_name, CLI::callback_t fun, std::string flag_description) {
+        Option *opt;
+        if(detail::has_default_flag_values(flag_name)) {
+            // check for default values and if it has them
+            auto flag_defaults = detail::get_default_flag_values(flag_name);
+            detail::remove_default_flag_values(flag_name);
+            opt = add_option(std::move(flag_name), std::move(fun), std::move(flag_description), false);
+            for(const auto &fname : flag_defaults)
+                opt->fnames_.push_back(fname.first);
+            opt->default_flag_values_ = std::move(flag_defaults);
+        } else {
+            opt = add_option(std::move(flag_name), std::move(fun), std::move(flag_description), false);
+        }
+        // flags cannot have positional values
+        if(opt->get_positional()) {
+            auto pos_name = opt->get_name(true);
+            remove_option(opt);
+            throw IncorrectConstruction::PositionalFlag(pos_name);
+        }
+        opt->multi_option_policy(MultiOptionPolicy::TakeLast);
+        opt->expected(0);
+        opt->required(false);
+        return opt;
+    }
+
+  public:
+    /// Add a flag with no description or variable assignment
+    Option *add_flag(std::string flag_name) { return _add_flag_internal(flag_name, CLI::callback_t(), std::string{}); }
+
+    /// Add flag with description but with no variable assignment or callback
+    /// takes a constant string,  if a variable string is passed that variable will be assigned the results from the
+    /// flag
+    template <typename T,
+              enable_if_t<std::is_const<T>::value && std::is_constructible<std::string, T>::value, detail::enabler> =
+                  detail::dummy>
+    Option *add_flag(std::string flag_name, T &flag_description) {
+        return _add_flag_internal(flag_name, CLI::callback_t(), flag_description);
+    }
+
+    /// Add option for flag with integer result - defaults to allowing multiple passings, but can be forced to one
+    /// if `multi_option_policy(CLI::MultiOptionPolicy::Throw)` is used.
+    template <typename T,
+              enable_if_t<std::is_constructible<T, std::int64_t>::value && !is_bool<T>::value, detail::enabler> =
+                  detail::dummy>
+    Option *add_flag(std::string flag_name,
+                     T &flag_count,  ///< A variable holding the count
+                     std::string flag_description = "") {
+        flag_count = 0;
+        CLI::callback_t fun = [&flag_count](const CLI::results_t &res) {
+            try {
+                detail::sum_flag_vector(res, flag_count);
+            } catch(const std::invalid_argument &) {
+                return false;
+            }
+            return true;
+        };
+        return _add_flag_internal(flag_name, std::move(fun), std::move(flag_description))
+            ->multi_option_policy(MultiOptionPolicy::TakeAll);
+    }
+
+    /// Other type version accepts all other types that are not vectors such as bool, enum, string or other classes
+    /// that can be converted from a string
+    template <typename T,
+              enable_if_t<!detail::is_mutable_container<T>::value && !std::is_const<T>::value &&
+                              (!std::is_constructible<T, std::int64_t>::value || is_bool<T>::value) &&
+                              !std::is_constructible<std::function<void(int)>, T>::value,
+                          detail::enabler> = detail::dummy>
+    Option *add_flag(std::string flag_name,
+                     T &flag_result,  ///< A variable holding true if passed
+                     std::string flag_description = "") {
+
+        CLI::callback_t fun = [&flag_result](const CLI::results_t &res) {
+            return CLI::detail::lexical_cast(res[0], flag_result);
+        };
+        return _add_flag_internal(flag_name, std::move(fun), std::move(flag_description))->run_callback_for_default();
+    }
+
+    /// Vector version to capture multiple flags.
+    template <typename T,
+              enable_if_t<!std::is_assignable<std::function<void(std::int64_t)> &, T>::value, detail::enabler> =
+                  detail::dummy>
+    Option *add_flag(std::string flag_name,
+                     std::vector<T> &flag_results,  ///< A vector of values with the flag results
+                     std::string flag_description = "") {
+        CLI::callback_t fun = [&flag_results](const CLI::results_t &res) {
+            bool retval = true;
+            for(const auto &elem : res) {
+                flag_results.emplace_back();
+                retval &= detail::lexical_cast(elem, flag_results.back());
+            }
+            return retval;
+        };
+        return _add_flag_internal(flag_name, std::move(fun), std::move(flag_description))
+            ->multi_option_policy(MultiOptionPolicy::TakeAll)
+            ->run_callback_for_default();
+    }
+
+    /// Add option for callback that is triggered with a true flag and takes no arguments
+    Option *add_flag_callback(std::string flag_name,
+                              std::function<void(void)> function,  ///< A function to call, void(void)
+                              std::string flag_description = "") {
+
+        CLI::callback_t fun = [function](const CLI::results_t &res) {
+            bool trigger{false};
+            auto result = CLI::detail::lexical_cast(res[0], trigger);
+            if(result && trigger) {
+                function();
+            }
+            return result;
+        };
+        return _add_flag_internal(flag_name, std::move(fun), std::move(flag_description));
+    }
+
+    /// Add option for callback with an integer value
+    Option *add_flag_function(std::string flag_name,
+                              std::function<void(std::int64_t)> function,  ///< A function to call, void(int)
+                              std::string flag_description = "") {
+
+        CLI::callback_t fun = [function](const CLI::results_t &res) {
+            std::int64_t flag_count = 0;
+            detail::sum_flag_vector(res, flag_count);
+            function(flag_count);
+            return true;
+        };
+        return _add_flag_internal(flag_name, std::move(fun), std::move(flag_description))
+            ->multi_option_policy(MultiOptionPolicy::TakeAll);
+    }
+
+#ifdef CLI11_CPP14
+    /// Add option for callback (C++14 or better only)
+    Option *add_flag(std::string flag_name,
+                     std::function<void(std::int64_t)> function,  ///< A function to call, void(std::int64_t)
+                     std::string flag_description = "") {
+        return add_flag_function(std::move(flag_name), std::move(function), std::move(flag_description));
+    }
+#endif
+
+    /// Set a configuration ini file option, or clear it if no name passed
+    Option *set_config(std::string option_name = "",
+                       std::string default_filename = "",
+                       const std::string &help_message = "Read an ini file",
+                       bool config_required = false) {
+
+        // Remove existing config if present
+        if(config_ptr_ != nullptr) {
+            remove_option(config_ptr_);
+            config_ptr_ = nullptr;  // need to remove the config_ptr completely
+        }
+
+        // Only add config if option passed
+        if(!option_name.empty()) {
+            config_ptr_ = add_option(option_name, help_message);
+            if(config_required) {
+                config_ptr_->required();
+            }
+            if(!default_filename.empty()) {
+                config_ptr_->default_str(std::move(default_filename));
+            }
+            config_ptr_->configurable(false);
+        }
+
+        return config_ptr_;
+    }
+
+    /// Removes an option from the App. Takes an option pointer. Returns true if found and removed.
+    bool remove_option(Option *opt) {
+        // Make sure no links exist
+        for(Option_p &op : options_) {
+            op->remove_needs(opt);
+            op->remove_excludes(opt);
+        }
+
+        if(help_ptr_ == opt)
+            help_ptr_ = nullptr;
+        if(help_all_ptr_ == opt)
+            help_all_ptr_ = nullptr;
+
+        auto iterator =
+            std::find_if(std::begin(options_), std::end(options_), [opt](const Option_p &v) { return v.get() == opt; });
+        if(iterator != std::end(options_)) {
+            options_.erase(iterator);
+            return true;
+        }
+        return false;
+    }
+
+    /// creates an option group as part of the given app
+    template <typename T = Option_group>
+    T *add_option_group(std::string group_name, std::string group_description = "") {
+        if(!detail::valid_alias_name_string(group_name)) {
+            throw IncorrectConstruction("option group names may not contain newlines or null characters");
+        }
+        auto option_group = std::make_shared<T>(std::move(group_description), group_name, this);
+        auto ptr = option_group.get();
+        // move to App_p for overload resolution on older gcc versions
+        App_p app_ptr = std::dynamic_pointer_cast<App>(option_group);
+        add_subcommand(std::move(app_ptr));
+        return ptr;
+    }
+
+    ///@}
+    /// @name Subcommands
+    ///@{
+
+    /// Add a subcommand. Inherits INHERITABLE and OptionDefaults, and help flag
+    App *add_subcommand(std::string subcommand_name = "", std::string subcommand_description = "") {
+        if(!subcommand_name.empty() && !detail::valid_name_string(subcommand_name)) {
+            if(!detail::valid_first_char(subcommand_name[0])) {
+                throw IncorrectConstruction(
+                    "Subcommand name starts with invalid character, '!' and '-' are not allowed");
+            }
+            for(auto c : subcommand_name) {
+                if(!detail::valid_later_char(c)) {
+                    throw IncorrectConstruction(std::string("Subcommand name contains invalid character ('") + c +
+                                                "'), all characters are allowed except"
+                                                "'=',':','{','}', and ' '");
+                }
+            }
+        }
+        CLI::App_p subcom = std::shared_ptr<App>(new App(std::move(subcommand_description), subcommand_name, this));
+        return add_subcommand(std::move(subcom));
+    }
+
+    /// Add a previously created app as a subcommand
+    App *add_subcommand(CLI::App_p subcom) {
+        if(!subcom)
+            throw IncorrectConstruction("passed App is not valid");
+        auto ckapp = (name_.empty() && parent_ != nullptr) ? _get_fallthrough_parent() : this;
+        auto &mstrg = _compare_subcommand_names(*subcom, *ckapp);
+        if(!mstrg.empty()) {
+            throw(OptionAlreadyAdded("subcommand name or alias matches existing subcommand: " + mstrg));
+        }
+        subcom->parent_ = this;
+        subcommands_.push_back(std::move(subcom));
+        return subcommands_.back().get();
+    }
+
+    /// Removes a subcommand from the App. Takes a subcommand pointer. Returns true if found and removed.
+    bool remove_subcommand(App *subcom) {
+        // Make sure no links exist
+        for(App_p &sub : subcommands_) {
+            sub->remove_excludes(subcom);
+            sub->remove_needs(subcom);
+        }
+
+        auto iterator = std::find_if(
+            std::begin(subcommands_), std::end(subcommands_), [subcom](const App_p &v) { return v.get() == subcom; });
+        if(iterator != std::end(subcommands_)) {
+            subcommands_.erase(iterator);
+            return true;
+        }
+        return false;
+    }
+    /// Check to see if a subcommand is part of this command (doesn't have to be in command line)
+    /// returns the first subcommand if passed a nullptr
+    App *get_subcommand(const App *subcom) const {
+        if(subcom == nullptr)
+            throw OptionNotFound("nullptr passed");
+        for(const App_p &subcomptr : subcommands_)
+            if(subcomptr.get() == subcom)
+                return subcomptr.get();
+        throw OptionNotFound(subcom->get_name());
+    }
+
+    /// Check to see if a subcommand is part of this command (text version)
+    App *get_subcommand(std::string subcom) const {
+        auto subc = _find_subcommand(subcom, false, false);
+        if(subc == nullptr)
+            throw OptionNotFound(subcom);
+        return subc;
+    }
+    /// Get a pointer to subcommand by index
+    App *get_subcommand(int index = 0) const {
+        if(index >= 0) {
+            auto uindex = static_cast<unsigned>(index);
+            if(uindex < subcommands_.size())
+                return subcommands_[uindex].get();
+        }
+        throw OptionNotFound(std::to_string(index));
+    }
+
+    /// Check to see if a subcommand is part of this command and get a shared_ptr to it
+    CLI::App_p get_subcommand_ptr(App *subcom) const {
+        if(subcom == nullptr)
+            throw OptionNotFound("nullptr passed");
+        for(const App_p &subcomptr : subcommands_)
+            if(subcomptr.get() == subcom)
+                return subcomptr;
+        throw OptionNotFound(subcom->get_name());
+    }
+
+    /// Check to see if a subcommand is part of this command (text version)
+    CLI::App_p get_subcommand_ptr(std::string subcom) const {
+        for(const App_p &subcomptr : subcommands_)
+            if(subcomptr->check_name(subcom))
+                return subcomptr;
+        throw OptionNotFound(subcom);
+    }
+
+    /// Get an owning pointer to subcommand by index
+    CLI::App_p get_subcommand_ptr(int index = 0) const {
+        if(index >= 0) {
+            auto uindex = static_cast<unsigned>(index);
+            if(uindex < subcommands_.size())
+                return subcommands_[uindex];
+        }
+        throw OptionNotFound(std::to_string(index));
+    }
+
+    /// Check to see if an option group is part of this App
+    App *get_option_group(std::string group_name) const {
+        for(const App_p &app : subcommands_) {
+            if(app->name_.empty() && app->group_ == group_name) {
+                return app.get();
+            }
+        }
+        throw OptionNotFound(group_name);
+    }
+
+    /// No argument version of count counts the number of times this subcommand was
+    /// passed in. The main app will return 1. Unnamed subcommands will also return 1 unless
+    /// otherwise modified in a callback
+    std::size_t count() const { return parsed_; }
+
+    /// Get a count of all the arguments processed in options and subcommands, this excludes arguments which were
+    /// treated as extras.
+    std::size_t count_all() const {
+        std::size_t cnt{0};
+        for(auto &opt : options_) {
+            cnt += opt->count();
+        }
+        for(auto &sub : subcommands_) {
+            cnt += sub->count_all();
+        }
+        if(!get_name().empty()) {  // for named subcommands add the number of times the subcommand was called
+            cnt += parsed_;
+        }
+        return cnt;
+    }
+
+    /// Changes the group membership
+    App *group(std::string group_name) {
+        group_ = group_name;
+        return this;
+    }
+
+    /// The argumentless form of require subcommand requires 1 or more subcommands
+    App *require_subcommand() {
+        require_subcommand_min_ = 1;
+        require_subcommand_max_ = 0;
+        return this;
+    }
+
+    /// Require a subcommand to be given (does not affect help call)
+    /// The number required can be given. Negative values indicate maximum
+    /// number allowed (0 for any number). Max number inheritable.
+    App *require_subcommand(int value) {
+        if(value < 0) {
+            require_subcommand_min_ = 0;
+            require_subcommand_max_ = static_cast<std::size_t>(-value);
+        } else {
+            require_subcommand_min_ = static_cast<std::size_t>(value);
+            require_subcommand_max_ = static_cast<std::size_t>(value);
+        }
+        return this;
+    }
+
+    /// Explicitly control the number of subcommands required. Setting 0
+    /// for the max means unlimited number allowed. Max number inheritable.
+    App *require_subcommand(std::size_t min, std::size_t max) {
+        require_subcommand_min_ = min;
+        require_subcommand_max_ = max;
+        return this;
+    }
+
+    /// The argumentless form of require option requires 1 or more options be used
+    App *require_option() {
+        require_option_min_ = 1;
+        require_option_max_ = 0;
+        return this;
+    }
+
+    /// Require an option to be given (does not affect help call)
+    /// The number required can be given. Negative values indicate maximum
+    /// number allowed (0 for any number).
+    App *require_option(int value) {
+        if(value < 0) {
+            require_option_min_ = 0;
+            require_option_max_ = static_cast<std::size_t>(-value);
+        } else {
+            require_option_min_ = static_cast<std::size_t>(value);
+            require_option_max_ = static_cast<std::size_t>(value);
+        }
+        return this;
+    }
+
+    /// Explicitly control the number of options required. Setting 0
+    /// for the max means unlimited number allowed. Max number inheritable.
+    App *require_option(std::size_t min, std::size_t max) {
+        require_option_min_ = min;
+        require_option_max_ = max;
+        return this;
+    }
+
+    /// Stop subcommand fallthrough, so that parent commands cannot collect commands after subcommand.
+    /// Default from parent, usually set on parent.
+    App *fallthrough(bool value = true) {
+        fallthrough_ = value;
+        return this;
+    }
+
+    /// Check to see if this subcommand was parsed, true only if received on command line.
+    /// This allows the subcommand to be directly checked.
+    explicit operator bool() const { return parsed_ > 0; }
+
+    ///@}
+    /// @name Extras for subclassing
+    ///@{
+
+    /// This allows subclasses to inject code before callbacks but after parse.
+    ///
+    /// This does not run if any errors or help is thrown.
+    virtual void pre_callback() {}
+
+    ///@}
+    /// @name Parsing
+    ///@{
+    //
+    /// Reset the parsed data
+    void clear() {
+
+        parsed_ = 0;
+        pre_parse_called_ = false;
+
+        missing_.clear();
+        parsed_subcommands_.clear();
+        for(const Option_p &opt : options_) {
+            opt->clear();
+        }
+        for(const App_p &subc : subcommands_) {
+            subc->clear();
+        }
+    }
+
+    /// Parses the command line - throws errors.
+    /// This must be called after the options are in but before the rest of the program.
+    void parse(int argc, const char *const *argv) {
+        // If the name is not set, read from command line
+        if(name_.empty() || has_automatic_name_) {
+            has_automatic_name_ = true;
+            name_ = argv[0];
+        }
+
+        std::vector<std::string> args;
+        args.reserve(static_cast<std::size_t>(argc) - 1);
+        for(int i = argc - 1; i > 0; i--)
+            args.emplace_back(argv[i]);
+        parse(std::move(args));
+    }
+
+    /// Parse a single string as if it contained command line arguments.
+    /// This function splits the string into arguments then calls parse(std::vector<std::string> &)
+    /// the function takes an optional boolean argument specifying if the programName is included in the string to
+    /// process
+    void parse(std::string commandline, bool program_name_included = false) {
+
+        if(program_name_included) {
+            auto nstr = detail::split_program_name(commandline);
+            if((name_.empty()) || (has_automatic_name_)) {
+                has_automatic_name_ = true;
+                name_ = nstr.first;
+            }
+            commandline = std::move(nstr.second);
+        } else {
+            detail::trim(commandline);
+        }
+        // the next section of code is to deal with quoted arguments after an '=' or ':' for windows like operations
+        if(!commandline.empty()) {
+            commandline = detail::find_and_modify(commandline, "=", detail::escape_detect);
+            if(allow_windows_style_options_)
+                commandline = detail::find_and_modify(commandline, ":", detail::escape_detect);
+        }
+
+        auto args = detail::split_up(std::move(commandline));
+        // remove all empty strings
+        args.erase(std::remove(args.begin(), args.end(), std::string{}), args.end());
+        std::reverse(args.begin(), args.end());
+
+        parse(std::move(args));
+    }
+
+    /// The real work is done here. Expects a reversed vector.
+    /// Changes the vector to the remaining options.
+    void parse(std::vector<std::string> &args) {
+        // Clear if parsed
+        if(parsed_ > 0)
+            clear();
+
+        // parsed_ is incremented in commands/subcommands,
+        // but placed here to make sure this is cleared when
+        // running parse after an error is thrown, even by _validate or _configure.
+        parsed_ = 1;
+        _validate();
+        _configure();
+        // set the parent as nullptr as this object should be the top now
+        parent_ = nullptr;
+        parsed_ = 0;
+
+        _parse(args);
+        run_callback();
+    }
+
+    /// The real work is done here. Expects a reversed vector.
+    void parse(std::vector<std::string> &&args) {
+        // Clear if parsed
+        if(parsed_ > 0)
+            clear();
+
+        // parsed_ is incremented in commands/subcommands,
+        // but placed here to make sure this is cleared when
+        // running parse after an error is thrown, even by _validate or _configure.
+        parsed_ = 1;
+        _validate();
+        _configure();
+        // set the parent as nullptr as this object should be the top now
+        parent_ = nullptr;
+        parsed_ = 0;
+
+        _parse(std::move(args));
+        run_callback();
+    }
+
+    void parse_from_stream(std::istream &input) {
+        if(parsed_ == 0) {
+            _validate();
+            _configure();
+            // set the parent as nullptr as this object should be the top now
+        }
+
+        _parse_stream(input);
+        run_callback();
+    }
+    /// Provide a function to print a help message. The function gets access to the App pointer and error.
+    void failure_message(std::function<std::string(const App *, const Error &e)> function) {
+        failure_message_ = function;
+    }
+
+    /// Print a nice error message and return the exit code
+    int exit(const Error &e, std::ostream &out = std::cout, std::ostream &err = std::cerr) const {
+
+        /// Avoid printing anything if this is a CLI::RuntimeError
+        if(e.get_name() == "RuntimeError")
+            return e.get_exit_code();
+
+        if(e.get_name() == "CallForHelp") {
+            out << help();
+            return e.get_exit_code();
+        }
+
+        if(e.get_name() == "CallForAllHelp") {
+            out << help("", AppFormatMode::All);
+            return e.get_exit_code();
+        }
+
+        if(e.get_name() == "CallForVersion") {
+            out << e.what() << std::endl;
+            return e.get_exit_code();
+        }
+
+        if(e.get_exit_code() != static_cast<int>(ExitCodes::Success)) {
+            if(failure_message_)
+                err << failure_message_(this, e) << std::flush;
+        }
+
+        return e.get_exit_code();
+    }
+
+    ///@}
+    /// @name Post parsing
+    ///@{
+
+    /// Counts the number of times the given option was passed.
+    std::size_t count(std::string option_name) const { return get_option(option_name)->count(); }
+
+    /// Get a subcommand pointer list to the currently selected subcommands (after parsing by default, in command
+    /// line order; use parsed = false to get the original definition list.)
+    std::vector<App *> get_subcommands() const { return parsed_subcommands_; }
+
+    /// Get a filtered subcommand pointer list from the original definition list. An empty function will provide all
+    /// subcommands (const)
+    std::vector<const App *> get_subcommands(const std::function<bool(const App *)> &filter) const {
+        std::vector<const App *> subcomms(subcommands_.size());
+        std::transform(std::begin(subcommands_), std::end(subcommands_), std::begin(subcomms), [](const App_p &v) {
+            return v.get();
+        });
+
+        if(filter) {
+            subcomms.erase(std::remove_if(std::begin(subcomms),
+                                          std::end(subcomms),
+                                          [&filter](const App *app) { return !filter(app); }),
+                           std::end(subcomms));
+        }
+
+        return subcomms;
+    }
+
+    /// Get a filtered subcommand pointer list from the original definition list. An empty function will provide all
+    /// subcommands
+    std::vector<App *> get_subcommands(const std::function<bool(App *)> &filter) {
+        std::vector<App *> subcomms(subcommands_.size());
+        std::transform(std::begin(subcommands_), std::end(subcommands_), std::begin(subcomms), [](const App_p &v) {
+            return v.get();
+        });
+
+        if(filter) {
+            subcomms.erase(
+                std::remove_if(std::begin(subcomms), std::end(subcomms), [&filter](App *app) { return !filter(app); }),
+                std::end(subcomms));
+        }
+
+        return subcomms;
+    }
+
+    /// Check to see if given subcommand was selected
+    bool got_subcommand(const App *subcom) const {
+        // get subcom needed to verify that this was a real subcommand
+        return get_subcommand(subcom)->parsed_ > 0;
+    }
+
+    /// Check with name instead of pointer to see if subcommand was selected
+    bool got_subcommand(std::string subcommand_name) const { return get_subcommand(subcommand_name)->parsed_ > 0; }
+
+    /// Sets excluded options for the subcommand
+    App *excludes(Option *opt) {
+        if(opt == nullptr) {
+            throw OptionNotFound("nullptr passed");
+        }
+        exclude_options_.insert(opt);
+        return this;
+    }
+
+    /// Sets excluded subcommands for the subcommand
+    App *excludes(App *app) {
+        if(app == nullptr) {
+            throw OptionNotFound("nullptr passed");
+        }
+        if(app == this) {
+            throw OptionNotFound("cannot self reference in needs");
+        }
+        auto res = exclude_subcommands_.insert(app);
+        // subcommand exclusion should be symmetric
+        if(res.second) {
+            app->exclude_subcommands_.insert(this);
+        }
+        return this;
+    }
+
+    App *needs(Option *opt) {
+        if(opt == nullptr) {
+            throw OptionNotFound("nullptr passed");
+        }
+        need_options_.insert(opt);
+        return this;
+    }
+
+    App *needs(App *app) {
+        if(app == nullptr) {
+            throw OptionNotFound("nullptr passed");
+        }
+        if(app == this) {
+            throw OptionNotFound("cannot self reference in needs");
+        }
+        need_subcommands_.insert(app);
+        return this;
+    }
+
+    /// Removes an option from the excludes list of this subcommand
+    bool remove_excludes(Option *opt) {
+        auto iterator = std::find(std::begin(exclude_options_), std::end(exclude_options_), opt);
+        if(iterator == std::end(exclude_options_)) {
+            return false;
+        }
+        exclude_options_.erase(iterator);
+        return true;
+    }
+
+    /// Removes a subcommand from the excludes list of this subcommand
+    bool remove_excludes(App *app) {
+        auto iterator = std::find(std::begin(exclude_subcommands_), std::end(exclude_subcommands_), app);
+        if(iterator == std::end(exclude_subcommands_)) {
+            return false;
+        }
+        auto other_app = *iterator;
+        exclude_subcommands_.erase(iterator);
+        other_app->remove_excludes(this);
+        return true;
+    }
+
+    /// Removes an option from the needs list of this subcommand
+    bool remove_needs(Option *opt) {
+        auto iterator = std::find(std::begin(need_options_), std::end(need_options_), opt);
+        if(iterator == std::end(need_options_)) {
+            return false;
+        }
+        need_options_.erase(iterator);
+        return true;
+    }
+
+    /// Removes a subcommand from the needs list of this subcommand
+    bool remove_needs(App *app) {
+        auto iterator = std::find(std::begin(need_subcommands_), std::end(need_subcommands_), app);
+        if(iterator == std::end(need_subcommands_)) {
+            return false;
+        }
+        need_subcommands_.erase(iterator);
+        return true;
+    }
+
+    ///@}
+    /// @name Help
+    ///@{
+
+    /// Set footer.
+    App *footer(std::string footer_string) {
+        footer_ = std::move(footer_string);
+        return this;
+    }
+    /// Set footer.
+    App *footer(std::function<std::string()> footer_function) {
+        footer_callback_ = std::move(footer_function);
+        return this;
+    }
+    /// Produce a string that could be read in as a config of the current values of the App. Set default_also to
+    /// include default arguments. write_descriptions will print a description for the App and for each option.
+    std::string config_to_str(bool default_also = false, bool write_description = false) const {
+        return config_formatter_->to_config(this, default_also, write_description, "");
+    }
+
+    /// Makes a help message, using the currently configured formatter
+    /// Will only do one subcommand at a time
+    std::string help(std::string prev = "", AppFormatMode mode = AppFormatMode::Normal) const {
+        if(prev.empty())
+            prev = get_name();
+        else
+            prev += " " + get_name();
+
+        // Delegate to subcommand if needed
+        auto selected_subcommands = get_subcommands();
+        if(!selected_subcommands.empty()) {
+            return selected_subcommands.at(0)->help(prev, mode);
+        }
+        return formatter_->make_help(this, prev, mode);
+    }
+
+    /// Displays a version string
+    std::string version() const {
+        std::string val;
+        if(version_ptr_ != nullptr) {
+            auto rv = version_ptr_->results();
+            version_ptr_->clear();
+            version_ptr_->add_result("true");
+            try {
+                version_ptr_->run_callback();
+            } catch(const CLI::CallForVersion &cfv) {
+                val = cfv.what();
+            }
+            version_ptr_->clear();
+            version_ptr_->add_result(rv);
+        }
+        return val;
+    }
+    ///@}
+    /// @name Getters
+    ///@{
+
+    /// Access the formatter
+    std::shared_ptr<FormatterBase> get_formatter() const { return formatter_; }
+
+    /// Access the config formatter
+    std::shared_ptr<Config> get_config_formatter() const { return config_formatter_; }
+
+    /// Access the config formatter as a configBase pointer
+    std::shared_ptr<ConfigBase> get_config_formatter_base() const {
+        // This is safer as a dynamic_cast if we have RTTI, as Config -> ConfigBase
+#if defined(__cpp_rtti) || (defined(__GXX_RTTI) && __GXX_RTTI) || (defined(_HAS_STATIC_RTTI) && (_HAS_STATIC_RTTI == 0))
+        return std::dynamic_pointer_cast<ConfigBase>(config_formatter_);
+#else
+        return std::static_pointer_cast<ConfigBase>(config_formatter_);
+#endif
+    }
+
+    /// Get the app or subcommand description
+    std::string get_description() const { return description_; }
+
+    /// Set the description of the app
+    App *description(std::string app_description) {
+        description_ = std::move(app_description);
+        return this;
+    }
+
+    /// Get the list of options (user facing function, so returns raw pointers), has optional filter function
+    std::vector<const Option *> get_options(const std::function<bool(const Option *)> filter = {}) const {
+        std::vector<const Option *> options(options_.size());
+        std::transform(std::begin(options_), std::end(options_), std::begin(options), [](const Option_p &val) {
+            return val.get();
+        });
+
+        if(filter) {
+            options.erase(std::remove_if(std::begin(options),
+                                         std::end(options),
+                                         [&filter](const Option *opt) { return !filter(opt); }),
+                          std::end(options));
+        }
+
+        return options;
+    }
+
+    /// Non-const version of the above
+    std::vector<Option *> get_options(const std::function<bool(Option *)> filter = {}) {
+        std::vector<Option *> options(options_.size());
+        std::transform(std::begin(options_), std::end(options_), std::begin(options), [](const Option_p &val) {
+            return val.get();
+        });
+
+        if(filter) {
+            options.erase(
+                std::remove_if(std::begin(options), std::end(options), [&filter](Option *opt) { return !filter(opt); }),
+                std::end(options));
+        }
+
+        return options;
+    }
+
+    /// Get an option by name (noexcept non-const version)
+    Option *get_option_no_throw(std::string option_name) noexcept {
+        for(Option_p &opt : options_) {
+            if(opt->check_name(option_name)) {
+                return opt.get();
+            }
+        }
+        for(auto &subc : subcommands_) {
+            // also check down into nameless subcommands
+            if(subc->get_name().empty()) {
+                auto opt = subc->get_option_no_throw(option_name);
+                if(opt != nullptr) {
+                    return opt;
+                }
+            }
+        }
+        return nullptr;
+    }
+
+    /// Get an option by name (noexcept const version)
+    const Option *get_option_no_throw(std::string option_name) const noexcept {
+        for(const Option_p &opt : options_) {
+            if(opt->check_name(option_name)) {
+                return opt.get();
+            }
+        }
+        for(const auto &subc : subcommands_) {
+            // also check down into nameless subcommands
+            if(subc->get_name().empty()) {
+                auto opt = subc->get_option_no_throw(option_name);
+                if(opt != nullptr) {
+                    return opt;
+                }
+            }
+        }
+        return nullptr;
+    }
+
+    /// Get an option by name
+    const Option *get_option(std::string option_name) const {
+        auto opt = get_option_no_throw(option_name);
+        if(opt == nullptr) {
+            throw OptionNotFound(option_name);
+        }
+        return opt;
+    }
+
+    /// Get an option by name (non-const version)
+    Option *get_option(std::string option_name) {
+        auto opt = get_option_no_throw(option_name);
+        if(opt == nullptr) {
+            throw OptionNotFound(option_name);
+        }
+        return opt;
+    }
+
+    /// Shortcut bracket operator for getting a pointer to an option
+    const Option *operator[](const std::string &option_name) const { return get_option(option_name); }
+
+    /// Shortcut bracket operator for getting a pointer to an option
+    const Option *operator[](const char *option_name) const { return get_option(option_name); }
+
+    /// Check the status of ignore_case
+    bool get_ignore_case() const { return ignore_case_; }
+
+    /// Check the status of ignore_underscore
+    bool get_ignore_underscore() const { return ignore_underscore_; }
+
+    /// Check the status of fallthrough
+    bool get_fallthrough() const { return fallthrough_; }
+
+    /// Check the status of the allow windows style options
+    bool get_allow_windows_style_options() const { return allow_windows_style_options_; }
+
+    /// Check the status of the allow windows style options
+    bool get_positionals_at_end() const { return positionals_at_end_; }
+
+    /// Check the status of the allow windows style options
+    bool get_configurable() const { return configurable_; }
+
+    /// Get the group of this subcommand
+    const std::string &get_group() const { return group_; }
+
+    /// Generate and return the footer.
+    std::string get_footer() const { return (footer_callback_) ? footer_callback_() + '\n' + footer_ : footer_; }
+
+    /// Get the required min subcommand value
+    std::size_t get_require_subcommand_min() const { return require_subcommand_min_; }
+
+    /// Get the required max subcommand value
+    std::size_t get_require_subcommand_max() const { return require_subcommand_max_; }
+
+    /// Get the required min option value
+    std::size_t get_require_option_min() const { return require_option_min_; }
+
+    /// Get the required max option value
+    std::size_t get_require_option_max() const { return require_option_max_; }
+
+    /// Get the prefix command status
+    bool get_prefix_command() const { return prefix_command_; }
+
+    /// Get the status of allow extras
+    bool get_allow_extras() const { return allow_extras_; }
+
+    /// Get the status of required
+    bool get_required() const { return required_; }
+
+    /// Get the status of disabled
+    bool get_disabled() const { return disabled_; }
+
+    /// Get the status of silence
+    bool get_silent() const { return silent_; }
+
+    /// Get the status of disabled
+    bool get_immediate_callback() const { return immediate_callback_; }
+
+    /// Get the status of disabled by default
+    bool get_disabled_by_default() const { return (default_startup == startup_mode::disabled); }
+
+    /// Get the status of disabled by default
+    bool get_enabled_by_default() const { return (default_startup == startup_mode::enabled); }
+    /// Get the status of validating positionals
+    bool get_validate_positionals() const { return validate_positionals_; }
+
+    /// Get the status of allow extras
+    config_extras_mode get_allow_config_extras() const { return allow_config_extras_; }
+
+    /// Get a pointer to the help flag.
+    Option *get_help_ptr() { return help_ptr_; }
+
+    /// Get a pointer to the help flag. (const)
+    const Option *get_help_ptr() const { return help_ptr_; }
+
+    /// Get a pointer to the help all flag. (const)
+    const Option *get_help_all_ptr() const { return help_all_ptr_; }
+
+    /// Get a pointer to the config option.
+    Option *get_config_ptr() { return config_ptr_; }
+
+    /// Get a pointer to the config option. (const)
+    const Option *get_config_ptr() const { return config_ptr_; }
+
+    /// Get a pointer to the version option.
+    Option *get_version_ptr() { return version_ptr_; }
+
+    /// Get a pointer to the version option. (const)
+    const Option *get_version_ptr() const { return version_ptr_; }
+
+    /// Get the parent of this subcommand (or nullptr if main app)
+    App *get_parent() { return parent_; }
+
+    /// Get the parent of this subcommand (or nullptr if main app) (const version)
+    const App *get_parent() const { return parent_; }
+
+    /// Get the name of the current app
+    const std::string &get_name() const { return name_; }
+
+    /// Get the aliases of the current app
+    const std::vector<std::string> &get_aliases() const { return aliases_; }
+
+    /// clear all the aliases of the current App
+    App *clear_aliases() {
+        aliases_.clear();
+        return this;
+    }
+
+    /// Get a display name for an app
+    std::string get_display_name(bool with_aliases = false) const {
+        if(name_.empty()) {
+            return std::string("[Option Group: ") + get_group() + "]";
+        }
+        if(aliases_.empty() || !with_aliases) {
+            return name_;
+        }
+        std::string dispname = name_;
+        for(const auto &lalias : aliases_) {
+            dispname.push_back(',');
+            dispname.push_back(' ');
+            dispname.append(lalias);
+        }
+        return dispname;
+    }
+
+    /// Check the name, case insensitive and underscore insensitive if set
+    bool check_name(std::string name_to_check) const {
+        std::string local_name = name_;
+        if(ignore_underscore_) {
+            local_name = detail::remove_underscore(name_);
+            name_to_check = detail::remove_underscore(name_to_check);
+        }
+        if(ignore_case_) {
+            local_name = detail::to_lower(name_);
+            name_to_check = detail::to_lower(name_to_check);
+        }
+
+        if(local_name == name_to_check) {
+            return true;
+        }
+        for(auto les : aliases_) {
+            if(ignore_underscore_) {
+                les = detail::remove_underscore(les);
+            }
+            if(ignore_case_) {
+                les = detail::to_lower(les);
+            }
+            if(les == name_to_check) {
+                return true;
+            }
+        }
+        return false;
+    }
+
+    /// Get the groups available directly from this option (in order)
+    std::vector<std::string> get_groups() const {
+        std::vector<std::string> groups;
+
+        for(const Option_p &opt : options_) {
+            // Add group if it is not already in there
+            if(std::find(groups.begin(), groups.end(), opt->get_group()) == groups.end()) {
+                groups.push_back(opt->get_group());
+            }
+        }
+
+        return groups;
+    }
+
+    /// This gets a vector of pointers with the original parse order
+    const std::vector<Option *> &parse_order() const { return parse_order_; }
+
+    /// This returns the missing options from the current subcommand
+    std::vector<std::string> remaining(bool recurse = false) const {
+        std::vector<std::string> miss_list;
+        for(const std::pair<detail::Classifier, std::string> &miss : missing_) {
+            miss_list.push_back(std::get<1>(miss));
+        }
+        // Get from a subcommand that may allow extras
+        if(recurse) {
+            if(!allow_extras_) {
+                for(const auto &sub : subcommands_) {
+                    if(sub->name_.empty() && !sub->missing_.empty()) {
+                        for(const std::pair<detail::Classifier, std::string> &miss : sub->missing_) {
+                            miss_list.push_back(std::get<1>(miss));
+                        }
+                    }
+                }
+            }
+            // Recurse into subcommands
+
+            for(const App *sub : parsed_subcommands_) {
+                std::vector<std::string> output = sub->remaining(recurse);
+                std::copy(std::begin(output), std::end(output), std::back_inserter(miss_list));
+            }
+        }
+        return miss_list;
+    }
+
+    /// This returns the missing options in a form ready for processing by another command line program
+    std::vector<std::string> remaining_for_passthrough(bool recurse = false) const {
+        std::vector<std::string> miss_list = remaining(recurse);
+        std::reverse(std::begin(miss_list), std::end(miss_list));
+        return miss_list;
+    }
+
+    /// This returns the number of remaining options, minus the -- separator
+    std::size_t remaining_size(bool recurse = false) const {
+        auto remaining_options = static_cast<std::size_t>(std::count_if(
+            std::begin(missing_), std::end(missing_), [](const std::pair<detail::Classifier, std::string> &val) {
+                return val.first != detail::Classifier::POSITIONAL_MARK;
+            }));
+
+        if(recurse) {
+            for(const App_p &sub : subcommands_) {
+                remaining_options += sub->remaining_size(recurse);
+            }
+        }
+        return remaining_options;
+    }
+
+    ///@}
+
+  protected:
+    /// Check the options to make sure there are no conflicts.
+    ///
+    /// Currently checks to see if multiple positionals exist with unlimited args and checks if the min and max options
+    /// are feasible
+    void _validate() const {
+        // count the number of positional only args
+        auto pcount = std::count_if(std::begin(options_), std::end(options_), [](const Option_p &opt) {
+            return opt->get_items_expected_max() >= detail::expected_max_vector_size && !opt->nonpositional();
+        });
+        if(pcount > 1) {
+            auto pcount_req = std::count_if(std::begin(options_), std::end(options_), [](const Option_p &opt) {
+                return opt->get_items_expected_max() >= detail::expected_max_vector_size && !opt->nonpositional() &&
+                       opt->get_required();
+            });
+            if(pcount - pcount_req > 1) {
+                throw InvalidError(name_);
+            }
+        }
+
+        std::size_t nameless_subs{0};
+        for(const App_p &app : subcommands_) {
+            app->_validate();
+            if(app->get_name().empty())
+                ++nameless_subs;
+        }
+
+        if(require_option_min_ > 0) {
+            if(require_option_max_ > 0) {
+                if(require_option_max_ < require_option_min_) {
+                    throw(InvalidError("Required min options greater than required max options",
+                                       ExitCodes::InvalidError));
+                }
+            }
+            if(require_option_min_ > (options_.size() + nameless_subs)) {
+                throw(InvalidError("Required min options greater than number of available options",
+                                   ExitCodes::InvalidError));
+            }
+        }
+    }
+
+    /// configure subcommands to enable parsing through the current object
+    /// set the correct fallthrough and prefix for nameless subcommands and manage the automatic enable or disable
+    /// makes sure parent is set correctly
+    void _configure() {
+        if(default_startup == startup_mode::enabled) {
+            disabled_ = false;
+        } else if(default_startup == startup_mode::disabled) {
+            disabled_ = true;
+        }
+        for(const App_p &app : subcommands_) {
+            if(app->has_automatic_name_) {
+                app->name_.clear();
+            }
+            if(app->name_.empty()) {
+                app->fallthrough_ = false;  // make sure fallthrough_ is false to prevent infinite loop
+                app->prefix_command_ = false;
+            }
+            // make sure the parent is set to be this object in preparation for parse
+            app->parent_ = this;
+            app->_configure();
+        }
+    }
+
+    /// Internal function to run (App) callback, bottom up
+    void run_callback(bool final_mode = false, bool suppress_final_callback = false) {
+        pre_callback();
+        // in the main app if immediate_callback_ is set it runs the main callback before the used subcommands
+        if(!final_mode && parse_complete_callback_) {
+            parse_complete_callback_();
+        }
+        // run the callbacks for the received subcommands
+        for(App *subc : get_subcommands()) {
+            subc->run_callback(true, suppress_final_callback);
+        }
+        // now run callbacks for option_groups
+        for(auto &subc : subcommands_) {
+            if(subc->name_.empty() && subc->count_all() > 0) {
+                subc->run_callback(true, suppress_final_callback);
+            }
+        }
+
+        // finally run the main callback
+        if(final_callback_ && (parsed_ > 0) && (!suppress_final_callback)) {
+            if(!name_.empty() || count_all() > 0 || parent_ == nullptr) {
+                final_callback_();
+            }
+        }
+    }
+
+    /// Check to see if a subcommand is valid. Give up immediately if subcommand max has been reached.
+    bool _valid_subcommand(const std::string &current, bool ignore_used = true) const {
+        // Don't match if max has been reached - but still check parents
+        if(require_subcommand_max_ != 0 && parsed_subcommands_.size() >= require_subcommand_max_) {
+            return parent_ != nullptr && parent_->_valid_subcommand(current, ignore_used);
+        }
+        auto com = _find_subcommand(current, true, ignore_used);
+        if(com != nullptr) {
+            return true;
+        }
+        // Check parent if exists, else return false
+        return parent_ != nullptr && parent_->_valid_subcommand(current, ignore_used);
+    }
+
+    /// Selects a Classifier enum based on the type of the current argument
+    detail::Classifier _recognize(const std::string &current, bool ignore_used_subcommands = true) const {
+        std::string dummy1, dummy2;
+
+        if(current == "--")
+            return detail::Classifier::POSITIONAL_MARK;
+        if(_valid_subcommand(current, ignore_used_subcommands))
+            return detail::Classifier::SUBCOMMAND;
+        if(detail::split_long(current, dummy1, dummy2))
+            return detail::Classifier::LONG;
+        if(detail::split_short(current, dummy1, dummy2)) {
+            if(dummy1[0] >= '0' && dummy1[0] <= '9') {
+                if(get_option_no_throw(std::string{'-', dummy1[0]}) == nullptr) {
+                    return detail::Classifier::NONE;
+                }
+            }
+            return detail::Classifier::SHORT;
+        }
+        if((allow_windows_style_options_) && (detail::split_windows_style(current, dummy1, dummy2)))
+            return detail::Classifier::WINDOWS_STYLE;
+        if((current == "++") && !name_.empty() && parent_ != nullptr)
+            return detail::Classifier::SUBCOMMAND_TERMINATOR;
+        return detail::Classifier::NONE;
+    }
+
+    // The parse function is now broken into several parts, and part of process
+
+    /// Read and process a configuration file (main app only)
+    void _process_config_file() {
+        if(config_ptr_ != nullptr) {
+            bool config_required = config_ptr_->get_required();
+            auto file_given = config_ptr_->count() > 0;
+            auto config_files = config_ptr_->as<std::vector<std::string>>();
+            if(config_files.empty() || config_files.front().empty()) {
+                if(config_required) {
+                    throw FileError::Missing("no specified config file");
+                }
+                return;
+            }
+            for(auto rit = config_files.rbegin(); rit != config_files.rend(); ++rit) {
+                const auto &config_file = *rit;
+                auto path_result = detail::check_path(config_file.c_str());
+                if(path_result == detail::path_type::file) {
+                    try {
+                        std::vector<ConfigItem> values = config_formatter_->from_file(config_file);
+                        _parse_config(values);
+                        if(!file_given) {
+                            config_ptr_->add_result(config_file);
+                        }
+                    } catch(const FileError &) {
+                        if(config_required || file_given)
+                            throw;
+                    }
+                } else if(config_required || file_given) {
+                    throw FileError::Missing(config_file);
+                }
+            }
+        }
+    }
+
+    /// Get envname options if not yet passed. Runs on *all* subcommands.
+    void _process_env() {
+        for(const Option_p &opt : options_) {
+            if(opt->count() == 0 && !opt->envname_.empty()) {
+                char *buffer = nullptr;
+                std::string ename_string;
+
+#ifdef _MSC_VER
+                // Windows version
+                std::size_t sz = 0;
+                if(_dupenv_s(&buffer, &sz, opt->envname_.c_str()) == 0 && buffer != nullptr) {
+                    ename_string = std::string(buffer);
+                    free(buffer);
+                }
+#else
+                // This also works on Windows, but gives a warning
+                buffer = std::getenv(opt->envname_.c_str());
+                if(buffer != nullptr)
+                    ename_string = std::string(buffer);
+#endif
+
+                if(!ename_string.empty()) {
+                    opt->add_result(ename_string);
+                }
+            }
+        }
+
+        for(App_p &sub : subcommands_) {
+            if(sub->get_name().empty() || !sub->parse_complete_callback_)
+                sub->_process_env();
+        }
+    }
+
+    /// Process callbacks. Runs on *all* subcommands.
+    void _process_callbacks() {
+
+        for(App_p &sub : subcommands_) {
+            // process the priority option_groups first
+            if(sub->get_name().empty() && sub->parse_complete_callback_) {
+                if(sub->count_all() > 0) {
+                    sub->_process_callbacks();
+                    sub->run_callback();
+                }
+            }
+        }
+
+        for(const Option_p &opt : options_) {
+            if((*opt) && !opt->get_callback_run()) {
+                opt->run_callback();
+            }
+        }
+        for(App_p &sub : subcommands_) {
+            if(!sub->parse_complete_callback_) {
+                sub->_process_callbacks();
+            }
+        }
+    }
+
+    /// Run help flag processing if any are found.
+    ///
+    /// The flags allow recursive calls to remember if there was a help flag on a parent.
+    void _process_help_flags(bool trigger_help = false, bool trigger_all_help = false) const {
+        const Option *help_ptr = get_help_ptr();
+        const Option *help_all_ptr = get_help_all_ptr();
+
+        if(help_ptr != nullptr && help_ptr->count() > 0)
+            trigger_help = true;
+        if(help_all_ptr != nullptr && help_all_ptr->count() > 0)
+            trigger_all_help = true;
+
+        // If there were parsed subcommands, call those. First subcommand wins if there are multiple ones.
+        if(!parsed_subcommands_.empty()) {
+            for(const App *sub : parsed_subcommands_)
+                sub->_process_help_flags(trigger_help, trigger_all_help);
+
+            // Only the final subcommand should call for help. All help wins over help.
+        } else if(trigger_all_help) {
+            throw CallForAllHelp();
+        } else if(trigger_help) {
+            throw CallForHelp();
+        }
+    }
+
+    /// Verify required options and cross requirements. Subcommands too (only if selected).
+    void _process_requirements() {
+        // check excludes
+        bool excluded{false};
+        std::string excluder;
+        for(auto &opt : exclude_options_) {
+            if(opt->count() > 0) {
+                excluded = true;
+                excluder = opt->get_name();
+            }
+        }
+        for(auto &subc : exclude_subcommands_) {
+            if(subc->count_all() > 0) {
+                excluded = true;
+                excluder = subc->get_display_name();
+            }
+        }
+        if(excluded) {
+            if(count_all() > 0) {
+                throw ExcludesError(get_display_name(), excluder);
+            }
+            // if we are excluded but didn't receive anything, just return
+            return;
+        }
+
+        // check excludes
+        bool missing_needed{false};
+        std::string missing_need;
+        for(auto &opt : need_options_) {
+            if(opt->count() == 0) {
+                missing_needed = true;
+                missing_need = opt->get_name();
+            }
+        }
+        for(auto &subc : need_subcommands_) {
+            if(subc->count_all() == 0) {
+                missing_needed = true;
+                missing_need = subc->get_display_name();
+            }
+        }
+        if(missing_needed) {
+            if(count_all() > 0) {
+                throw RequiresError(get_display_name(), missing_need);
+            }
+            // if we missing something but didn't have any options, just return
+            return;
+        }
+
+        std::size_t used_options = 0;
+        for(const Option_p &opt : options_) {
+
+            if(opt->count() != 0) {
+                ++used_options;
+            }
+            // Required but empty
+            if(opt->get_required() && opt->count() == 0) {
+                throw RequiredError(opt->get_name());
+            }
+            // Requires
+            for(const Option *opt_req : opt->needs_)
+                if(opt->count() > 0 && opt_req->count() == 0)
+                    throw RequiresError(opt->get_name(), opt_req->get_name());
+            // Excludes
+            for(const Option *opt_ex : opt->excludes_)
+                if(opt->count() > 0 && opt_ex->count() != 0)
+                    throw ExcludesError(opt->get_name(), opt_ex->get_name());
+        }
+        // check for the required number of subcommands
+        if(require_subcommand_min_ > 0) {
+            auto selected_subcommands = get_subcommands();
+            if(require_subcommand_min_ > selected_subcommands.size())
+                throw RequiredError::Subcommand(require_subcommand_min_);
+        }
+
+        // Max error cannot occur, the extra subcommand will parse as an ExtrasError or a remaining item.
+
+        // run this loop to check how many unnamed subcommands were actually used since they are considered options
+        // from the perspective of an App
+        for(App_p &sub : subcommands_) {
+            if(sub->disabled_)
+                continue;
+            if(sub->name_.empty() && sub->count_all() > 0) {
+                ++used_options;
+            }
+        }
+
+        if(require_option_min_ > used_options || (require_option_max_ > 0 && require_option_max_ < used_options)) {
+            auto option_list = detail::join(options_, [this](const Option_p &ptr) {
+                if(ptr.get() == help_ptr_ || ptr.get() == help_all_ptr_) {
+                    return std::string{};
+                }
+                return ptr->get_name(false, true);
+            });
+
+            auto subc_list = get_subcommands([](App *app) { return ((app->get_name().empty()) && (!app->disabled_)); });
+            if(!subc_list.empty()) {
+                option_list += "," + detail::join(subc_list, [](const App *app) { return app->get_display_name(); });
+            }
+            throw RequiredError::Option(require_option_min_, require_option_max_, used_options, option_list);
+        }
+
+        // now process the requirements for subcommands if needed
+        for(App_p &sub : subcommands_) {
+            if(sub->disabled_)
+                continue;
+            if(sub->name_.empty() && sub->required_ == false) {
+                if(sub->count_all() == 0) {
+                    if(require_option_min_ > 0 && require_option_min_ <= used_options) {
+                        continue;
+                        // if we have met the requirement and there is nothing in this option group skip checking
+                        // requirements
+                    }
+                    if(require_option_max_ > 0 && used_options >= require_option_min_) {
+                        continue;
+                        // if we have met the requirement and there is nothing in this option group skip checking
+                        // requirements
+                    }
+                }
+            }
+            if(sub->count() > 0 || sub->name_.empty()) {
+                sub->_process_requirements();
+            }
+
+            if(sub->required_ && sub->count_all() == 0) {
+                throw(CLI::RequiredError(sub->get_display_name()));
+            }
+        }
+    }
+
+    /// Process callbacks and such.
+    void _process() {
+        CLI::FileError fe("ne");
+        bool caught_error{false};
+        try {
+            // the config file might generate a FileError but that should not be processed until later in the process
+            // to allow for help, version and other errors to generate first.
+            _process_config_file();
+            // process env shouldn't throw but no reason to process it if config generated an error
+            _process_env();
+        } catch(const CLI::FileError &fe2) {
+            fe = fe2;
+            caught_error = true;
+        }
+        // callbacks and help_flags can generate exceptions which should take priority over the config file error if one
+        // exists
+        _process_callbacks();
+        _process_help_flags();
+
+        if(caught_error) {
+            throw CLI::FileError(std::move(fe));
+        }
+
+        _process_requirements();
+    }
+
+    /// Throw an error if anything is left over and should not be.
+    void _process_extras() {
+        if(!(allow_extras_ || prefix_command_)) {
+            std::size_t num_left_over = remaining_size();
+            if(num_left_over > 0) {
+                throw ExtrasError(name_, remaining(false));
+            }
+        }
+
+        for(App_p &sub : subcommands_) {
+            if(sub->count() > 0)
+                sub->_process_extras();
+        }
+    }
+
+    /// Throw an error if anything is left over and should not be.
+    /// Modifies the args to fill in the missing items before throwing.
+    void _process_extras(std::vector<std::string> &args) {
+        if(!(allow_extras_ || prefix_command_)) {
+            std::size_t num_left_over = remaining_size();
+            if(num_left_over > 0) {
+                args = remaining(false);
+                throw ExtrasError(name_, args);
+            }
+        }
+
+        for(App_p &sub : subcommands_) {
+            if(sub->count() > 0)
+                sub->_process_extras(args);
+        }
+    }
+
+    /// Internal function to recursively increment the parsed counter on the current app as well unnamed subcommands
+    void increment_parsed() {
+        ++parsed_;
+        for(App_p &sub : subcommands_) {
+            if(sub->get_name().empty())
+                sub->increment_parsed();
+        }
+    }
+    /// Internal parse function
+    void _parse(std::vector<std::string> &args) {
+        increment_parsed();
+        _trigger_pre_parse(args.size());
+        bool positional_only = false;
+
+        while(!args.empty()) {
+            if(!_parse_single(args, positional_only)) {
+                break;
+            }
+        }
+
+        if(parent_ == nullptr) {
+            _process();
+
+            // Throw error if any items are left over (depending on settings)
+            _process_extras(args);
+
+            // Convert missing (pairs) to extras (string only) ready for processing in another app
+            args = remaining_for_passthrough(false);
+        } else if(parse_complete_callback_) {
+            _process_env();
+            _process_callbacks();
+            _process_help_flags();
+            _process_requirements();
+            run_callback(false, true);
+        }
+    }
+
+    /// Internal parse function
+    void _parse(std::vector<std::string> &&args) {
+        // this can only be called by the top level in which case parent == nullptr by definition
+        // operation is simplified
+        increment_parsed();
+        _trigger_pre_parse(args.size());
+        bool positional_only = false;
+
+        while(!args.empty()) {
+            _parse_single(args, positional_only);
+        }
+        _process();
+
+        // Throw error if any items are left over (depending on settings)
+        _process_extras();
+    }
+
+    /// Internal function to parse a stream
+    void _parse_stream(std::istream &input) {
+        auto values = config_formatter_->from_config(input);
+        _parse_config(values);
+        increment_parsed();
+        _trigger_pre_parse(values.size());
+        _process();
+
+        // Throw error if any items are left over (depending on settings)
+        _process_extras();
+    }
+
+    /// Parse one config param, return false if not found in any subcommand, remove if it is
+    ///
+    /// If this has more than one dot.separated.name, go into the subcommand matching it
+    /// Returns true if it managed to find the option, if false you'll need to remove the arg manually.
+    void _parse_config(const std::vector<ConfigItem> &args) {
+        for(const ConfigItem &item : args) {
+            if(!_parse_single_config(item) && allow_config_extras_ == config_extras_mode::error)
+                throw ConfigError::Extras(item.fullname());
+        }
+    }
+
+    /// Fill in a single config option
+    bool _parse_single_config(const ConfigItem &item, std::size_t level = 0) {
+        if(level < item.parents.size()) {
+            try {
+                auto subcom = get_subcommand(item.parents.at(level));
+                auto result = subcom->_parse_single_config(item, level + 1);
+
+                return result;
+            } catch(const OptionNotFound &) {
+                return false;
+            }
+        }
+        // check for section open
+        if(item.name == "++") {
+            if(configurable_) {
+                increment_parsed();
+                _trigger_pre_parse(2);
+                if(parent_ != nullptr) {
+                    parent_->parsed_subcommands_.push_back(this);
+                }
+            }
+            return true;
+        }
+        // check for section close
+        if(item.name == "--") {
+            if(configurable_) {
+                _process_callbacks();
+                _process_requirements();
+                run_callback();
+            }
+            return true;
+        }
+        Option *op = get_option_no_throw("--" + item.name);
+        if(op == nullptr) {
+            if(item.name.size() == 1) {
+                op = get_option_no_throw("-" + item.name);
+            }
+        }
+        if(op == nullptr) {
+            op = get_option_no_throw(item.name);
+        }
+        if(op == nullptr) {
+            // If the option was not present
+            if(get_allow_config_extras() == config_extras_mode::capture)
+                // Should we worry about classifying the extras properly?
+                missing_.emplace_back(detail::Classifier::NONE, item.fullname());
+            return false;
+        }
+
+        if(!op->get_configurable()) {
+            if(get_allow_config_extras() == config_extras_mode::ignore_all) {
+                return false;
+            }
+            throw ConfigError::NotConfigurable(item.fullname());
+        }
+
+        if(op->empty()) {
+            // Flag parsing
+            if(op->get_expected_min() == 0) {
+                auto res = config_formatter_->to_flag(item);
+                res = op->get_flag_value(item.name, res);
+
+                op->add_result(res);
+
+            } else {
+                op->add_result(item.inputs);
+                op->run_callback();
+            }
+        }
+
+        return true;
+    }
+
+    /// Parse "one" argument (some may eat more than one), delegate to parent if fails, add to missing if missing
+    /// from main return false if the parse has failed and needs to return to parent
+    bool _parse_single(std::vector<std::string> &args, bool &positional_only) {
+        bool retval = true;
+        detail::Classifier classifier = positional_only ? detail::Classifier::NONE : _recognize(args.back());
+        switch(classifier) {
+        case detail::Classifier::POSITIONAL_MARK:
+            args.pop_back();
+            positional_only = true;
+            if((!_has_remaining_positionals()) && (parent_ != nullptr)) {
+                retval = false;
+            } else {
+                _move_to_missing(classifier, "--");
+            }
+            break;
+        case detail::Classifier::SUBCOMMAND_TERMINATOR:
+            // treat this like a positional mark if in the parent app
+            args.pop_back();
+            retval = false;
+            break;
+        case detail::Classifier::SUBCOMMAND:
+            retval = _parse_subcommand(args);
+            break;
+        case detail::Classifier::LONG:
+        case detail::Classifier::SHORT:
+        case detail::Classifier::WINDOWS_STYLE:
+            // If already parsed a subcommand, don't accept options_
+            _parse_arg(args, classifier);
+            break;
+        case detail::Classifier::NONE:
+            // Probably a positional or something for a parent (sub)command
+            retval = _parse_positional(args, false);
+            if(retval && positionals_at_end_) {
+                positional_only = true;
+            }
+            break;
+            // LCOV_EXCL_START
+        default:
+            throw HorribleError("unrecognized classifier (you should not see this!)");
+            // LCOV_EXCL_STOP
+        }
+        return retval;
+    }
+
+    /// Count the required remaining positional arguments
+    std::size_t _count_remaining_positionals(bool required_only = false) const {
+        std::size_t retval = 0;
+        for(const Option_p &opt : options_) {
+            if(opt->get_positional() && (!required_only || opt->get_required())) {
+                if(opt->get_items_expected_min() > 0 &&
+                   static_cast<int>(opt->count()) < opt->get_items_expected_min()) {
+                    retval += static_cast<std::size_t>(opt->get_items_expected_min()) - opt->count();
+                }
+            }
+        }
+        return retval;
+    }
+
+    /// Count the required remaining positional arguments
+    bool _has_remaining_positionals() const {
+        for(const Option_p &opt : options_) {
+            if(opt->get_positional() && ((static_cast<int>(opt->count()) < opt->get_items_expected_min()))) {
+                return true;
+            }
+        }
+
+        return false;
+    }
+
+    /// Parse a positional, go up the tree to check
+    /// @param haltOnSubcommand if set to true the operation will not process subcommands merely return false
+    /// Return true if the positional was used false otherwise
+    bool _parse_positional(std::vector<std::string> &args, bool haltOnSubcommand) {
+
+        const std::string &positional = args.back();
+
+        if(positionals_at_end_) {
+            // deal with the case of required arguments at the end which should take precedence over other arguments
+            auto arg_rem = args.size();
+            auto remreq = _count_remaining_positionals(true);
+            if(arg_rem <= remreq) {
+                for(const Option_p &opt : options_) {
+                    if(opt->get_positional() && opt->required_) {
+                        if(static_cast<int>(opt->count()) < opt->get_items_expected_min()) {
+                            if(validate_positionals_) {
+                                std::string pos = positional;
+                                pos = opt->_validate(pos, 0);
+                                if(!pos.empty()) {
+                                    continue;
+                                }
+                            }
+                            opt->add_result(positional);
+                            parse_order_.push_back(opt.get());
+                            args.pop_back();
+                            return true;
+                        }
+                    }
+                }
+            }
+        }
+        for(const Option_p &opt : options_) {
+            // Eat options, one by one, until done
+            if(opt->get_positional() &&
+               (static_cast<int>(opt->count()) < opt->get_items_expected_min() || opt->get_allow_extra_args())) {
+                if(validate_positionals_) {
+                    std::string pos = positional;
+                    pos = opt->_validate(pos, 0);
+                    if(!pos.empty()) {
+                        continue;
+                    }
+                }
+                opt->add_result(positional);
+                parse_order_.push_back(opt.get());
+                args.pop_back();
+                return true;
+            }
+        }
+
+        for(auto &subc : subcommands_) {
+            if((subc->name_.empty()) && (!subc->disabled_)) {
+                if(subc->_parse_positional(args, false)) {
+                    if(!subc->pre_parse_called_) {
+                        subc->_trigger_pre_parse(args.size());
+                    }
+                    return true;
+                }
+            }
+        }
+        // let the parent deal with it if possible
+        if(parent_ != nullptr && fallthrough_)
+            return _get_fallthrough_parent()->_parse_positional(args, static_cast<bool>(parse_complete_callback_));
+
+        /// Try to find a local subcommand that is repeated
+        auto com = _find_subcommand(args.back(), true, false);
+        if(com != nullptr && (require_subcommand_max_ == 0 || require_subcommand_max_ > parsed_subcommands_.size())) {
+            if(haltOnSubcommand) {
+                return false;
+            }
+            args.pop_back();
+            com->_parse(args);
+            return true;
+        }
+        /// now try one last gasp at subcommands that have been executed before, go to root app and try to find a
+        /// subcommand in a broader way, if one exists let the parent deal with it
+        auto parent_app = (parent_ != nullptr) ? _get_fallthrough_parent() : this;
+        com = parent_app->_find_subcommand(args.back(), true, false);
+        if(com != nullptr && (com->parent_->require_subcommand_max_ == 0 ||
+                              com->parent_->require_subcommand_max_ > com->parent_->parsed_subcommands_.size())) {
+            return false;
+        }
+
+        if(positionals_at_end_) {
+            throw CLI::ExtrasError(name_, args);
+        }
+        /// If this is an option group don't deal with it
+        if(parent_ != nullptr && name_.empty()) {
+            return false;
+        }
+        /// We are out of other options this goes to missing
+        _move_to_missing(detail::Classifier::NONE, positional);
+        args.pop_back();
+        if(prefix_command_) {
+            while(!args.empty()) {
+                _move_to_missing(detail::Classifier::NONE, args.back());
+                args.pop_back();
+            }
+        }
+
+        return true;
+    }
+
+    /// Locate a subcommand by name with two conditions, should disabled subcommands be ignored, and should used
+    /// subcommands be ignored
+    App *_find_subcommand(const std::string &subc_name, bool ignore_disabled, bool ignore_used) const noexcept {
+        for(const App_p &com : subcommands_) {
+            if(com->disabled_ && ignore_disabled)
+                continue;
+            if(com->get_name().empty()) {
+                auto subc = com->_find_subcommand(subc_name, ignore_disabled, ignore_used);
+                if(subc != nullptr) {
+                    return subc;
+                }
+            }
+            if(com->check_name(subc_name)) {
+                if((!*com) || !ignore_used)
+                    return com.get();
+            }
+        }
+        return nullptr;
+    }
+
+    /// Parse a subcommand, modify args and continue
+    ///
+    /// Unlike the others, this one will always allow fallthrough
+    /// return true if the subcommand was processed false otherwise
+    bool _parse_subcommand(std::vector<std::string> &args) {
+        if(_count_remaining_positionals(/* required */ true) > 0) {
+            _parse_positional(args, false);
+            return true;
+        }
+        auto com = _find_subcommand(args.back(), true, true);
+        if(com != nullptr) {
+            args.pop_back();
+            if(!com->silent_) {
+                parsed_subcommands_.push_back(com);
+            }
+            com->_parse(args);
+            auto parent_app = com->parent_;
+            while(parent_app != this) {
+                parent_app->_trigger_pre_parse(args.size());
+                if(!com->silent_) {
+                    parent_app->parsed_subcommands_.push_back(com);
+                }
+                parent_app = parent_app->parent_;
+            }
+            return true;
+        }
+
+        if(parent_ == nullptr)
+            throw HorribleError("Subcommand " + args.back() + " missing");
+        return false;
+    }
+
+    /// Parse a short (false) or long (true) argument, must be at the top of the list
+    /// return true if the argument was processed or false if nothing was done
+    bool _parse_arg(std::vector<std::string> &args, detail::Classifier current_type) {
+
+        std::string current = args.back();
+
+        std::string arg_name;
+        std::string value;
+        std::string rest;
+
+        switch(current_type) {
+        case detail::Classifier::LONG:
+            if(!detail::split_long(current, arg_name, value))
+                throw HorribleError("Long parsed but missing (you should not see this):" + args.back());
+            break;
+        case detail::Classifier::SHORT:
+            if(!detail::split_short(current, arg_name, rest))
+                throw HorribleError("Short parsed but missing! You should not see this");
+            break;
+        case detail::Classifier::WINDOWS_STYLE:
+            if(!detail::split_windows_style(current, arg_name, value))
+                throw HorribleError("windows option parsed but missing! You should not see this");
+            break;
+        case detail::Classifier::SUBCOMMAND:
+        case detail::Classifier::SUBCOMMAND_TERMINATOR:
+        case detail::Classifier::POSITIONAL_MARK:
+        case detail::Classifier::NONE:
+        default:
+            throw HorribleError("parsing got called with invalid option! You should not see this");
+        }
+
+        auto op_ptr =
+            std::find_if(std::begin(options_), std::end(options_), [arg_name, current_type](const Option_p &opt) {
+                if(current_type == detail::Classifier::LONG)
+                    return opt->check_lname(arg_name);
+                if(current_type == detail::Classifier::SHORT)
+                    return opt->check_sname(arg_name);
+                // this will only get called for detail::Classifier::WINDOWS_STYLE
+                return opt->check_lname(arg_name) || opt->check_sname(arg_name);
+            });
+
+        // Option not found
+        if(op_ptr == std::end(options_)) {
+            for(auto &subc : subcommands_) {
+                if(subc->name_.empty() && !subc->disabled_) {
+                    if(subc->_parse_arg(args, current_type)) {
+                        if(!subc->pre_parse_called_) {
+                            subc->_trigger_pre_parse(args.size());
+                        }
+                        return true;
+                    }
+                }
+            }
+            // If a subcommand, try the main command
+            if(parent_ != nullptr && fallthrough_)
+                return _get_fallthrough_parent()->_parse_arg(args, current_type);
+            // don't capture missing if this is a nameless subcommand
+            if(parent_ != nullptr && name_.empty()) {
+                return false;
+            }
+            // Otherwise, add to missing
+            args.pop_back();
+            _move_to_missing(current_type, current);
+            return true;
+        }
+
+        args.pop_back();
+
+        // Get a reference to the pointer to make syntax bearable
+        Option_p &op = *op_ptr;
+        /// if we require a separator add it here
+        if(op->get_inject_separator()) {
+            if(!op->results().empty() && !op->results().back().empty()) {
+                op->add_result(std::string{});
+            }
+        }
+        if(op->get_trigger_on_parse() && op->current_option_state_ == Option::option_state::callback_run) {
+            op->clear();
+        }
+        int min_num = (std::min)(op->get_type_size_min(), op->get_items_expected_min());
+        int max_num = op->get_items_expected_max();
+        // check container like options to limit the argument size to a single type if the allow_extra_flags argument is
+        // set. 16 is somewhat arbitrary (needs to be at least 4)
+        if(max_num >= detail::expected_max_vector_size / 16 && !op->get_allow_extra_args()) {
+            auto tmax = op->get_type_size_max();
+            max_num = detail::checked_multiply(tmax, op->get_expected_min()) ? tmax : detail::expected_max_vector_size;
+        }
+        // Make sure we always eat the minimum for unlimited vectors
+        int collected = 0;     // total number of arguments collected
+        int result_count = 0;  // local variable for number of results in a single arg string
+        // deal with purely flag like things
+        if(max_num == 0) {
+            auto res = op->get_flag_value(arg_name, value);
+            op->add_result(res);
+            parse_order_.push_back(op.get());
+        } else if(!value.empty()) {  // --this=value
+            op->add_result(value, result_count);
+            parse_order_.push_back(op.get());
+            collected += result_count;
+            // -Trest
+        } else if(!rest.empty()) {
+            op->add_result(rest, result_count);
+            parse_order_.push_back(op.get());
+            rest = "";
+            collected += result_count;
+        }
+
+        // gather the minimum number of arguments
+        while(min_num > collected && !args.empty()) {
+            std::string current_ = args.back();
+            args.pop_back();
+            op->add_result(current_, result_count);
+            parse_order_.push_back(op.get());
+            collected += result_count;
+        }
+
+        if(min_num > collected) {  // if we have run out of arguments and the minimum was not met
+            throw ArgumentMismatch::TypedAtLeast(op->get_name(), min_num, op->get_type_name());
+        }
+
+        if(max_num > collected || op->get_allow_extra_args()) {  // we allow optional arguments
+            auto remreqpos = _count_remaining_positionals(true);
+            // we have met the minimum now optionally check up to the maximum
+            while((collected < max_num || op->get_allow_extra_args()) && !args.empty() &&
+                  _recognize(args.back(), false) == detail::Classifier::NONE) {
+                // If any required positionals remain, don't keep eating
+                if(remreqpos >= args.size()) {
+                    break;
+                }
+
+                op->add_result(args.back(), result_count);
+                parse_order_.push_back(op.get());
+                args.pop_back();
+                collected += result_count;
+            }
+
+            // Allow -- to end an unlimited list and "eat" it
+            if(!args.empty() && _recognize(args.back()) == detail::Classifier::POSITIONAL_MARK)
+                args.pop_back();
+            // optional flag that didn't receive anything now get the default value
+            if(min_num == 0 && max_num > 0 && collected == 0) {
+                auto res = op->get_flag_value(arg_name, std::string{});
+                op->add_result(res);
+                parse_order_.push_back(op.get());
+            }
+        }
+
+        // if we only partially completed a type then add an empty string for later processing
+        if(min_num > 0 && op->get_type_size_max() != min_num && (collected % op->get_type_size_max()) != 0) {
+            op->add_result(std::string{});
+        }
+        if(op->get_trigger_on_parse()) {
+            op->run_callback();
+        }
+        if(!rest.empty()) {
+            rest = "-" + rest;
+            args.push_back(rest);
+        }
+        return true;
+    }
+
+    /// Trigger the pre_parse callback if needed
+    void _trigger_pre_parse(std::size_t remaining_args) {
+        if(!pre_parse_called_) {
+            pre_parse_called_ = true;
+            if(pre_parse_callback_) {
+                pre_parse_callback_(remaining_args);
+            }
+        } else if(immediate_callback_) {
+            if(!name_.empty()) {
+                auto pcnt = parsed_;
+                auto extras = std::move(missing_);
+                clear();
+                parsed_ = pcnt;
+                pre_parse_called_ = true;
+                missing_ = std::move(extras);
+            }
+        }
+    }
+
+    /// Get the appropriate parent to fallthrough to which is the first one that has a name or the main app
+    App *_get_fallthrough_parent() {
+        if(parent_ == nullptr) {
+            throw(HorribleError("No Valid parent"));
+        }
+        auto fallthrough_parent = parent_;
+        while((fallthrough_parent->parent_ != nullptr) && (fallthrough_parent->get_name().empty())) {
+            fallthrough_parent = fallthrough_parent->parent_;
+        }
+        return fallthrough_parent;
+    }
+
+    /// Helper function to run through all possible comparisons of subcommand names to check there is no overlap
+    const std::string &_compare_subcommand_names(const App &subcom, const App &base) const {
+        static const std::string estring;
+        if(subcom.disabled_) {
+            return estring;
+        }
+        for(auto &subc : base.subcommands_) {
+            if(subc.get() != &subcom) {
+                if(subc->disabled_) {
+                    continue;
+                }
+                if(!subcom.get_name().empty()) {
+                    if(subc->check_name(subcom.get_name())) {
+                        return subcom.get_name();
+                    }
+                }
+                if(!subc->get_name().empty()) {
+                    if(subcom.check_name(subc->get_name())) {
+                        return subc->get_name();
+                    }
+                }
+                for(const auto &les : subcom.aliases_) {
+                    if(subc->check_name(les)) {
+                        return les;
+                    }
+                }
+                // this loop is needed in case of ignore_underscore or ignore_case on one but not the other
+                for(const auto &les : subc->aliases_) {
+                    if(subcom.check_name(les)) {
+                        return les;
+                    }
+                }
+                // if the subcommand is an option group we need to check deeper
+                if(subc->get_name().empty()) {
+                    auto &cmpres = _compare_subcommand_names(subcom, *subc);
+                    if(!cmpres.empty()) {
+                        return cmpres;
+                    }
+                }
+                // if the test subcommand is an option group we need to check deeper
+                if(subcom.get_name().empty()) {
+                    auto &cmpres = _compare_subcommand_names(*subc, subcom);
+                    if(!cmpres.empty()) {
+                        return cmpres;
+                    }
+                }
+            }
+        }
+        return estring;
+    }
+    /// Helper function to place extra values in the most appropriate position
+    void _move_to_missing(detail::Classifier val_type, const std::string &val) {
+        if(allow_extras_ || subcommands_.empty()) {
+            missing_.emplace_back(val_type, val);
+            return;
+        }
+        // allow extra arguments to be places in an option group if it is allowed there
+        for(auto &subc : subcommands_) {
+            if(subc->name_.empty() && subc->allow_extras_) {
+                subc->missing_.emplace_back(val_type, val);
+                return;
+            }
+        }
+        // if we haven't found any place to put them yet put them in missing
+        missing_.emplace_back(val_type, val);
+    }
+
+  public:
+    /// function that could be used by subclasses of App to shift options around into subcommands
+    void _move_option(Option *opt, App *app) {
+        if(opt == nullptr) {
+            throw OptionNotFound("the option is NULL");
+        }
+        // verify that the give app is actually a subcommand
+        bool found = false;
+        for(auto &subc : subcommands_) {
+            if(app == subc.get()) {
+                found = true;
+            }
+        }
+        if(!found) {
+            throw OptionNotFound("The Given app is not a subcommand");
+        }
+
+        if((help_ptr_ == opt) || (help_all_ptr_ == opt))
+            throw OptionAlreadyAdded("cannot move help options");
+
+        if(config_ptr_ == opt)
+            throw OptionAlreadyAdded("cannot move config file options");
+
+        auto iterator =
+            std::find_if(std::begin(options_), std::end(options_), [opt](const Option_p &v) { return v.get() == opt; });
+        if(iterator != std::end(options_)) {
+            const auto &opt_p = *iterator;
+            if(std::find_if(std::begin(app->options_), std::end(app->options_), [&opt_p](const Option_p &v) {
+                   return (*v == *opt_p);
+               }) == std::end(app->options_)) {
+                // only erase after the insertion was successful
+                app->options_.push_back(std::move(*iterator));
+                options_.erase(iterator);
+            } else {
+                throw OptionAlreadyAdded("option was not located: " + opt->get_name());
+            }
+        } else {
+            throw OptionNotFound("could not locate the given Option");
+        }
+    }
+};  // namespace CLI
+
+/// Extension of App to better manage groups of options
+class Option_group : public App {
+  public:
+    Option_group(std::string group_description, std::string group_name, App *parent)
+        : App(std::move(group_description), "", parent) {
+        group(group_name);
+        // option groups should have automatic fallthrough
+    }
+    using App::add_option;
+    /// Add an existing option to the Option_group
+    Option *add_option(Option *opt) {
+        if(get_parent() == nullptr) {
+            throw OptionNotFound("Unable to locate the specified option");
+        }
+        get_parent()->_move_option(opt, this);
+        return opt;
+    }
+    /// Add an existing option to the Option_group
+    void add_options(Option *opt) { add_option(opt); }
+    /// Add a bunch of options to the group
+    template <typename... Args> void add_options(Option *opt, Args... args) {
+        add_option(opt);
+        add_options(args...);
+    }
+    using App::add_subcommand;
+    /// Add an existing subcommand to be a member of an option_group
+    App *add_subcommand(App *subcom) {
+        App_p subc = subcom->get_parent()->get_subcommand_ptr(subcom);
+        subc->get_parent()->remove_subcommand(subcom);
+        add_subcommand(std::move(subc));
+        return subcom;
+    }
+};
+/// Helper function to enable one option group/subcommand when another is used
+inline void TriggerOn(App *trigger_app, App *app_to_enable) {
+    app_to_enable->enabled_by_default(false);
+    app_to_enable->disabled_by_default();
+    trigger_app->preparse_callback([app_to_enable](std::size_t) { app_to_enable->disabled(false); });
+}
+
+/// Helper function to enable one option group/subcommand when another is used
+inline void TriggerOn(App *trigger_app, std::vector<App *> apps_to_enable) {
+    for(auto &app : apps_to_enable) {
+        app->enabled_by_default(false);
+        app->disabled_by_default();
+    }
+
+    trigger_app->preparse_callback([apps_to_enable](std::size_t) {
+        for(auto &app : apps_to_enable) {
+            app->disabled(false);
+        }
+    });
+}
+
+/// Helper function to disable one option group/subcommand when another is used
+inline void TriggerOff(App *trigger_app, App *app_to_enable) {
+    app_to_enable->disabled_by_default(false);
+    app_to_enable->enabled_by_default();
+    trigger_app->preparse_callback([app_to_enable](std::size_t) { app_to_enable->disabled(); });
+}
+
+/// Helper function to disable one option group/subcommand when another is used
+inline void TriggerOff(App *trigger_app, std::vector<App *> apps_to_enable) {
+    for(auto &app : apps_to_enable) {
+        app->disabled_by_default(false);
+        app->enabled_by_default();
+    }
+
+    trigger_app->preparse_callback([apps_to_enable](std::size_t) {
+        for(auto &app : apps_to_enable) {
+            app->disabled();
+        }
+    });
+}
+
+/// Helper function to mark an option as deprecated
+inline void deprecate_option(Option *opt, const std::string &replacement = "") {
+    Validator deprecate_warning{[opt, replacement](std::string &) {
+                                    std::cout << opt->get_name() << " is deprecated please use '" << replacement
+                                              << "' instead\n";
+                                    return std::string();
+                                },
+                                "DEPRECATED"};
+    deprecate_warning.application_index(0);
+    opt->check(deprecate_warning);
+    if(!replacement.empty()) {
+        opt->description(opt->get_description() + " DEPRECATED: please use '" + replacement + "' instead");
+    }
+}
+
+/// Helper function to mark an option as deprecated
+inline void deprecate_option(App *app, const std::string &option_name, const std::string &replacement = "") {
+    auto opt = app->get_option(option_name);
+    deprecate_option(opt, replacement);
+}
+
+/// Helper function to mark an option as deprecated
+inline void deprecate_option(App &app, const std::string &option_name, const std::string &replacement = "") {
+    auto opt = app.get_option(option_name);
+    deprecate_option(opt, replacement);
+}
+
+/// Helper function to mark an option as retired
+inline void retire_option(App *app, Option *opt) {
+    App temp;
+    auto option_copy = temp.add_option(opt->get_name(false, true))
+                           ->type_size(opt->get_type_size_min(), opt->get_type_size_max())
+                           ->expected(opt->get_expected_min(), opt->get_expected_max())
+                           ->allow_extra_args(opt->get_allow_extra_args());
+
+    app->remove_option(opt);
+    auto opt2 = app->add_option(option_copy->get_name(false, true), "option has been retired and has no effect")
+                    ->type_name("RETIRED")
+                    ->default_str("RETIRED")
+                    ->type_size(option_copy->get_type_size_min(), option_copy->get_type_size_max())
+                    ->expected(option_copy->get_expected_min(), option_copy->get_expected_max())
+                    ->allow_extra_args(option_copy->get_allow_extra_args());
+
+    Validator retired_warning{[opt2](std::string &) {
+                                  std::cout << "WARNING " << opt2->get_name() << " is retired and has no effect\n";
+                                  return std::string();
+                              },
+                              ""};
+    retired_warning.application_index(0);
+    opt2->check(retired_warning);
+}
+
+/// Helper function to mark an option as retired
+inline void retire_option(App &app, Option *opt) { retire_option(&app, opt); }
+
+/// Helper function to mark an option as retired
+inline void retire_option(App *app, const std::string &option_name) {
+
+    auto opt = app->get_option_no_throw(option_name);
+    if(opt != nullptr) {
+        retire_option(app, opt);
+        return;
+    }
+    auto opt2 = app->add_option(option_name, "option has been retired and has no effect")
+                    ->type_name("RETIRED")
+                    ->expected(0, 1)
+                    ->default_str("RETIRED");
+    Validator retired_warning{[opt2](std::string &) {
+                                  std::cout << "WARNING " << opt2->get_name() << " is retired and has no effect\n";
+                                  return std::string();
+                              },
+                              ""};
+    retired_warning.application_index(0);
+    opt2->check(retired_warning);
+}
+
+/// Helper function to mark an option as retired
+inline void retire_option(App &app, const std::string &option_name) { retire_option(&app, option_name); }
+
+namespace FailureMessage {
+
+/// Printout a clean, simple message on error (the default in CLI11 1.5+)
+inline std::string simple(const App *app, const Error &e) {
+    std::string header = std::string(e.what()) + "\n";
+    std::vector<std::string> names;
+
+    // Collect names
+    if(app->get_help_ptr() != nullptr)
+        names.push_back(app->get_help_ptr()->get_name());
+
+    if(app->get_help_all_ptr() != nullptr)
+        names.push_back(app->get_help_all_ptr()->get_name());
+
+    // If any names found, suggest those
+    if(!names.empty())
+        header += "Run with " + detail::join(names, " or ") + " for more information.\n";
+
+    return header;
+}
+
+/// Printout the full help string on error (if this fn is set, the old default for CLI11)
+inline std::string help(const App *app, const Error &e) {
+    std::string header = std::string("ERROR: ") + e.get_name() + ": " + e.what() + "\n";
+    header += app->help();
+    return header;
+}
+
+}  // namespace FailureMessage
+
+namespace detail {
+/// This class is simply to allow tests access to App's protected functions
+struct AppFriend {
+#ifdef CLI11_CPP14
+
+    /// Wrap _parse_short, perfectly forward arguments and return
+    template <typename... Args> static decltype(auto) parse_arg(App *app, Args &&...args) {
+        return app->_parse_arg(std::forward<Args>(args)...);
+    }
+
+    /// Wrap _parse_subcommand, perfectly forward arguments and return
+    template <typename... Args> static decltype(auto) parse_subcommand(App *app, Args &&...args) {
+        return app->_parse_subcommand(std::forward<Args>(args)...);
+    }
+#else
+    /// Wrap _parse_short, perfectly forward arguments and return
+    template <typename... Args>
+    static auto parse_arg(App *app, Args &&...args) ->
+        typename std::result_of<decltype (&App::_parse_arg)(App, Args...)>::type {
+        return app->_parse_arg(std::forward<Args>(args)...);
+    }
+
+    /// Wrap _parse_subcommand, perfectly forward arguments and return
+    template <typename... Args>
+    static auto parse_subcommand(App *app, Args &&...args) ->
+        typename std::result_of<decltype (&App::_parse_subcommand)(App, Args...)>::type {
+        return app->_parse_subcommand(std::forward<Args>(args)...);
+    }
+#endif
+    /// Wrap the fallthrough parent function to make sure that is working correctly
+    static App *get_fallthrough_parent(App *app) { return app->_get_fallthrough_parent(); }
+};
+}  // namespace detail
+
+
+
+
+namespace detail {
+
+inline std::string convert_arg_for_ini(const std::string &arg, char stringQuote = '"', char characterQuote = '\'') {
+    if(arg.empty()) {
+        return std::string(2, stringQuote);
+    }
+    // some specifically supported strings
+    if(arg == "true" || arg == "false" || arg == "nan" || arg == "inf") {
+        return arg;
+    }
+    // floating point conversion can convert some hex codes, but don't try that here
+    if(arg.compare(0, 2, "0x") != 0 && arg.compare(0, 2, "0X") != 0) {
+        double val;
+        if(detail::lexical_cast(arg, val)) {
+            return arg;
+        }
+    }
+    // just quote a single non numeric character
+    if(arg.size() == 1) {
+        return std::string(1, characterQuote) + arg + characterQuote;
+    }
+    // handle hex, binary or octal arguments
+    if(arg.front() == '0') {
+        if(arg[1] == 'x') {
+            if(std::all_of(arg.begin() + 2, arg.end(), [](char x) {
+                   return (x >= '0' && x <= '9') || (x >= 'A' && x <= 'F') || (x >= 'a' && x <= 'f');
+               })) {
+                return arg;
+            }
+        } else if(arg[1] == 'o') {
+            if(std::all_of(arg.begin() + 2, arg.end(), [](char x) { return (x >= '0' && x <= '7'); })) {
+                return arg;
+            }
+        } else if(arg[1] == 'b') {
+            if(std::all_of(arg.begin() + 2, arg.end(), [](char x) { return (x == '0' || x == '1'); })) {
+                return arg;
+            }
+        }
+    }
+    if(arg.find_first_of(stringQuote) == std::string::npos) {
+        return std::string(1, stringQuote) + arg + stringQuote;
+    } else {
+        return characterQuote + arg + characterQuote;
+    }
+}
+
+/// Comma separated join, adds quotes if needed
+inline std::string ini_join(const std::vector<std::string> &args,
+                            char sepChar = ',',
+                            char arrayStart = '[',
+                            char arrayEnd = ']',
+                            char stringQuote = '"',
+                            char characterQuote = '\'') {
+    std::string joined;
+    if(args.size() > 1 && arrayStart != '\0') {
+        joined.push_back(arrayStart);
+    }
+    std::size_t start = 0;
+    for(const auto &arg : args) {
+        if(start++ > 0) {
+            joined.push_back(sepChar);
+            if(isspace(sepChar) == 0) {
+                joined.push_back(' ');
+            }
+        }
+        joined.append(convert_arg_for_ini(arg, stringQuote, characterQuote));
+    }
+    if(args.size() > 1 && arrayEnd != '\0') {
+        joined.push_back(arrayEnd);
+    }
+    return joined;
+}
+
+inline std::vector<std::string> generate_parents(const std::string &section, std::string &name, char parentSeparator) {
+    std::vector<std::string> parents;
+    if(detail::to_lower(section) != "default") {
+        if(section.find(parentSeparator) != std::string::npos) {
+            parents = detail::split(section, parentSeparator);
+        } else {
+            parents = {section};
+        }
+    }
+    if(name.find(parentSeparator) != std::string::npos) {
+        std::vector<std::string> plist = detail::split(name, parentSeparator);
+        name = plist.back();
+        detail::remove_quotes(name);
+        plist.pop_back();
+        parents.insert(parents.end(), plist.begin(), plist.end());
+    }
+
+    // clean up quotes on the parents
+    for(auto &parent : parents) {
+        detail::remove_quotes(parent);
+    }
+    return parents;
+}
+
+/// assuming non default segments do a check on the close and open of the segments in a configItem structure
+inline void
+checkParentSegments(std::vector<ConfigItem> &output, const std::string &currentSection, char parentSeparator) {
+
+    std::string estring;
+    auto parents = detail::generate_parents(currentSection, estring, parentSeparator);
+    if(!output.empty() && output.back().name == "--") {
+        std::size_t msize = (parents.size() > 1U) ? parents.size() : 2;
+        while(output.back().parents.size() >= msize) {
+            output.push_back(output.back());
+            output.back().parents.pop_back();
+        }
+
+        if(parents.size() > 1) {
+            std::size_t common = 0;
+            std::size_t mpair = (std::min)(output.back().parents.size(), parents.size() - 1);
+            for(std::size_t ii = 0; ii < mpair; ++ii) {
+                if(output.back().parents[ii] != parents[ii]) {
+                    break;
+                }
+                ++common;
+            }
+            if(common == mpair) {
+                output.pop_back();
+            } else {
+                while(output.back().parents.size() > common + 1) {
+                    output.push_back(output.back());
+                    output.back().parents.pop_back();
+                }
+            }
+            for(std::size_t ii = common; ii < parents.size() - 1; ++ii) {
+                output.emplace_back();
+                output.back().parents.assign(parents.begin(), parents.begin() + static_cast<std::ptrdiff_t>(ii) + 1);
+                output.back().name = "++";
+            }
+        }
+    } else if(parents.size() > 1) {
+        for(std::size_t ii = 0; ii < parents.size() - 1; ++ii) {
+            output.emplace_back();
+            output.back().parents.assign(parents.begin(), parents.begin() + static_cast<std::ptrdiff_t>(ii) + 1);
+            output.back().name = "++";
+        }
+    }
+
+    // insert a section end which is just an empty items_buffer
+    output.emplace_back();
+    output.back().parents = std::move(parents);
+    output.back().name = "++";
+}
+}  // namespace detail
+
+inline std::vector<ConfigItem> ConfigBase::from_config(std::istream &input) const {
+    std::string line;
+    std::string currentSection = "default";
+    std::string previousSection = "default";
+    std::vector<ConfigItem> output;
+    bool isDefaultArray = (arrayStart == '[' && arrayEnd == ']' && arraySeparator == ',');
+    bool isINIArray = (arrayStart == '\0' || arrayStart == ' ') && arrayStart == arrayEnd;
+    bool inSection{false};
+    char aStart = (isINIArray) ? '[' : arrayStart;
+    char aEnd = (isINIArray) ? ']' : arrayEnd;
+    char aSep = (isINIArray && arraySeparator == ' ') ? ',' : arraySeparator;
+    int currentSectionIndex{0};
+    while(getline(input, line)) {
+        std::vector<std::string> items_buffer;
+        std::string name;
+
+        detail::trim(line);
+        std::size_t len = line.length();
+        // lines have to be at least 3 characters to have any meaning to CLI just skip the rest
+        if(len < 3) {
+            continue;
+        }
+        if(line.front() == '[' && line.back() == ']') {
+            if(currentSection != "default") {
+                // insert a section end which is just an empty items_buffer
+                output.emplace_back();
+                output.back().parents = detail::generate_parents(currentSection, name, parentSeparatorChar);
+                output.back().name = "--";
+            }
+            currentSection = line.substr(1, len - 2);
+            // deal with double brackets for TOML
+            if(currentSection.size() > 1 && currentSection.front() == '[' && currentSection.back() == ']') {
+                currentSection = currentSection.substr(1, currentSection.size() - 2);
+            }
+            if(detail::to_lower(currentSection) == "default") {
+                currentSection = "default";
+            } else {
+                detail::checkParentSegments(output, currentSection, parentSeparatorChar);
+            }
+            inSection = false;
+            if(currentSection == previousSection) {
+                ++currentSectionIndex;
+            } else {
+                currentSectionIndex = 0;
+                previousSection = currentSection;
+            }
+            continue;
+        }
+
+        // comment lines
+        if(line.front() == ';' || line.front() == '#' || line.front() == commentChar) {
+            continue;
+        }
+
+        // Find = in string, split and recombine
+        auto pos = line.find(valueDelimiter);
+        if(pos != std::string::npos) {
+            name = detail::trim_copy(line.substr(0, pos));
+            std::string item = detail::trim_copy(line.substr(pos + 1));
+            auto cloc = item.find(commentChar);
+            if(cloc != std::string::npos) {
+                item.erase(cloc, std::string::npos);
+                detail::trim(item);
+            }
+            if(item.size() > 1 && item.front() == aStart) {
+                for(std::string multiline; item.back() != aEnd && std::getline(input, multiline);) {
+                    detail::trim(multiline);
+                    item += multiline;
+                }
+                items_buffer = detail::split_up(item.substr(1, item.length() - 2), aSep);
+            } else if((isDefaultArray || isINIArray) && item.find_first_of(aSep) != std::string::npos) {
+                items_buffer = detail::split_up(item, aSep);
+            } else if((isDefaultArray || isINIArray) && item.find_first_of(' ') != std::string::npos) {
+                items_buffer = detail::split_up(item);
+            } else {
+                items_buffer = {item};
+            }
+        } else {
+            name = detail::trim_copy(line);
+            auto cloc = name.find(commentChar);
+            if(cloc != std::string::npos) {
+                name.erase(cloc, std::string::npos);
+                detail::trim(name);
+            }
+
+            items_buffer = {"true"};
+        }
+        if(name.find(parentSeparatorChar) == std::string::npos) {
+            detail::remove_quotes(name);
+        }
+        // clean up quotes on the items
+        for(auto &it : items_buffer) {
+            detail::remove_quotes(it);
+        }
+
+        std::vector<std::string> parents = detail::generate_parents(currentSection, name, parentSeparatorChar);
+        if(parents.size() > maximumLayers) {
+            continue;
+        }
+        if(!configSection.empty() && !inSection) {
+            if(parents.empty() || parents.front() != configSection) {
+                continue;
+            }
+            if(configIndex >= 0 && currentSectionIndex != configIndex) {
+                continue;
+            }
+            parents.erase(parents.begin());
+            inSection = true;
+        }
+        if(!output.empty() && name == output.back().name && parents == output.back().parents) {
+            output.back().inputs.insert(output.back().inputs.end(), items_buffer.begin(), items_buffer.end());
+        } else {
+            output.emplace_back();
+            output.back().parents = std::move(parents);
+            output.back().name = std::move(name);
+            output.back().inputs = std::move(items_buffer);
+        }
+    }
+    if(currentSection != "default") {
+        // insert a section end which is just an empty items_buffer
+        std::string ename;
+        output.emplace_back();
+        output.back().parents = detail::generate_parents(currentSection, ename, parentSeparatorChar);
+        output.back().name = "--";
+        while(output.back().parents.size() > 1) {
+            output.push_back(output.back());
+            output.back().parents.pop_back();
+        }
+    }
+    return output;
+}
+
+inline std::string
+ConfigBase::to_config(const App *app, bool default_also, bool write_description, std::string prefix) const {
+    std::stringstream out;
+    std::string commentLead;
+    commentLead.push_back(commentChar);
+    commentLead.push_back(' ');
+
+    std::vector<std::string> groups = app->get_groups();
+    bool defaultUsed = false;
+    groups.insert(groups.begin(), std::string("Options"));
+    if(write_description && (app->get_configurable() || app->get_parent() == nullptr || app->get_name().empty())) {
+        out << commentLead << detail::fix_newlines(commentLead, app->get_description()) << '\n';
+    }
+    for(auto &group : groups) {
+        if(group == "Options" || group.empty()) {
+            if(defaultUsed) {
+                continue;
+            }
+            defaultUsed = true;
+        }
+        if(write_description && group != "Options" && !group.empty()) {
+            out << '\n' << commentLead << group << " Options\n";
+        }
+        for(const Option *opt : app->get_options({})) {
+
+            // Only process options that are configurable
+            if(opt->get_configurable()) {
+                if(opt->get_group() != group) {
+                    if(!(group == "Options" && opt->get_group().empty())) {
+                        continue;
+                    }
+                }
+                std::string name = prefix + opt->get_single_name();
+                std::string value = detail::ini_join(
+                    opt->reduced_results(), arraySeparator, arrayStart, arrayEnd, stringQuote, characterQuote);
+
+                if(value.empty() && default_also) {
+                    if(!opt->get_default_str().empty()) {
+                        value = detail::convert_arg_for_ini(opt->get_default_str(), stringQuote, characterQuote);
+                    } else if(opt->get_expected_min() == 0) {
+                        value = "false";
+                    } else if(opt->get_run_callback_for_default()) {
+                        value = "\"\"";  // empty string default value
+                    }
+                }
+
+                if(!value.empty()) {
+                    if(write_description && opt->has_description()) {
+                        out << '\n';
+                        out << commentLead << detail::fix_newlines(commentLead, opt->get_description()) << '\n';
+                    }
+                    out << name << valueDelimiter << value << '\n';
+                }
+            }
+        }
+    }
+    auto subcommands = app->get_subcommands({});
+    for(const App *subcom : subcommands) {
+        if(subcom->get_name().empty()) {
+            if(write_description && !subcom->get_group().empty()) {
+                out << '\n' << commentLead << subcom->get_group() << " Options\n";
+            }
+            out << to_config(subcom, default_also, write_description, prefix);
+        }
+    }
+
+    for(const App *subcom : subcommands) {
+        if(!subcom->get_name().empty()) {
+            if(subcom->get_configurable() && app->got_subcommand(subcom)) {
+                if(!prefix.empty() || app->get_parent() == nullptr) {
+                    out << '[' << prefix << subcom->get_name() << "]\n";
+                } else {
+                    std::string subname = app->get_name() + parentSeparatorChar + subcom->get_name();
+                    auto p = app->get_parent();
+                    while(p->get_parent() != nullptr) {
+                        subname = p->get_name() + parentSeparatorChar + subname;
+                        p = p->get_parent();
+                    }
+                    out << '[' << subname << "]\n";
+                }
+                out << to_config(subcom, default_also, write_description, "");
+            } else {
+                out << to_config(
+                    subcom, default_also, write_description, prefix + subcom->get_name() + parentSeparatorChar);
+            }
+        }
+    }
+
+    return out.str();
+}
+
+
+
+
+inline std::string
+Formatter::make_group(std::string group, bool is_positional, std::vector<const Option *> opts) const {
+    std::stringstream out;
+
+    out << "\n" << group << ":\n";
+    for(const Option *opt : opts) {
+        out << make_option(opt, is_positional);
+    }
+
+    return out.str();
+}
+
+inline std::string Formatter::make_positionals(const App *app) const {
+    std::vector<const Option *> opts =
+        app->get_options([](const Option *opt) { return !opt->get_group().empty() && opt->get_positional(); });
+
+    if(opts.empty())
+        return std::string();
+
+    return make_group(get_label("Positionals"), true, opts);
+}
+
+inline std::string Formatter::make_groups(const App *app, AppFormatMode mode) const {
+    std::stringstream out;
+    std::vector<std::string> groups = app->get_groups();
+
+    // Options
+    for(const std::string &group : groups) {
+        std::vector<const Option *> opts = app->get_options([app, mode, &group](const Option *opt) {
+            return opt->get_group() == group                     // Must be in the right group
+                   && opt->nonpositional()                       // Must not be a positional
+                   && (mode != AppFormatMode::Sub                // If mode is Sub, then
+                       || (app->get_help_ptr() != opt            // Ignore help pointer
+                           && app->get_help_all_ptr() != opt));  // Ignore help all pointer
+        });
+        if(!group.empty() && !opts.empty()) {
+            out << make_group(group, false, opts);
+
+            if(group != groups.back())
+                out << "\n";
+        }
+    }
+
+    return out.str();
+}
+
+inline std::string Formatter::make_description(const App *app) const {
+    std::string desc = app->get_description();
+    auto min_options = app->get_require_option_min();
+    auto max_options = app->get_require_option_max();
+    if(app->get_required()) {
+        desc += " REQUIRED ";
+    }
+    if((max_options == min_options) && (min_options > 0)) {
+        if(min_options == 1) {
+            desc += " \n[Exactly 1 of the following options is required]";
+        } else {
+            desc += " \n[Exactly " + std::to_string(min_options) + "options from the following list are required]";
+        }
+    } else if(max_options > 0) {
+        if(min_options > 0) {
+            desc += " \n[Between " + std::to_string(min_options) + " and " + std::to_string(max_options) +
+                    " of the follow options are required]";
+        } else {
+            desc += " \n[At most " + std::to_string(max_options) + " of the following options are allowed]";
+        }
+    } else if(min_options > 0) {
+        desc += " \n[At least " + std::to_string(min_options) + " of the following options are required]";
+    }
+    return (!desc.empty()) ? desc + "\n" : std::string{};
+}
+
+inline std::string Formatter::make_usage(const App *app, std::string name) const {
+    std::stringstream out;
+
+    out << get_label("Usage") << ":" << (name.empty() ? "" : " ") << name;
+
+    std::vector<std::string> groups = app->get_groups();
+
+    // Print an Options badge if any options exist
+    std::vector<const Option *> non_pos_options =
+        app->get_options([](const Option *opt) { return opt->nonpositional(); });
+    if(!non_pos_options.empty())
+        out << " [" << get_label("OPTIONS") << "]";
+
+    // Positionals need to be listed here
+    std::vector<const Option *> positionals = app->get_options([](const Option *opt) { return opt->get_positional(); });
+
+    // Print out positionals if any are left
+    if(!positionals.empty()) {
+        // Convert to help names
+        std::vector<std::string> positional_names(positionals.size());
+        std::transform(positionals.begin(), positionals.end(), positional_names.begin(), [this](const Option *opt) {
+            return make_option_usage(opt);
+        });
+
+        out << " " << detail::join(positional_names, " ");
+    }
+
+    // Add a marker if subcommands are expected or optional
+    if(!app->get_subcommands(
+               [](const CLI::App *subc) { return ((!subc->get_disabled()) && (!subc->get_name().empty())); })
+            .empty()) {
+        out << " " << (app->get_require_subcommand_min() == 0 ? "[" : "")
+            << get_label(app->get_require_subcommand_max() < 2 || app->get_require_subcommand_min() > 1 ? "SUBCOMMAND"
+                                                                                                        : "SUBCOMMANDS")
+            << (app->get_require_subcommand_min() == 0 ? "]" : "");
+    }
+
+    out << std::endl;
+
+    return out.str();
+}
+
+inline std::string Formatter::make_footer(const App *app) const {
+    std::string footer = app->get_footer();
+    if(footer.empty()) {
+        return std::string{};
+    }
+    return footer + "\n";
+}
+
+inline std::string Formatter::make_help(const App *app, std::string name, AppFormatMode mode) const {
+
+    // This immediately forwards to the make_expanded method. This is done this way so that subcommands can
+    // have overridden formatters
+    if(mode == AppFormatMode::Sub)
+        return make_expanded(app);
+
+    std::stringstream out;
+    if((app->get_name().empty()) && (app->get_parent() != nullptr)) {
+        if(app->get_group() != "Subcommands") {
+            out << app->get_group() << ':';
+        }
+    }
+
+    out << make_description(app);
+    out << make_usage(app, name);
+    out << make_positionals(app);
+    out << make_groups(app, mode);
+    out << make_subcommands(app, mode);
+    out << '\n' << make_footer(app);
+
+    return out.str();
+}
+
+inline std::string Formatter::make_subcommands(const App *app, AppFormatMode mode) const {
+    std::stringstream out;
+
+    std::vector<const App *> subcommands = app->get_subcommands({});
+
+    // Make a list in definition order of the groups seen
+    std::vector<std::string> subcmd_groups_seen;
+    for(const App *com : subcommands) {
+        if(com->get_name().empty()) {
+            if(!com->get_group().empty()) {
+                out << make_expanded(com);
+            }
+            continue;
+        }
+        std::string group_key = com->get_group();
+        if(!group_key.empty() &&
+           std::find_if(subcmd_groups_seen.begin(), subcmd_groups_seen.end(), [&group_key](std::string a) {
+               return detail::to_lower(a) == detail::to_lower(group_key);
+           }) == subcmd_groups_seen.end())
+            subcmd_groups_seen.push_back(group_key);
+    }
+
+    // For each group, filter out and print subcommands
+    for(const std::string &group : subcmd_groups_seen) {
+        out << "\n" << group << ":\n";
+        std::vector<const App *> subcommands_group = app->get_subcommands(
+            [&group](const App *sub_app) { return detail::to_lower(sub_app->get_group()) == detail::to_lower(group); });
+        for(const App *new_com : subcommands_group) {
+            if(new_com->get_name().empty())
+                continue;
+            if(mode != AppFormatMode::All) {
+                out << make_subcommand(new_com);
+            } else {
+                out << new_com->help(new_com->get_name(), AppFormatMode::Sub);
+                out << "\n";
+            }
+        }
+    }
+
+    return out.str();
+}
+
+inline std::string Formatter::make_subcommand(const App *sub) const {
+    std::stringstream out;
+    detail::format_help(out, sub->get_display_name(true), sub->get_description(), column_width_);
+    return out.str();
+}
+
+inline std::string Formatter::make_expanded(const App *sub) const {
+    std::stringstream out;
+    out << sub->get_display_name(true) << "\n";
+
+    out << make_description(sub);
+    if(sub->get_name().empty() && !sub->get_aliases().empty()) {
+        detail::format_aliases(out, sub->get_aliases(), column_width_ + 2);
+    }
+    out << make_positionals(sub);
+    out << make_groups(sub, AppFormatMode::Sub);
+    out << make_subcommands(sub, AppFormatMode::Sub);
+
+    // Drop blank spaces
+    std::string tmp = detail::find_and_replace(out.str(), "\n\n", "\n");
+    tmp = tmp.substr(0, tmp.size() - 1);  // Remove the final '\n'
+
+    // Indent all but the first line (the name)
+    return detail::find_and_replace(tmp, "\n", "\n  ") + "\n";
+}
+
+inline std::string Formatter::make_option_name(const Option *opt, bool is_positional) const {
+    if(is_positional)
+        return opt->get_name(true, false);
+
+    return opt->get_name(false, true);
+}
+
+inline std::string Formatter::make_option_opts(const Option *opt) const {
+    std::stringstream out;
+
+    if(!opt->get_option_text().empty()) {
+        out << " " << opt->get_option_text();
+    } else {
+        if(opt->get_type_size() != 0) {
+            if(!opt->get_type_name().empty())
+                out << " " << get_label(opt->get_type_name());
+            if(!opt->get_default_str().empty())
+                out << "=" << opt->get_default_str();
+            if(opt->get_expected_max() == detail::expected_max_vector_size)
+                out << " ...";
+            else if(opt->get_expected_min() > 1)
+                out << " x " << opt->get_expected();
+
+            if(opt->get_required())
+                out << " " << get_label("REQUIRED");
+        }
+        if(!opt->get_envname().empty())
+            out << " (" << get_label("Env") << ":" << opt->get_envname() << ")";
+        if(!opt->get_needs().empty()) {
+            out << " " << get_label("Needs") << ":";
+            for(const Option *op : opt->get_needs())
+                out << " " << op->get_name();
+        }
+        if(!opt->get_excludes().empty()) {
+            out << " " << get_label("Excludes") << ":";
+            for(const Option *op : opt->get_excludes())
+                out << " " << op->get_name();
+        }
+    }
+    return out.str();
+}
+
+inline std::string Formatter::make_option_desc(const Option *opt) const { return opt->get_description(); }
+
+inline std::string Formatter::make_option_usage(const Option *opt) const {
+    // Note that these are positionals usages
+    std::stringstream out;
+    out << make_option_name(opt, true);
+    if(opt->get_expected_max() >= detail::expected_max_vector_size)
+        out << "...";
+    else if(opt->get_expected_max() > 1)
+        out << "(" << opt->get_expected() << "x)";
+
+    return opt->get_required() ? out.str() : "[" + out.str() + "]";
+}
+
+
+
+} // namespace CLI

From 359b50f721b9947fa9271ccab795d9d0df84f4a6 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Fri, 19 Nov 2021 13:44:27 -0500
Subject: [PATCH 22/46] Improve benchmark

---
 aux/test/aux_test_dft_helpers.h | 33 +++++++++++++++----------
 aux/test/check_idft_bench.cxx   | 43 ++++++++++++++++++++++-----------
 aux/test/check_idft_bench.sh    | 30 +++++++++++++++++++++++
 3 files changed, 79 insertions(+), 27 deletions(-)
 create mode 100755 aux/test/check_idft_bench.sh

diff --git a/aux/test/aux_test_dft_helpers.h b/aux/test/aux_test_dft_helpers.h
index db83d0fa8..240d5b667 100644
--- a/aux/test/aux_test_dft_helpers.h
+++ b/aux/test/aux_test_dft_helpers.h
@@ -5,6 +5,7 @@
 #include "WireCellUtil/PluginManager.h"
 #include "WireCellUtil/Exceptions.h"
 #include "WireCellUtil/Persist.h"
+#include "WireCellUtil/CLI11.hpp"
 
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IDFT.h"
@@ -100,19 +101,27 @@ namespace WireCell::Aux::Test {
         std::string tn{"FftwDFT"};
         std::string pi{"WireCellAux"};
         std::string cfg_name{""};
+        std::string output{""};
         Configuration cfg;
     };        
 
-    DftArgs make_dft_args(int argc, char* argv[]) 
+    // remove command name from main()'s argc/argv[0]
+    int make_dft_args(DftArgs& args, int argc, char** argv) 
     {
-        DftArgs ret;
-
-        if (argc > 1) ret.tn = argv[1];
-        if (argc > 2) ret.pi = argv[2];
-        if (argc > 3) {
+        CLI::App app{"wct dft test"};
+        app.add_option("-o,--output", args.output,
+                   "Output file")->type_size(1)->allow_extra_args(false);
+        app.add_option("-p,--plugin", args.pi,
+                   "Plugin")->type_size(1)->allow_extra_args(false);
+        app.add_option("-t,--typename", args.tn,
+                   "Type or Type:Name of IDFT imp")->type_size(1)->allow_extra_args(false);
+        app.add_option("-c,--config", args.cfg_name,
+                   "Config file for IDFT imp")->type_size(1)->allow_extra_args(false);
+        CLI11_PARSE(app, argc, argv);
+
+        if (not args.cfg_name.empty()) {
             // Either we get directly a "data" object 
-            ret.cfg_name = argv[3];
-            auto cfg = Persist::load(argv[3]);
+            auto cfg = Persist::load(args.cfg_name);
             // or we go searching a list for matching type/name.
             if (cfg.isArray()) {
                 for (auto one : cfg) {
@@ -121,17 +130,15 @@ namespace WireCell::Aux::Test {
                     if (not n.empty()) {
                         tn = tn + ":" + n;
                     }
-                    if (tn == ret.tn) {
+                    if (tn == args.tn) {
                         cfg = one["data"];
                         break;
                     }
                 }
             }
-            ret.cfg = cfg;
-
+            args.cfg = cfg;
         }
-        return ret;
-        //return make_dft(dft_tn, dft_pi, cfg);
+        return 0;
     }
 
     const double default_eps = 1e-8;
diff --git a/aux/test/check_idft_bench.cxx b/aux/test/check_idft_bench.cxx
index b7bd29100..a31029354 100644
--- a/aux/test/check_idft_bench.cxx
+++ b/aux/test/check_idft_bench.cxx
@@ -19,6 +19,16 @@ using complex_t = std::complex<float>;
 
 using transform_function = std::function<void(const complex_t* in, complex_t* out)>;
 
+void ignore_exception(const complex_t* in, complex_t* out, transform_function func)
+{
+    try {
+        func(in, out);
+    }
+    catch (...) {
+        std::cerr << "exception ignored\n";
+    }
+}
+
 const int nominal = 100'000'000;
 void doit(Stopwatch& sw, const std::string& name, int nrows, int ncols, transform_function func)
 {
@@ -28,32 +38,40 @@ void doit(Stopwatch& sw, const std::string& name, int nrows, int ncols, transfor
 
     std::vector<complex_t> in(size), out(size);
 
-    sw([&](){func(in.data(), in.data());}, {
+    sw([&](){ignore_exception(in.data(), in.data(), func);}, {
             {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",1}, {"first",true}, {"in-place",true},
         });
 
     sw([&](){
         for (int count=0; count<ntimes+1; ++count) {
-            func(in.data(), in.data());
+            ignore_exception(in.data(), in.data(), func);
         }}, {
             {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",ntimes}, {"first",false}, {"in-place",true},
         });
 
-    sw([&](){func(in.data(), out.data());}, {
+    sw([&](){ignore_exception(in.data(), out.data(), func);}, {
             {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",1}, {"first",true}, {"in-place",false},
         });
 
     sw([&](){
         for (int count=0; count<ntimes+1; ++count) {
-            func(in.data(), out.data());
+            ignore_exception(in.data(), out.data(), func);
         }}, {
             {"nrows",nrows}, {"ncols",ncols}, {"func",name}, {"ntimes",ntimes}, {"first",false}, {"in-place",false},
         });
 }
 
+
 int main(int argc, char* argv[])
 {
-    auto args = make_dft_args(argc, argv);
+    DftArgs args;
+    int rc = make_dft_args(args, argc, argv);
+    if (rc) { return rc; }
+    if (args.output.empty()) {
+        std::cerr << "need output file" << std::endl;
+        return 0;
+    }
+    
     auto idft = make_dft(args.tn, args.pi, args.cfg);
 
     Stopwatch sw({
@@ -62,18 +80,15 @@ int main(int argc, char* argv[])
             {"config", object_t::parse(Persist::dumps(args.cfg))}, 
             {"config_file",args.cfg_name}});
 
-    std::string cname = args.cfg_name;
-    auto slash = cname.rfind("/");
-    if (slash != std::string::npos) {
-        cname = cname.substr(slash+1);
+    auto fname = args.output;
+    if (fname.empty()) {
+        fname = "/dev/stdout";
     }
-    cname = cname.substr(0, cname.rfind("."));
-    std::string fname = argv[0];
-    fname += "_" + args.pi + "_" + args.tn + "_" + cname + ".json";
     std::cerr << "writing to: " << fname << std::endl;
     
-
-    std::vector<int> oned_sizes{500, 512, 1000, 1024, 4096, 6000, 8192, 10000, 16384};
+    std::vector<int> oned_sizes{128, 256, 500, 512, 1000, 1024, 2000,
+        2048, 3000, 4096, 6000, 8192, 9375, 9503, 9592, 9595, 9600,
+        10000, 16384};
     for (auto size : oned_sizes) {
         doit(sw, "fwd1d", 1, size, [&](const complex_t* in, complex_t* out) {
             idft->fwd1d(in, out, size);
diff --git a/aux/test/check_idft_bench.sh b/aux/test/check_idft_bench.sh
new file mode 100755
index 000000000..0003c9207
--- /dev/null
+++ b/aux/test/check_idft_bench.sh
@@ -0,0 +1,30 @@
+#!/bin/bash
+
+# A do all script for IDFT benchmark with all known IDFTs
+# Note, this will almost certainly fail if a systen does not have:
+# 
+# - wire-cell-toolkit built at least under build/
+# - wire-cell-python built and in the environment
+# - run this script in-place in the source
+# - host has at exactly one GPU
+# - GPU has enough memory
+#
+# even if fails, it documents what to run
+
+tstdir="$(dirname $(realpath $BASH_SOURCE))"
+auxdir="$(dirname $tstdir)"
+topdir="$(dirname $auxdir)"
+blddir="$topdir/build"
+cib="$blddir/aux/check_idft_bench"
+
+torchcfg="$tstdir/test_idft_pytorch.jsonnet"
+
+set -x
+wirecell-aux run-idft-bench -o idft-bench-fftw-cpu.json $cib
+wirecell-aux run-idft-bench -o idft-bench-torch-cpu.json -p WireCellPytorch -t TorchDFT $cib
+wirecell-aux run-idft-bench -o idft-bench-torch-gpu.json -p WireCellPytorch -t TorchDFT -c $torchcfg $cib
+
+wirecell-aux plot-idft-bench -o idft-bench.pdf \
+             idft-bench-fftw-cpu.json  \
+             idft-bench-torch-cpu.json  \
+             idft-bench-torch-gpu.json

From bbe851db17b1ff67a6649d9b7fadfd4ffd93a280 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 22 Nov 2021 09:54:10 -0500
Subject: [PATCH 23/46] Fix regression in cli arg parsing

---
 aux/test/test_dfttools.cxx | 5 ++++-
 aux/test/test_idft.cxx     | 5 ++++-
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/aux/test/test_dfttools.cxx b/aux/test/test_dfttools.cxx
index cc4b43157..cfa96349c 100644
--- a/aux/test/test_dfttools.cxx
+++ b/aux/test/test_dfttools.cxx
@@ -122,7 +122,10 @@ void test_1b(IDFT::pointer dft, int axis, int nrows=8, int ncols=4)
 
 int main(int argc, char* argv[])
 {
-    auto idft = make_dft_args(argc, argv);
+    DftArgs args;
+    int rc = make_dft_args(args, argc, argv);
+    if (rc) { return rc; }
+    auto idft = make_dft(args.tn, args.pi, args.cfg);
 
     test_1d_impulse(idft);
     test_2d_impulse(idft);
diff --git a/aux/test/test_idft.cxx b/aux/test/test_idft.cxx
index a4f337a5e..8e016bc2f 100644
--- a/aux/test/test_idft.cxx
+++ b/aux/test/test_idft.cxx
@@ -204,7 +204,10 @@ void test_2d_transpose(IDFT::pointer dft, int nrows, int ncols)
 
 int main(int argc, char* argv[])
 {
-    auto idft = make_dft_args(argc, argv);
+    DftArgs args;
+    int rc = make_dft_args(args, argc, argv);
+    if (rc) { return rc; }
+    auto idft = make_dft(args.tn, args.pi, args.cfg);
 
     test_1d_zero(idft);
     test_1d_impulse(idft);

From 0a49ef62c4b4dface1697ff20e7dee596ac7c794 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 22 Nov 2021 12:11:47 -0500
Subject: [PATCH 24/46] Remove obsolete 'zipper' based sim

---
 gen/inc/WireCellGen/DepoZipper.h   |  43 -----
 gen/inc/WireCellGen/Ductor.h       |  67 -------
 gen/inc/WireCellGen/ImpactZipper.h |  38 ----
 gen/src/DepoZipper.cxx             | 187 -------------------
 gen/src/Ductor.cxx                 | 289 -----------------------------
 gen/src/ImpactZipper.cxx           | 127 -------------
 6 files changed, 751 deletions(-)
 delete mode 100644 gen/inc/WireCellGen/DepoZipper.h
 delete mode 100644 gen/inc/WireCellGen/Ductor.h
 delete mode 100644 gen/inc/WireCellGen/ImpactZipper.h
 delete mode 100644 gen/src/DepoZipper.cxx
 delete mode 100644 gen/src/Ductor.cxx
 delete mode 100644 gen/src/ImpactZipper.cxx

diff --git a/gen/inc/WireCellGen/DepoZipper.h b/gen/inc/WireCellGen/DepoZipper.h
deleted file mode 100644
index bd9ec50e5..000000000
--- a/gen/inc/WireCellGen/DepoZipper.h
+++ /dev/null
@@ -1,43 +0,0 @@
-/** Make a frame from depos using an ImpactZipper.
-
-    See also the very similar DepoTransform which is newer and faster.
- */
-
-#ifndef WIRECELLGEN_DEPOZIPPER
-#define WIRECELLGEN_DEPOZIPPER
-
-#include "WireCellIface/IDepoFramer.h"
-#include "WireCellIface/IConfigurable.h"
-#include "WireCellIface/IRandom.h"
-#include "WireCellIface/IPlaneImpactResponse.h"
-#include "WireCellIface/IAnodePlane.h"
-
-namespace WireCell {
-    namespace Gen {
-
-        class DepoZipper : public IDepoFramer, public IConfigurable {
-           public:
-            DepoZipper();
-            virtual ~DepoZipper();
-
-            virtual bool operator()(const input_pointer& in, output_pointer& out);
-
-            virtual void configure(const WireCell::Configuration& cfg);
-            virtual WireCell::Configuration default_configuration() const;
-
-           private:
-            IAnodePlane::pointer m_anode;
-            IRandom::pointer m_rng;
-            std::vector<IPlaneImpactResponse::pointer> m_pirs;
-
-            double m_start_time;
-            double m_readout_time;
-            double m_tick;
-            double m_drift_speed;
-            double m_nsigma;
-            int m_frame_count;
-        };
-    }  // namespace Gen
-}  // namespace WireCell
-
-#endif
diff --git a/gen/inc/WireCellGen/Ductor.h b/gen/inc/WireCellGen/Ductor.h
deleted file mode 100644
index 60f348b4b..000000000
--- a/gen/inc/WireCellGen/Ductor.h
+++ /dev/null
@@ -1,67 +0,0 @@
-#ifndef WIRECELLGEN_DUCTOR
-#define WIRECELLGEN_DUCTOR
-
-#include "WireCellUtil/Pimpos.h"
-#include "WireCellUtil/Response.h"
-
-#include "WireCellIface/IConfigurable.h"
-#include "WireCellIface/IDuctor.h"
-
-#include "WireCellIface/IAnodeFace.h"
-#include "WireCellIface/IAnodePlane.h"
-#include "WireCellIface/IPlaneImpactResponse.h"
-#include "WireCellIface/IRandom.h"
-#include "WireCellUtil/Logging.h"
-
-#include <vector>
-
-namespace WireCell {
-    namespace Gen {
-
-        /** This IDuctor needs a Garfield2D field calculation data
-         * file in compressed JSON format as produced by Python module
-         * wirecell.sigproc.garfield.
-         */
-        class Ductor : public IDuctor, public IConfigurable {
-           public:
-            Ductor();
-            virtual ~Ductor(){};
-
-            // virtual void reset();
-            virtual bool operator()(const input_pointer& depo, output_queue& frames);
-
-            virtual void configure(const WireCell::Configuration& config);
-            virtual WireCell::Configuration default_configuration() const;
-
-           protected:
-            // The "Type:Name" of the IAnodePlane (default is "AnodePlane")
-            std::string m_anode_tn;
-            std::string m_rng_tn;
-            std::vector<std::string> m_pir_tns;
-
-            IAnodePlane::pointer m_anode;
-            IRandom::pointer m_rng;
-            std::vector<IPlaneImpactResponse::pointer> m_pirs;
-
-            IDepo::vector m_depos;
-
-            double m_start_time;
-            double m_readout_time;
-            double m_tick;
-            double m_drift_speed;
-            double m_nsigma;
-            bool m_fluctuate;
-            std::string m_mode;
-
-            int m_frame_count;
-            std::string m_tag;
-
-            virtual void process(output_queue& frames);
-            virtual ITrace::vector process_face(IAnodeFace::pointer face, const IDepo::vector& face_depos);
-            bool start_processing(const input_pointer& depo);
-            Log::logptr_t l;
-        };
-    }  // namespace Gen
-}  // namespace WireCell
-
-#endif
diff --git a/gen/inc/WireCellGen/ImpactZipper.h b/gen/inc/WireCellGen/ImpactZipper.h
deleted file mode 100644
index ca9d8db60..000000000
--- a/gen/inc/WireCellGen/ImpactZipper.h
+++ /dev/null
@@ -1,38 +0,0 @@
-#ifndef WIRECELL_IMPACTZIPPER
-#define WIRECELL_IMPACTZIPPER
-
-#include "WireCellIface/IPlaneImpactResponse.h"
-#include "WireCellGen/BinnedDiffusion.h"
-
-namespace WireCell {
-    namespace Gen {
-
-        /** An ImpactZipper "zips" up through all the impact positions
-         * along a wire plane convolving the response functions and
-         * the local drifted charge distribution producing a waveform
-         * on each central wire.
-         */
-        class ImpactZipper {
-            IPlaneImpactResponse::pointer m_pir;
-            BinnedDiffusion& m_bd;
-
-           public:
-            ImpactZipper(IPlaneImpactResponse::pointer pir, BinnedDiffusion& bd);
-            virtual ~ImpactZipper();
-
-            /// Return the wire's waveform.  If the response functions
-            /// are just field response (ie, instantaneous current)
-            /// then the waveforms are expressed as current integrated
-            /// over each sample bin and thus in units of charge.  If
-            /// the response functions include electronics response
-            /// then the waveforms are in units of voltage
-            /// representing the sampling of the output of the FEE
-            /// amplifiers.
-
-            // fixme: this should be a forward iterator so that it may cal bd.erase() safely to conserve memory
-            Waveform::realseq_t waveform(int wire) const;
-        };
-
-    }  // namespace Gen
-}  // namespace WireCell
-#endif /* WIRECELL_IMPACTZIPPER */
diff --git a/gen/src/DepoZipper.cxx b/gen/src/DepoZipper.cxx
deleted file mode 100644
index 07c0eeb5e..000000000
--- a/gen/src/DepoZipper.cxx
+++ /dev/null
@@ -1,187 +0,0 @@
-#include "WireCellGen/DepoZipper.h"
-#include "WireCellGen/ImpactZipper.h"
-#include "WireCellUtil/NamedFactory.h"
-#include "WireCellIface/IAnodePlane.h"
-#include "WireCellIface/SimpleTrace.h"
-#include "WireCellIface/SimpleFrame.h"
-#include "WireCellGen/BinnedDiffusion.h"
-#include "WireCellGen/ImpactZipper.h"
-#include "WireCellUtil/Units.h"
-#include "WireCellUtil/Point.h"
-
-WIRECELL_FACTORY(DepoZipper, WireCell::Gen::DepoZipper, WireCell::IDepoFramer, WireCell::IConfigurable)
-
-using namespace WireCell;
-using namespace std;
-
-Gen::DepoZipper::DepoZipper()
-  : m_start_time(0.0 * units::ns)
-  , m_readout_time(5.0 * units::ms)
-  , m_tick(0.5 * units::us)
-  , m_drift_speed(1.0 * units::mm / units::us)
-  , m_nsigma(3.0)
-  , m_frame_count(0)
-{
-}
-
-Gen::DepoZipper::~DepoZipper() {}
-
-void Gen::DepoZipper::configure(const WireCell::Configuration& cfg)
-{
-    auto anode_tn = get<string>(cfg, "anode", "");
-    m_anode = Factory::find_tn<IAnodePlane>(anode_tn);
-
-    m_nsigma = get<double>(cfg, "nsigma", m_nsigma);
-    bool fluctuate = get<bool>(cfg, "fluctuate", false);
-    m_rng = nullptr;
-    if (fluctuate) {
-        auto rng_tn = get<string>(cfg, "rng", "");
-        m_rng = Factory::find_tn<IRandom>(rng_tn);
-    }
-
-    m_readout_time = get<double>(cfg, "readout_time", m_readout_time);
-    m_tick = get<double>(cfg, "tick", m_tick);
-    m_start_time = get<double>(cfg, "start_time", m_start_time);
-    m_drift_speed = get<double>(cfg, "drift_speed", m_drift_speed);
-    m_frame_count = get<int>(cfg, "first_frame_number", m_frame_count);
-
-    auto jpirs = cfg["pirs"];
-    if (jpirs.isNull() or jpirs.empty()) {
-        THROW(ValueError() << errmsg{"Gen::Ductor: must configure with some plane impact response components"});
-    }
-    m_pirs.clear();
-    for (auto jpir : jpirs) {
-        auto tn = jpir.asString();
-        auto pir = Factory::find_tn<IPlaneImpactResponse>(tn);
-        m_pirs.push_back(pir);
-    }
-}
-WireCell::Configuration Gen::DepoZipper::default_configuration() const
-{
-    Configuration cfg;
-
-    /// How many Gaussian sigma due to diffusion to keep before truncating.
-    put(cfg, "nsigma", m_nsigma);
-
-    /// Whether to fluctuate the final Gaussian deposition.
-    put(cfg, "fluctuate", false);
-
-    /// The open a gate.  This is actually a "readin" time measured at
-    /// the input ("reference") plane.
-    put(cfg, "start_time", m_start_time);
-
-    /// The time span for each readout.  This is actually a "readin"
-    /// time span measured at the input ("reference") plane.
-    put(cfg, "readout_time", m_readout_time);
-
-    /// The sample period
-    put(cfg, "tick", m_tick);
-
-    /// The nominal speed of drifting electrons
-    put(cfg, "drift_speed", m_drift_speed);
-
-    /// Allow for a custom starting frame number
-    put(cfg, "first_frame_number", m_frame_count);
-
-    /// Name of component providing the anode plane.
-    put(cfg, "anode", "");
-    /// Name of component providing the anode pseudo random number generator.
-    put(cfg, "rng", "");
-
-    /// Plane impact responses
-    cfg["pirs"] = Json::arrayValue;
-
-    return cfg;
-}
-
-bool Gen::DepoZipper::operator()(const input_pointer& in, output_pointer& out)
-{
-    if (!in) {
-        out = nullptr;
-        cerr << "Gen::DepoZipper: EOS\n";
-        return true;
-    }
-
-    auto depos = in->depos();
-
-    Binning tbins(m_readout_time / m_tick, m_start_time, m_start_time + m_readout_time);
-    ITrace::vector traces;
-    for (auto face : m_anode->faces()) {
-        // Select the depos which are in this face's sensitive volume
-        IDepo::vector face_depos, dropped_depos;
-        auto bb = face->sensitive();
-        if (bb.empty()) {
-            cerr << "Gen::DepoZipper anode:" << m_anode->ident() << " face:" << face->ident()
-                 << " is marked insensitive, skipping\n";
-            continue;
-        }
-
-        for (auto depo : (*depos)) {
-            if (bb.inside(depo->pos())) {
-                face_depos.push_back(depo);
-            }
-            else {
-                dropped_depos.push_back(depo);
-            }
-        }
-
-        if (face_depos.size()) {
-            auto ray = bb.bounds();
-            cerr << "Gen::Ductor: anode:" << m_anode->ident() << " face:" << face->ident() << ": processing "
-                 << face_depos.size() << " depos spanning: t:[" << face_depos.front()->time() / units::ms << ", "
-                 << face_depos.back()->time() / units::ms << "]ms, bb: " << ray.first / units::cm << " --> "
-                 << ray.second / units::cm << "cm\n";
-        }
-        if (dropped_depos.size()) {
-            auto ray = bb.bounds();
-            cerr << "Gen::Ductor: anode:" << m_anode->ident() << " face:" << face->ident() << ": dropped "
-                 << dropped_depos.size() << " depos spanning: t:[" << dropped_depos.front()->time() / units::ms << ", "
-                 << dropped_depos.back()->time() / units::ms << "]ms, outside bb: " << ray.first / units::cm << " --> "
-                 << ray.second / units::cm << "cm\n";
-        }
-
-        int iplane = -1;
-        for (auto plane : face->planes()) {
-            ++iplane;
-
-            const Pimpos* pimpos = plane->pimpos();
-
-            Binning tbins(m_readout_time / m_tick, m_start_time, m_start_time + m_readout_time);
-
-            Gen::BinnedDiffusion bindiff(*pimpos, tbins, m_nsigma, m_rng);
-            for (auto depo : face_depos) {
-                bindiff.add(depo, depo->extent_long() / m_drift_speed, depo->extent_tran());
-            }
-
-            auto& wires = plane->wires();
-
-            auto pir = m_pirs.at(iplane);
-            Gen::ImpactZipper zipper(pir, bindiff);
-
-            const int nwires = pimpos->region_binning().nbins();
-            for (int iwire = 0; iwire < nwires; ++iwire) {
-                auto wave = zipper.waveform(iwire);
-
-                auto mm = Waveform::edge(wave);
-                if (mm.first == (int) wave.size()) {  // all zero
-                    continue;
-                }
-
-                int chid = wires[iwire]->channel();
-                int tbin = mm.first;
-
-                // std::cout << mm.first << " "<< mm.second << std::endl;
-
-                ITrace::ChargeSequence charge(wave.begin() + mm.first, wave.begin() + mm.second);
-                auto trace = make_shared<SimpleTrace>(chid, tbin, charge);
-                traces.push_back(trace);
-            }
-        }
-    }
-
-    auto frame = make_shared<SimpleFrame>(m_frame_count, m_start_time, traces, m_tick);
-    cerr << "Gen::DepoZipper: make frame " << m_frame_count << "\n";
-    ++m_frame_count;
-    out = frame;
-    return true;
-}
diff --git a/gen/src/Ductor.cxx b/gen/src/Ductor.cxx
deleted file mode 100644
index 9dcd8f264..000000000
--- a/gen/src/Ductor.cxx
+++ /dev/null
@@ -1,289 +0,0 @@
-#include "WireCellGen/Ductor.h"
-#include "WireCellGen/BinnedDiffusion.h"
-#include "WireCellGen/ImpactZipper.h"
-#include "WireCellUtil/Units.h"
-#include "WireCellUtil/Point.h"
-#include "WireCellUtil/NamedFactory.h"
-#include "WireCellIface/SimpleTrace.h"
-#include "WireCellIface/SimpleFrame.h"
-
-#include <string>
-
-WIRECELL_FACTORY(Ductor, WireCell::Gen::Ductor, WireCell::IDuctor, WireCell::IConfigurable)
-
-using namespace std;
-using namespace WireCell;
-
-Gen::Ductor::Ductor()
-  : m_anode_tn("AnodePlane")
-  , m_rng_tn("Random")
-  , m_start_time(0.0 * units::ns)
-  , m_readout_time(5.0 * units::ms)
-  , m_tick(0.5 * units::us)
-  , m_drift_speed(1.0 * units::mm / units::us)
-  , m_nsigma(3.0)
-  , m_fluctuate(true)
-  , m_mode("continuous")
-  , m_frame_count(0)
-  , l(Log::logger("sim"))
-{
-}
-
-WireCell::Configuration Gen::Ductor::default_configuration() const
-{
-    Configuration cfg;
-
-    /// How many Gaussian sigma due to diffusion to keep before truncating.
-    put(cfg, "nsigma", m_nsigma);
-
-    /// Whether to fluctuate the final Gaussian deposition.
-    put(cfg, "fluctuate", m_fluctuate);
-
-    /// The initial time for this ductor
-    put(cfg, "start_time", m_start_time);
-
-    /// The time span for each readout.
-    put(cfg, "readout_time", m_readout_time);
-
-    /// The sample period
-    put(cfg, "tick", m_tick);
-
-    /// If false then determine start time of each readout based on the
-    /// input depos.  This option is useful when running WCT sim on a
-    /// source of depos which have already been "chunked" in time.  If
-    /// true then this Ductor will continuously simulate all time in
-    /// "readout_time" frames leading to empty frames in the case of
-    /// some readout time with no depos.
-    put(cfg, "continuous", true);
-
-    /// Fixed mode simply reads out the same time window all the time.
-    /// It implies discontinuous (continuous == false).
-    put(cfg, "fixed", false);
-
-    /// The nominal speed of drifting electrons
-    put(cfg, "drift_speed", m_drift_speed);
-
-    /// Allow for a custom starting frame number
-    put(cfg, "first_frame_number", m_frame_count);
-
-    /// Name of component providing the anode plane.
-    put(cfg, "anode", m_anode_tn);
-    put(cfg, "rng", m_rng_tn);
-
-    cfg["pirs"] = Json::arrayValue;
-    /// don't set here so user must, but eg:
-    // cfg["pirs"][0] = "PlaneImpactResponseU";
-    // cfg["pirs"][1] = "PlaneImpactResponseV";
-    // cfg["pirs"][2] = "PlaneImpactResponseW";
-
-    // Tag to use for frame and traces will get this tag + the anode
-    // ID.
-    cfg["tag"] = "ductor";
-
-    return cfg;
-}
-
-void Gen::Ductor::configure(const WireCell::Configuration& cfg)
-{
-    m_anode_tn = get<string>(cfg, "anode", m_anode_tn);
-    m_anode = Factory::find_tn<IAnodePlane>(m_anode_tn);
-
-    m_nsigma = get<double>(cfg, "nsigma", m_nsigma);
-    bool continuous = get<bool>(cfg, "continuous", true);
-    bool fixed = get<bool>(cfg, "fixed", false);
-
-    m_mode = "continuous";
-    if (fixed) {
-        m_mode = "fixed";
-    }
-    else if (!continuous) {
-        m_mode = "discontinuous";
-    }
-
-    m_fluctuate = get<bool>(cfg, "fluctuate", m_fluctuate);
-    m_rng = nullptr;
-    if (m_fluctuate) {
-        m_rng_tn = get(cfg, "rng", m_rng_tn);
-        m_rng = Factory::find_tn<IRandom>(m_rng_tn);
-    }
-
-    m_readout_time = get<double>(cfg, "readout_time", m_readout_time);
-    m_tick = get<double>(cfg, "tick", m_tick);
-    m_start_time = get<double>(cfg, "start_time", m_start_time);
-    m_drift_speed = get<double>(cfg, "drift_speed", m_drift_speed);
-    m_frame_count = get<int>(cfg, "first_frame_number", m_frame_count);
-
-    auto jpirs = cfg["pirs"];
-    if (jpirs.isNull() or jpirs.empty()) {
-        l->critical("must configure with some plane impace response components");
-        THROW(ValueError() << errmsg{"Gen::Ductor: must configure with some plane impact response components"});
-    }
-    m_pirs.clear();
-    for (auto jpir : jpirs) {
-        auto tn = jpir.asString();
-        auto pir = Factory::find_tn<IPlaneImpactResponse>(tn);
-        m_pirs.push_back(pir);
-    }
-
-    m_tag = get<std::string>(cfg, "tag", "ductor");
-
-    l->debug("Ductor tagging {}, AnodePlane: {}, mode: {}, fluctuate: {}, time start: {} ms, readout time: {} ms, frame start: {}",
-             m_tag,
-             m_anode_tn, m_mode, (m_fluctuate ? "on" : "off"), m_start_time / units::ms, m_readout_time / units::ms,
-             m_frame_count);
-}
-
-ITrace::vector Gen::Ductor::process_face(IAnodeFace::pointer face, const IDepo::vector& face_depos)
-{
-    ITrace::vector traces;
-
-    int iplane = -1;
-    for (auto plane : face->planes()) {
-        ++iplane;
-
-        const Pimpos* pimpos = plane->pimpos();
-
-        Binning tbins(m_readout_time / m_tick, m_start_time, m_start_time + m_readout_time);
-
-        Gen::BinnedDiffusion bindiff(*pimpos, tbins, m_nsigma, m_rng);
-        for (auto depo : face_depos) {
-            bindiff.add(depo, depo->extent_long() / m_drift_speed, depo->extent_tran());
-        }
-
-        auto& wires = plane->wires();
-
-        auto pir = m_pirs.at(iplane);
-        Gen::ImpactZipper zipper(pir, bindiff);
-
-        const int nwires = pimpos->region_binning().nbins();
-        for (int iwire = 0; iwire < nwires; ++iwire) {
-            auto wave = zipper.waveform(iwire);
-
-            auto mm = Waveform::edge(wave);
-            if (mm.first == (int) wave.size()) {  // all zero
-                continue;
-            }
-
-            int chid = wires[iwire]->channel();
-            int tbin = mm.first;
-
-            ITrace::ChargeSequence charge(wave.begin() + mm.first, wave.begin() + mm.second);
-            auto trace = make_shared<SimpleTrace>(chid, tbin, charge);
-            traces.push_back(trace);
-        }
-    }
-    return traces;
-}
-
-void Gen::Ductor::process(output_queue& frames)
-{
-    ITrace::vector traces;
-
-    for (auto face : m_anode->faces()) {
-        // Select the depos which are in this face's sensitive volume
-        IDepo::vector face_depos, dropped_depos;
-        auto bb = face->sensitive();
-        if (bb.empty()) {
-            l->debug("anode: {} face: {} is marked insensitive, skipping", m_anode->ident(), face->ident());
-            continue;
-        }
-
-        for (auto depo : m_depos) {
-            if (bb.inside(depo->pos())) {
-                face_depos.push_back(depo);
-            }
-            else {
-                dropped_depos.push_back(depo);
-            }
-        }
-
-        if (face_depos.size()) {
-            auto ray = bb.bounds();
-            l->debug(
-                "anode: {}, face: {}, processing {} depos spanning "
-                "t:[{},{}]ms, bb:[{}-->{}]cm",
-                m_anode->ident(), face->ident(), face_depos.size(), face_depos.front()->time() / units::ms,
-                face_depos.back()->time() / units::ms, ray.first / units::cm, ray.second / units::cm);
-        }
-        if (dropped_depos.size()) {
-            auto ray = bb.bounds();
-            l->debug(
-                "anode: {}, face: {}, dropped {} depos spanning "
-                "t:[{},{}]ms, outside bb:[{}-->{}]cm",
-                m_anode->ident(), face->ident(), dropped_depos.size(), dropped_depos.front()->time() / units::ms,
-                dropped_depos.back()->time() / units::ms, ray.first / units::cm, ray.second / units::cm);
-        }
-
-        auto newtraces = process_face(face, face_depos);
-        traces.insert(traces.end(), newtraces.begin(), newtraces.end());
-    }
-
-    auto frame = make_shared<SimpleFrame>(m_frame_count, m_start_time, traces, m_tick);
-    IFrame::trace_list_t indices(traces.size());
-    for (size_t ind = 0; ind < traces.size(); ++ind) {
-        indices[ind] = ind;
-    }
-    frame->tag_traces(m_tag + std::to_string(m_anode->ident()), indices);
-    frame->tag_frame(m_tag);
-    frames.push_back(frame);
-    l->debug("made frame: {} with {} traces @ {}ms", m_frame_count, traces.size(), m_start_time / units::ms);
-
-    // fixme: what about frame overflow here?  If the depos extend
-    // beyond the readout where does their info go?  2nd order,
-    // diffusion and finite field response can cause depos near the
-    // end of the readout to have some portion of their waveforms
-    // lost?
-    m_depos.clear();
-
-    if (m_mode == "continuous") {
-        m_start_time += m_readout_time;
-    }
-
-    ++m_frame_count;
-}
-
-// Return true if ready to start processing and capture start time if
-// in continuous mode.
-bool Gen::Ductor::start_processing(const input_pointer& depo)
-{
-    if (!depo) {
-        return true;
-    }
-
-    if (m_mode == "fixed") {
-        // fixed mode waits until EOS
-        return false;
-    }
-
-    if (m_mode == "discontinuous") {
-        // discontinuous mode sets start time on first depo.
-        if (m_depos.empty()) {
-            m_start_time = depo->time();
-            return false;
-        }
-    }
-
-    // continuous and discontinuous modes follow Just Enough
-    // Processing(TM) strategy.
-
-    // Note: we use this depo time even if it may not actually be
-    // inside our sensitive volume.
-    bool ok = depo->time() > m_start_time + m_readout_time;
-    return ok;
-}
-
-bool Gen::Ductor::operator()(const input_pointer& depo, output_queue& frames)
-{
-    if (start_processing(depo)) {
-        process(frames);
-    }
-
-    if (depo) {
-        m_depos.push_back(depo);
-    }
-    else {
-        frames.push_back(nullptr);
-    }
-
-    return true;
-}
diff --git a/gen/src/ImpactZipper.cxx b/gen/src/ImpactZipper.cxx
deleted file mode 100644
index 193d0bed1..000000000
--- a/gen/src/ImpactZipper.cxx
+++ /dev/null
@@ -1,127 +0,0 @@
-#include "WireCellGen/ImpactZipper.h"
-#include "WireCellUtil/Testing.h"
-
-#include <iostream>  // debugging.
-using namespace std;
-
-using namespace WireCell;
-Gen::ImpactZipper::ImpactZipper(IPlaneImpactResponse::pointer pir, BinnedDiffusion& bd)
-  : m_pir(pir)
-  , m_bd(bd)
-{
-}
-
-Gen::ImpactZipper::~ImpactZipper() {}
-
-Waveform::realseq_t Gen::ImpactZipper::waveform(int iwire) const
-{
-    const double pitch_range = m_pir->pitch_range();
-
-    const auto pimpos = m_bd.pimpos();
-    const auto rb = pimpos.region_binning();
-    const auto ib = pimpos.impact_binning();
-    const double wire_pos = rb.center(iwire);
-
-    const int min_impact = ib.edge_index(wire_pos - 0.5 * pitch_range);
-    const int max_impact = ib.edge_index(wire_pos + 0.5 * pitch_range);
-    const int nsamples = m_bd.tbins().nbins();
-    Waveform::compseq_t total_spectrum(nsamples, Waveform::complex_t(0.0, 0.0));
-
-    int nfound = 0;
-    const bool share = true;
-    // const Waveform::complex_t complex_one_half(0.5,0.0);
-
-    // The BinnedDiffusion is indexed by absolute impact and the
-    // PlaneImpactResponse relative impact.
-    for (int imp = min_impact; imp <= max_impact; ++imp) {
-        // ImpactData
-        auto id = m_bd.impact_data(imp);
-        if (!id) {
-            // common as we are scanning all impacts covering a wire
-            // fixme: is there a way to predict this to avoid the query?
-            // std::cerr << "ImpactZipper: no data for absolute impact number: " << imp << std::endl;
-            continue;
-        }
-
-        const Waveform::compseq_t& charge_spectrum = id->spectrum();
-        // for interpolation
-        const Waveform::compseq_t& weightcharge_spectrum = id->weight_spectrum();
-
-        if (charge_spectrum.empty()) {
-            // should not happen
-            std::cerr << "ImpactZipper: no charge for absolute impact number: " << imp << std::endl;
-            continue;
-        }
-        if (weightcharge_spectrum.empty()) {
-            // weight == 0, should not happen
-            std::cerr << "ImpactZipper: no weight charge for absolute impact number: " << imp << std::endl;
-            continue;
-        }
-
-        const double imp_pos = ib.center(imp);
-        const double rel_imp_pos = imp_pos - wire_pos;
-        // std::cerr << "IZ: " << " imp=" << imp << " imp_pos=" << imp_pos << " rel_imp_pos=" << rel_imp_pos <<
-        // std::endl;
-
-        Waveform::compseq_t conv_spectrum(nsamples, Waveform::complex_t(0.0, 0.0));
-        if (share) {  // fixme: make a configurable option
-            TwoImpactResponses two_ir = m_pir->bounded(rel_imp_pos);
-            if (!two_ir.first || !two_ir.second) {
-                // std::cerr << "ImpactZipper: no impact response for absolute impact number: " << imp << std::endl;
-                continue;
-            }
-            // fixme: this is average, not interpolation.
-            Waveform::compseq_t rs1 = two_ir.first->spectrum();
-            Waveform::compseq_t rs2 = two_ir.second->spectrum();
-
-            for (int ind = 0; ind < nsamples; ++ind) {
-                // conv_spectrum[ind] = complex_one_half*(rs1[ind]+rs2[ind])*charge_spectrum[ind];
-
-                // linear interpolation: wQ*rs1 + (Q-wQ)*rs2
-                conv_spectrum[ind] = weightcharge_spectrum[ind] * rs1[ind] +
-                                     (charge_spectrum[ind] - weightcharge_spectrum[ind]) * rs2[ind];
-                /* debugging */
-                /* if(iwire == 1000 && ind>1000 && ind<2000) { */
-                /* std::cerr<<"rs1 spectrum: "<<imp<<"|"<<ind<<": "<<std::abs(rs1[ind])<<std::endl; */
-                /* std::cerr<<"rs2 spectrum: "<<imp<<"|"<<ind<<": "<<std::abs(rs2[ind])<<std::endl; */
-                /* std::cerr<<"rs1 charge spectrum "<<ind<<": "<<weightcharge_spectrum[ind]<<std::endl; */
-                /* std::cerr<<"rs2 charge spectrum "<<ind<<":
-                 * "<<charge_spectrum[ind]-weightcharge_spectrum[ind]<<std::endl; */
-                /* //std::cerr<<"rs1 charge spectrum "<<ind<<": "<<complex_one_half*charge_spectrum[ind]<<std::endl; */
-                /* //std::cerr<<"rs2 charge spectrum "<<ind<<": "<<complex_one_half*charge_spectrum[ind]<<std::endl; */
-                /* } */
-            }
-        }
-        else {
-            auto ir = m_pir->closest(rel_imp_pos);
-            if (!ir) {
-                // std::cerr << "ImpactZipper: no impact response for absolute impact number: " << imp << std::endl;
-                continue;
-            }
-            Waveform::compseq_t response_spectrum = ir->spectrum();
-            for (int ind = 0; ind < nsamples; ++ind) {
-                conv_spectrum[ind] = response_spectrum[ind] * charge_spectrum[ind];
-            }
-        }
-
-        ++nfound;
-        // std::cerr << "ImpactZipper: found:"<<nfound<<" for absolute impact number " << imp
-        //           << " csize=" << csize << " rsize=" << rsize << " rebin=" << rebinfactor
-        //           << std::endl;
-
-        Waveform::increase(total_spectrum, conv_spectrum);
-    }
-    // std::cerr << "ImpactZipper: found " << nfound << " in abs impact: ["  << min_impact << ","<< max_impact << "]\n";
-
-    // Clear memory assuming next call is iwire+1.
-    // fixme: this is a dumb way to go. Better to make an iterator.
-    m_bd.erase(0, min_impact);
-
-    if (!nfound) {
-        return Waveform::realseq_t(nsamples, 0.0);
-    }
-
-    auto waveform = Waveform::idft(total_spectrum);
-
-    return waveform;
-}

From 2bedce696fa7522aa2fbd45ddce86e05fb995e1e Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 22 Nov 2021 12:12:38 -0500
Subject: [PATCH 25/46] Pass IDFT::pointer by const ref

---
 aux/inc/WireCellAux/DftTools.h | 12 ++++++------
 aux/src/DftTools.cxx           |  8 ++++----
 2 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
index 20272bc3f..72b2d789a 100644
--- a/aux/inc/WireCellAux/DftTools.h
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -20,14 +20,14 @@ namespace WireCell::Aux {
 
     // 1D with vectors
 
-    inline dft_vector_t fwd(IDFT::pointer dft, const dft_vector_t& seq)
+    inline dft_vector_t fwd(const IDFT::pointer& dft, const dft_vector_t& seq)
     {
         dft_vector_t ret(seq.size());
         dft->fwd1d(seq.data(), ret.data(), ret.size());
         return ret;
     }
 
-    inline dft_vector_t inv(IDFT::pointer dft, const dft_vector_t& spec)
+    inline dft_vector_t inv(const IDFT::pointer& dft, const dft_vector_t& spec)
     {
         dft_vector_t ret(spec.size());
         dft->inv1d(spec.data(), ret.data(), ret.size());
@@ -44,8 +44,8 @@ namespace WireCell::Aux {
     // from real or arr.real()() to convert result to real.
 
     // Transform both dimesions.
-    dft_array_t fwd(IDFT::pointer dft, const dft_array_t& arr);
-    dft_array_t inv(IDFT::pointer dft, const dft_array_t& arr);
+    dft_array_t fwd(const IDFT::pointer& dft, const dft_array_t& arr);
+    dft_array_t inv(const IDFT::pointer& dft, const dft_array_t& arr);
 
     // Transform a 2D array along one axis.
     //
@@ -60,8 +60,8 @@ namespace WireCell::Aux {
     // Note: internal storage order of an Eigen array may differ from
     // the logical order and indeed that of the array template type
     // order.  Neither is pertinent in setting the axis.
-    dft_array_t fwd(IDFT::pointer dft, const dft_array_t& arr, int axis);
-    dft_array_t inv(IDFT::pointer dft, const dft_array_t& arr, int axis);
+    dft_array_t fwd(const IDFT::pointer& dft, const dft_array_t& arr, int axis);
+    dft_array_t inv(const IDFT::pointer& dft, const dft_array_t& arr, int axis);
 
 
 }
diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index 905cbcfa2..9623c5ca4 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -38,7 +38,7 @@ Aux::dft_array_t doit(const Aux::dft_array_t& arr, trans func)
 
 }
 
-Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr)
+Aux::dft_array_t Aux::fwd(const IDFT::pointer& dft, const Aux::dft_array_t& arr)
 {
     return doit(arr, [&](const complex_t* in_data,
                          complex_t* out_data,
@@ -47,7 +47,7 @@ Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr)
     });
 }
 
-Aux::dft_array_t Aux::inv(IDFT::pointer dft, const Aux::dft_array_t& arr)
+Aux::dft_array_t Aux::inv(const IDFT::pointer& dft, const Aux::dft_array_t& arr)
 {
     return doit(arr, [&](const complex_t* in_data,
                          complex_t* out_data,
@@ -103,7 +103,7 @@ Aux::dft_array_t doit1b(const Aux::dft_array_t& arr, int axis, trans func)
 // - We then have column-wise storage order but IDFT assumes row-wise
 // - so we reverse (nrows, ncols) and meaning of axis.
 
-Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr, int axis)
+Aux::dft_array_t Aux::fwd(const IDFT::pointer& dft, const Aux::dft_array_t& arr, int axis)
 {
     Aux::dft_array_t ret = arr; 
     dft->fwd1b(ret.data(), ret.data(), ret.cols(), ret.rows(), !axis);
@@ -117,7 +117,7 @@ Aux::dft_array_t Aux::fwd(IDFT::pointer dft, const Aux::dft_array_t& arr, int ax
     // });
 }
 
-Aux::dft_array_t Aux::inv(IDFT::pointer dft, const Aux::dft_array_t& arr, int axis)
+Aux::dft_array_t Aux::inv(const IDFT::pointer& dft, const Aux::dft_array_t& arr, int axis)
 {
     Aux::dft_array_t ret = arr; 
     dft->inv1b(ret.data(), ret.data(), ret.cols(), ret.rows(), !axis);

From ee42c720865a9e6c718bde3cce6e13d8b8222715 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 22 Nov 2021 12:12:48 -0500
Subject: [PATCH 26/46] Port gen to IDFT

---
 gen/inc/WireCellGen/AddCoherentNoise.h    |   2 +
 gen/inc/WireCellGen/AddNoise.h            |   2 +
 gen/inc/WireCellGen/BinnedDiffusion.h     |   6 +-
 gen/inc/WireCellGen/DepoTransform.h       |   5 +-
 gen/inc/WireCellGen/EmpiricalNoiseModel.h |   2 +
 gen/inc/WireCellGen/ImpactData.h          |   5 +-
 gen/inc/WireCellGen/ImpactTransform.h     |   7 +-
 gen/inc/WireCellGen/NoiseSource.h         |   2 +
 gen/inc/WireCellGen/PlaneImpactResponse.h |   2 +
 gen/inc/WireCellGen/TruthSmearer.h        |   2 +
 gen/inc/WireCellGen/TruthTraceID.h        |   2 +
 gen/src/AddCoherentNoise.cxx              |   9 +-
 gen/src/AddNoise.cxx                      |   9 +-
 gen/src/BinnedDiffusion.cxx               |   6 +-
 gen/src/DepoSplat.cxx                     |   2 +-
 gen/src/DepoTransform.cxx                 |   7 +-
 gen/src/EmpiricalNoiseModel.cxx           |  12 +-
 gen/src/ImpactData.cxx                    |  10 +-
 gen/src/ImpactTransform.cxx               | 257 +++++-----------------
 gen/src/Noise.cxx                         |   7 +-
 gen/src/Noise.h                           |  20 +-
 gen/src/NoiseSource.cxx                   |  10 +-
 gen/src/PlaneImpactResponse.cxx           |  30 ++-
 gen/src/TruthSmearer.cxx                  |  15 +-
 gen/src/TruthTraceID.cxx                  |  18 +-
 gen/test/test_empnomo.cxx                 |   7 +
 gen/test/test_pir.cxx                     |   9 +-
 util/inc/WireCellUtil/Array.h             |   6 +-
 28 files changed, 220 insertions(+), 251 deletions(-)

diff --git a/gen/inc/WireCellGen/AddCoherentNoise.h b/gen/inc/WireCellGen/AddCoherentNoise.h
index 58b93c6db..087da8bd2 100644
--- a/gen/inc/WireCellGen/AddCoherentNoise.h
+++ b/gen/inc/WireCellGen/AddCoherentNoise.h
@@ -7,6 +7,7 @@
 #include "WireCellIface/IFrameFilter.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IRandom.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IChannelSpectrum.h"
 #include "WireCellUtil/Waveform.h"
 #include "WireCellUtil/Logging.h"
@@ -36,6 +37,7 @@ namespace WireCell {
             typedef std::map<int, std::pair<int, std::vector<float>>> noise_map_t;
 
             IRandom::pointer m_rng;
+            IDFT::pointer m_dft;
 
             std::string m_spectra_file, m_rng_tn;
             int m_nsamples;
diff --git a/gen/inc/WireCellGen/AddNoise.h b/gen/inc/WireCellGen/AddNoise.h
index 662c2f3c8..6ad18b954 100644
--- a/gen/inc/WireCellGen/AddNoise.h
+++ b/gen/inc/WireCellGen/AddNoise.h
@@ -10,6 +10,7 @@
 #include "WireCellIface/IFrameFilter.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IRandom.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IChannelSpectrum.h"
 #include "WireCellUtil/Waveform.h"
 #include "WireCellAux/Logger.h"
@@ -35,6 +36,7 @@ namespace WireCell {
 
            private:
             IRandom::pointer m_rng;
+            IDFT::pointer m_dft;
             IChannelSpectrum::pointer m_model;
 
             std::string m_model_tn, m_rng_tn;
diff --git a/gen/inc/WireCellGen/BinnedDiffusion.h b/gen/inc/WireCellGen/BinnedDiffusion.h
index dc3a161e4..6366dc665 100644
--- a/gen/inc/WireCellGen/BinnedDiffusion.h
+++ b/gen/inc/WireCellGen/BinnedDiffusion.h
@@ -4,7 +4,9 @@
 #include "WireCellUtil/Pimpos.h"
 #include "WireCellUtil/Point.h"
 #include "WireCellUtil/Units.h"
+
 #include "WireCellIface/IDepo.h"
+#include "WireCellIface/IDFT.h"
 
 #include "WireCellGen/ImpactData.h"
 
@@ -45,7 +47,8 @@ namespace WireCell {
             /// Useful to client code to mark a calculation strategy.
             enum ImpactDataCalculationStrategy { constant = 1, linear = 2 };
 
-            BinnedDiffusion(const Pimpos& pimpos, const Binning& tbins, double nsigma = 3.0,
+            BinnedDiffusion(const Pimpos& pimpos, const IDFT::pointer& dft,
+                            const Binning& tbins, double nsigma = 3.0,
                             IRandom::pointer fluctuate = nullptr, ImpactDataCalculationStrategy calcstrat = linear);
 
             const Pimpos& pimpos() const { return m_pimpos; }
@@ -95,6 +98,7 @@ namespace WireCell {
 
            private:
             const Pimpos& m_pimpos;
+            const IDFT::pointer& m_dft;
             const Binning& m_tbins;
 
             double m_nsigma;
diff --git a/gen/inc/WireCellGen/DepoTransform.h b/gen/inc/WireCellGen/DepoTransform.h
index d2b8f9a0b..d58434dea 100644
--- a/gen/inc/WireCellGen/DepoTransform.h
+++ b/gen/inc/WireCellGen/DepoTransform.h
@@ -4,14 +4,16 @@
 #ifndef WIRECELLGEN_DEPOTRANSFORM
 #define WIRECELLGEN_DEPOTRANSFORM
 
+#include "WireCellAux/Logger.h"
+
 #include "WireCellIface/IDepoFramer.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IRandom.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IPlaneImpactResponse.h"
 #include "WireCellIface/IAnodePlane.h"
 #include "WireCellIface/WirePlaneId.h"
 #include "WireCellIface/IDepo.h"
-#include "WireCellAux/Logger.h"
 
 namespace WireCell {
     namespace Gen {
@@ -35,6 +37,7 @@ namespace WireCell {
            private:
             IAnodePlane::pointer m_anode;
             IRandom::pointer m_rng;
+            IDFT::pointer m_dft;
             std::vector<IPlaneImpactResponse::pointer> m_pirs;
 
             double m_start_time;
diff --git a/gen/inc/WireCellGen/EmpiricalNoiseModel.h b/gen/inc/WireCellGen/EmpiricalNoiseModel.h
index 513c85dac..424bfe33f 100644
--- a/gen/inc/WireCellGen/EmpiricalNoiseModel.h
+++ b/gen/inc/WireCellGen/EmpiricalNoiseModel.h
@@ -14,6 +14,7 @@
 #include "WireCellIface/IChannelSpectrum.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IAnodePlane.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IChannelStatus.h"
 
 #include "WireCellUtil/Units.h"
@@ -86,6 +87,7 @@ namespace WireCell {
            private:
             IAnodePlane::pointer m_anode;
             IChannelStatus::pointer m_chanstat;
+            IDFT::pointer m_dft;
 
             std::string m_spectra_file;
             int m_nsamples;
diff --git a/gen/inc/WireCellGen/ImpactData.h b/gen/inc/WireCellGen/ImpactData.h
index d775a09ff..d4d5a90af 100644
--- a/gen/inc/WireCellGen/ImpactData.h
+++ b/gen/inc/WireCellGen/ImpactData.h
@@ -4,6 +4,9 @@
  */
 
 #include "WireCellUtil/Waveform.h"
+
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellGen/GaussianDiffusion.h"
 
 #include <memory>
@@ -56,7 +59,7 @@ namespace WireCell {
              * linear or constant (all = 0.5),
              * and honoring the Gaussian distribution (diffusion).
              */
-            void calculate(int nticks) const;
+            void calculate(const IDFT::pointer& dft, int nticks) const;
 
             /**  Return the time domain waveform of drifted/diffused
              *  charge at this impact position. See `calculate()`. */
diff --git a/gen/inc/WireCellGen/ImpactTransform.h b/gen/inc/WireCellGen/ImpactTransform.h
index 466072498..c3029e0e1 100644
--- a/gen/inc/WireCellGen/ImpactTransform.h
+++ b/gen/inc/WireCellGen/ImpactTransform.h
@@ -1,8 +1,11 @@
 #ifndef WIRECELL_IMPACTTRANSFORM
 #define WIRECELL_IMPACTTRANSFORM
 
-#include "WireCellIface/IPlaneImpactResponse.h"
 #include "WireCellGen/BinnedDiffusion_transform.h"
+
+#include "WireCellIface/IPlaneImpactResponse.h"
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellUtil/Array.h"
 
 #include <Eigen/Sparse>
@@ -15,6 +18,7 @@ namespace WireCell {
          */
         class ImpactTransform {
             IPlaneImpactResponse::pointer m_pir;
+            IDFT::pointer m_dft;
             BinnedDiffusion_transform& m_bd;
 
             int m_num_group;     // how many 2D convolution is needed
@@ -32,6 +36,7 @@ namespace WireCell {
 
            public:
             ImpactTransform(IPlaneImpactResponse::pointer pir,
+                            const IDFT::pointer& dft,
                             BinnedDiffusion_transform& bd);
 
             virtual ~ImpactTransform();
diff --git a/gen/inc/WireCellGen/NoiseSource.h b/gen/inc/WireCellGen/NoiseSource.h
index 2d3d8840d..50c12c3b5 100644
--- a/gen/inc/WireCellGen/NoiseSource.h
+++ b/gen/inc/WireCellGen/NoiseSource.h
@@ -11,6 +11,7 @@
 #include "WireCellIface/IFrameSource.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IRandom.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IAnodePlane.h"
 #include "WireCellIface/IChannelSpectrum.h"
 #include "WireCellUtil/Waveform.h"
@@ -36,6 +37,7 @@ namespace WireCell {
 
            private:
             IRandom::pointer m_rng;
+            IDFT::pointer m_dft;
             IAnodePlane::pointer m_anode;
             IChannelSpectrum::pointer m_model;
             double m_time, m_stop, m_readout, m_tick;
diff --git a/gen/inc/WireCellGen/PlaneImpactResponse.h b/gen/inc/WireCellGen/PlaneImpactResponse.h
index 8f230e636..92701a9db 100644
--- a/gen/inc/WireCellGen/PlaneImpactResponse.h
+++ b/gen/inc/WireCellGen/PlaneImpactResponse.h
@@ -103,6 +103,7 @@ namespace WireCell {
             const std::vector<IImpactResponse::pointer>& irs() const { return m_ir; }
 
            private:
+
             std::string m_frname;
             std::vector<std::string> m_short;
             double m_overall_short_padding;
@@ -118,6 +119,7 @@ namespace WireCell {
             std::vector<IImpactResponse::pointer> m_ir;
             double m_half_extent, m_pitch, m_impact;
 
+            std::string m_dftname{"FftwDFT"};
             void build_responses();
         };
 
diff --git a/gen/inc/WireCellGen/TruthSmearer.h b/gen/inc/WireCellGen/TruthSmearer.h
index 3e35166d7..be700aafa 100644
--- a/gen/inc/WireCellGen/TruthSmearer.h
+++ b/gen/inc/WireCellGen/TruthSmearer.h
@@ -6,6 +6,7 @@
 
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IDuctor.h"
+#include "WireCellIface/IDFT.h"
 
 #include "WireCellIface/IAnodePlane.h"
 #include "WireCellIface/IRandom.h"
@@ -30,6 +31,7 @@ namespace WireCell {
 
             IAnodePlane::pointer m_anode;
             IRandom::pointer m_rng;
+            IDFT::pointer m_dft;
             IDepo::vector m_depos;
 
             double m_start_time;
diff --git a/gen/inc/WireCellGen/TruthTraceID.h b/gen/inc/WireCellGen/TruthTraceID.h
index b6c1c4608..a08af1e7b 100644
--- a/gen/inc/WireCellGen/TruthTraceID.h
+++ b/gen/inc/WireCellGen/TruthTraceID.h
@@ -10,6 +10,7 @@
 
 #include "WireCellIface/IAnodePlane.h"
 #include "WireCellIface/IRandom.h"
+#include "WireCellIface/IDFT.h"
 
 namespace WireCell {
     namespace Gen {
@@ -28,6 +29,7 @@ namespace WireCell {
 
             IAnodePlane::pointer m_anode;
             IRandom::pointer m_rng;
+            IDFT::pointer m_dft;
             IDepo::vector m_depos;
 
             double m_start_time;
diff --git a/gen/src/AddCoherentNoise.cxx b/gen/src/AddCoherentNoise.cxx
index 90fdde2a1..cd2c7e7bd 100644
--- a/gen/src/AddCoherentNoise.cxx
+++ b/gen/src/AddCoherentNoise.cxx
@@ -7,6 +7,8 @@
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/FFTBestLength.h"
 
+#include "WireCellAux/DftTools.h"
+
 #include "Noise.h"
 
 #include <iostream>
@@ -54,6 +56,7 @@ WireCell::Configuration Gen::AddCoherentNoise::default_configuration() const
     cfg["random_fluctuation_amplitude"] = m_fluctuation;
     cfg["period"] = m_period;
     cfg["normalization"] = m_normalization;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
 
     return cfg;
 }
@@ -68,6 +71,9 @@ void Gen::AddCoherentNoise::configure(const WireCell::Configuration& cfg)
     m_fluctuation = get<double>(cfg, "random_fluctuation_amplitude", m_fluctuation);
     m_normalization = get<int>(cfg, "normalization", m_normalization);
 
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     m_fft_length = fft_best_length(m_nsamples);
     gen_elec_resp_default();
 
@@ -141,7 +147,8 @@ bool Gen::AddCoherentNoise::operator()(const input_pointer& inframe, output_poin
             noise_freq[i] = tc;
         }
 
-        Waveform::realseq_t wave = WireCell::Waveform::idft(noise_freq);
+        // Waveform::realseq_t wave = WireCell::Waveform::idft(noise_freq);
+        auto wave = Waveform::real(Aux::inv(m_dft, noise_freq));
 
         // Add signal (be careful to double counting with the incoherent noise)
         Waveform::increase(wave, intrace->charge());
diff --git a/gen/src/AddNoise.cxx b/gen/src/AddNoise.cxx
index c56fea8a0..db306db5f 100644
--- a/gen/src/AddNoise.cxx
+++ b/gen/src/AddNoise.cxx
@@ -1,5 +1,7 @@
 #include "WireCellGen/AddNoise.h"
 
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellIface/SimpleTrace.h"
 #include "WireCellIface/SimpleFrame.h"
 
@@ -36,6 +38,7 @@ WireCell::Configuration Gen::AddNoise::default_configuration() const
 
     cfg["model"] = m_model_tn;
     cfg["rng"] = m_rng_tn;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     cfg["nsamples"] = m_nsamples;
     cfg["replacement_percentage"] = m_rep_percent;
     return cfg;
@@ -45,6 +48,8 @@ void Gen::AddNoise::configure(const WireCell::Configuration& cfg)
 {
     m_rng_tn = get(cfg, "rng", m_rng_tn);
     m_rng = Factory::find_tn<IRandom>(m_rng_tn);
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
     m_model_tn = get(cfg, "model", m_model_tn);
     m_model = Factory::find_tn<IChannelSpectrum>(m_model_tn);
     m_nsamples = get<int>(cfg, "nsamples", m_nsamples);
@@ -66,7 +71,9 @@ bool Gen::AddNoise::operator()(const input_pointer& inframe, output_pointer& out
     for (const auto& intrace : *inframe->traces()) {
         int chid = intrace->channel();
         const auto& spec = (*m_model)(chid);
-        Waveform::realseq_t wave = Gen::Noise::generate_waveform(spec, m_rng, m_rep_percent);
+        auto cspec = Gen::Noise::generate_spectrum(spec, m_rng, m_rep_percent);
+        auto wave = Waveform::real(Aux::inv(m_dft, cspec));
+        // Waveform::realseq_t wave = Gen::Noise::generate_waveform(spec, m_rng, m_rep_percent);
 
         wave.resize(m_nsamples, 0);
         Waveform::increase(wave, intrace->charge());
diff --git a/gen/src/BinnedDiffusion.cxx b/gen/src/BinnedDiffusion.cxx
index 4127ba1ee..a855b9c97 100644
--- a/gen/src/BinnedDiffusion.cxx
+++ b/gen/src/BinnedDiffusion.cxx
@@ -7,9 +7,11 @@ using namespace std;
 
 using namespace WireCell;
 
-Gen::BinnedDiffusion::BinnedDiffusion(const Pimpos& pimpos, const Binning& tbins, double nsigma,
+Gen::BinnedDiffusion::BinnedDiffusion(const Pimpos& pimpos, const IDFT::pointer& dft,
+                                      const Binning& tbins, double nsigma,
                                       IRandom::pointer fluctuate, ImpactDataCalculationStrategy calcstrat)
   : m_pimpos(pimpos)
+  , m_dft(dft)
   , m_tbins(tbins)
   , m_nsigma(nsigma)
   , m_fluctuate(fluctuate)
@@ -127,7 +129,7 @@ Gen::ImpactData::pointer Gen::BinnedDiffusion::impact_data(int bin) const
         // diff->set_sampling(m_tbins, ib, m_nsigma, 0, m_calcstrat);
     }
 
-    idptr->calculate(m_tbins.nbins());
+    idptr->calculate(m_dft, m_tbins.nbins());
     return idptr;
 }
 
diff --git a/gen/src/DepoSplat.cxx b/gen/src/DepoSplat.cxx
index eb1ff16d6..47456cb9f 100644
--- a/gen/src/DepoSplat.cxx
+++ b/gen/src/DepoSplat.cxx
@@ -9,7 +9,7 @@
 
 // from ductor
 #include "WireCellGen/BinnedDiffusion.h"
-#include "WireCellGen/ImpactZipper.h"
+
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Point.h"
 #include "WireCellUtil/NamedFactory.h"
diff --git a/gen/src/DepoTransform.cxx b/gen/src/DepoTransform.cxx
index a8beda4d6..023551199 100644
--- a/gen/src/DepoTransform.cxx
+++ b/gen/src/DepoTransform.cxx
@@ -77,6 +77,8 @@ void Gen::DepoTransform::configure(const WireCell::Configuration& cfg)
         auto rng_tn = get<string>(cfg, "rng", "");
         m_rng = Factory::find_tn<IRandom>(rng_tn);
     }
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
 
     m_readout_time = get<double>(cfg, "readout_time", m_readout_time);
     m_tick = get<double>(cfg, "tick", m_tick);
@@ -132,6 +134,9 @@ WireCell::Configuration Gen::DepoTransform::default_configuration() const
     /// Plane impact responses
     cfg["pirs"] = Json::arrayValue;
 
+    // type-name for the DFT to use
+    cfg["dft"] = "FftwDFT";
+
     return cfg;
 }
 
@@ -203,7 +208,7 @@ bool Gen::DepoTransform::operator()(const input_pointer& in, output_pointer& out
             auto& wires = plane->wires();
 
             auto pir = m_pirs.at(iplane);
-            Gen::ImpactTransform transform(pir, bindiff);
+            Gen::ImpactTransform transform(pir, m_dft, bindiff);
 
             const int nwires = pimpos->region_binning().nbins();
             for (int iwire = 0; iwire < nwires; ++iwire) {
diff --git a/gen/src/EmpiricalNoiseModel.cxx b/gen/src/EmpiricalNoiseModel.cxx
index 85df675a3..8a1d109c9 100644
--- a/gen/src/EmpiricalNoiseModel.cxx
+++ b/gen/src/EmpiricalNoiseModel.cxx
@@ -9,6 +9,8 @@
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/FFTBestLength.h"
 
+#include "WireCellAux/DftTools.h"
+
 #include <iostream>  // debug
 
 WIRECELL_FACTORY(EmpiricalNoiseModel,
@@ -89,6 +91,7 @@ WireCell::Configuration Gen::EmpiricalNoiseModel::default_configuration() const
     // cfg["gain_scale"] = m_gres;
     // cfg["freq_scale"] = m_fres;
     cfg["anode"] = m_anode_tn;  // name of IAnodePlane component
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
 
     return cfg;
 }
@@ -161,6 +164,9 @@ void Gen::EmpiricalNoiseModel::configure(const WireCell::Configuration& cfg)
 
     m_spectra_file = get(cfg, "spectra_file", m_spectra_file);
 
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     m_nsamples = get(cfg, "nsamples", m_nsamples);
     m_fft_length = fft_best_length(m_nsamples);
     // m_fft_length = m_nsamples;
@@ -352,7 +358,8 @@ const IChannelSpectrum::amplitude_t& Gen::EmpiricalNoiseModel::operator()(int ch
         if (resp1 == m_elec_resp_cache.end()) {
             Response::ColdElec elec_resp(10, ch_shaping);  // default at 1 mV/fC
             auto sig = elec_resp.generate(WireCell::Waveform::Domain(0, m_fft_length * m_period), m_fft_length);
-            auto filt = Waveform::dft(sig);
+            //auto filt = Waveform::dft(sig);
+            auto filt = Aux::fwd(m_dft, Waveform::complex(sig));
             auto ele_resp_amp = Waveform::magnitude(filt);
 
             ele_resp_amp.resize(m_elec_resp_freq.size());
@@ -365,7 +372,8 @@ const IChannelSpectrum::amplitude_t& Gen::EmpiricalNoiseModel::operator()(int ch
         if (resp2 == m_elec_resp_cache.end()) {
             Response::ColdElec elec_resp(10, db_shaping);  // default at 1 mV/fC
             auto sig = elec_resp.generate(WireCell::Waveform::Domain(0, m_fft_length * m_period), m_fft_length);
-            auto filt = Waveform::dft(sig);
+            // auto filt = Waveform::dft(sig);
+            auto filt = Aux::fwd(m_dft, Waveform::complex(sig));
             auto ele_resp_amp = Waveform::magnitude(filt);
 
             ele_resp_amp.resize(m_elec_resp_freq.size());
diff --git a/gen/src/ImpactData.cxx b/gen/src/ImpactData.cxx
index a3ed125b4..814b26127 100644
--- a/gen/src/ImpactData.cxx
+++ b/gen/src/ImpactData.cxx
@@ -1,5 +1,7 @@
 #include "WireCellGen/ImpactData.h"
 
+#include "WireCellAux/DftTools.h"
+
 #include <iostream>  // debugging
 
 using namespace WireCell;
@@ -19,7 +21,7 @@ Waveform::realseq_t& Gen::ImpactData::weightform() const { return m_weights; }
 
 Waveform::compseq_t& Gen::ImpactData::weight_spectrum() const { return m_weight_spectrum; }
 
-void Gen::ImpactData::calculate(int nticks) const
+void Gen::ImpactData::calculate(const IDFT::pointer& dft, int nticks) const
 {
     if (m_waveform.size() > 0) {
         return;
@@ -54,8 +56,10 @@ void Gen::ImpactData::calculate(int nticks) const
         }
     }
 
-    m_spectrum = Waveform::dft(m_waveform);
-    m_weight_spectrum = Waveform::dft(m_weights);
+    // m_spectrum = Waveform::dft(m_waveform);
+    m_spectrum = Aux::fwd(dft, Waveform::complex(m_waveform));
+    // m_weight_spectrum = Waveform::dft(m_weights);
+    m_weight_spectrum = Aux::fwd(dft, Waveform::complex(m_weights));
 }
 
 // std::pair<int,int> Gen::ImpactData::strip() const
diff --git a/gen/src/ImpactTransform.cxx b/gen/src/ImpactTransform.cxx
index 74739b453..90ff57540 100644
--- a/gen/src/ImpactTransform.cxx
+++ b/gen/src/ImpactTransform.cxx
@@ -1,33 +1,29 @@
 #include "WireCellGen/ImpactTransform.h"
+
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellUtil/Testing.h"
 #include "WireCellUtil/FFTBestLength.h"
 #include "WireCellUtil/Exceptions.h"
+
 #include <iostream>  // debugging.
 using namespace std;
 
 using namespace WireCell;
 
 Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
+                                      const IDFT::pointer& dft,
                                       BinnedDiffusion_transform& bd)
   : m_pir(pir)
+  , m_dft(dft)
   , m_bd(bd)
 {
-    // for (int i=0;i!=210;i++){
-    //   double pos = -31.5 + 0.3*i+1e-9;0
-    //   m_pir->closest(pos);
-    // }
-
     // arrange the field response (210 in total, pitch_range/impact)
     // number of wires nwires ...
     m_num_group = std::round(m_pir->pitch() / m_pir->impact()) + 1;  // 11
     m_num_pad_wire = std::round((m_pir->nwires() - 1) / 2.);         // 10 for wires, 5 for PCB strips
 
     const auto pimpos = m_bd.pimpos();
-    //  const int nsamples = m_bd.tbins().nbins();
-    // const auto rb = pimpos.region_binning();
-    // const int nwires = rb.nbins();
-
-    //
     
     //std::cerr << "ImpactTransform: num_group:" << m_num_group << " num_pad_wire:" << m_num_pad_wire << std::endl;
     for (int i = 0; i != m_num_group; i++) {
@@ -43,10 +39,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
 
         //std::cerr << "ImpactTransform: " << rel_cen_imp_pos << std::endl;
         for (int j = 0; j != m_pir->nwires(); j++) {
-            // std::cerr << "ImpactTransform: "
-            //           << i << " " << j << " "
-            //           << rel_cen_imp_pos - (j-m_num_pad_wire)*m_pir->pitch()<< " "
-            //           << std::endl;
 
             try {
                 map_resp[j - m_num_pad_wire] = m_pir->closest(rel_cen_imp_pos - (j - m_num_pad_wire) * m_pir->pitch());
@@ -68,37 +60,21 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                 
             Waveform::compseq_t response_spectrum = map_resp[j - m_num_pad_wire]->spectrum();
 
-            //response_spectrum.size() << std::endl;
         }
-        // std::cout << m_vec_impact.back() << std::endl;
-        // std::cout << rel_cen_imp_pos << std::endl;
-        // std::cout << map_resp.size() << std::endl;
-        m_vec_map_resp.push_back(map_resp);
 
-        // Eigen::SparseMatrix<float> *mat = new Eigen::SparseMatrix<float>(nsamples,nwires);
-        //  mat.reserve(Eigen::VectorXi::Constant(nwires,1000));
-        // m_vec_spmatrix.push_back(mat);
+        m_vec_map_resp.push_back(map_resp);
 
         std::vector<std::tuple<int, int, double> > vec_charge;  // ch, time, charge
         m_vec_vec_charge.push_back(vec_charge);
     }
 
-    // m_bd.get_charge_matrix(m_vec_spmatrix, m_vec_impact);
-    // std::cout << nwires << " " << nsamples << std::endl;
-
     // now work on the charge part ...
     // trying to sampling ...
     m_bd.get_charge_vec(m_vec_vec_charge, m_vec_impact);
     // std::cout << nwires << " " << nsamples << std::endl;
 
-    // for (size_t i=0;i!=m_vec_vec_charge.size();i++){
-    //   std::cout << m_vec_vec_charge[i].size() << std::endl;
-    // }
-
     // length and width ...
 
-    //
-
     //    std::cout << nwires << " " << nsamples << std::endl;
     std::pair<int, int> impact_range = m_bd.impact_bin_range(m_bd.get_nsigma());
     std::pair<int, int> time_range = m_bd.time_bin_range(m_bd.get_nsigma());
@@ -120,15 +96,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
     int npad_wire = 0;
     const size_t ntotal_wires = fft_best_length(end_ch - start_ch + 2 * m_num_pad_wire, 1);
 
-    //   pow(2,std::ceil(log(end_ch - start_ch + 2 * m_num_pad_wire)/log(2)));
-    //  if (nwires == 2400){
-    // if (ntotal_wires > 2500)
-    //   ntotal_wires = 2500;
-    // }else if (nwires ==3456){
-    // if (ntotal_wires > 3600)
-    //   ntotal_wires = 3600;
-    //      npad_wire=72; //3600
-    //}
     npad_wire = (ntotal_wires - end_ch + start_ch) / 2;
     m_start_ch = start_ch - npad_wire;
     m_end_ch = end_ch + npad_wire;
@@ -138,29 +105,14 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
     int npad_time = m_pir->closest(0)->waveform_pad();
     const size_t ntotal_ticks = fft_best_length(end_tick - start_tick + npad_time);
 
-    // pow(2,std::ceil(log(end_tick - start_tick + npad_time)/log(2)));
-    // if (ntotal_ticks >9800 && nsamples <9800 && nsamples >9550)
-    //  ntotal_ticks = 9800;
     npad_time = ntotal_ticks - end_tick + start_tick;
     m_start_tick = start_tick;
     m_end_tick = end_tick + npad_time;
 
-    // m_end_tick = 16384;//nsamples;
-    // m_start_tick = 0;
-    // // std::cout << m_start_tick << " " << m_end_tick << std::endl;
-    // int npad_time = 0;
-    // int ntotal_ticks = pow(2,std::ceil(log(nsamples + npad_time)/log(2)));
-    // if (ntotal_ticks >9800 && nsamples <9800)
-    //   ntotal_ticks = 9800
-    // npad_time = ntotal_ticks - nsamples;
-    // m_start_tick = 0;
-    // m_end_tick = ntotal_ticks;
-
     Array::array_xxc acc_data_f_w =
         Array::array_xxc::Zero(end_ch - start_ch + 2 * npad_wire, m_end_tick - m_start_tick);
 
     int num_double = (m_vec_vec_charge.size() - 1) / 2;
-    // int num_double = (m_vec_spmatrix.size()-1)/2;
 
     // speed up version , first five
     for (int i = 0; i != num_double; i++) {
@@ -178,15 +130,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
         m_vec_vec_charge.at(i).clear();
         m_vec_vec_charge.at(i).shrink_to_fit();
 
-        // useing matrix form ...
-        // for (int k=0; k<m_vec_spmatrix.at(i)->outerSize(); ++k)
-        //   for (Eigen::SparseMatrix<float>::InnerIterator it(*m_vec_spmatrix.at(i),k); it; ++it){
-        // 	c_data(it.col()+npad_wire-start_ch,it.row()-m_start_tick) = it.value();
-        //   }
-        // delete m_vec_spmatrix.at(i);
-        // //m_vec_spmatrix.at(i).setZero();
-        // //m_vec_spmatrix.at(i).resize(0,0);
-
         // fill reverse order
         int ii = num_double * 2 - i;
         for (size_t j = 0; j != m_vec_vec_charge.at(ii).size(); j++) {
@@ -197,18 +140,12 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
         //    std::cout << ii << " " << m_vec_vec_charge.at(ii).size() << std::endl;
         m_vec_vec_charge.at(ii).clear();
         m_vec_vec_charge.at(ii).shrink_to_fit();
-        // for (int k=0; k<m_vec_spmatrix.at(ii)->outerSize(); ++k)
-        //   for (Eigen::SparseMatrix<float>::InnerIterator it(*m_vec_spmatrix.at(ii),k); it; ++it){
-        // 	c_data(it.col()+npad_wire-start_ch,it.row()-m_start_tick) = it.value();
-        //   }
-        // delete m_vec_spmatrix.at(ii);
-        // //    m_vec_spmatrix.at(ii).setZero();
-        // //m_vec_spmatrix.at(ii).resize(0,0);
 
         // Do FFT on time
-        c_data = Array::dft_cc(c_data, 0);
+        // c_data = Array::dft_cc(c_data, 0);
         // Do FFT on wire
-        c_data = Array::dft_cc(c_data, 1);
+        // c_data = Array::dft_cc(c_data, 1);
+        c_data = Aux::fwd(m_dft, c_data);
 
         // std::cout << i << std::endl;
         {
@@ -217,7 +154,8 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[0]->spectrum();
                 // do a inverse FFT
-                Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
                 // pick the first xxx ticks
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
@@ -225,7 +163,8 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
                 // do a FFT
-                rs1 = Waveform::dft(rs1_reduced);
+                // rs1 = Waveform::dft(rs1_reduced);
+                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
 
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(0, icol) = rs1[icol];
@@ -234,21 +173,25 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
 
             for (int irow = 0; irow != m_num_pad_wire; irow++) {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[irow + 1]->spectrum();
-                Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs1_t.size())) break;
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
-                rs1 = Waveform::dft(rs1_reduced);
+                // rs1 = Waveform::dft(rs1_reduced);
+                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
                 Waveform::compseq_t rs2 = m_vec_map_resp.at(i)[-irow - 1]->spectrum();
-                Waveform::realseq_t rs2_t = Waveform::idft(rs2);
+                // Waveform::realseq_t rs2_t = Waveform::idft(rs2);
+                Waveform::realseq_t rs2_t = Waveform::real(Aux::inv(m_dft, rs2));
                 Waveform::realseq_t rs2_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs2_t.size())) break;
                     rs2_reduced.at(icol) = rs2_t[icol];
                 }
-                rs2 = Waveform::dft(rs2_reduced);
+                //rs2 = Waveform::dft(rs2_reduced);
+                rs2 = Aux::fwd(m_dft, Waveform::complex(rs2_reduced));
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(irow + 1, icol) = rs1[icol];
                     resp_f_w(end_ch - start_ch - 1 - irow + 2 * npad_wire, icol) = rs2[icol];
@@ -257,13 +200,16 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             // std::cout << i << std::endl;
 
             // Do FFT on wire for response // slight larger
-            resp_f_w = Array::dft_cc(resp_f_w, 1);  // Now becomes the f and f in both time and wire domain ...
+            // resp_f_w = Array::dft_cc(resp_f_w, 1);  // Now becomes the f and f in both time and wire domain ...
+            resp_f_w = Aux::fwd(m_dft, resp_f_w, 0);
+
             // multiply them together
             c_data = c_data * resp_f_w;
         }
 
         // Do inverse FFT on wire
-        c_data = Array::idft_cc(c_data, 1);
+        // c_data = Array::idft_cc(c_data, 1);
+        c_data = Aux::inv(m_dft, c_data, 0);
 
         // Add to wire result in frequency
         acc_data_f_w += c_data;
@@ -290,18 +236,14 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             //      std::cout << i << " " << m_vec_vec_charge.at(i).size() << std::endl;
             m_vec_vec_charge.at(i).clear();
             m_vec_vec_charge.at(i).shrink_to_fit();
-            // for (int k=0; k<m_vec_spmatrix.at(i)->outerSize(); ++k)
-            // 	for (Eigen::SparseMatrix<float>::InnerIterator it(*m_vec_spmatrix.at(i),k); it; ++it){
-            // 	  data_t_w(it.col()+npad_wire-start_ch,it.row()-m_start_tick) = it.value();
-            // 	}
-            // delete m_vec_spmatrix.at(i);
-            // //      m_vec_spmatrix.at(i).setZero();
-            // // m_vec_spmatrix.at(i).resize(0,0);
 
             // Do FFT on time
-            data_f_w = Array::dft_rc(data_t_w, 0);
+            // data_f_w = Array::dft_rc(data_t_w, 0);
             // Do FFT on wire
-            data_f_w = Array::dft_cc(data_f_w, 1);
+            // data_f_w = Array::dft_cc(data_f_w, 1);
+            data_f_w = data_t_w.cast<IDFT::complex_t>();
+            data_f_w = Aux::fwd(m_dft, data_f_w);
+
         }
 
         {
@@ -310,16 +252,10 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
 
             {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[0]->spectrum();
-                // Array::array_xxc temp_resp_f_w = Array::array_xxc::Zero(2*m_num_pad_wire+1,nsamples);
-                // for (int icol = 0; icol != nsamples; icol++){
-                //   temp_resp_f_w(0,icol) = rs1[icol];
-                // }
-                // Array::array_xxf temp_resp_t_w =
-                // Array::idft_cr(temp_resp_f_w,0).block(0,0,2*m_num_pad_wire+1,m_end_tick-m_start_tick); temp_resp_f_w
-                // = Array::dft_rc(temp_resp_t_w,0);
 
                 // do a inverse FFT
-                Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
                 // pick the first xxx ticks
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 // std::cout << rs1.size() << " " << nsamples << " " << m_end_tick << " " <<  m_start_tick << std::endl;
@@ -329,7 +265,8 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                     //  std::cout << icol << " " << rs1_t[icol] << std::endl;
                 }
                 // do a FFT
-                rs1 = Waveform::dft(rs1_reduced);
+                // rs1 = Waveform::dft(rs1_reduced);
+                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
 
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     //   std::cout << icol << " " << rs1[icol] << " " << temp_resp_f_w(0,icol) << std::endl;
@@ -338,131 +275,51 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             }
             for (int irow = 0; irow != m_num_pad_wire; irow++) {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[irow + 1]->spectrum();
-                Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
+                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs1_t.size())) break;
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
-                rs1 = Waveform::dft(rs1_reduced);
+                // rs1 = Waveform::dft(rs1_reduced);
+                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
                 Waveform::compseq_t rs2 = m_vec_map_resp.at(i)[-irow - 1]->spectrum();
-                Waveform::realseq_t rs2_t = Waveform::idft(rs2);
+                // Waveform::realseq_t rs2_t = Waveform::idft(rs2);
+                Waveform::realseq_t rs2_t = Waveform::real(Aux::inv(m_dft, rs2));
                 Waveform::realseq_t rs2_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs2_t.size())) break;
                     rs2_reduced.at(icol) = rs2_t[icol];
                 }
-                rs2 = Waveform::dft(rs2_reduced);
+                // rs2 = Waveform::dft(rs2_reduced);
+                rs2 = Aux::fwd(m_dft, Waveform::complex(rs2_reduced));
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(irow + 1, icol) = rs1[icol];
                     resp_f_w(end_ch - start_ch - 1 - irow + 2 * npad_wire, icol) = rs2[icol];
                 }
-                // for (int icol = 0; icol != nsamples; icol++){
-                //   resp_f_w(irow+1,icol) = rs1[icol];
-                //   resp_f_w(end_ch-start_ch-1-irow+2*npad_wire,icol) = rs2[icol];
-                // }
             }
             // Do FFT on wire for response // slight larger
-            resp_f_w = Array::dft_cc(resp_f_w, 1);  // Now becomes the f and f in both time and wire domain ...
+            // resp_f_w = Array::dft_cc(resp_f_w, 1);  // Now becomes the f and f in both time and wire domain ...
+            resp_f_w = Aux::fwd(m_dft, resp_f_w, 0);
             // multiply them together
             data_f_w = data_f_w * resp_f_w;
         }
 
         // Do inverse FFT on wire
-        data_f_w = Array::idft_cc(data_f_w, 1);
+        // data_f_w = Array::idft_cc(data_f_w, 1);
+        data_f_w = Aux::inv(m_dft, data_f_w, 0);
 
         // Add to wire result in frequency
         acc_data_f_w += data_f_w;
     }
 
-    // m_decon_data = Array::array_xxc::Zero(nwires,nsamples);
-    //    if (npad_wire!=0){
-    acc_data_f_w = Array::idft_cc(acc_data_f_w, 0);  //.block(npad_wire,0,nwires,nsamples);
+    // acc_data_f_w = Array::idft_cc(acc_data_f_w, 0);
+    acc_data_f_w = Aux::inv(m_dft, acc_data_f_w, 1); 
     Array::array_xxf real_m_decon_data = acc_data_f_w.real();
     Array::array_xxf img_m_decon_data = acc_data_f_w.imag().colwise().reverse();
     m_decon_data = real_m_decon_data + img_m_decon_data;
 
-    // std::cout << real_m_decon_data(40,5182) << " " << img_m_decon_data(40,5182) << std::endl;
-    //    std::cout << real_m_decon_data(40,5182-m_start_tick) << " " << img_m_decon_data(40,5182-m_start_tick) <<
-    //    std::endl;
-
-    //}else{
-    // Array::array_xxc temp_m_decon_data = Array::idft_cc(acc_data_f_w,0);
-    //   Array::array_xxf real_m_decon_data = temp_m_decon_data.real();
-    //   Array::array_xxf img_m_decon_data = temp_m_decon_data.imag().rowwise().reverse();
-    //   m_decon_data = real_m_decon_data + img_m_decon_data;
-    // }
-
-    // // prepare FFT, loop 11 of them ... (older version)
-    // for (size_t i=0;i!=m_vec_vec_charge.size();i++){
-    //   // fill response array in frequency domain
-    //   if (i!=10) continue;
-
-    //   Array::array_xxc data_f_w;
-    //   {
-    // 	Array::array_xxf data_t_w = Array::array_xxf::Zero(nwires+2*npad_wire,nsamples);
-    // 	// fill charge array in time-wire domain // slightly larger
-    // 	for (size_t j=0;j!=m_vec_vec_charge.at(i).size();j++){
-    // 	  data_t_w(std::get<0>(m_vec_vec_charge.at(i).at(j))+npad_wire,std::get<1>(m_vec_vec_charge.at(i).at(j))) +=
-    // std::get<2>(m_vec_vec_charge.at(i).at(j));
-    // 	}
-    // 	m_vec_vec_charge.at(i).clear();
-
-    // 	// Do FFT on time
-    // 	data_f_w = Array::dft_rc(data_t_w,0);
-    // 	// Do FFT on wire
-    // 	data_f_w = Array::dft_cc(data_f_w,1);
-    //   }
-
-    //   {
-    // 	Array::array_xxc resp_f_w = Array::array_xxc::Zero(nwires+2*npad_wire,nsamples);
-    // 	{
-    // 	  Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[0]->spectrum();
-    // 	  for (int icol = 0; icol != nsamples; icol++){
-    // 	    resp_f_w(0,icol) = rs1[icol];
-    // 	  }
-    // 	}
-    // 	for (int irow = 0; irow!=m_num_pad_wire;irow++){
-    // 	  Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[irow+1]->spectrum();
-    // 	  Waveform::compseq_t rs2 = m_vec_map_resp.at(i)[-irow-1]->spectrum();
-    // 	  for (int icol = 0; icol != nsamples; icol++){
-    // 	    resp_f_w(irow+1,icol) = rs1[icol];
-    // 	    resp_f_w(nwires-1-irow+2*npad_wire,icol) = rs2[icol];
-    // 	  }
-    // 	}
-    // 	// Do FFT on wire for response // slight larger
-    // 	resp_f_w = Array::dft_cc(resp_f_w,1); // Now becomes the f and f in both time and wire domain ...
-    // 	// multiply them together
-    // 	data_f_w = data_f_w * resp_f_w;
-    //   }
-
-    //   // Do inverse FFT on wire
-    //   data_f_w = Array::idft_cc(data_f_w,1);
-
-    //   // Add to wire result in frequency
-    //   acc_data_f_w += data_f_w;
-    // }
-    // m_vec_vec_charge.clear();
-
-    // // do inverse FFT on time for the final results ...
-
-    // if (npad_wire!=0){
-    //   Array::array_xxf temp_m_decon_data = Array::idft_cr(acc_data_f_w,0);
-    //   m_decon_data = temp_m_decon_data.block(npad_wire,0,nwires,nsamples);
-    // }else{
-    //   m_decon_data = Array::idft_cr(acc_data_f_w,0);
-    // }
-
-    //    std::cout << m_decon_data(40,5195-m_start_tick)/units::mV << " " <<
-    //    m_decon_data(40,5195-m_start_tick)/units::mV << std::endl;
-
-    //  m_vec_spmatrix.clear();
-    // m_vec_spmatrix.shrink_to_fit();
-
-    // int nrows = resp_f_w.rows();
-    // int ncols = resp_f_w.cols();
-    // log->debug("ImpactTransform: # of channels: {} # of ticks: {}", m_decon_data.rows(), m_decon_data.cols());
-
 }  // constructor
 
 Gen::ImpactTransform::~ImpactTransform() {}
@@ -479,9 +336,6 @@ Waveform::realseq_t Gen::ImpactTransform::waveform(int iwire) const
             if (i >= m_start_tick && i < m_end_tick) {
                 wf.at(i) = m_decon_data(iwire - m_start_ch, i - m_start_tick);
             }
-            else {
-                // wf.at(i) = 1e-25;
-            }
             // std::cout << m_decon_data(iwire-m_start_ch,i-m_start_tick) << std::endl;
         }
 
@@ -489,19 +343,20 @@ Waveform::realseq_t Gen::ImpactTransform::waveform(int iwire) const
             // now convolute with the long-range response ...
             const size_t nlength = fft_best_length(nsamples + m_pir->closest(0)->long_aux_waveform_pad());
 
-            // nlength = nsamples;
-
             //   std::cout << nlength << " " << nsamples + m_pir->closest(0)->long_aux_waveform_pad() << std::endl;
 
             wf.resize(nlength, 0);
             Waveform::realseq_t long_resp = m_pir->closest(0)->long_aux_waveform();
             long_resp.resize(nlength, 0);
-            Waveform::compseq_t spec = Waveform::dft(wf);
-            Waveform::compseq_t long_spec = Waveform::dft(long_resp);
+            // Waveform::compseq_t spec = Waveform::dft(wf);
+            Waveform::compseq_t spec = Aux::fwd(m_dft, Waveform::complex(wf));
+            // Waveform::compseq_t long_spec = Waveform::dft(long_resp);
+            Waveform::compseq_t long_spec = Aux::fwd(m_dft, Waveform::complex(long_resp));
             for (size_t i = 0; i != nlength; i++) {
                 spec.at(i) *= long_spec.at(i);
             }
-            wf = Waveform::idft(spec);
+            // wf = Waveform::idft(spec);
+            wf = Waveform::real(Aux::inv(m_dft, spec));
             wf.resize(nsamples, 0);
         }
 
diff --git a/gen/src/Noise.cxx b/gen/src/Noise.cxx
index 8fbb86ad0..ee8350b97 100644
--- a/gen/src/Noise.cxx
+++ b/gen/src/Noise.cxx
@@ -4,7 +4,7 @@
 
 using namespace WireCell;
 
-Waveform::realseq_t Gen::Noise::generate_waveform(const std::vector<float>& spec, IRandom::pointer rng, double replace)
+Waveform::compseq_t Gen::Noise::generate_spectrum(const std::vector<float>& spec, IRandom::pointer rng, double replace)
 {
     // reuse randomes a bit to optimize speed.
     static std::vector<double> random_real_part;
@@ -49,6 +49,7 @@ Waveform::realseq_t Gen::Noise::generate_waveform(const std::vector<float>& spec
         noise_freq.at(i + int(spec.size()) - shift).imag(random_imag_part.at(i) * amplitude);
     }
 
-    Waveform::realseq_t noise_time = WireCell::Waveform::idft(noise_freq);
-    return noise_time;
+    return noise_freq;
+    // Waveform::realseq_t noise_time = WireCell::Waveform::idft(noise_freq);
+    // return noise_time;
 }
diff --git a/gen/src/Noise.h b/gen/src/Noise.h
index a671dad40..4f8e21d4d 100644
--- a/gen/src/Noise.h
+++ b/gen/src/Noise.h
@@ -1,18 +1,16 @@
 // This is some "private" code shared by a couple of components in gen.
-//
-// fixme: this is a candidate for turning into an interface.
 
 #include "WireCellIface/IRandom.h"
 #include "WireCellUtil/Waveform.h"
 
 #include <vector>
 
-namespace WireCell {
-    namespace Gen {
-        namespace Noise {
-            // Generate a time series waveform given a spectral amplitude
-            WireCell::Waveform::realseq_t generate_waveform(const std::vector<float>& spec, IRandom::pointer rng,
-                                                            double replace = 0.02);
-        }  // namespace Noise
-    }      // namespace Gen
-}  // namespace WireCell
+namespace WireCell::Gen::Noise {
+    // Generate a time series waveform given a spectral amplitude
+    // WireCell::Waveform::realseq_t generate_waveform(const std::vector<float>& spec, IRandom::pointer rng,
+    //                                                 double replace = 0.02);
+
+    // Generate specific noise spectrum.  Caller likely wants to Aux::inv() it and take Waveform::real().
+    WireCell::Waveform::compseq_t generate_spectrum(const std::vector<float>& spec, IRandom::pointer rng,
+                                                    double replace = 0.02);
+}
diff --git a/gen/src/NoiseSource.cxx b/gen/src/NoiseSource.cxx
index 28e511044..48dfc5334 100644
--- a/gen/src/NoiseSource.cxx
+++ b/gen/src/NoiseSource.cxx
@@ -1,5 +1,7 @@
 #include "WireCellGen/NoiseSource.h"
 
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellIface/SimpleTrace.h"
 #include "WireCellIface/SimpleFrame.h"
 
@@ -48,6 +50,7 @@ WireCell::Configuration Gen::NoiseSource::default_configuration() const
     cfg["anode"] = m_anode_tn;
     cfg["model"] = m_model_tn;
     cfg["rng"] = m_rng_tn;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     cfg["nsamples"] = m_nsamples;
     cfg["replacement_percentage"] = m_rep_percent;
     return cfg;
@@ -60,6 +63,8 @@ void Gen::NoiseSource::configure(const WireCell::Configuration& cfg)
     if (!m_rng) {
         THROW(KeyError() << errmsg{"failed to get IRandom: " + m_rng_tn});
     }
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
 
     m_anode_tn = get(cfg, "anode", m_anode_tn);
     m_anode = Factory::find_tn<IAnodePlane>(m_anode_tn);
@@ -104,7 +109,10 @@ bool Gen::NoiseSource::operator()(IFrame::pointer& frame)
     for (auto chid : m_anode->channels()) {
         const auto& spec = (*m_model)(chid);
 
-        Waveform::realseq_t noise = Gen::Noise::generate_waveform(spec, m_rng, m_rep_percent);
+        //Waveform::realseq_t noise = Gen::Noise::generate_waveform(spec, m_rng, m_rep_percent);
+        auto cnoise = Gen::Noise::generate_spectrum(spec, m_rng, m_rep_percent);
+        auto noise = Waveform::real(Aux::inv(m_dft, cnoise));
+
         //	std::cout << noise.size() << " " << nsamples << std::endl;
         noise.resize(m_nsamples, 0);
         auto trace = make_shared<SimpleTrace>(chid, tbin, noise);
diff --git a/gen/src/PlaneImpactResponse.cxx b/gen/src/PlaneImpactResponse.cxx
index c4ce24bf5..1d875fe3a 100644
--- a/gen/src/PlaneImpactResponse.cxx
+++ b/gen/src/PlaneImpactResponse.cxx
@@ -1,10 +1,16 @@
+#include "WireCellGen/PlaneImpactResponse.h"
+
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellIface/IFieldResponse.h"
 #include "WireCellIface/IWaveform.h"
-#include "WireCellGen/PlaneImpactResponse.h"
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellUtil/Testing.h"
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/FFTBestLength.h"
 
+
 WIRECELL_FACTORY(PlaneImpactResponse,
                  WireCell::Gen::PlaneImpactResponse,
                  WireCell::INamed,
@@ -41,6 +47,7 @@ WireCell::Configuration Gen::PlaneImpactResponse::default_configuration() const
     cfg["nticks"] = 10000;
     // sample period of response waveforms
     cfg["tick"] = 0.5 * units::us;
+    cfg["dft"] = m_dftname;     // type-name for the DFT to use
     return cfg;
 }
 
@@ -73,11 +80,14 @@ void Gen::PlaneImpactResponse::configure(const WireCell::Configuration& cfg)
     m_nbins = (size_t) get(cfg, "nticks", (int) m_nbins);
     m_tick = get(cfg, "tick", m_tick);
 
+    m_dftname = get<std::string>(cfg, "dft", m_dftname);
     build_responses();
 }
 
 void Gen::PlaneImpactResponse::build_responses()
 {
+    auto dft = Factory::find_tn<IDFT>(m_dftname);
+
     auto ifr = Factory::find_tn<IFieldResponse>(m_frname);
 
     const size_t n_short_length = fft_best_length(m_overall_short_padding / m_tick);
@@ -101,7 +111,8 @@ void Gen::PlaneImpactResponse::build_responses()
         }
         // note: we are ignoring waveform_start which will introduce
         // an arbitrary phase shift....
-        auto spec = Waveform::dft(wave);
+        // auto spec = Waveform::dft(wave);
+        auto spec = Aux::fwd(dft, Waveform::complex(wave));
         for (size_t ibin = 0; ibin < n_short_length; ++ibin) {
             short_spec[ibin] *= spec[ibin];
         }
@@ -127,14 +138,16 @@ void Gen::PlaneImpactResponse::build_responses()
         }
         // note: we are ignoring waveform_start which will introduce
         // an arbitrary phase shift....
-        auto spec = Waveform::dft(wave);
+        // auto spec = Waveform::dft(wave);
+        auto spec = Aux::fwd(dft, Waveform::complex(wave));
         for (size_t ibin = 0; ibin < n_long_length; ++ibin) {
             long_spec[ibin] *= spec[ibin];
         }
     }
     WireCell::Waveform::realseq_t long_wf;
-    if (nlong > 0) long_wf = Waveform::idft(long_spec);
-
+    if (nlong > 0) {
+        long_wf = Waveform::real(Aux::inv(dft, long_spec));
+    }
     const auto& fr = ifr->field_response();
     const auto& pr = *fr.plane(m_plane_ident);
     const int npaths = pr.paths.size();
@@ -219,7 +232,8 @@ void Gen::PlaneImpactResponse::build_responses()
             // sum up over coarse ticks.
             wave[bin] += induced_charge;
         }
-        WireCell::Waveform::compseq_t spec = Waveform::dft(wave);
+        // WireCell::Waveform::compseq_t spec = Waveform::dft(wave);
+        WireCell::Waveform::compseq_t spec = Aux::fwd(dft, Waveform::complex(wave));
 
         // Convolve with short responses
         if (nshort) {
@@ -227,7 +241,9 @@ void Gen::PlaneImpactResponse::build_responses()
                 spec[find] *= short_spec[find];
             }
         }
-        Waveform::realseq_t wf = Waveform::idft(spec);
+        // Waveform::realseq_t wf = Waveform::idft(spec);
+        Waveform::realseq_t wf = Waveform::real(Aux::inv(dft, spec));
+
         wf.resize(m_nbins, 0);
 
         IImpactResponse::pointer ir =
diff --git a/gen/src/TruthSmearer.cxx b/gen/src/TruthSmearer.cxx
index eb70632eb..9bc19459c 100644
--- a/gen/src/TruthSmearer.cxx
+++ b/gen/src/TruthSmearer.cxx
@@ -1,6 +1,6 @@
 #include "WireCellGen/TruthSmearer.h"
 #include "WireCellGen/BinnedDiffusion.h"
-#include "WireCellGen/ImpactZipper.h"
+
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Point.h"
 #include "WireCellUtil/NamedFactory.h"
@@ -97,6 +97,9 @@ WireCell::Configuration Gen::TruthSmearer::default_configuration() const
     put(cfg, "anode", m_anode_tn);
     put(cfg, "rng", m_rng_tn);
 
+    // Name for the DFTer
+    cfg["dft"] = "FftwDFT";
+
     return cfg;
 }
 
@@ -118,6 +121,9 @@ void Gen::TruthSmearer::configure(const WireCell::Configuration& cfg)
         m_rng = Factory::find_tn<IRandom>(m_rng_tn);
     }
 
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     m_readout_time = get<double>(cfg, "readout_time", m_readout_time);
     m_tick = get<double>(cfg, "tick", m_tick);
     m_start_time = get<double>(cfg, "start_time", m_start_time);
@@ -165,7 +171,7 @@ void Gen::TruthSmearer::process(output_queue& frames)
                 tick = tbins.binsize();
             }
 
-            Gen::BinnedDiffusion bindiff(*pimpos, tbins, m_nsigma, m_rng);
+            Gen::BinnedDiffusion bindiff(*pimpos, m_dft, tbins, m_nsigma, m_rng);
             for (auto depo : face_depos) {
                 // time filter smearing
                 double extent_time = depo->extent_long() / m_drift_speed;
@@ -193,9 +199,6 @@ void Gen::TruthSmearer::process(output_queue& frames)
             const double impact = ib.binsize();
             const int nwires = rb.nbins();
             for (int iwire = 0; iwire < nwires; ++iwire) {
-                ///  Similar to ImpactZipper::waveform
-                ///  No convolution
-                ///  m_waveform from BinnedDiffusion::impact_data()
 
                 const double wire_pos = rb.center(iwire);
 
@@ -239,7 +242,7 @@ void Gen::TruthSmearer::process(output_queue& frames)
 
                     Waveform::realseq_t charge_spectrum = id->waveform();
                     if (charge_spectrum.empty()) {
-                        std::cerr << "impactZipper: no charge spectrum for absolute impact number: " << imp << endl;
+                        std::cerr << "TruthSmearer: no charge spectrum for absolute impact number: " << imp << endl;
                         continue;
                     }
 
diff --git a/gen/src/TruthTraceID.cxx b/gen/src/TruthTraceID.cxx
index df60ecba1..16d8bc33b 100644
--- a/gen/src/TruthTraceID.cxx
+++ b/gen/src/TruthTraceID.cxx
@@ -1,10 +1,14 @@
 #include "WireCellGen/TruthTraceID.h"
 #include "WireCellGen/BinnedDiffusion.h"
+
+#include "WireCellAux/DftTools.h"
+
+#include "WireCellIface/SimpleTrace.h"
+#include "WireCellIface/SimpleFrame.h"
+
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Point.h"
 #include "WireCellUtil/NamedFactory.h"
-#include "WireCellIface/SimpleTrace.h"
-#include "WireCellIface/SimpleFrame.h"
 
 #include <string>
 
@@ -54,6 +58,7 @@ WireCell::Configuration Gen::TruthTraceID::default_configuration() const
     put(cfg, "first_frame_number", m_frame_count);
     put(cfg, "anode", m_anode_tn);
     put(cfg, "rng", m_rng_tn);
+    put(cfg, "dft", "FftwDFT"); // type-name for the DFT to use
     put(cfg, "truth_type", m_truth_type);
     put(cfg, "number_induction_wire", m_num_ind_wire);
     put(cfg, "number_collection_wire", m_num_col_wire);
@@ -86,6 +91,8 @@ void Gen::TruthTraceID::configure(const WireCell::Configuration& cfg)
         m_rng_tn = get(cfg, "rng", m_rng_tn);
         m_rng = Factory::find_tn<IRandom>(m_rng_tn);
     }
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
 
     m_readout_time = get<double>(cfg, "readout_time", m_readout_time);
     m_tick = get<double>(cfg, "tick", m_tick);
@@ -139,7 +146,7 @@ void Gen::TruthTraceID::process(output_queue& frames)
             auto timeTruth = hf_time.generate(timeBins);
 
             // ### apply diffusion at wire plane ###
-            Gen::BinnedDiffusion bindiff(*pimpos, tbins, m_nsigma, m_rng);
+            Gen::BinnedDiffusion bindiff(*pimpos, m_dft, tbins, m_nsigma, m_rng);
             for (auto depo : m_depos) {
                 bindiff.add(depo, depo->extent_long() / m_drift_speed, depo->extent_tran());
 
@@ -193,8 +200,9 @@ void Gen::TruthTraceID::process(output_queue& frames)
                     }
                     bindiff.erase(0, min_impact);
 
-                    Waveform::realseq_t wave(nsamples, 0.0);
-                    wave = Waveform::idft(total_spectrum);
+                    // Waveform::realseq_t wave(nsamples, 0.0);
+                    // wave = Waveform::idft(total_spectrum);
+                    Waveform::realseq_t wave = Waveform::real(Aux::inv(m_dft, total_spectrum));
                     auto mm = Waveform::edge(wave);
                     if (mm.first == (int) wave.size()) {
                         continue;
diff --git a/gen/test/test_empnomo.cxx b/gen/test/test_empnomo.cxx
index 2e7269761..0565647a6 100644
--- a/gen/test/test_empnomo.cxx
+++ b/gen/test/test_empnomo.cxx
@@ -5,6 +5,7 @@
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellIface/IChannelStatus.h"
 #include "WireCellIface/IChannelSpectrum.h"
+#include "WireCellIface/IDFT.h"
 
 #include <cstdlib>
 #include <string>
@@ -16,6 +17,9 @@ using namespace WireCell;
 
 int main(int argc, char* argv[])
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+
     std::string detector = "uboone";
 
     // In the real WCT this is done by wire-cell and driven by user
@@ -25,6 +29,9 @@ int main(int argc, char* argv[])
     cerr << "Using AnodePlane: \"" << anode_tns[0] << "\"\n";
 
     {
+        {
+            Factory::lookup_tn<IDFT>("FftwDFT");
+        }
         {
             auto icfg = Factory::lookup<IConfigurable>("StaticChannelStatus");
             // In the real app this would be in a JSON or Jsonnet config
diff --git a/gen/test/test_pir.cxx b/gen/test/test_pir.cxx
index 0846c6a70..016aba3ac 100644
--- a/gen/test/test_pir.cxx
+++ b/gen/test/test_pir.cxx
@@ -1,7 +1,10 @@
+#include "WireCellGen/PlaneImpactResponse.h"
+
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellUtil/PluginManager.h"
 #include "WireCellUtil/Testing.h"
 #include "WireCellUtil/NamedFactory.h"
-#include "WireCellGen/PlaneImpactResponse.h"
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Logging.h"
 
@@ -16,6 +19,7 @@ int main(int argc, char* argv[]) {
     Log::set_level("debug");
 
     PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
     pm.add("WireCellGen");
     pm.add("WireCellSigProc");
 
@@ -24,6 +28,9 @@ int main(int argc, char* argv[]) {
         response_file = argv[1];
     };
 
+    {
+        Factory::lookup_tn<IDFT>("FftwDFT");
+    }
     {
         auto icfg = Factory::lookup<IConfigurable>("FieldResponse");
         auto cfg = icfg->default_configuration();
diff --git a/util/inc/WireCellUtil/Array.h b/util/inc/WireCellUtil/Array.h
index 00504775c..2b30a272e 100644
--- a/util/inc/WireCellUtil/Array.h
+++ b/util/inc/WireCellUtil/Array.h
@@ -73,7 +73,11 @@ namespace WireCell {
 
         /** Partial, 1D DFT and inverse DFT along one dimension of an
          * array.  Each row is transformed if dim=0, each column if
-         * dim=1.  The transfer is either real->complex (rc),
+         * dim=1.  
+         *
+         * NOTE: this is backward from numpy.fft and IDFT convention!.
+         *
+         * The transfer is either real->complex (rc),
          * complex->complex(cc) or complex->real(cr).
          *
          * The full 2D DFT should be used unless an intermediate

From c499a53d6884938bbb58a2b20b4110282b1841b0 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 23 Nov 2021 16:25:54 -0500
Subject: [PATCH 27/46] First draft removal of hard-wired DFT in favor of IDFT.

Tests still needed.
---
 aux/inc/WireCellAux/DftTools.h                |  72 ++-
 aux/src/DftTools.cxx                          | 100 +++--
 aux/src/TaggedTensorSetFrame.cxx              |   2 +
 aux/test/test_taggedframetensorset.cxx        |   2 +
 gen/inc/WireCellGen/Misconfigure.h            |   3 +
 gen/inc/WireCellGen/PerChannelVariation.h     |   4 +
 gen/inc/WireCellGen/PlaneImpactResponse.h     |   6 +-
 gen/src/EmpiricalNoiseModel.cxx               |   4 +-
 gen/src/ImpactData.cxx                        |   4 +-
 gen/src/ImpactTransform.cxx                   |  30 +-
 gen/src/Misconfigure.cxx                      |  21 +-
 gen/src/NoiseSource.cxx                       |   2 +-
 gen/src/PerChannelVariation.cxx               |  22 +-
 gen/src/PlaneImpactResponse.cxx               |  14 +-
 gen/src/TruthTraceID.cxx                      |   2 +-
 root/test/test_binneddiffusion.cxx            |  13 +-
 root/test/test_convo.cxx                      |  15 +-
 root/test/test_convo_binning.cxx              |  21 +-
 root/test/test_fft.cxx                        |  29 +-
 root/test/test_fft_speed.cxx                  |  15 +-
 root/test/test_fieldresp.cxx                  |  14 +-
 root/test/test_impactresponse.cxx             |  22 +-
 root/test/test_impactzipper.cxx               | 421 ------------------
 root/test/test_misconfigure.cxx               |  20 +-
 root/test/test_rcresponse.cxx                 |  10 +-
 sig/inc/WireCellSig/Decon2DFilter.h           |   5 +-
 sig/inc/WireCellSig/Decon2DResponse.h         |   6 +-
 sig/src/Decon2DFilter.cxx                     |  33 +-
 sig/src/Decon2DResponse.cxx                   |  65 ++-
 sigproc/inc/WireCellSigProc/L1SPFilter.h      |   5 +-
 sigproc/inc/WireCellSigProc/Microboone.h      |  18 +-
 .../inc/WireCellSigProc/OmniChannelNoiseDB.h  |   2 +
 sigproc/inc/WireCellSigProc/OmnibusSigProc.h  |   9 +-
 sigproc/inc/WireCellSigProc/Protodune.h       |  19 +-
 .../WireCellSigProc/SimpleChannelNoiseDB.h    |  11 +-
 sigproc/src/L1SPFilter.cxx                    |  42 +-
 sigproc/src/Microboone.cxx                    | 166 ++-----
 sigproc/src/OmniChannelNoiseDB.cxx            |  21 +-
 sigproc/src/OmnibusSigProc.cxx                | 106 +++--
 sigproc/src/Protodune.cxx                     | 182 ++------
 sigproc/src/SimpleChannelNoiseDB.cxx          |  25 +-
 sigproc/test/test_partial.cxx                 |  12 +-
 sigproc/test/test_simple_channel_noisedb.cxx  |   8 +
 sigproc/test/test_zero_padding.cxx            |  12 +-
 util/inc/WireCellUtil/Array.h                 |  14 +-
 util/inc/WireCellUtil/Waveform.h              |  54 +--
 util/src/Array.cxx                            | 406 ++++++++---------
 util/src/Waveform.cxx                         | 148 +++---
 util/test/test_array.cxx                      | 170 +++----
 util/test/test_waveform.cxx                   |  25 --
 50 files changed, 1083 insertions(+), 1349 deletions(-)
 delete mode 100644 root/test/test_impactzipper.cxx

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
index 72b2d789a..b072fc684 100644
--- a/aux/inc/WireCellAux/DftTools.h
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -16,36 +16,87 @@ namespace WireCell::Aux {
 
     // std::vector based functions
 
-    using dft_vector_t = std::vector<complex_t>;
+    using real_vector_t = std::vector<float>;
+    using complex_vector_t = std::vector<complex_t>;
 
     // 1D with vectors
 
-    inline dft_vector_t fwd(const IDFT::pointer& dft, const dft_vector_t& seq)
+    // Perform forward c2c transform on vector.
+    inline complex_vector_t fwd(const IDFT::pointer& dft, const complex_vector_t& seq)
     {
-        dft_vector_t ret(seq.size());
+        complex_vector_t ret(seq.size());
         dft->fwd1d(seq.data(), ret.data(), ret.size());
         return ret;
     }
 
-    inline dft_vector_t inv(const IDFT::pointer& dft, const dft_vector_t& spec)
+    // Perform forward r2c transform on vector.
+    inline complex_vector_t fwd_r2c(const IDFT::pointer& dft, const real_vector_t& vec)
     {
-        dft_vector_t ret(spec.size());
+        complex_vector_t cvec(vec.size());
+        std::transform(vec.begin(), vec.end(), cvec.begin(),
+                       [](float re) { return Aux::complex_t(re,0.0); } );
+        return fwd(dft, cvec);
+    }
+
+    // Perform inverse c2c transform on vector.
+    inline complex_vector_t inv(const IDFT::pointer& dft, const complex_vector_t& spec)
+    {
+        complex_vector_t ret(spec.size());
         dft->inv1d(spec.data(), ret.data(), ret.size());
         return ret;
     }
 
+    // Perform inverse c2r transform on vector.
+    inline real_vector_t inv_c2r(const IDFT::pointer& dft, const complex_vector_t& spec)
+    {
+        auto cvec = inv(dft, spec);
+        real_vector_t rvec(cvec.size());
+        std::transform(cvec.begin(), cvec.end(), rvec.begin(),
+                       [](const Aux::complex_t& c) { return std::real(c); });
+        return rvec;
+        
+    }
+
+    // 1D high-level interface
+
+    /// Convovle in1 and in2.  Returned vecgtor has size sum of sizes
+    /// of in1 and in2 less one element in order to assure no periodic
+    /// aliasing.  Caller need not (should not) pad either input.
+    /// Caller is free to truncate result as required.
+    real_vector_t convolve(const IDFT::pointer& dft,
+                           const real_vector_t& in1,
+                           const real_vector_t& in2);
+
+
+    /// Replace response res1 in meas with response res2.
+    ///
+    /// This will compute the FFT of all three, in frequency space will form:
+    ///
+    ///     meas * resp2 / resp1
+    ///
+    /// apply the inverse FFT and return its real part.
+    ///
+    /// The output vector is long enough to assure no periodic
+    /// aliasing.  In general, caller should NOT pre-pad any input.
+    /// Any subsequent truncation of result is up to caller.
+    real_vector_t replace(const IDFT::pointer& dft,
+                          const real_vector_t& meas,
+                          const real_vector_t& res1,
+                          const real_vector_t& res2);
+
+
     // Eigen array based functions
 
     /// A complex, 2D array.  Use Array::cast<type>() if you need to
     /// convert to/from real.
-    using dft_array_t = Eigen::ArrayXXcf;
+    using complex_array_t = Eigen::ArrayXXcf;
     
     // 2D with Eigen arrays.  Use eg arr.cast<complex_>() to provde
     // from real or arr.real()() to convert result to real.
 
     // Transform both dimesions.
-    dft_array_t fwd(const IDFT::pointer& dft, const dft_array_t& arr);
-    dft_array_t inv(const IDFT::pointer& dft, const dft_array_t& arr);
+    complex_array_t fwd(const IDFT::pointer& dft, const complex_array_t& arr);
+    complex_array_t inv(const IDFT::pointer& dft, const complex_array_t& arr);
 
     // Transform a 2D array along one axis.
     //
@@ -60,9 +111,8 @@ namespace WireCell::Aux {
     // Note: internal storage order of an Eigen array may differ from
     // the logical order and indeed that of the array template type
     // order.  Neither is pertinent in setting the axis.
-    dft_array_t fwd(const IDFT::pointer& dft, const dft_array_t& arr, int axis);
-    dft_array_t inv(const IDFT::pointer& dft, const dft_array_t& arr, int axis);
-
+    complex_array_t fwd(const IDFT::pointer& dft, const complex_array_t& arr, int axis);
+    complex_array_t inv(const IDFT::pointer& dft, const complex_array_t& arr, int axis);
 
 }
 
diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index 9623c5ca4..e0eb83e2c 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -1,4 +1,6 @@
 #include "WireCellAux/DftTools.h"
+#include <algorithm>
+
 
 using namespace WireCell;
 using namespace WireCell::Aux;
@@ -14,7 +16,7 @@ using ROWM = Eigen::Array<Aux::complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen:
 using COLM = Eigen::Array<Aux::complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor>;
 
 template<typename trans>
-Aux::dft_array_t doit(const Aux::dft_array_t& arr, trans func)
+Aux::complex_array_t doit(const Aux::complex_array_t& arr, trans func)
 {
     // Nominally, eigen storage memory is in column-major order
     const Aux::complex_t* in_data = arr.data();
@@ -28,7 +30,7 @@ Aux::dft_array_t doit(const Aux::dft_array_t& arr, trans func)
         nrows = arr.rows();
     }
 
-    Aux::dft_vector_t out_vec(nrows*ncols);
+    Aux::complex_vector_t out_vec(nrows*ncols);
     func(in_data, out_vec.data(), nrows, ncols);
 
     if (flipped) {
@@ -38,7 +40,7 @@ Aux::dft_array_t doit(const Aux::dft_array_t& arr, trans func)
 
 }
 
-Aux::dft_array_t Aux::fwd(const IDFT::pointer& dft, const Aux::dft_array_t& arr)
+Aux::complex_array_t Aux::fwd(const IDFT::pointer& dft, const Aux::complex_array_t& arr)
 {
     return doit(arr, [&](const complex_t* in_data,
                          complex_t* out_data,
@@ -47,7 +49,7 @@ Aux::dft_array_t Aux::fwd(const IDFT::pointer& dft, const Aux::dft_array_t& arr)
     });
 }
 
-Aux::dft_array_t Aux::inv(const IDFT::pointer& dft, const Aux::dft_array_t& arr)
+Aux::complex_array_t Aux::inv(const IDFT::pointer& dft, const Aux::complex_array_t& arr)
 {
     return doit(arr, [&](const complex_t* in_data,
                          complex_t* out_data,
@@ -56,10 +58,8 @@ Aux::dft_array_t Aux::inv(const IDFT::pointer& dft, const Aux::dft_array_t& arr)
     });
 }
 
-#include <iostream> // debug
-
 template<typename trans>
-Aux::dft_array_t doit1b(const Aux::dft_array_t& arr, int axis, trans func)
+Aux::complex_array_t doit1b(const Aux::complex_array_t& arr, int axis, trans func)
 {
     // We must provide a flat array with storage order such with
     // logical axis-major ordering.
@@ -67,14 +67,11 @@ Aux::dft_array_t doit1b(const Aux::dft_array_t& arr, int axis, trans func)
     const int nrows = arr.rows(); // "logical"
     const int ncols = arr.cols(); // shape
 
-    std::cerr << "nrows="<<nrows<<", ncols="<<ncols
-              << ", axis="<<axis<<", IsRowMajor:"<<arr.IsRowMajor<<"\n";
-
     // If storage order matches "axis-major"
     if ( (axis == 1 and arr.IsRowMajor)
          or
          (axis == 0 and not arr.IsRowMajor) ) {
-        Aux::dft_vector_t out_vec(nrows*ncols);
+        Aux::complex_vector_t out_vec(nrows*ncols);
         func(in_data, out_vec.data(), ncols, nrows);
         if (arr.IsRowMajor) {
             // note, returning makes a copy and will perform an actual
@@ -103,29 +100,76 @@ Aux::dft_array_t doit1b(const Aux::dft_array_t& arr, int axis, trans func)
 // - We then have column-wise storage order but IDFT assumes row-wise
 // - so we reverse (nrows, ncols) and meaning of axis.
 
-Aux::dft_array_t Aux::fwd(const IDFT::pointer& dft, const Aux::dft_array_t& arr, int axis)
+Aux::complex_array_t Aux::fwd(const IDFT::pointer& dft, 
+                              const Aux::complex_array_t& arr, 
+                              int axis)
 {
-    Aux::dft_array_t ret = arr; 
+    Aux::complex_array_t ret = arr; 
     dft->fwd1b(ret.data(), ret.data(), ret.cols(), ret.rows(), !axis);
     return ret;
-
-    // return doit1b(arr, axis,
-    //               [&](const complex_t* in_data,
-    //                   complex_t* out_data,
-    //                   int nrows, int ncols) {
-    //     dft->fwd1b(in_data, out_data, nrows, ncols);
-    // });
 }
 
-Aux::dft_array_t Aux::inv(const IDFT::pointer& dft, const Aux::dft_array_t& arr, int axis)
+Aux::complex_array_t Aux::inv(const IDFT::pointer& dft,
+                              const Aux::complex_array_t& arr,
+                              int axis)
 {
-    Aux::dft_array_t ret = arr; 
+    Aux::complex_array_t ret = arr; 
     dft->inv1b(ret.data(), ret.data(), ret.cols(), ret.rows(), !axis);
     return ret;
-    // return doit1b(arr, axis,
-    //               [&](const complex_t* in_data,
-    //                   complex_t* out_data,
-    //                   int nrows, int ncols) {
-    //     dft->inv1b(in_data, out_data, nrows, ncols);
-    // });
+}
+
+
+Aux::real_vector_t Aux::convolve(const IDFT::pointer& dft,
+                                 const Aux::real_vector_t& in1,
+                                 const Aux::real_vector_t& in2)
+{
+    size_t size = in1.size() + in2.size() - 1;
+    Aux::complex_vector_t cin1(size,0), cin2(size,0);
+
+    std::transform(in1.begin(), in1.end(), cin1.begin(),
+                   [](float re) { return Aux::complex_t(re,0.0); } );
+    std::transform(in2.begin(), in2.end(), cin2.begin(),
+                   [](float re) { return Aux::complex_t(re,0.0); } );
+
+    dft->fwd1d(cin1.data(), cin1.data(), size);
+    dft->fwd1d(cin2.data(), cin2.data(), size);
+
+    for (size_t ind=0; ind<size; ++ind) {
+        cin1[ind] *= cin2[ind];
+    }
+
+    Aux::real_vector_t ret(size);
+    std::transform(cin1.begin(), cin1.end(), ret.begin(),
+                   [](const complex_t& c) { return std::real(c); });
+    return ret;
+}
+
+Aux::real_vector_t Aux::replace(const IDFT::pointer& dft,
+                                const Aux::real_vector_t& meas,
+                                const Aux::real_vector_t& res1,
+                                const Aux::real_vector_t& res2)
+{
+    size_t sizes[3] = {meas.size(), res1.size(), res2.size()};
+    size_t size = sizes[0] + sizes[1] + sizes[2] - *std::min_element(sizes, sizes + 3) - 1;
+
+    Aux::complex_vector_t cmeas(size,0), cres1(size,0), cres2(size,0);
+    std::transform(meas.begin(), meas.end(), cmeas.begin(),
+                   [](float re) { return Aux::complex_t(re,0.0); } );
+    std::transform(res1.begin(), res1.end(), cres1.begin(),
+                   [](float re) { return Aux::complex_t(re,0.0); } );
+    std::transform(res2.begin(), res2.end(), cres2.begin(),
+                   [](float re) { return Aux::complex_t(re,0.0); } );
+
+    dft->fwd1d(cmeas.data(), cmeas.data(), size);
+    dft->fwd1d(cres1.data(), cres1.data(), size);
+    dft->fwd1d(cres2.data(), cres2.data(), size);
+
+    for (size_t ind=0; ind<size; ++ind) {
+        cmeas[ind] *= res2[ind]/res1[ind];
+    }
+    Aux::real_vector_t ret(size);
+    std::transform(cmeas.begin(), cmeas.end(), ret.begin(),
+                   [](const complex_t& c) { return std::real(c); });
+
+    return ret;
 }
diff --git a/aux/src/TaggedTensorSetFrame.cxx b/aux/src/TaggedTensorSetFrame.cxx
index 0a4c4db80..4cbbe7e23 100644
--- a/aux/src/TaggedTensorSetFrame.cxx
+++ b/aux/src/TaggedTensorSetFrame.cxx
@@ -4,6 +4,8 @@
 #include "WireCellIface/SimpleFrame.h"
 #include "WireCellUtil/NamedFactory.h"
 
+#include <Eigen/Core>
+
 WIRECELL_FACTORY(TaggedTensorSetFrame, WireCell::Aux::TaggedTensorSetFrame, WireCell::ITensorSetFrame,
                  WireCell::IConfigurable)
 
diff --git a/aux/test/test_taggedframetensorset.cxx b/aux/test/test_taggedframetensorset.cxx
index 529fda632..ee20a01a3 100644
--- a/aux/test/test_taggedframetensorset.cxx
+++ b/aux/test/test_taggedframetensorset.cxx
@@ -12,6 +12,8 @@
 #include "WireCellUtil/Testing.h"
 #include "WireCellUtil/Logging.h"
 
+#include <Eigen/Core>
+
 using namespace WireCell;
 
 int main()
diff --git a/gen/inc/WireCellGen/Misconfigure.h b/gen/inc/WireCellGen/Misconfigure.h
index 8c6da84a4..1bc59f664 100644
--- a/gen/inc/WireCellGen/Misconfigure.h
+++ b/gen/inc/WireCellGen/Misconfigure.h
@@ -23,6 +23,8 @@
 
 #include "WireCellIface/IFrameFilter.h"
 #include "WireCellIface/IConfigurable.h"
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellUtil/Waveform.h"
 
 #include <unordered_set>
@@ -45,6 +47,7 @@ namespace WireCell {
            private:
             Waveform::realseq_t m_from, m_to;
             bool m_truncate;
+            IDFT::pointer m_dft;
         };
     }  // namespace Gen
 }  // namespace WireCell
diff --git a/gen/inc/WireCellGen/PerChannelVariation.h b/gen/inc/WireCellGen/PerChannelVariation.h
index 756f3087d..3ce79573e 100644
--- a/gen/inc/WireCellGen/PerChannelVariation.h
+++ b/gen/inc/WireCellGen/PerChannelVariation.h
@@ -21,6 +21,8 @@
 #include "WireCellIface/IFrameFilter.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IChannelResponse.h"
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellUtil/Waveform.h"
 
 #include <unordered_set>
@@ -46,6 +48,8 @@ namespace WireCell {
             int m_nsamples;
             WireCell::Waveform::realseq_t m_from;
             bool m_truncate;
+            IDFT::pointer m_dft;
+
         };
     }  // namespace Gen
 }  // namespace WireCell
diff --git a/gen/inc/WireCellGen/PlaneImpactResponse.h b/gen/inc/WireCellGen/PlaneImpactResponse.h
index 92701a9db..ec304c865 100644
--- a/gen/inc/WireCellGen/PlaneImpactResponse.h
+++ b/gen/inc/WireCellGen/PlaneImpactResponse.h
@@ -28,7 +28,9 @@ namespace WireCell {
             int m_long_waveform_pad;
 
            public:
-            ImpactResponse(int impact, const Waveform::realseq_t& wf, int waveform_pad,
+            ImpactResponse(int impact,
+                           const Waveform::compseq_t& spectrum,
+                           const Waveform::realseq_t& wf, int waveform_pad,
                            const Waveform::realseq_t& long_wf, int long_waveform_pad)
               : m_impact(impact)
               , m_waveform(wf)
@@ -36,7 +38,7 @@ namespace WireCell {
               , m_long_waveform(long_wf)
               , m_long_waveform_pad(long_waveform_pad)
             {
-                m_spectrum = Waveform::dft(m_waveform);
+                // m_spectrum = Waveform::dft(m_waveform);
             }
 
             /// Frequency-domain spectrum of response
diff --git a/gen/src/EmpiricalNoiseModel.cxx b/gen/src/EmpiricalNoiseModel.cxx
index 8a1d109c9..79db5a957 100644
--- a/gen/src/EmpiricalNoiseModel.cxx
+++ b/gen/src/EmpiricalNoiseModel.cxx
@@ -359,7 +359,7 @@ const IChannelSpectrum::amplitude_t& Gen::EmpiricalNoiseModel::operator()(int ch
             Response::ColdElec elec_resp(10, ch_shaping);  // default at 1 mV/fC
             auto sig = elec_resp.generate(WireCell::Waveform::Domain(0, m_fft_length * m_period), m_fft_length);
             //auto filt = Waveform::dft(sig);
-            auto filt = Aux::fwd(m_dft, Waveform::complex(sig));
+            auto filt = Aux::fwd_r2c(m_dft, sig);
             auto ele_resp_amp = Waveform::magnitude(filt);
 
             ele_resp_amp.resize(m_elec_resp_freq.size());
@@ -373,7 +373,7 @@ const IChannelSpectrum::amplitude_t& Gen::EmpiricalNoiseModel::operator()(int ch
             Response::ColdElec elec_resp(10, db_shaping);  // default at 1 mV/fC
             auto sig = elec_resp.generate(WireCell::Waveform::Domain(0, m_fft_length * m_period), m_fft_length);
             // auto filt = Waveform::dft(sig);
-            auto filt = Aux::fwd(m_dft, Waveform::complex(sig));
+            auto filt = Aux::fwd_r2c(m_dft, sig);
             auto ele_resp_amp = Waveform::magnitude(filt);
 
             ele_resp_amp.resize(m_elec_resp_freq.size());
diff --git a/gen/src/ImpactData.cxx b/gen/src/ImpactData.cxx
index 814b26127..89191abc8 100644
--- a/gen/src/ImpactData.cxx
+++ b/gen/src/ImpactData.cxx
@@ -57,9 +57,9 @@ void Gen::ImpactData::calculate(const IDFT::pointer& dft, int nticks) const
     }
 
     // m_spectrum = Waveform::dft(m_waveform);
-    m_spectrum = Aux::fwd(dft, Waveform::complex(m_waveform));
+    m_spectrum = Aux::fwd_r2c(dft, m_waveform);
     // m_weight_spectrum = Waveform::dft(m_weights);
-    m_weight_spectrum = Aux::fwd(dft, Waveform::complex(m_weights));
+    m_weight_spectrum = Aux::fwd_r2c(dft, m_weights);
 }
 
 // std::pair<int,int> Gen::ImpactData::strip() const
diff --git a/gen/src/ImpactTransform.cxx b/gen/src/ImpactTransform.cxx
index 90ff57540..abcebfc21 100644
--- a/gen/src/ImpactTransform.cxx
+++ b/gen/src/ImpactTransform.cxx
@@ -155,7 +155,7 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[0]->spectrum();
                 // do a inverse FFT
                 // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
-                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
+                Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 // pick the first xxx ticks
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
@@ -164,7 +164,7 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                 }
                 // do a FFT
                 // rs1 = Waveform::dft(rs1_reduced);
-                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
+                rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
 
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(0, icol) = rs1[icol];
@@ -174,24 +174,24 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             for (int irow = 0; irow != m_num_pad_wire; irow++) {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[irow + 1]->spectrum();
                 // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
-                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
+                Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs1_t.size())) break;
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
                 // rs1 = Waveform::dft(rs1_reduced);
-                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
+                rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
                 Waveform::compseq_t rs2 = m_vec_map_resp.at(i)[-irow - 1]->spectrum();
                 // Waveform::realseq_t rs2_t = Waveform::idft(rs2);
-                Waveform::realseq_t rs2_t = Waveform::real(Aux::inv(m_dft, rs2));
+                Waveform::realseq_t rs2_t = Aux::inv_c2r(m_dft, rs2);
                 Waveform::realseq_t rs2_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs2_t.size())) break;
                     rs2_reduced.at(icol) = rs2_t[icol];
                 }
                 //rs2 = Waveform::dft(rs2_reduced);
-                rs2 = Aux::fwd(m_dft, Waveform::complex(rs2_reduced));
+                rs2 = Aux::fwd_r2c(m_dft, rs2_reduced);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(irow + 1, icol) = rs1[icol];
                     resp_f_w(end_ch - start_ch - 1 - irow + 2 * npad_wire, icol) = rs2[icol];
@@ -255,7 +255,7 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
 
                 // do a inverse FFT
                 // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
-                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
+                Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 // pick the first xxx ticks
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 // std::cout << rs1.size() << " " << nsamples << " " << m_end_tick << " " <<  m_start_tick << std::endl;
@@ -266,7 +266,7 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                 }
                 // do a FFT
                 // rs1 = Waveform::dft(rs1_reduced);
-                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
+                rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
 
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     //   std::cout << icol << " " << rs1[icol] << " " << temp_resp_f_w(0,icol) << std::endl;
@@ -276,24 +276,24 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             for (int irow = 0; irow != m_num_pad_wire; irow++) {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[irow + 1]->spectrum();
                 // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
-                Waveform::realseq_t rs1_t = Waveform::real(Aux::inv(m_dft, rs1));
+                Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs1_t.size())) break;
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
                 // rs1 = Waveform::dft(rs1_reduced);
-                rs1 = Aux::fwd(m_dft, Waveform::complex(rs1_reduced));
+                rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
                 Waveform::compseq_t rs2 = m_vec_map_resp.at(i)[-irow - 1]->spectrum();
                 // Waveform::realseq_t rs2_t = Waveform::idft(rs2);
-                Waveform::realseq_t rs2_t = Waveform::real(Aux::inv(m_dft, rs2));
+                Waveform::realseq_t rs2_t = Aux::inv_c2r(m_dft, rs2);
                 Waveform::realseq_t rs2_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs2_t.size())) break;
                     rs2_reduced.at(icol) = rs2_t[icol];
                 }
                 // rs2 = Waveform::dft(rs2_reduced);
-                rs2 = Aux::fwd(m_dft, Waveform::complex(rs2_reduced));
+                rs2 = Aux::fwd_r2c(m_dft, rs2_reduced);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(irow + 1, icol) = rs1[icol];
                     resp_f_w(end_ch - start_ch - 1 - irow + 2 * npad_wire, icol) = rs2[icol];
@@ -349,14 +349,14 @@ Waveform::realseq_t Gen::ImpactTransform::waveform(int iwire) const
             Waveform::realseq_t long_resp = m_pir->closest(0)->long_aux_waveform();
             long_resp.resize(nlength, 0);
             // Waveform::compseq_t spec = Waveform::dft(wf);
-            Waveform::compseq_t spec = Aux::fwd(m_dft, Waveform::complex(wf));
+            Waveform::compseq_t spec = Aux::fwd_r2c(m_dft, wf);
             // Waveform::compseq_t long_spec = Waveform::dft(long_resp);
-            Waveform::compseq_t long_spec = Aux::fwd(m_dft, Waveform::complex(long_resp));
+            Waveform::compseq_t long_spec = Aux::fwd_r2c(m_dft, long_resp);
             for (size_t i = 0; i != nlength; i++) {
                 spec.at(i) *= long_spec.at(i);
             }
             // wf = Waveform::idft(spec);
-            wf = Waveform::real(Aux::inv(m_dft, spec));
+            wf = Aux::inv_c2r(m_dft, spec);
             wf.resize(nsamples, 0);
         }
 
diff --git a/gen/src/Misconfigure.cxx b/gen/src/Misconfigure.cxx
index a5273cac5..9a42c3a65 100644
--- a/gen/src/Misconfigure.cxx
+++ b/gen/src/Misconfigure.cxx
@@ -1,9 +1,14 @@
 #include "WireCellGen/Misconfigure.h"
+
+#include "WireCellAux/DftTools.h"
+
+#include "WireCellIface/SimpleFrame.h"
+#include "WireCellIface/SimpleTrace.h"
+
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/Response.h"
 #include "WireCellUtil/Waveform.h"
-#include "WireCellIface/SimpleFrame.h"
-#include "WireCellIface/SimpleTrace.h"
+
 
 WIRECELL_FACTORY(Misconfigure, WireCell::Gen::Misconfigure, WireCell::IFrameFilter, WireCell::IConfigurable)
 
@@ -41,6 +46,8 @@ WireCell::Configuration Gen::Misconfigure::default_configuration() const
     /// needs to be handled in some way by the user.
     cfg["truncate"] = true;
 
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
+
     return cfg;
 }
 
@@ -54,6 +61,9 @@ void Gen::Misconfigure::configure(const WireCell::Configuration& cfg)
     m_to = Response::ColdElec(cfg["to"]["gain"].asDouble(), cfg["to"]["shaping"].asDouble()).generate(bins);
 
     m_truncate = cfg["truncate"].asBool();
+
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
 }
 
 bool Gen::Misconfigure::operator()(const input_pointer& in, output_pointer& out)
@@ -72,9 +82,12 @@ bool Gen::Misconfigure::operator()(const input_pointer& in, output_pointer& out)
     size_t ntraces = traces->size();
     ITrace::vector out_traces(ntraces);
     for (size_t ind = 0; ind < ntraces; ++ind) {
-        auto trace = traces->at(ind);
+        const auto& trace = traces->at(ind);
 
-        auto wave = Waveform::replace_convolve(trace->charge(), m_to, m_from, m_truncate);
+        // auto wave = Waveform::replace_convolve(trace->charge(), m_to, m_from, m_truncate);
+        const auto& charge = trace->charge();
+        auto wave = Aux::replace(m_dft, charge, m_to, m_from);
+        wave.resize(charge.size());
         out_traces[ind] = std::make_shared<SimpleTrace>(trace->channel(), trace->tbin(), wave);
     }
 
diff --git a/gen/src/NoiseSource.cxx b/gen/src/NoiseSource.cxx
index 48dfc5334..76f6974d5 100644
--- a/gen/src/NoiseSource.cxx
+++ b/gen/src/NoiseSource.cxx
@@ -111,7 +111,7 @@ bool Gen::NoiseSource::operator()(IFrame::pointer& frame)
 
         //Waveform::realseq_t noise = Gen::Noise::generate_waveform(spec, m_rng, m_rep_percent);
         auto cnoise = Gen::Noise::generate_spectrum(spec, m_rng, m_rep_percent);
-        auto noise = Waveform::real(Aux::inv(m_dft, cnoise));
+        auto noise = Aux::inv_c2r(m_dft, cnoise);
 
         //	std::cout << noise.size() << " " << nsamples << std::endl;
         noise.resize(m_nsamples, 0);
diff --git a/gen/src/PerChannelVariation.cxx b/gen/src/PerChannelVariation.cxx
index 2af90496b..af702b752 100644
--- a/gen/src/PerChannelVariation.cxx
+++ b/gen/src/PerChannelVariation.cxx
@@ -1,9 +1,13 @@
 #include "WireCellGen/PerChannelVariation.h"
+
+#include "WireCellAux/DftTools.h"
+
+#include "WireCellIface/SimpleFrame.h"
+#include "WireCellIface/SimpleTrace.h"
+
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/Response.h"
 #include "WireCellUtil/Waveform.h"
-#include "WireCellIface/SimpleFrame.h"
-#include "WireCellIface/SimpleTrace.h"
 
 #include <string>
 
@@ -41,11 +45,15 @@ WireCell::Configuration Gen::PerChannelVariation::default_configuration() const
     /// ch-by-ch electronics responses by calibration
     cfg["per_chan_resp"] = "";
 
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 
 void Gen::PerChannelVariation::configure(const WireCell::Configuration& cfg)
 {
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     m_per_chan_resp = get<std::string>(cfg, "per_chan_resp", "");
 
     if (!m_per_chan_resp.empty()) {
@@ -64,6 +72,7 @@ void Gen::PerChannelVariation::configure(const WireCell::Configuration& cfg)
     m_truncate = cfg["truncate"].asBool();
 }
 
+
 bool Gen::PerChannelVariation::operator()(const input_pointer& in, output_pointer& out)
 {
     if (!in) {
@@ -86,11 +95,14 @@ bool Gen::PerChannelVariation::operator()(const input_pointer& in, output_pointe
     size_t ntraces = traces->size();
     ITrace::vector out_traces(ntraces);
     for (size_t ind = 0; ind < ntraces; ++ind) {
-        auto trace = traces->at(ind);
+        const auto& trace = traces->at(ind);
         auto chid = trace->channel();
         Waveform::realseq_t tch_resp = m_cr->channel_response(chid);
-        tch_resp.resize(m_nsamples, 0);
-        auto wave = Waveform::replace_convolve(trace->charge(), tch_resp, m_from, m_truncate);
+        // tch_resp.resize(m_nsamples, 0);
+        // auto wave = Waveform::replace_convolve(trace->charge(), tch_resp, m_from, m_truncate);
+        const auto& charge = trace->charge();
+        auto wave = Aux::replace(m_dft, charge, tch_resp, m_from);
+        wave.resize(charge.size());
         out_traces[ind] = std::make_shared<SimpleTrace>(chid, trace->tbin(), wave);
     }
 
diff --git a/gen/src/PlaneImpactResponse.cxx b/gen/src/PlaneImpactResponse.cxx
index 1d875fe3a..d5e74eee3 100644
--- a/gen/src/PlaneImpactResponse.cxx
+++ b/gen/src/PlaneImpactResponse.cxx
@@ -112,7 +112,7 @@ void Gen::PlaneImpactResponse::build_responses()
         // note: we are ignoring waveform_start which will introduce
         // an arbitrary phase shift....
         // auto spec = Waveform::dft(wave);
-        auto spec = Aux::fwd(dft, Waveform::complex(wave));
+        auto spec = Aux::fwd_r2c(dft, wave);
         for (size_t ibin = 0; ibin < n_short_length; ++ibin) {
             short_spec[ibin] *= spec[ibin];
         }
@@ -139,14 +139,14 @@ void Gen::PlaneImpactResponse::build_responses()
         // note: we are ignoring waveform_start which will introduce
         // an arbitrary phase shift....
         // auto spec = Waveform::dft(wave);
-        auto spec = Aux::fwd(dft, Waveform::complex(wave));
+        auto spec = Aux::fwd_r2c(dft, wave);
         for (size_t ibin = 0; ibin < n_long_length; ++ibin) {
             long_spec[ibin] *= spec[ibin];
         }
     }
     WireCell::Waveform::realseq_t long_wf;
     if (nlong > 0) {
-        long_wf = Waveform::real(Aux::inv(dft, long_spec));
+        long_wf = Aux::inv_c2r(dft, long_spec);
     }
     const auto& fr = ifr->field_response();
     const auto& pr = *fr.plane(m_plane_ident);
@@ -233,7 +233,7 @@ void Gen::PlaneImpactResponse::build_responses()
             wave[bin] += induced_charge;
         }
         // WireCell::Waveform::compseq_t spec = Waveform::dft(wave);
-        WireCell::Waveform::compseq_t spec = Aux::fwd(dft, Waveform::complex(wave));
+        WireCell::Waveform::compseq_t spec = Aux::fwd_r2c(dft, wave);
 
         // Convolve with short responses
         if (nshort) {
@@ -242,13 +242,15 @@ void Gen::PlaneImpactResponse::build_responses()
             }
         }
         // Waveform::realseq_t wf = Waveform::idft(spec);
-        Waveform::realseq_t wf = Waveform::real(Aux::inv(dft, spec));
+        Waveform::realseq_t wf = Aux::inv_c2r(dft, spec);
 
         wf.resize(m_nbins, 0);
+        spec = Aux::fwd_r2c(dft, wf);
 
         IImpactResponse::pointer ir =
             std::make_shared<Gen::ImpactResponse>(
-                ipath, wf, m_overall_short_padding / m_tick,
+                ipath,
+                spec, wf, m_overall_short_padding / m_tick,
                 long_wf, m_long_padding / m_tick);
         m_ir.push_back(ir);
     }
diff --git a/gen/src/TruthTraceID.cxx b/gen/src/TruthTraceID.cxx
index 16d8bc33b..512693f2f 100644
--- a/gen/src/TruthTraceID.cxx
+++ b/gen/src/TruthTraceID.cxx
@@ -202,7 +202,7 @@ void Gen::TruthTraceID::process(output_queue& frames)
 
                     // Waveform::realseq_t wave(nsamples, 0.0);
                     // wave = Waveform::idft(total_spectrum);
-                    Waveform::realseq_t wave = Waveform::real(Aux::inv(m_dft, total_spectrum));
+                    Waveform::realseq_t wave = Aux::inv_c2r(m_dft, total_spectrum);
                     auto mm = Waveform::edge(wave);
                     if (mm.first == (int) wave.size()) {
                         continue;
diff --git a/root/test/test_binneddiffusion.cxx b/root/test/test_binneddiffusion.cxx
index 751a0664d..cd14504bd 100644
--- a/root/test/test_binneddiffusion.cxx
+++ b/root/test/test_binneddiffusion.cxx
@@ -1,3 +1,5 @@
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellGen/BinnedDiffusion.h"
 #include "WireCellIface/SimpleDepo.h"
 #include "WireCellUtil/ExecMon.h"
@@ -30,11 +32,14 @@ struct Meta {
     ExecMon em;
     const char* name;
 
-    Meta(const char* name)
+    IDFT::pointer idft;
+
+    Meta(const char* name, IDFT::pointer idft)
       //: theApp(new TApplication (name,0,0))
       : canvas(new TCanvas("canvas", "canvas", 500, 500))
       , em(name)
       , name(name)
+      , idft(idft)
     {
         print("[");
     }
@@ -74,7 +79,7 @@ void test_track(Meta& meta, double charge, double track_time, const Ray& track_r
     const auto rbins = pimpos.region_binning();
     const auto ibins = pimpos.impact_binning();
 
-    Gen::BinnedDiffusion bd(pimpos, tbins, ndiffision_sigma, fluctuate);
+    Gen::BinnedDiffusion bd(pimpos, meta.idft, tbins, ndiffision_sigma, fluctuate);
 
     auto track_start = track_ray.first;
     auto track_dir = ray_unit(track_ray);
@@ -231,18 +236,20 @@ int main(int argc, char* argv[])
 {
     PluginManager& pm = PluginManager::instance();
     pm.add("WireCellGen");
+    pm.add("WireCellAux");
     {
         auto rngcfg = Factory::lookup<IConfigurable>("Random");
         auto cfg = rngcfg->default_configuration();
         rngcfg->configure(cfg);
     }
     auto rng = Factory::lookup<IRandom>("Random");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
 
     const char* me = argv[0];
 
     TFile* rootfile = TFile::Open(Form("%s.root", me), "RECREATE");
 
-    Meta meta(me);
+    Meta meta(me, idft);
     gStyle->SetOptStat(0);
 
     const double track_time = t0 + 10 * units::ns;
diff --git a/root/test/test_convo.cxx b/root/test/test_convo.cxx
index b6a64a7a1..d2bb9d343 100644
--- a/root/test/test_convo.cxx
+++ b/root/test/test_convo.cxx
@@ -1,3 +1,6 @@
+#include "WireCellAux/DftTools.h"
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
 
 #include "WireCellUtil/Response.h"
 #include "WireCellUtil/Waveform.h"
@@ -67,6 +70,10 @@ std::vector<TH1F*> plot_wave(TCanvas& canvas, int padnum, std::string name, std:
 
 int main(int argc, char* argv[])
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
+
     if (argc < 2) {
         std::cerr << "This test requires an Wire Cell Field Response input file." << std::endl;
         return 0;
@@ -126,16 +133,16 @@ int main(int argc, char* argv[])
             }
 
             // frequency space
-            Waveform::compseq_t charge_spectrum = Waveform::dft(electrons);
-            Waveform::compseq_t raw_response_spectrum = Waveform::dft(raw_response);
-            Waveform::compseq_t response_spectrum = Waveform::dft(response);
+            Waveform::compseq_t charge_spectrum = Aux::fwd_r2c(idft, electrons);
+            Waveform::compseq_t raw_response_spectrum = Aux::fwd_r2c(idft, raw_response);
+            Waveform::compseq_t response_spectrum = Aux::fwd_r2c(idft, response);
 
             // convolve
             Waveform::compseq_t conv_spectrum(nticks, Waveform::complex_t(0.0, 0.0));
             for (int ind = 0; ind < nticks; ++ind) {
                 conv_spectrum[ind] = response_spectrum[ind] * charge_spectrum[ind];
             }
-            Waveform::realseq_t conv = Waveform::idft(conv_spectrum);
+            Waveform::realseq_t conv = Aux::inv_c2r(idft, conv_spectrum);
             for (int ind = 0; ind < nticks; ++ind) {
                 conv[ind] /= nticks;
             }
diff --git a/root/test/test_convo_binning.cxx b/root/test/test_convo_binning.cxx
index 46c1dba69..3a2fed9c9 100644
--- a/root/test/test_convo_binning.cxx
+++ b/root/test/test_convo_binning.cxx
@@ -1,11 +1,18 @@
 // Test what happens with different choices of how we bin.
 
 #include "MultiPdf.h"
+
+#include "WireCellGen/RCResponse.h"
+
+#include "WireCellAux/DftTools.h"
+
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
+
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Waveform.h"
 #include "WireCellUtil/Binning.h"
 #include "WireCellUtil/Response.h"
-#include "WireCellGen/RCResponse.h"
 
 #include "TGraph.h"
 #include "TH1F.h"
@@ -75,6 +82,10 @@ struct Plotter {
 
 int main(int argc, char* argv[])
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
+
     Test::MultiPdf mpdf(argv[0]);
     Plotter p(mpdf);
 
@@ -111,22 +122,22 @@ int main(int argc, char* argv[])
     p.draw(fce, fbin_short, "fce", "Fine CE");
 
     // convolve + rebin fine->coarse
-    auto fcc = linear_convolve(ffr, fce);
+    auto fcc = Aux::convolve(idft, ffr, fce);
     p.draw(fcc, fbin_long, "fcc", "Fine conv");
     auto ccc2 = rebin(fcc, rebinfactor);
     p.draw(ccc2, cbin_long, "ccc2", "Coarse rebin conv");
-    auto fccs = linear_convolve(ffrs, fce);
+    auto fccs = Aux::convolve(idft, ffrs, fce);
     p.draw(fccs, fbin_long, "fccs", "Fine conv shifted");
     auto cccs2 = rebin(fccs, rebinfactor);
     p.draw(cccs2, cbin_long, "cccs2", "Coarse rebin conv shifted");
 
     // rebin fine->coarse + convolve
-    auto ccc = linear_convolve(cfr, cce);
+    auto ccc = Aux::convolve(idft, cfr, cce);
     for (size_t ind=0; ind<ccc.size(); ++ind) {
         ccc[ind] *= rebinfactor;
     }
     p.draw(ccc, cbin_long, "ccc", "Coarse native conv");
-    auto cccs = linear_convolve(cfrs, cce);
+    auto cccs = Aux::convolve(idft, cfrs, cce);
     for (size_t ind=0; ind<ccc.size(); ++ind) {
         cccs[ind] *= rebinfactor;
     }
diff --git a/root/test/test_fft.cxx b/root/test/test_fft.cxx
index a0adc23c4..ca20e7900 100644
--- a/root/test/test_fft.cxx
+++ b/root/test/test_fft.cxx
@@ -1,3 +1,7 @@
+#include "WireCellAux/DftTools.h"
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
+
 #include "WireCellUtil/Waveform.h"
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Response.h"
@@ -20,10 +24,11 @@ using namespace WireCell::Test;
 // The preferred display units for gain.
 const double GUnit = units::mV / units::fC;
 
-void draw_time_freq(MultiPdf& pdf, Waveform::realseq_t& res, const std::string& title, const Binning& tbins)
+void draw_time_freq(MultiPdf& pdf, const IDFT::pointer& idft,
+                    Waveform::realseq_t& res, const std::string& title, const Binning& tbins)
 {
-    Waveform::compseq_t spec = Waveform::dft(res);
-    Waveform::realseq_t res2 = Waveform::idft(spec);
+    Waveform::compseq_t spec = Aux::fwd_r2c(idft, res);
+    Waveform::realseq_t res2 = Aux::inv_c2r(idft, spec);
 
     TH1F h_wave("response", title.c_str(), tbins.nbins(), tbins.min() / units::us, tbins.max() / units::us);
     TH1F h_wave2("response2", title.c_str(), tbins.nbins(), tbins.min() / units::us, tbins.max() / units::us);
@@ -106,6 +111,10 @@ void draw_time_freq(MultiPdf& pdf, Waveform::realseq_t& res, const std::string&
 
 int main(int argc, char* argv[])
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
+
     const std::vector<double> gains = {7.8 * GUnit, 14.0 * GUnit};
     const std::vector<double> shapings = {1.0 * units::us, 2.0 * units::us};
 
@@ -123,7 +132,7 @@ int main(int argc, char* argv[])
 
         const double tshape_us = shapings[ind] / units::us;
         auto tit = Form("Cold Electronics Response at %.0fus peaking", tshape_us);
-        draw_time_freq(pdf, res, tit, tbins);
+        draw_time_freq(pdf, idft, res, tit, tbins);
     }
 
     // Look at RC filter
@@ -135,7 +144,7 @@ int main(int argc, char* argv[])
         Waveform::realseq_t res = rc.generate(tbins);
 
         auto tit = "RC Response at 1ms time constant";
-        draw_time_freq(pdf, res, tit, tbins);
+        draw_time_freq(pdf, idft, res, tit, tbins);
     }
     {
         Binning shifted(tbins.nbins(), tbins.min() + tick, tbins.max() + tick);
@@ -144,7 +153,7 @@ int main(int argc, char* argv[])
         Waveform::realseq_t res = rc.generate(shifted);
 
         auto tit = "RC Response at 1ms time constant (suppress delta)";
-        draw_time_freq(pdf, res, tit, tbins);
+        draw_time_freq(pdf, idft, res, tit, tbins);
     }
 
     // Look at SysResp (Gaussian smear)
@@ -152,7 +161,7 @@ int main(int argc, char* argv[])
         Response::SysResp gaus;
         Waveform::realseq_t res = gaus.generate(tbins);
         auto tit = "Response Gaussian smear by default";
-        draw_time_freq(pdf, res, tit, tbins);
+        draw_time_freq(pdf, idft, res, tit, tbins);
     }
     {
         double mag = 1.0;
@@ -163,7 +172,7 @@ int main(int argc, char* argv[])
         Response::SysResp gaus(tick, mag, smear);
         Waveform::realseq_t res = gaus.generate(ttt);
         auto tit = "Response Gaussian 2 us smear";
-        draw_time_freq(pdf, res, tit, ttt);
+        draw_time_freq(pdf, idft, res, tit, ttt);
     }
 
     // do timing tests
@@ -198,7 +207,7 @@ int main(int argc, char* argv[])
             double fwd_time = 0.0;
             for (int itry = 0; itry < ntries; ++itry) {
                 auto t1 = std::chrono::high_resolution_clock::now();
-                spec = Waveform::dft(res);
+                spec = Aux::fwd_r2c(idft, res);
                 auto t2 = std::chrono::high_resolution_clock::now();
                 fwd_time += std::chrono::duration_cast<std::chrono::nanoseconds>(t2 - t1).count();
             }
@@ -207,7 +216,7 @@ int main(int argc, char* argv[])
             double rev_time = 0.0;
             for (int itry = 0; itry < ntries; ++itry) {
                 auto t1 = std::chrono::high_resolution_clock::now();
-                res = Waveform::idft(spec);
+                res = Aux::inv_c2r(idft, spec);
                 auto t2 = std::chrono::high_resolution_clock::now();
                 rev_time += std::chrono::duration_cast<std::chrono::nanoseconds>(t2 - t1).count();
             }
diff --git a/root/test/test_fft_speed.cxx b/root/test/test_fft_speed.cxx
index 0dff0b06f..6ee66534c 100644
--- a/root/test/test_fft_speed.cxx
+++ b/root/test/test_fft_speed.cxx
@@ -1,3 +1,7 @@
+#include "WireCellAux/DftTools.h"
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
+
 #include "WireCellUtil/Waveform.h"
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Response.h"
@@ -25,6 +29,10 @@ const double GUnit = units::mV / units::fC;
 
 int main(int argc, char** argv)
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
+
     int nInputs = 0;
     int nBegin = 0;
     int nEnd = 0;
@@ -123,7 +131,8 @@ int main(int argc, char** argv)
             // fwd_time /= ntries;
 
             auto t1 = std::chrono::high_resolution_clock::now();
-            Array::dft_cc(test_array, 0);
+            // Array::dft_cc(test_array, 0);
+            Aux::fwd(idft, test_array, 1);
             auto t2 = std::chrono::high_resolution_clock::now();
             fwd_time = std::chrono::duration_cast<std::chrono::nanoseconds>(t2 - t1).count() / ntries;
 
@@ -131,7 +140,9 @@ int main(int argc, char** argv)
             // for (int itry=0; itry<ntries; ++itry) {
             auto t3 = std::chrono::high_resolution_clock::now();
             // 	res = Waveform::idft(spec);
-            Array::idft_cc(test_array, 0);
+            // Array::idft_cc(test_array, 0);
+            Aux::inv(idft, test_array, 1);
+
             auto t4 = std::chrono::high_resolution_clock::now();
             rev_time = std::chrono::duration_cast<std::chrono::nanoseconds>(t4 - t3).count() / ntries;
             // }
diff --git a/root/test/test_fieldresp.cxx b/root/test/test_fieldresp.cxx
index 65e93102e..f0d133790 100644
--- a/root/test/test_fieldresp.cxx
+++ b/root/test/test_fieldresp.cxx
@@ -1,3 +1,5 @@
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellUtil/Testing.h"
 #include "WireCellUtil/Logging.h"
 
@@ -34,13 +36,15 @@ int main(int argc, char* argv[])
     /// WCT internals, normally user code does not need this
     {
         PluginManager& pm = PluginManager::instance();
+        pm.add("WireCellAux");
+
         pm.add("WireCellSigProc");
         auto ifrcfg = Factory::lookup<IConfigurable>("FieldResponse");
         auto cfg = ifrcfg->default_configuration();
         cfg["filename"] = frfname;
         ifrcfg->configure(cfg);
     }
-
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
     auto ifr = Factory::find<IFieldResponse>("FieldResponse");
 
     // Get full, "fine-grained" field responses defined at impact
@@ -80,7 +84,7 @@ int main(int argc, char* argv[])
     Response::ColdElec ce(14.0 * units::mV / units::fC, 2.0 * units::microsecond);
     auto ewave = ce.generate(tbins);
     Waveform::scale(ewave, 1.2 * 4096 / 2000.);
-    elec = Waveform::dft(ewave);
+    elec = Aux::fwd_r2c(idft, ewave);
 
     std::complex<float> fine_period(fravg.period, 0);
 
@@ -105,7 +109,8 @@ int main(int argc, char* argv[])
         auto arr = Response::as_array(fravg.planes[ind]);
 
         // do FFT for response ...
-        Array::array_xxc c_data = Array::dft_rc(arr, 0);
+        // Array::array_xxc c_data = Array::dft_rc(arr, 0);
+        Array::array_xxc c_data = Aux::fwd(idft, arr.cast<IDFT::complex_t>(), 1);
         int nrows = c_data.rows();
         int ncols = c_data.cols();
 
@@ -115,7 +120,8 @@ int main(int argc, char* argv[])
             }
         }
 
-        arr = Array::idft_cr(c_data, 0);
+        // arr = Array::idft_cr(c_data, 0);
+        arr = Aux::inv(idft, c_data, 1).real();
 
         // figure out how to do fine ... shift (good ...)
         auto arr1 = arr.block(0, 0, nrows, 100);
diff --git a/root/test/test_impactresponse.cxx b/root/test/test_impactresponse.cxx
index 56e64faaa..e5cf76ee1 100644
--- a/root/test/test_impactresponse.cxx
+++ b/root/test/test_impactresponse.cxx
@@ -1,3 +1,9 @@
+#include "WireCellAux/DftTools.h"
+
+#include "WireCellIface/IConfigurable.h"
+#include "WireCellIface/IFieldResponse.h"
+#include "WireCellIface/IPlaneImpactResponse.h"
+
 #include "WireCellUtil/PluginManager.h"
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/Logging.h"
@@ -6,10 +12,6 @@
 #include "WireCellUtil/Testing.h"
 #include "WireCellUtil/Response.h"
 
-#include "WireCellIface/IConfigurable.h"
-#include "WireCellIface/IFieldResponse.h"
-#include "WireCellIface/IPlaneImpactResponse.h"
-
 #include "MultiPdf.h"  // local helper shared by a few tests
 #include "TH2F.h"
 #include "TLine.h"
@@ -28,7 +30,8 @@ using namespace std;
 using spdlog::debug;
 using spdlog::error;
 
-void plot_time(MultiPdf& mpdf, IPlaneImpactResponse::pointer pir, int iplane, Binning tbins, const std::string& name,
+void plot_time(MultiPdf& mpdf, const IDFT::pointer& idft,
+               IPlaneImpactResponse::pointer pir, int iplane, Binning tbins, const std::string& name,
                const std::string& title)
 {
     // only show bins where we think the response is
@@ -103,7 +106,8 @@ void plot_time(MultiPdf& mpdf, IPlaneImpactResponse::pointer pir, int iplane, Bi
         //     continue;
         // }
         auto spec = ir->spectrum();
-        auto wave = Waveform::idft(spec);
+        // auto wave = Waveform::idft(spec);
+        auto wave = Aux::inv_c2r(idft, spec);
         pitch += 0.001 * impact_dist;
         for (int ind = 0; ind < ntbins; ++ind) {
             const double time = tbins.center(ind);
@@ -146,8 +150,10 @@ int main(int argc, const char* argv[])
     Log::set_level("debug");
 
     PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
     pm.add("WireCellGen");
     pm.add("WireCellSigProc");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
 
     const int nticks = 9595;
     const double tick = 0.5 * units::us;
@@ -234,10 +240,10 @@ int main(int argc, const char* argv[])
     MultiPdf mpdf(out_basename.c_str());
     for (int iplane = 0; iplane < 3; ++iplane) {
         auto pir = Factory::find_tn<IPlaneImpactResponse>(pir_tns[iplane]);
-        plot_time(mpdf, pir, iplane, tbins, "fr", "Field Response");
+        plot_time(mpdf, idft, pir, iplane, tbins, "fr", "Field Response");
 
         auto pir_ele = Factory::find_tn<IPlaneImpactResponse>(pir_ele_tns[iplane]);
-        plot_time(mpdf, pir_ele, iplane, tbins, "dr", "Detector Response");
+        plot_time(mpdf, idft, pir_ele, iplane, tbins, "dr", "Detector Response");
     }
 
     mpdf.close();
diff --git a/root/test/test_impactzipper.cxx b/root/test/test_impactzipper.cxx
deleted file mode 100644
index 68355cbc0..000000000
--- a/root/test/test_impactzipper.cxx
+++ /dev/null
@@ -1,421 +0,0 @@
-#include "WireCellGen/ImpactZipper.h"
-#include "WireCellGen/TrackDepos.h"
-#include "WireCellGen/BinnedDiffusion.h"
-#include "WireCellGen/TransportedDepo.h"
-#include "WireCellGen/PlaneImpactResponse.h"
-#include "WireCellUtil/ExecMon.h"
-#include "WireCellUtil/Point.h"
-#include "WireCellUtil/Binning.h"
-#include "WireCellUtil/Testing.h"
-#include "WireCellUtil/Response.h"
-
-#include "WireCellUtil/PluginManager.h"
-#include "WireCellUtil/NamedFactory.h"
-#include "WireCellIface/IRandom.h"
-#include "WireCellIface/IConfigurable.h"
-#include "WireCellIface/IFieldResponse.h"
-#include "WireCellIface/IPlaneImpactResponse.h"
-
-#include "TCanvas.h"
-#include "TFile.h"
-#include "TLine.h"
-#include "TStyle.h"
-#include "TH2F.h"
-
-#include <iostream>
-#include <string>
-
-using namespace WireCell;
-using namespace std;
-
-int main(const int argc, char* argv[])
-{
-    string track_types = "point";
-    if (argc > 1) {
-        track_types = argv[1];
-    }
-    cerr << "Using tracks type: \"" << track_types << "\"\n";
-
-    string response_file = "ub-10-half.json.bz2";
-    if (argc > 2) {
-        response_file = argv[2];
-        cerr << "Using Wire Cell field response file:\n" << response_file << endl;
-    }
-    else {
-        cerr << "No Wire Cell field response input file given, will try to use:\n" << response_file << endl;
-    }
-
-    string out_basename = argv[0];
-    if (argc > 3) {
-        out_basename = argv[3];
-    }
-
-    // here we do hard-wired configuration.  User code should NEVER do
-    // this.
-
-    PluginManager& pm = PluginManager::instance();
-    pm.add("WireCellGen");
-    pm.add("WireCellSigProc");
-    {
-        auto rngcfg = Factory::lookup<IConfigurable>("Random");
-        auto cfg = rngcfg->default_configuration();
-        rngcfg->configure(cfg);
-    }
-
-    const int nticks = 9595;
-    const double tick = 0.5 * units::us;
-    const double gain = 14.0 * units::mV / units::fC;
-    const double shaping = 2.0 * units::us;
-
-    const double t0 = 0.0 * units::s;
-    const double readout_time = nticks * tick;
-    const double drift_speed = 1.0 * units::mm / units::us;  // close, but not real
-
-    const std::string er_tn = "ColdElecResponse", rc_tn = "RCResponse";
-
-    {  // configure elecresponse
-        auto icfg = Factory::lookup_tn<IConfigurable>(er_tn);
-        auto cfg = icfg->default_configuration();
-        cfg["gain"] = gain;
-        cfg["shaping"] = shaping;
-        cfg["nticks"] = nticks;
-        cerr << "Setting: " << cfg["nticks"].asInt() << " ticks\n";
-        cfg["tick"] = tick;
-        cfg["start"] = t0;
-        icfg->configure(cfg);
-    }
-    {  // configure rc response
-        auto icfg = Factory::lookup_tn<IConfigurable>(rc_tn);
-        auto cfg = icfg->default_configuration();
-        cfg["nticks"] = nticks;
-        cfg["tick"] = tick;
-        cfg["start"] = t0;
-        icfg->configure(cfg);
-    }
-    {
-        auto icfg = Factory::lookup<IConfigurable>("FieldResponse");
-        auto cfg = icfg->default_configuration();
-        cfg["filename"] = response_file;
-        icfg->configure(cfg);
-    }
-
-    std::vector<std::string> pir_tns{"PlaneImpactResponse:U", "PlaneImpactResponse:V", "PlaneImpactResponse:W"};
-    {  // configure pirs
-        for (int iplane = 0; iplane < 3; ++iplane) {
-            auto icfg = Factory::lookup_tn<IConfigurable>(pir_tns[iplane]);
-            auto cfg = icfg->default_configuration();
-            cfg["plane"] = iplane;
-            cfg["nticks"] = nticks;
-            cfg["tick"] = tick;
-            cfg["other_responses"][0] = er_tn;
-            cfg["other_responses"][1] = rc_tn;  // double it so
-            cfg["other_responses"][2] = rc_tn;  // we get RC^2
-            icfg->configure(cfg);
-        }
-    }
-
-    WireCell::ExecMon em(out_basename);
-    auto ifr = Factory::find_tn<IFieldResponse>("FieldResponse");
-    auto fr = ifr->field_response();
-
-    em("loaded response");
-
-    const char* uvw = "UVW";
-
-    // 1D garfield wires are all parallel
-    const double angle = 60 * units::degree;
-    const Vector upitch(0, -sin(angle), cos(angle));
-    const Vector uwire(0, cos(angle), sin(angle));
-    const Vector vpitch(0, sin(angle), cos(angle));
-    const Vector vwire(0, cos(angle), -sin(angle));
-    const Vector wpitch(0, 0, 1);
-    const Vector wwire(0, 1, 0);
-
-    // FIXME: need to apply electronics response!
-
-    // Origin where drift and diffusion meets field response.
-    Point field_origin(fr.origin, 0, 0);
-    cerr << "Field response origin: " << field_origin / units::mm << "mm\n";
-
-    // Describe the W collection plane
-    const int nwires = 2001;
-    const double wire_pitch = 3 * units::mm;
-    const int nregion_bins = 10;  // fixme: this should come from the Response::Schema.
-    const double halfwireextent = wire_pitch * 0.5 * (nwires - 1);
-    cerr << "Max wire at pitch=" << halfwireextent << endl;
-
-    std::vector<Pimpos> uvw_pimpos{
-        Pimpos(nwires, -halfwireextent, halfwireextent, uwire, upitch, field_origin, nregion_bins),
-        Pimpos(nwires, -halfwireextent, halfwireextent, vwire, vpitch, field_origin, nregion_bins),
-        Pimpos(nwires, -halfwireextent, halfwireextent, wwire, wpitch, field_origin, nregion_bins)};
-
-    // Digitization and time
-    Binning tbins(nticks, t0, t0 + readout_time);
-
-    // Diffusion
-    const int ndiffision_sigma = 3.0;
-    bool fluctuate = false;  // note, "point" negates this below
-
-    // Generate some trivial tracks
-    const double stepsize = 0.003 * units::mm;
-    Gen::TrackDepos tracks(stepsize);
-
-    // This is the number of ionized electrons for a MIP assumed by MB noise paper.
-    // note: with option "point" this is overridden below.
-    const double dqdx = 16000 * units::eplus / (3 * units::mm);
-    const double charge_per_depo = -(dqdx) *stepsize;
-
-    const double event_time = t0 + 1 * units::ms;
-    const Point event_vertex(1.0 * units::m, 0 * units::m, 0 * units::mm);
-
-    // mostly "prolonged" track in X direction
-    if (track_types.find("prolong") < track_types.size()) {
-        tracks.add_track(event_time,
-                         Ray(event_vertex, event_vertex + Vector(1 * units::m, 0 * units::m, +10 * units::cm)),
-                         charge_per_depo);
-        tracks.add_track(event_time,
-                         Ray(event_vertex, event_vertex + Vector(1 * units::m, 0 * units::m, -10 * units::cm)),
-                         charge_per_depo);
-    }
-
-    // mostly "isochronous" track in Z direction, give spelling errors a break. :)
-    if (track_types.find("isoch") < track_types.size()) {
-        tracks.add_track(event_time, Ray(event_vertex, event_vertex + Vector(0, 0, 50 * units::mm)), charge_per_depo);
-    }
-    // "driftlike" track diagonal in space and drift time
-    if (track_types.find("driftlike") < track_types.size()) {
-        tracks.add_track(event_time,
-                         Ray(event_vertex, event_vertex + Vector(60 * units::cm, 0 * units::m, 10.0 * units::mm)),
-                         charge_per_depo);
-    }
-
-    // make a +
-    if (track_types.find("plus") < track_types.size()) {
-        tracks.add_track(event_time, Ray(event_vertex, event_vertex + Vector(0, 0, +1 * units::m)), charge_per_depo);
-        tracks.add_track(event_time, Ray(event_vertex, event_vertex + Vector(0, 0, -1 * units::m)), charge_per_depo);
-        tracks.add_track(event_time, Ray(event_vertex, event_vertex + Vector(0, +1 * units::m, 0)), charge_per_depo);
-        tracks.add_track(event_time, Ray(event_vertex, event_vertex + Vector(0, -1 * units::m, 0)), charge_per_depo);
-    }
-
-    // // make a .
-    if (track_types.find("point") < track_types.size()) {
-        fluctuate = false;
-        for (int i = 0; i < 6; i++) {
-            auto vt = event_vertex + Vector(0, 0, i * 0.06 * units::mm);
-            auto tt = event_time + i * 10.0 * units::us;
-            tracks.add_track(tt, Ray(vt, vt + Vector(0, 0, 0.1 * stepsize)),  // force 1 point
-                             -1.0 * units::eplus);
-        }
-
-        /* tracks.add_track(event_time, */
-        /*                  Ray(event_vertex, */
-        /*                      event_vertex + Vector(0, 0, 0.1*stepsize)), // force 1 point */
-        /*                  -1.0*units::eplus); */
-    }
-
-    em("made tracks");
-
-    // Get depos
-    auto depos = tracks.depos();
-
-    std::cerr << "got " << depos.size() << " depos from tracks\n";
-    em("made depos");
-
-    TFile* rootfile = TFile::Open(Form("%s-uvw.root", out_basename.c_str()), "recreate");
-    TCanvas* canvas = new TCanvas("c", "canvas", 1000, 1000);
-    gStyle->SetOptStat(0);
-
-    std::string pdfname = argv[0];
-    pdfname += ".pdf";
-    canvas->Print((pdfname + "[").c_str(), "pdf");
-
-    IRandom::pointer rng = nullptr;
-    if (fluctuate) {
-        rng = Factory::lookup<IRandom>("Random");
-    }
-
-    for (int plane_id = 0; plane_id < 3; ++plane_id) {
-        em("start loop over planes");
-        Pimpos& pimpos = uvw_pimpos[plane_id];
-
-        // add deposition to binned diffusion
-        Gen::BinnedDiffusion bindiff(
-            pimpos, tbins, ndiffision_sigma, rng,
-            Gen::BinnedDiffusion::ImpactDataCalculationStrategy::constant);  // default is constant interpolation
-        em("made BinnedDiffusion");
-        for (auto depo : depos) {
-            auto drifted = std::make_shared<Gen::TransportedDepo>(depo, field_origin.x(), drift_speed);
-
-            // In the real simulation these sigma are a function of
-            // drift time.  Hard coded here with small values the
-            // resulting voltage peak due to "point" source should
-            // correspond to what is also shown on a per-impact
-            // "Detector Response" from util's test_impactresponse.
-            // Peak response of a delta function of current
-            // integrating over time to one electron charge would give
-            // 1eplus * 14mV/fC = 2.24 microvolt.
-            const double sigma_time = 1 * units::us;
-            const double sigma_pitch = 1.5 * units::mm;
-
-            bool ok = bindiff.add(drifted, sigma_time, sigma_pitch);
-            if (!ok) {
-                std::cerr << "failed to add: t=" << drifted->time() / units::us << ", pt=" << drifted->pos() / units::mm
-                          << std::endl;
-            }
-            Assert(ok);
-
-            std::cerr << "depo:"
-                      << " q=" << drifted->charge() / units::eplus << "ele"
-                      << " time-T0=" << (drifted->time() - t0) / units::us << "us +/- " << sigma_time / units::us
-                      << " us "
-                      << " pt=" << drifted->pos() / units::mm << " mm\n";
-        }
-        em("added track depositions");
-
-        auto ipir = Factory::find_tn<IPlaneImpactResponse>(pir_tns[plane_id]);
-
-        em("looked up " + pir_tns[plane_id]);
-        {
-            const Response::Schema::PlaneResponse* pr = fr.plane(plane_id);
-            const double pmax = 0.5 * ipir->pitch_range();
-            const double pstep = std::abs(pr->paths[1].pitchpos - pr->paths[0].pitchpos);
-            const int npbins = 2.0 * pmax / pstep;
-            const int ntbins = pr->paths[0].current.size();
-
-            const double tmin = fr.tstart;
-            const double tmax = fr.tstart + fr.period * ntbins;
-            TH2F* hpir = new TH2F(Form("hfr%d", plane_id), Form("Field Response %c-plane", uvw[plane_id]), ntbins, tmin,
-                                  tmax, npbins, -pmax, pmax);
-            for (auto& path : pr->paths) {
-                const double cpitch = path.pitchpos;
-                for (size_t ic = 0; ic < path.current.size(); ++ic) {
-                    const double ctime = fr.tstart + ic * fr.period;
-                    const double charge = path.current[ic] * fr.period;
-                    hpir->Fill(ctime, cpitch, -1 * charge / units::eplus);
-                }
-            }
-            hpir->SetZTitle("Induced charge [eles]");
-            hpir->Write();
-
-            hpir->Draw("colz");
-            if (track_types.find("point") < track_types.size()) {
-                hpir->GetXaxis()->SetRangeUser(70. * units::us, 100. * units::us);
-                hpir->GetYaxis()->SetRangeUser(-10. * units::mm, 10. * units::mm);
-            }
-            canvas->Update();
-            // canvas->Print(Form("%s_%c_resp.png", out_basename.c_str(), uvw[plane_id]));
-            canvas->Print(pdfname.c_str(), "pdf");
-        }
-        em("wrote and leaked response hist");
-
-        Gen::ImpactZipper zipper(ipir, bindiff);
-        em("made ImpactZipper");
-
-        // Set pitch range for plot y-axis
-        auto rbins = pimpos.region_binning();
-        auto pmm = bindiff.pitch_range(ndiffision_sigma);
-        const int wbin0 = max(0, rbins.bin(pmm.first) - 40);
-        const int wbinf = min(rbins.nbins() - 1, rbins.bin(pmm.second) + 40);
-        const int nwbins = 1 + wbinf - wbin0;
-
-        // Dead reckon
-        const int tbin0 = 3500, tbinf = 5500;
-        const int ntbins = tbinf - tbin0;
-
-        std::map<int, Waveform::realseq_t> frame;
-        double tottot = 0.0;
-        for (int iwire = wbin0; iwire <= wbinf; ++iwire) {
-            auto wave = zipper.waveform(iwire);
-            auto tot = Waveform::sum(wave);
-            if (tot != 0.0) {
-                auto mm = std::minmax_element(wave.begin(), wave.end());
-                cerr << "^ Wire " << iwire << " tot=" << tot / units::uV << " uV"
-                     << " mm=[" << (*mm.first) / units::uV << "," << (*mm.second) / units::uV << "] uV " << endl;
-            }
-
-            tottot += tot;
-            if (std::abs(iwire - 1000) <= 1) {  // central wires for "point"
-                auto mm = std::minmax_element(wave.begin(), wave.end());
-                std::cerr << "central wire: " << iwire << " mm=[" << (*mm.first) / units::microvolt << ","
-                          << (*mm.second) / units::microvolt << "] uV\n";
-            }
-            frame[iwire] = wave;
-        }
-        em("zipped through wires");
-        cerr << "Tottot = " << tottot << endl;
-        Assert(tottot != 0.0);
-
-        TH2F* hist = new TH2F(Form("h%d", plane_id), Form("Wire vs Tick %c-plane", uvw[plane_id]), ntbins, tbin0,
-                              tbin0 + ntbins, nwbins, wbin0, wbin0 + nwbins);
-        hist->SetXTitle("tick");
-        hist->SetYTitle("wire");
-        hist->SetZTitle("Voltage [-#muV]");
-
-        std::cerr << nwbins << " wires: [" << wbin0 << "," << wbinf << "], " << ntbins << " ticks: [" << tbin0 << ","
-                  << tbinf << "]\n";
-
-        em("created TH2F");
-        for (auto wire : frame) {
-            const int iwire = wire.first;
-            Assert(rbins.inbounds(iwire));
-            const Waveform::realseq_t& wave = wire.second;
-            // auto tot = Waveform::sum(wave);
-            // std::cerr << iwire << " tot=" << tot << std::endl;
-            for (int itick = tbin0; itick <= tbinf; ++itick) {
-                hist->Fill(itick + 0.1, iwire + 0.1, -1.0 * wave[itick] / units::microvolt);
-            }
-        }
-
-        if (track_types.find("point") < track_types.size()) {
-            hist->GetXaxis()->SetRangeUser(3950, 4100);
-            hist->GetYaxis()->SetRangeUser(996, 1004);
-        }
-        if (track_types.find("isoch") < track_types.size()) {
-            hist->GetXaxis()->SetRangeUser(3900, 4000);
-            hist->GetYaxis()->SetRangeUser(995, 1020);
-        }
-        em("filled TH2F");
-        hist->Write();
-        em("wrote TH2F");
-        hist->Draw("colz");
-        canvas->SetRightMargin(0.15);
-        em("drew TH2F");
-        std::vector<TLine*> lines;
-        auto trqs = tracks.tracks();
-        for (size_t iline = 0; iline < trqs.size(); ++iline) {
-            auto trq = trqs[iline];
-            const double time = get<0>(trq);
-            const Ray ray = get<1>(trq);
-
-            // this need to subtract off the fr.origin is I think a bug,
-            // or at least a bookkeeping detail to ensconce somewhere.  I
-            // think FR is taking the start of the path as the time
-            // origin.  Something to check...
-            const int tick1 = tbins.bin(time + (ray.first.x() - fr.origin) / drift_speed);
-            const int tick2 = tbins.bin(time + (ray.second.x() - fr.origin) / drift_speed);
-
-            const int wire1 = rbins.bin(pimpos.distance(ray.first));
-            const int wire2 = rbins.bin(pimpos.distance(ray.second));
-
-            cerr << "digitrack: t=" << time << " ticks=[" << tick1 << "," << tick2 << "] wires=[" << wire1 << ","
-                 << wire2 << "]\n";
-
-            const int fudge = 0;
-            TLine* line = new TLine(tick1 - fudge, wire1, tick2 - fudge, wire2);
-            line->Write(Form("l%c%d", uvw[plane_id], (int) iline));
-            line->Draw();
-            // canvas->Print(Form("%s_%c.png", out_basename.c_str(), uvw[plane_id]));
-            canvas->Print(pdfname.c_str(), "pdf");
-        }
-        em("printed PNG canvases");
-        em("end of PIR scope");
-
-        // canvas->Print("test_impactzipper.pdf","pdf");
-    }
-    rootfile->Close();
-    canvas->Print((pdfname + "]").c_str(), "pdf");
-    em("done");
-
-    // cerr << em.summary() << endl;
-    return 0;
-}
diff --git a/root/test/test_misconfigure.cxx b/root/test/test_misconfigure.cxx
index 1c7ea3af9..428dac9f7 100644
--- a/root/test/test_misconfigure.cxx
+++ b/root/test/test_misconfigure.cxx
@@ -1,4 +1,6 @@
+#include "WireCellAux/DftTools.h"
 #include "WireCellIface/IFrameFilter.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/SimpleFrame.h"
 #include "WireCellIface/SimpleTrace.h"
@@ -117,9 +119,13 @@ TH2F* plot_frame(MultiPdf& pdf, IFrame::pointer frame, std::string name, double
 int main(int argc, char* argv[])
 {
     PluginManager& pm = PluginManager::instance();
+    auto aux_pi = pm.add("WireCellAux");
+    assert(aux_pi);
     pm.add("WireCellGen");
     pm.add("WireCellRoot");
 
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
+
     int nsamples = 50;
     double gain, shaping, tick;
     {
@@ -140,9 +146,9 @@ int main(int argc, char* argv[])
     auto resp = ce.generate(Binning(200, 0, 200 * tick));
     auto resp2 = ce.generate(Binning(400, 0, 400 * tick));
     auto resp3 = ce.generate(Binning(50, 0, 50 * tick));
-    auto resp_spec = Waveform::dft(resp);
-    auto resp_spec2 = Waveform::dft(resp2);
-    auto resp_spec3 = Waveform::dft(resp3);
+    auto resp_spec = Aux::fwd_r2c(idft, resp);
+    auto resp_spec2 = Aux::fwd_r2c(idft, resp2);
+    auto resp_spec3 = Aux::fwd_r2c(idft, resp3);
 
     ITrace::vector q_traces;
     ITrace::vector out_traces;
@@ -163,10 +169,10 @@ int main(int argc, char* argv[])
         q_traces.push_back(std::make_shared<SimpleTrace>(qchannel++, 0, q3));
         q_traces.push_back(std::make_shared<SimpleTrace>(qchannel++, 0, q4));
 
-        auto e1 = linear_convolve(q1, resp);
-        auto e2 = linear_convolve(q2, resp);
-        auto e3 = linear_convolve(q3, resp);
-        auto e4 = linear_convolve(q4, resp);
+        auto e1 = Aux::convolve(idft, q1, resp);
+        auto e2 = Aux::convolve(idft, q2, resp);
+        auto e3 = Aux::convolve(idft, q3, resp);
+        auto e4 = Aux::convolve(idft, q4, resp);
 
         out_traces.push_back(std::make_shared<SimpleTrace>(channel++, 0, e1));
         out_traces.push_back(std::make_shared<SimpleTrace>(channel++, 0, e2));
diff --git a/root/test/test_rcresponse.cxx b/root/test/test_rcresponse.cxx
index fb6f63127..1e65c08a9 100644
--- a/root/test/test_rcresponse.cxx
+++ b/root/test/test_rcresponse.cxx
@@ -1,6 +1,11 @@
 // Test RCResponse
+
 #include "MultiPdf.h"  // local helper shared by a few tests
 
+#include "WireCellAux/DftTools.h"
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
+
 #include "WireCellUtil/Units.h"
 #include "WireCellUtil/Waveform.h"
 #include "WireCellGen/RCResponse.h"
@@ -12,6 +17,9 @@ using namespace WireCell;
 
 int main(int argc, char* argv[])
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
     Test::MultiPdf mpdf(argv[0]);
 
     const double tick = 0.5*units::us;
@@ -28,7 +36,7 @@ int main(int argc, char* argv[])
     const auto& wavep1 = rcr.waveform_samples();
     // skip first which holds delta
     Waveform::realseq_t wave(wavep1.begin()+1, wavep1.end());
-    auto spec = Waveform::dft(wave);
+    auto spec = Aux::fwd_r2c(idft, wave);
     auto mag = Waveform::magnitude(spec);
 
     TGraph* g = new TGraph(wave.size());
diff --git a/sig/inc/WireCellSig/Decon2DFilter.h b/sig/inc/WireCellSig/Decon2DFilter.h
index 45d59a423..746f20491 100644
--- a/sig/inc/WireCellSig/Decon2DFilter.h
+++ b/sig/inc/WireCellSig/Decon2DFilter.h
@@ -6,6 +6,8 @@
 
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/ITensorSetFilter.h"
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellUtil/Logging.h"
 
 namespace WireCell {
@@ -25,8 +27,9 @@ namespace WireCell {
            private:
             Log::logptr_t log;
             Configuration m_cfg;  /// copy of configuration
+            IDFT::pointer m_dft;
         };
     }  // namespace Sig
 }  // namespace WireCell
 
-#endif  // WIRECELLSIG_DECON2DFILTER
\ No newline at end of file
+#endif  // WIRECELLSIG_DECON2DFILTER
diff --git a/sig/inc/WireCellSig/Decon2DResponse.h b/sig/inc/WireCellSig/Decon2DResponse.h
index 8e741f60d..f4cccce60 100644
--- a/sig/inc/WireCellSig/Decon2DResponse.h
+++ b/sig/inc/WireCellSig/Decon2DResponse.h
@@ -9,6 +9,8 @@
 #include "WireCellIface/IAnodePlane.h"
 #include "WireCellIface/IChannelResponse.h"
 #include "WireCellIface/IFieldResponse.h"
+#include "WireCellIface/IDFT.h"
+
 #include "WireCellUtil/Logging.h"
 
 namespace WireCell {
@@ -37,8 +39,10 @@ namespace WireCell {
             IChannelResponse::pointer m_cresp;
 
             IFieldResponse::pointer m_fresp;
+
+            IDFT::pointer m_dft;
         };
     }  // namespace Sig
 }  // namespace WireCell
 
-#endif  // WIRECELLSIG_DECON2DRESPONSE
\ No newline at end of file
+#endif  // WIRECELLSIG_DECON2DRESPONSE
diff --git a/sig/src/Decon2DFilter.cxx b/sig/src/Decon2DFilter.cxx
index c3e23b833..5529446ff 100644
--- a/sig/src/Decon2DFilter.cxx
+++ b/sig/src/Decon2DFilter.cxx
@@ -1,6 +1,15 @@
 #include "WireCellSig/Decon2DFilter.h"
 #include "WireCellSig/Util.h"
 
+#include "WireCellAux/SimpleTensorSet.h"
+#include "WireCellAux/SimpleTensor.h"
+#include "WireCellAux/Util.h"
+#include "WireCellAux/TensUtil.h"
+#include "WireCellAux/DftTools.h"
+
+#include "WireCellIface/ITensorSet.h"
+#include "WireCellIface/IFilterWaveform.h"
+
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/String.h"
 #include "WireCellUtil/Array.h"
@@ -8,14 +17,6 @@
 #include "WireCellUtil/FFTBestLength.h"
 #include "WireCellUtil/Exceptions.h"
 
-#include "WireCellIface/ITensorSet.h"
-#include "WireCellIface/IFilterWaveform.h"
-
-#include "WireCellAux/SimpleTensorSet.h"
-#include "WireCellAux/SimpleTensor.h"
-#include "WireCellAux/Util.h"
-#include "WireCellAux/TensUtil.h"
-
 WIRECELL_FACTORY(Decon2DFilter, WireCell::Sig::Decon2DFilter, WireCell::ITensorSetFilter, WireCell::IConfigurable)
 
 using namespace WireCell;
@@ -28,11 +29,17 @@ Sig::Decon2DFilter::Decon2DFilter()
 Configuration Sig::Decon2DFilter::default_configuration() const
 {
     Configuration cfg;
-
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 
-void Sig::Decon2DFilter::configure(const WireCell::Configuration &cfg) { m_cfg = cfg; }
+void Sig::Decon2DFilter::configure(const WireCell::Configuration &cfg)
+{
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
+    m_cfg = cfg;
+}
 
 bool Sig::Decon2DFilter::operator()(const ITensorSet::pointer &in, ITensorSet::pointer &out)
 {
@@ -111,7 +118,9 @@ bool Sig::Decon2DFilter::operator()(const ITensorSet::pointer &in, ITensorSet::p
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
+
     Array::array_xxf r_data = tm_r_data.block(m_pad_nwires, 0, m_nwires, m_nticks);
     Sig::restore_baseline(r_data);
 
@@ -162,4 +171,4 @@ bool Sig::Decon2DFilter::operator()(const ITensorSet::pointer &in, ITensorSet::p
     log->debug("Decon2DFilter: end");
 
     return true;
-}
\ No newline at end of file
+}
diff --git a/sig/src/Decon2DResponse.cxx b/sig/src/Decon2DResponse.cxx
index 7b3fd8f4a..7fc52bd89 100644
--- a/sig/src/Decon2DResponse.cxx
+++ b/sig/src/Decon2DResponse.cxx
@@ -1,5 +1,14 @@
 #include "WireCellSig/Decon2DResponse.h"
 
+#include "WireCellAux/SimpleTensorSet.h"
+#include "WireCellAux/SimpleTensor.h"
+#include "WireCellAux/Util.h"
+#include "WireCellAux/TensUtil.h"
+#include "WireCellAux/DftTools.h"
+
+#include "WireCellIface/ITensorSet.h"
+#include "WireCellIface/IFilterWaveform.h"
+
 #include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/String.h"
 #include "WireCellUtil/Array.h"
@@ -7,13 +16,6 @@
 #include "WireCellUtil/FFTBestLength.h"
 #include "WireCellUtil/Exceptions.h"
 
-#include "WireCellIface/ITensorSet.h"
-#include "WireCellIface/IFilterWaveform.h"
-
-#include "WireCellAux/SimpleTensorSet.h"
-#include "WireCellAux/SimpleTensor.h"
-#include "WireCellAux/Util.h"
-#include "WireCellAux/TensUtil.h"
 
 WIRECELL_FACTORY(Decon2DResponse, WireCell::Sig::Decon2DResponse, WireCell::ITensorSetFilter, WireCell::IConfigurable)
 
@@ -27,7 +29,7 @@ Sig::Decon2DResponse::Decon2DResponse()
 Configuration Sig::Decon2DResponse::default_configuration() const
 {
     Configuration cfg;
-
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 
@@ -56,6 +58,9 @@ void Sig::Decon2DResponse::configure(const WireCell::Configuration &cfg)
     if (!m_fresp) {
         THROW(ValueError() << errmsg{"Sig::Decon2DResponse::configure !m_fresp"});
     }
+
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
 }
 
 namespace {
@@ -121,7 +126,8 @@ std::vector<Waveform::realseq_t> Sig::Decon2DResponse::init_overall_response(con
     Response::ColdElec ce(m_gain, m_shaping_time);
     auto ewave = ce.generate(tbins);
     Waveform::scale(ewave, m_inter_gain * m_ADC_mV * (-1));
-    elec = Waveform::dft(ewave);
+    // elec = Waveform::dft(ewave);
+    elec = Aux::fwd_r2c(m_dft, ewave);
 
     std::complex<float> fine_period(fravg.period, 0);
 
@@ -144,7 +150,10 @@ std::vector<Waveform::realseq_t> Sig::Decon2DResponse::init_overall_response(con
     auto arr = Response::as_array(fravg.planes[iplane], fine_nwires, fine_nticks);
 
     // do FFT for response ...
-    Array::array_xxc c_data = Array::dft_rc(arr, 0);
+    // Array::array_xxc c_data = Array::dft_rc(arr, 0);
+    Array::array_xxc c_data = arr.cast<IDFT::complex_t>();
+    c_data = Aux::fwd(m_dft, c_data, 1);
+
     int nrows = c_data.rows();
     int ncols = c_data.cols();
 
@@ -154,7 +163,8 @@ std::vector<Waveform::realseq_t> Sig::Decon2DResponse::init_overall_response(con
         }
     }
 
-    arr = Array::idft_cr(c_data, 0);
+    // arr = Array::idft_cr(c_data, 0);
+    arr = Aux::inv(m_dft, c_data, 1).real();
 
     // figure out how to do fine ... shift (good ...)
     int fine_time_shift = m_fine_time_offset / fravg.period;
@@ -262,7 +272,9 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->debug("r_data: {} {}", r_data.rows(), r_data.cols());
 
     // first round of FFT on time
-    auto c_data = Array::dft_rc(r_data, 0);
+    // auto c_data = Array::dft_rc(r_data, 0);
+    WireCell::Array::array_xxc c_data = r_data.cast<IDFT::complex_t>();
+    c_data = Aux::fwd(m_dft, c_data, 1);
 
     if (m_cresp) {
         log->debug("Decon2DResponse: applying ch-by-ch electronics response correction");
@@ -275,12 +287,14 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
         Response::ColdElec ce(m_gain, m_shaping_time);
 
         const auto ewave = ce.generate(tbins);
-        const WireCell::Waveform::compseq_t elec = Waveform::dft(ewave);
+        // const WireCell::Waveform::compseq_t elec = Waveform::dft(ewave);
+        const WireCell::Waveform::compseq_t elec = Aux::fwd_r2c(m_dft, ewave);
 
         for (int irow = 0; irow != c_data.rows(); irow++) {
             Waveform::realseq_t tch_resp = m_cresp->channel_response(ch_arr[irow]);
             tch_resp.resize(m_fft_nticks, 0);
-            const WireCell::Waveform::compseq_t ch_elec = Waveform::dft(tch_resp);
+            // const WireCell::Waveform::compseq_t ch_elec = Waveform::dft(tch_resp);
+            const WireCell::Waveform::compseq_t ch_elec = Aux::fwd_r2c(m_dft, tch_resp);
 
             // FIXME figure this out
             // const int irow = och.wire + m_pad_nwires;
@@ -298,7 +312,8 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->trace("TRACE {}", __LINE__);
 
     // second round of FFT on wire
-    c_data = Array::dft_cc(c_data, 1);
+    // c_data = Array::dft_cc(c_data, 1);
+    c_data = Aux::fwd(m_dft, c_data, 0);
 
     // response part ...
     Array::array_xxf r_resp = Array::array_xxf::Zero(r_data.rows(), m_fft_nticks);
@@ -310,9 +325,12 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->trace("TRACE {}", __LINE__);
 
     // do first round FFT on the resposne on time
-    Array::array_xxc c_resp = Array::dft_rc(r_resp, 0);
+    //Array::array_xxc c_resp = Array::dft_rc(r_resp, 0);
     // do second round FFT on the response on wire
-    c_resp = Array::dft_cc(c_resp, 1);
+    //c_resp = Array::dft_cc(c_resp, 1);
+
+    Array::array_xxc c_resp = r_resp.cast<IDFT::complex_t>();
+    c_resp = Aux::fwd(m_dft, c_resp);
 
     // make ratio to the response and apply wire filter
     c_data = c_data / c_resp;
@@ -337,10 +355,11 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->trace("TRACE {}", __LINE__);
 
     // do the first round of inverse FFT on wire
-    c_data = Array::idft_cc(c_data, 1);
-
+    // c_data = Array::idft_cc(c_data, 1);
     // do the second round of inverse FFT on time
-    r_data = Array::idft_cr(c_data, 0);
+    // r_data = Array::idft_cr(c_data, 0);
+    c_data = Aux::inv(m_dft, c_data);
+    r_data = c_data.real();
 
     // do the shift in wire
     const int nrows = r_data.rows();
@@ -364,7 +383,9 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
         r_data.block(0, 0, nrows, time_shift) = arr2;
         r_data.block(0, time_shift, nrows, ncols - time_shift) = arr1;
     }
-    c_data = Array::dft_rc(r_data, 0);
+    // c_data = Array::dft_rc(r_data, 0);
+    c_data = Aux::fwd(m_dft, r_data.cast<IDFT::complex_t>(), 1);
+
     log->trace("TRACE {}", __LINE__);
 
     // Eigen to TensorSet
@@ -398,4 +419,4 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->debug("Decon2DResponse: end");
 
     return true;
-}
\ No newline at end of file
+}
diff --git a/sigproc/inc/WireCellSigProc/L1SPFilter.h b/sigproc/inc/WireCellSigProc/L1SPFilter.h
index bedaf7823..4ebe78751 100644
--- a/sigproc/inc/WireCellSigProc/L1SPFilter.h
+++ b/sigproc/inc/WireCellSigProc/L1SPFilter.h
@@ -8,9 +8,11 @@
 
 #include "WireCellIface/IFrameFilter.h"
 #include "WireCellIface/IConfigurable.h"
+#include "WireCellIface/IDFT.h"
 
-#include "WireCellUtil/Interpolate.h"
 #include "WireCellIface/SimpleTrace.h"
+#include "WireCellUtil/Interpolate.h"
+
 
 namespace WireCell {
     namespace SigProc {
@@ -38,6 +40,7 @@ namespace WireCell {
 
            private:
             Configuration m_cfg;
+            IDFT::pointer m_dft;
 
             double m_gain;
             double m_shaping;
diff --git a/sigproc/inc/WireCellSigProc/Microboone.h b/sigproc/inc/WireCellSigProc/Microboone.h
index 8e286870b..a15b1d067 100644
--- a/sigproc/inc/WireCellSigProc/Microboone.h
+++ b/sigproc/inc/WireCellSigProc/Microboone.h
@@ -4,14 +4,16 @@
 #ifndef WIRECELLSIGPROC_MICROBOONE
 #define WIRECELLSIGPROC_MICROBOONE
 
-#include "WireCellUtil/Waveform.h"
-#include "WireCellUtil/Bits.h"
+#include "WireCellSigProc/Diagnostics.h"
+
 #include "WireCellIface/IChannelFilter.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IChannelNoiseDatabase.h"
 #include "WireCellIface/IAnodePlane.h"
+#include "WireCellIface/IDFT.h"
 
-#include "WireCellSigProc/Diagnostics.h"
+#include "WireCellUtil/Waveform.h"
+#include "WireCellUtil/Bits.h"
 
 namespace WireCell {
     namespace SigProc {
@@ -26,14 +28,18 @@ namespace WireCell {
             bool NoisyFilterAlg(WireCell::Waveform::realseq_t& spec, float min_rms, float max_rms);
 
             std::vector<std::vector<int> > SignalProtection(WireCell::Waveform::realseq_t& sig,
-                                                            const WireCell::Waveform::compseq_t& respec, int res_offset,
+                                                            const WireCell::Waveform::compseq_t& respec,
+                                                            const IDFT::pointer& dft,
+                                                            int res_offset,
                                                             int pad_f, int pad_b, float upper_decon_limit = 0.02,
                                                             float decon_lf_cutoff = 0.08, float upper_adc_limit = 15,
                                                             float protection_factor = 5.0, float min_adc_limit = 50);
             bool Subtract_WScaling(WireCell::IChannelFilter::channel_signals_t& chansig,
                                    const WireCell::Waveform::realseq_t& medians,
                                    const WireCell::Waveform::compseq_t& respec, int res_offset,
-                                   std::vector<std::vector<int> >& rois, float upper_decon_limit1 = 0.08,
+                                   std::vector<std::vector<int> >& rois,
+                                   const IDFT::pointer& dft,
+                                   float upper_decon_limit1 = 0.08,
                                    float roi_min_max_ratio = 0.8, float rms_threshold = 0.);
 
             // hold common config stuff
@@ -54,6 +60,7 @@ namespace WireCell {
                 std::string m_anode_tn, m_noisedb_tn;
                 IAnodePlane::pointer m_anode;
                 IChannelNoiseDatabase::pointer m_noisedb;
+                IDFT::pointer m_dft;
             };
 
             /** Microboone style coherent noise subtraction.
@@ -135,6 +142,7 @@ namespace WireCell {
                private:
                 std::string m_anode_tn;
                 IAnodePlane::pointer m_anode;
+                IDFT::pointer m_dft;
                 double m_threshold;
                 int m_window;
                 int m_nbins;
diff --git a/sigproc/inc/WireCellSigProc/OmniChannelNoiseDB.h b/sigproc/inc/WireCellSigProc/OmniChannelNoiseDB.h
index 38154a367..bec3bbc4a 100644
--- a/sigproc/inc/WireCellSigProc/OmniChannelNoiseDB.h
+++ b/sigproc/inc/WireCellSigProc/OmniChannelNoiseDB.h
@@ -4,6 +4,7 @@
 #include "WireCellIface/IChannelNoiseDatabase.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IAnodePlane.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IFieldResponse.h"
 #include "WireCellIface/WirePlaneId.h"
 
@@ -167,6 +168,7 @@ namespace WireCell {
             std::unordered_map<int, shared_filter_t> m_response_cache;
 
             Log::logptr_t log;
+            IDFT::pointer m_dft;
         };
     }  // namespace SigProc
 
diff --git a/sigproc/inc/WireCellSigProc/OmnibusSigProc.h b/sigproc/inc/WireCellSigProc/OmnibusSigProc.h
index 4c597621b..34a40f2cd 100644
--- a/sigproc/inc/WireCellSigProc/OmnibusSigProc.h
+++ b/sigproc/inc/WireCellSigProc/OmnibusSigProc.h
@@ -1,13 +1,17 @@
 #ifndef WIRECELLSIGPROC_OMNIBUSSIGPROC
 #define WIRECELLSIGPROC_OMNIBUSSIGPROC
 
+#include "WireCellAux/Logger.h"
+
 #include "WireCellIface/IFrameFilter.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IAnodePlane.h"
+#include "WireCellIface/IDFT.h"
 #include "WireCellIface/IWaveform.h"
+
 #include "WireCellUtil/Waveform.h"
 #include "WireCellUtil/Array.h"
-#include "WireCellAux/Logger.h"
+
 
 #include <list>
 
@@ -230,6 +234,7 @@ namespace WireCell {
 
             size_t m_count{0};
 
+            IDFT::pointer m_dft;
         };
     }  // namespace SigProc
 }  // namespace WireCell
@@ -237,5 +242,5 @@ namespace WireCell {
 #endif
 // Local Variables:
 // mode: c++
-// c-basic-offset: 2
+// c-basic-offset: 4
 // End:
diff --git a/sigproc/inc/WireCellSigProc/Protodune.h b/sigproc/inc/WireCellSigProc/Protodune.h
index fbb607e00..f83f7b06b 100644
--- a/sigproc/inc/WireCellSigProc/Protodune.h
+++ b/sigproc/inc/WireCellSigProc/Protodune.h
@@ -5,14 +5,16 @@
 #ifndef WIRECELLSIGPROC_PROTODUNE
 #define WIRECELLSIGPROC_PROTODUNE
 
-#include "WireCellUtil/Waveform.h"
-#include "WireCellUtil/Bits.h"
+#include "WireCellSigProc/Diagnostics.h"
+
 #include "WireCellIface/IChannelFilter.h"
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IChannelNoiseDatabase.h"
 #include "WireCellIface/IAnodePlane.h"
+#include "WireCellIface/IDFT.h"
 
-#include "WireCellSigProc/Diagnostics.h"
+#include "WireCellUtil/Waveform.h"
+#include "WireCellUtil/Bits.h"
 
 namespace WireCell {
     namespace SigProc {
@@ -20,10 +22,13 @@ namespace WireCell {
 
             bool LinearInterpSticky(WireCell::Waveform::realseq_t& signal, std::vector<std::pair<int, int> >& st_ranges,
                                     float stky_sig_like_val, float stky_sig_like_rms);
-            bool FftInterpSticky(WireCell::Waveform::realseq_t& signal, std::vector<std::pair<int, int> >& st_ranges);
-            bool FftShiftSticky(WireCell::Waveform::realseq_t& signal, double toffset,
+            bool FftInterpSticky(const IDFT::pointer& dft,
+                                 WireCell::Waveform::realseq_t& signal, std::vector<std::pair<int, int> >& st_ranges);
+            bool FftShiftSticky(const IDFT::pointer& dft,
+                                WireCell::Waveform::realseq_t& signal, double toffset,
                                 std::vector<std::pair<int, int> >& st_ranges);
-            bool FftScaling(WireCell::Waveform::realseq_t& signal, int nsamples);
+            bool FftScaling(const IDFT::pointer& dft,
+                            WireCell::Waveform::realseq_t& signal, int nsamples);
 
             // hold common config stuff
             class ConfigFilterBase : public WireCell::IConfigurable {
@@ -43,6 +48,7 @@ namespace WireCell {
                 std::string m_anode_tn, m_noisedb_tn;
                 IAnodePlane::pointer m_anode;
                 IChannelNoiseDatabase::pointer m_noisedb;
+                IDFT::pointer m_dft;
             };
 
             /** Microboone/ProtoDUNE style noise subtraction.
@@ -77,6 +83,7 @@ namespace WireCell {
                 std::string m_anode_tn, m_noisedb_tn;
                 IAnodePlane::pointer m_anode;
                 IChannelNoiseDatabase::pointer m_noisedb;
+                IDFT::pointer m_dft;
 
                 std::map<int, std::vector<short int> > m_extra_stky;  // ch to extra sticky codes
                 float m_stky_sig_like_val;
diff --git a/sigproc/inc/WireCellSigProc/SimpleChannelNoiseDB.h b/sigproc/inc/WireCellSigProc/SimpleChannelNoiseDB.h
index ae75db9e3..5efef1834 100644
--- a/sigproc/inc/WireCellSigProc/SimpleChannelNoiseDB.h
+++ b/sigproc/inc/WireCellSigProc/SimpleChannelNoiseDB.h
@@ -2,6 +2,8 @@
 #define WIRECELLSIGPROC_SIMPLECHANNELNOISEDB
 
 #include "WireCellIface/IChannelNoiseDatabase.h"
+#include "WireCellIface/IConfigurable.h"
+#include "WireCellIface/IDFT.h"
 
 #include "WireCellUtil/Waveform.h"
 #include "WireCellUtil/Units.h"
@@ -14,7 +16,8 @@
 namespace WireCell {
     namespace SigProc {
 
-        class SimpleChannelNoiseDB : public WireCell::IChannelNoiseDatabase {
+        class SimpleChannelNoiseDB : public WireCell::IConfigurable, 
+                                     public WireCell::IChannelNoiseDatabase {
            public:
             /// Create a simple channel noise DB for digitized waveforms
             /// with the given size and number of samples.  Default is for
@@ -22,6 +25,10 @@ namespace WireCell {
             SimpleChannelNoiseDB(double tick = 0.5 * units::us, int nsamples = 9600);
             virtual ~SimpleChannelNoiseDB();
 
+            /// IConfigurable
+            virtual void configure(const WireCell::Configuration& config);
+            virtual WireCell::Configuration default_configuration() const;
+
             // IChannelNoiseDatabase
             virtual double sample_time() const { return m_tick; }
 
@@ -143,6 +150,8 @@ namespace WireCell {
 
             std::vector<channel_group_t> m_channel_groups;
             channel_group_t m_bad_channels;
+
+            IDFT::pointer m_dft;
         };
     }  // namespace SigProc
 
diff --git a/sigproc/src/L1SPFilter.cxx b/sigproc/src/L1SPFilter.cxx
index a021d7c2a..89bd736af 100644
--- a/sigproc/src/L1SPFilter.cxx
+++ b/sigproc/src/L1SPFilter.cxx
@@ -1,13 +1,16 @@
 #include "WireCellSigProc/L1SPFilter.h"
 
+#include "WireCellAux/DftTools.h"
+#include "WireCellAux/FrameTools.h"
+
 #include "WireCellIface/SimpleFrame.h"
 #include "WireCellIface/IFieldResponse.h"
 
-#include "WireCellUtil/NamedFactory.h"
-#include "WireCellAux/FrameTools.h"
-
 #include "WireCellRess/LassoModel.h"
 #include "WireCellRess/ElasticNetModel.h"
+
+#include "WireCellUtil/NamedFactory.h"
+
 #include <Eigen/Dense>
 
 #include <numeric>
@@ -54,7 +57,8 @@ void L1SPFilter::init_resp()
         Response::ColdElec ce(m_gain, m_shaping);
         auto ewave = ce.generate(tbins);
         Waveform::scale(ewave, m_postgain * m_ADC_mV * (-1));  // ADC to electron ...
-        elec = Waveform::dft(ewave);
+        //elec = Waveform::dft(ewave);
+        elec = Aux::fwd_r2c(m_dft, ewave); 
 
         std::complex<float> fine_period(fravg.period, 0);
 
@@ -62,8 +66,10 @@ void L1SPFilter::init_resp()
         WireCell::Waveform::realseq_t resp_V = fravg.planes[1].paths[0].current;
         WireCell::Waveform::realseq_t resp_W = fravg.planes[2].paths[0].current;
 
-        auto spectrum_V = WireCell::Waveform::dft(resp_V);
-        auto spectrum_W = WireCell::Waveform::dft(resp_W);
+        // auto spectrum_V = WireCell::Waveform::dft(resp_V);
+        auto spectrum_V = Aux::fwd_r2c(m_dft, resp_V);
+        // auto spectrum_W = WireCell::Waveform::dft(resp_W);
+        auto spectrum_W = Aux::fwd_r2c(m_dft, resp_W);
 
         WireCell::Waveform::scale(spectrum_V, elec);
         WireCell::Waveform::scale(spectrum_W, elec);
@@ -72,8 +78,10 @@ void L1SPFilter::init_resp()
         WireCell::Waveform::scale(spectrum_W, fine_period);
 
         // Now this response is ADC for 1 electron .
-        resp_V = WireCell::Waveform::idft(spectrum_V);
-        resp_W = WireCell::Waveform::idft(spectrum_W);
+        // resp_V = WireCell::Waveform::idft(spectrum_V);
+        resp_V = Aux::inv_c2r(m_dft, spectrum_V);
+        // resp_W = WireCell::Waveform::idft(spectrum_W);
+        resp_W = Aux::inv_c2r(m_dft, spectrum_W);
 
         // convolute with V and Y average responses ...
         double intrinsic_time_offset = fravg.origin / fravg.speed;
@@ -153,6 +161,8 @@ WireCell::Configuration L1SPFilter::default_configuration() const
     cfg["fine_time_offset"] = m_fine_time_offset;
     cfg["coarse_time_offset"] = m_coarse_time_offset;
 
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
+
     return cfg;
 }
 
@@ -167,6 +177,9 @@ void L1SPFilter::configure(const WireCell::Configuration& cfg)
 
     m_fine_time_offset = get(cfg, "fine_time_offset", m_fine_time_offset);
     m_coarse_time_offset = get(cfg, "coarse_time_offset", m_coarse_time_offset);
+
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
 }
 
 bool L1SPFilter::operator()(const input_pointer& in, output_pointer& out)
@@ -197,19 +210,6 @@ bool L1SPFilter::operator()(const input_pointer& in, output_pointer& out)
     // l1_col_scale << " " << l1_ind_scale << std::endl;
     init_resp();
 
-    // std::cout << (*lin_V)(0*units::us) << " " << (*lin_W)(0*units::us) << std::endl;
-    // std::cout << (*lin_V)(1*units::us) << " " << (*lin_W)(1*units::us) << std::endl;
-    //    for (size_t i=0; i!=resp_V.size(); i++){
-    // std::cout << (i*fravg.period - intrinsic_time_offset - m_coarse_time_offset + m_fine_time_offset)/units::us << "
-    // " << resp_V.at(i) << " " << resp_W.at(i) << " " << ewave.at(i) << std::endl;
-    //}
-    // std::complex<float> fine_period(fravg.period,0);
-    // int fine_nticks = Response::as_array(fravg.planes[0]).cols();
-    //    Waveform::realseq_t ftbins(fine_nticks);
-    // for (int i=0;i!=fine_nticks;i++){
-    //  ftbins.at(i) = i * fravg.period;
-    //}
-
     auto adctraces = Aux::tagged_traces(in, adctag);
     auto sigtraces = Aux::tagged_traces(in, sigtag);
 
diff --git a/sigproc/src/Microboone.cxx b/sigproc/src/Microboone.cxx
index 52c45add5..3d44db947 100644
--- a/sigproc/src/Microboone.cxx
+++ b/sigproc/src/Microboone.cxx
@@ -5,6 +5,8 @@
 #include "WireCellSigProc/Microboone.h"
 #include "WireCellSigProc/Derivations.h"
 
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellUtil/NamedFactory.h"
 
 #include <cmath>
@@ -48,7 +50,9 @@ double filter_low_loose(double freq) { return 1 - exp(-pow(freq / 0.005, 2)); }
 bool Microboone::Subtract_WScaling(WireCell::IChannelFilter::channel_signals_t& chansig,
                                    const WireCell::Waveform::realseq_t& medians,
                                    const WireCell::Waveform::compseq_t& respec, int res_offset,
-                                   std::vector<std::vector<int> >& rois, float decon_limit1, float roi_min_max_ratio,
+                                   std::vector<std::vector<int> >& rois,
+                                   const IDFT::pointer& dft,
+                                   float decon_limit1, float roi_min_max_ratio,
                                    float rms_threshold)
 {
     double ave_coef = 0;
@@ -134,7 +138,8 @@ bool Microboone::Subtract_WScaling(WireCell::IChannelFilter::channel_signals_t&
             }
 
             // do the deconvolution with a very loose low-frequency filter
-            WireCell::Waveform::compseq_t signal_roi_freq = WireCell::Waveform::dft(signal_roi);
+            // WireCell::Waveform::compseq_t signal_roi_freq = WireCell::Waveform::dft(signal_roi);
+            WireCell::Waveform::compseq_t signal_roi_freq = Aux::fwd_r2c(dft, signal_roi);
             WireCell::Waveform::shrink(signal_roi_freq, respec);
             for (size_t i = 0; i != signal_roi_freq.size(); i++) {
                 double freq;
@@ -148,7 +153,8 @@ bool Microboone::Subtract_WScaling(WireCell::IChannelFilter::channel_signals_t&
                 std::complex<float> factor = filter_time(freq) * filter_low_loose(freq);
                 signal_roi_freq.at(i) = signal_roi_freq.at(i) * factor;
             }
-            WireCell::Waveform::realseq_t signal_roi_decon = WireCell::Waveform::idft(signal_roi_freq);
+            // WireCell::Waveform::realseq_t signal_roi_decon = WireCell::Waveform::idft(signal_roi_freq);
+            WireCell::Waveform::realseq_t signal_roi_decon = Aux::inv_c2r(dft, signal_roi_freq);
 
             if (rms_threshold) {
                 std::pair<double, double> temp = Derivations::CalcRMS(signal_roi_decon);
@@ -267,7 +273,9 @@ bool Microboone::Subtract_WScaling(WireCell::IChannelFilter::channel_signals_t&
 }
 
 std::vector<std::vector<int> > Microboone::SignalProtection(WireCell::Waveform::realseq_t& medians,
-                                                            const WireCell::Waveform::compseq_t& respec, int res_offset,
+                                                            const WireCell::Waveform::compseq_t& respec,
+                                                            const IDFT::pointer& dft,
+                                                            int res_offset,
                                                             int pad_f, int pad_b, float upper_decon_limit,
                                                             float decon_lf_cutoff, float upper_adc_limit,
                                                             float protection_factor, float min_adc_limit)
@@ -342,7 +350,8 @@ std::vector<std::vector<int> > Microboone::SignalProtection(WireCell::Waveform::
     if (respec.size() > 0 && (respec.at(0).real() != 1 || respec.at(0).imag() != 0) && res_offset != 0) {
         // std::cout << nbin << std::endl;
 
-        WireCell::Waveform::compseq_t medians_freq = WireCell::Waveform::dft(medians);
+        // WireCell::Waveform::compseq_t medians_freq = WireCell::Waveform::dft(medians);
+        WireCell::Waveform::compseq_t medians_freq = Aux::fwd_r2c(dft, medians);
         WireCell::Waveform::shrink(medians_freq, respec);
 
         for (size_t i = 0; i != medians_freq.size(); i++) {
@@ -357,7 +366,8 @@ std::vector<std::vector<int> > Microboone::SignalProtection(WireCell::Waveform::
             std::complex<float> factor = filter_time(freq) * filter_low(freq, decon_lf_cutoff);
             medians_freq.at(i) = medians_freq.at(i) * factor;
         }
-        WireCell::Waveform::realseq_t medians_decon = WireCell::Waveform::idft(medians_freq);
+        // WireCell::Waveform::realseq_t medians_decon = WireCell::Waveform::idft(medians_freq);
+        WireCell::Waveform::realseq_t medians_decon = Aux::inv_c2r(dft, medians_freq);
 
         temp = Derivations::CalcRMS(medians_decon);
         mean = temp.first;
@@ -394,58 +404,6 @@ std::vector<std::vector<int> > Microboone::SignalProtection(WireCell::Waveform::
                 }
             }
         }
-
-        // // second-level decon ...
-        // medians_freq = WireCell::Waveform::dft(medians);
-        // WireCell::Waveform::realseq_t  respec_time = WireCell::Waveform::idft(respec);
-        // for (size_t i=0;i!=respec_time.size();i++){
-        //     if (respec_time.at(i)<0) respec_time.at(i) = 0;
-        // }
-        // WireCell::Waveform::compseq_t respec_freq = WireCell::Waveform::dft(respec_time);
-        // WireCell::Waveform::shrink(medians_freq,respec_freq);
-        // for (size_t i=0;i!=medians_freq.size();i++){
-        //     double freq;
-        //     // assuming 2 MHz digitization
-        //     if (i <medians_freq.size()/2.){
-        // 	freq = i/(1.*medians_freq.size())*2.;
-        //     }else{
-        // 	freq = (medians_freq.size() - i)/(1.*medians_freq.size())*2.;
-        //     }
-        //     std::complex<float> factor = filter_time(freq)*filter_low(freq, decon_lf_cutoff);
-        //     medians_freq.at(i) = medians_freq.at(i) * factor;
-        // }
-        // medians_decon = WireCell::Waveform::idft(medians_freq);
-
-        // temp = Derivations::CalcRMS(medians_decon);
-        // mean = temp.first;
-        // rms = temp.second;
-
-        // //	if (protection_factor*rms > upper_decon_limit){
-        // limit = protection_factor*rms;
-        // // }else{
-        // //     limit = upper_decon_limit;
-        // // }
-
-        // for (int j=0;j!=nbin;j++) {
-        //     float content = medians_decon.at(j);
-        //     if ((content-mean)>limit){
-        // 	int time_bin = j + res_offset;
-        // 	if (time_bin >= nbin) time_bin -= nbin;
-        // 	//	medians.at(time_bin) = 0;
-        // 	signalsBool.at(time_bin) = true;
-        // 	// add the front and back padding
-        // 	for (int k=0;k!=pad_b;k++){
-        // 	    int bin = time_bin+k+1;
-        // 	    if (bin > nbin-1) bin = nbin-1;
-        // 	    signalsBool.at(bin) = true;
-        // 	}
-        // 	for (int k=0;k!=pad_f;k++){
-        // 	    int bin = time_bin-k-1;
-        // 	    if (bin <0) { bin = 0; }
-        // 	    signalsBool.at(bin) = true;
-        // 	}
-        //     }
-        // }
     }
 
     // {
@@ -483,75 +441,6 @@ std::vector<std::vector<int> > Microboone::SignalProtection(WireCell::Waveform::
         }
     }
 
-    //     // use ROI to get a new waveform
-    //     WireCell::Waveform::realseq_t medians_roi(nbin,0);
-    //     for (auto roi: rois){
-    // 	const int bin0 = std::max(roi.front()-1, 0);
-    // 	const int binf = std::min(roi.back()+1, nbin-1);
-    // 	const double m0 = medians[bin0];
-    // 	const double mf = medians[binf];
-    // 	const double roi_run = binf - bin0;
-    // 	const double roi_rise = mf - m0;
-    // 	for (auto bin : roi) {
-    // 	    const double m = m0 + (bin - bin0)/roi_run*roi_rise;
-    // 	    medians_roi.at(bin) = medians.at(bin) - m;
-    // 	}
-    //     }
-    //     // do the deconvolution with a very loose low-frequency filter
-    //     WireCell::Waveform::compseq_t medians_roi_freq = WireCell::Waveform::dft(medians_roi);
-    //     WireCell::Waveform::shrink(medians_roi_freq,respec);
-    //     for (size_t i=0;i!=medians_roi_freq.size();i++){
-    // 	double freq;
-    // 	// assuming 2 MHz digitization
-    // 	if (i <medians_roi_freq.size()/2.){
-    // 	    freq = i/(1.*medians_roi_freq.size())*2.;
-    // 	}else{
-    // 	    freq = (medians_roi_freq.size() - i)/(1.*medians_roi_freq.size())*2.;
-    // 	}
-    // 	std::complex<float> factor = filter_time(freq)*filter_low_loose(freq);
-    // 	medians_roi_freq.at(i) = medians_roi_freq.at(i) * factor;
-    //     }
-    //     WireCell::Waveform::realseq_t medians_roi_decon = WireCell::Waveform::idft(medians_roi_freq);
-
-    //     // judge if a roi is good or not ...
-    //     //shift things back properly
-    //     for (auto roi: rois){
-    //     	const int bin0 = std::max(roi.front()-1, 0);
-    //     	const int binf = std::min(roi.back()+1, nbin-1);
-    //     	flag_replace[roi.front()] = false;
-
-    // 	double max_val = 0;
-    // 	double min_val = 0;
-    // 	// double max_adc_val=0;
-    // 	// double min_adc_val=0;
-
-    // 	for (int i=bin0; i<=binf; i++){
-    //     	    int time_bin = i-res_offset;
-    //     	    if (time_bin <0) time_bin += nbin;
-    // 	    if (time_bin >=nbin) time_bin -= nbin;
-
-    // 	    if (i==bin0){
-    // 		max_val = medians_roi_decon.at(time_bin);
-    // 		min_val = medians_roi_decon.at(time_bin);
-    // 		// max_adc_val = medians.at(i);
-    // 		// min_adc_val = medians.at(i);
-    // 	    }else{
-    // 		if (medians_roi_decon.at(time_bin) > max_val) max_val = medians_roi_decon.at(time_bin);
-    // 		if (medians_roi_decon.at(time_bin) < min_val) min_val = medians_roi_decon.at(time_bin);
-    // 		// if (medians.at(i) > max_adc_val) max_adc_val = medians.at(i);
-    // 		// if (medians.at(i) < min_adc_val) min_adc_val = medians.at(i);
-    // 	    }
-    //     	}
-
-    // 	//std::cout << "Xin: " << upper_decon_limit1 << std::endl;
-    // 	//	if ( max_val > upper_decon_limit1)
-    // 	//	if ( max_val > 0.04 && fabs(min_val) < 0.6*max_val)
-    // 	//if (max_val > 0.06 && fabs(min_val) < 0.6*max_val)
-    // 	if (max_val > 0.06)
-    // 	    flag_replace[roi.front()] = true;
-    //     }
-    // }
-
     // Replace medians for above regions with interpolation on values
     // just outside each region.
     for (auto roi : rois) {
@@ -885,6 +774,9 @@ void Microboone::ConfigFilterBase::configure(const WireCell::Configuration& cfg)
     m_anode = Factory::find_tn<IAnodePlane>(m_anode_tn);
     m_noisedb_tn = get(cfg, "noisedb", m_noisedb_tn);
     m_noisedb = Factory::find_tn<IChannelNoiseDatabase>(m_noisedb_tn);
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     // std::cerr << "ConfigFilterBase: \n" << cfg << "\n";
 }
 WireCell::Configuration Microboone::ConfigFilterBase::default_configuration() const
@@ -892,6 +784,7 @@ WireCell::Configuration Microboone::ConfigFilterBase::default_configuration() co
     Configuration cfg;
     cfg["anode"] = m_anode_tn;
     cfg["noisedb"] = m_noisedb_tn;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 
@@ -945,7 +838,8 @@ WireCell::Waveform::ChannelMaskMap Microboone::CoherentNoiseSub::apply(channel_s
 
     // do the signal protection and adaptive baseline
     std::vector<std::vector<int> > rois =
-        Microboone::SignalProtection(medians, respec, res_offset, pad_f, pad_b, decon_limit, decon_lf_cutoff, adc_limit,
+        Microboone::SignalProtection(medians, respec, m_dft,
+                                     res_offset, pad_f, pad_b, decon_limit, decon_lf_cutoff, adc_limit,
                                      protection_factor, min_adc_limit);
 
     // if (achannel == 3840){
@@ -959,7 +853,9 @@ WireCell::Waveform::ChannelMaskMap Microboone::CoherentNoiseSub::apply(channel_s
     // << medians.at(101) << std::endl;
 
     // calculate the scaling coefficient and subtract
-    Microboone::Subtract_WScaling(chansig, medians, respec, res_offset, rois, decon_limit1, roi_min_max_ratio,
+    Microboone::Subtract_WScaling(chansig, medians, respec, res_offset, rois, 
+                                  m_dft,
+                                  decon_limit1, roi_min_max_ratio,
                                   m_rms_threshold);
 
     // WireCell::IChannelFilter::signal_t& signal = chansig.begin()->second;
@@ -1045,7 +941,8 @@ WireCell::Waveform::ChannelMaskMap Microboone::OneChannelNoise::apply(int ch, si
         }
     }
 
-    auto spectrum = WireCell::Waveform::dft(signal);
+    // auto spectrum = WireCell::Waveform::dft(signal);
+    auto spectrum = Aux::fwd_r2c(m_dft, signal);
     // std::cerr << "OneChannelNoise: "<<ch<<" dft spectral sum="<<Waveform::sum(spectrum)<<"\n";
 
     bool is_partial = m_check_partial(spectrum);  // Xin's "IS_RC()"
@@ -1089,7 +986,8 @@ WireCell::Waveform::ChannelMaskMap Microboone::OneChannelNoise::apply(int ch, si
 
     // remove the DC component
     spectrum.front() = 0;
-    signal = WireCell::Waveform::idft(spectrum);
+    // signal = WireCell::Waveform::idft(spectrum);
+    signal = Aux::inv_c2r(m_dft, spectrum);
 
     // std::cerr << "OneChannelNoise: "<<ch<<" after dft: sigsum="<<Waveform::sum(signal)<<"\n";
 
@@ -1339,6 +1237,8 @@ void Microboone::OneChannelStatus::configure(const WireCell::Configuration& cfg)
     if (!m_anode) {
         THROW(KeyError() << errmsg{"failed to get IAnodePlane: " + m_anode_tn});
     }
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
     // std::cerr << "OneChannelStatus: \n" << cfg << "\n";
 }
 WireCell::Configuration Microboone::OneChannelStatus::default_configuration() const
@@ -1349,6 +1249,7 @@ WireCell::Configuration Microboone::OneChannelStatus::default_configuration() co
     cfg["Nbins"] = m_nbins;
     cfg["Cut"] = m_cut;
     cfg["anode"] = m_anode_tn;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 
@@ -1414,7 +1315,8 @@ bool Microboone::OneChannelStatus::ID_lf_noisy(signal_t& sig) const
     //     temp_sig.at(i)=i;
     // }
     // do FFT
-    Waveform::compseq_t sig_freq = Waveform::dft(temp_sig);
+    // Waveform::compseq_t sig_freq = Waveform::dft(temp_sig);
+    Waveform::compseq_t sig_freq = Aux::fwd_r2c(m_dft, temp_sig);    
     for (int i = 0; i != m_nbins; i++) {
         content += abs(sig_freq.at(i + 1));
     }
diff --git a/sigproc/src/OmniChannelNoiseDB.cxx b/sigproc/src/OmniChannelNoiseDB.cxx
index 2435d3a4d..c2907e489 100644
--- a/sigproc/src/OmniChannelNoiseDB.cxx
+++ b/sigproc/src/OmniChannelNoiseDB.cxx
@@ -1,4 +1,5 @@
 #include "WireCellSigProc/OmniChannelNoiseDB.h"
+#include "WireCellAux/DftTools.h"
 #include "WireCellUtil/Response.h"
 #include "WireCellUtil/NamedFactory.h"
 
@@ -63,6 +64,7 @@ WireCell::Configuration OmniChannelNoiseDB::default_configuration() const
     /// These must be provided
     cfg["groups"] = Json::arrayValue;
     cfg["channel_info"] = Json::arrayValue;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
 
     return cfg;
 }
@@ -181,7 +183,9 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::parse_rcrc(Json::Value j
     // auto signal = rcres.generate(WireCell::Binning(m_nsamples, 0, m_nsamples*m_tick));
     auto signal = rcres.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    Waveform::compseq_t spectrum = Waveform::dft(signal);
+    // Waveform::compseq_t spectrum = Waveform::dft(signal);
+    Waveform::compseq_t spectrum = Aux::fwd_r2c(m_dft, signal);
+
     // get the square of it because there are two RC filters
     Waveform::compseq_t spectrum2 = spectrum;
     // Waveform::scale(spectrum2,spectrum);
@@ -255,8 +259,10 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::get_reconfig(double from
     auto to_sig = to_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
     auto from_sig = from_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    auto to_filt = Waveform::dft(to_sig);
-    auto from_filt = Waveform::dft(from_sig);
+    // auto to_filt = Waveform::dft(to_sig);
+    auto to_filt = Aux::fwd_r2c(m_dft, to_sig);
+    // auto from_filt = Waveform::dft(from_sig);
+    auto from_filt = Aux::fwd_r2c(m_dft, from_sig);
 
     // auto from_filt_sum = Waveform::sum(from_filt);
     // auto to_filt_sum   = Waveform::sum(to_filt);
@@ -316,7 +322,8 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::parse_response(Json::Val
                 waveform[ind] += current[ind];
             }
         }
-        auto spectrum = WireCell::Waveform::dft(waveform);
+        // auto spectrum = WireCell::Waveform::dft(waveform);
+        auto spectrum = Aux::fwd_r2c(m_dft, waveform);
         auto ret = std::make_shared<filter_t>(spectrum);
         m_response_cache[wpid.ident()] = ret;
         return ret;
@@ -338,7 +345,8 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::parse_response(Json::Val
             waveform[ind] = jwave[ind].asFloat();
         }
 
-        auto spectrum = WireCell::Waveform::dft(waveform);
+        // auto spectrum = WireCell::Waveform::dft(waveform);
+        auto spectrum = Aux::fwd_r2c(m_dft, waveform);
         auto ret = std::make_shared<filter_t>(spectrum);
         m_waveform_cache[id] = ret;
         return ret;
@@ -579,6 +587,9 @@ void OmniChannelNoiseDB::configure(const WireCell::Configuration& cfg)
     std::string fr_tn = get<std::string>(cfg, "field_response", "FieldResponse");
     m_fr = Factory::find_tn<IFieldResponse>(fr_tn);
 
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     // WARNING: this assumes channel numbers count from 0 with no gaps!
     // int nchans = m_anode->channels().size();
     // std::cerr << "noise database with " << nchans << " channels\n";
diff --git a/sigproc/src/OmnibusSigProc.cxx b/sigproc/src/OmnibusSigProc.cxx
index ef1b5f490..6f2fa85ee 100644
--- a/sigproc/src/OmnibusSigProc.cxx
+++ b/sigproc/src/OmnibusSigProc.cxx
@@ -1,10 +1,9 @@
+#include "ROI_formation.h"
+#include "ROI_refinement.h"
+
 #include "WireCellSigProc/OmnibusSigProc.h"
 
-#include "WireCellUtil/NamedFactory.h"
-#include "WireCellUtil/Exceptions.h"
-#include "WireCellUtil/String.h"
-#include "WireCellUtil/FFTBestLength.h"
-#include "WireCellUtil/Waveform.h"
+#include "WireCellAux/DftTools.h"
 
 #include "WireCellIface/SimpleFrame.h"
 #include "WireCellIface/SimpleTrace.h"
@@ -13,8 +12,11 @@
 #include "WireCellIface/IFilterWaveform.h"
 #include "WireCellIface/IChannelResponse.h"
 
-#include "ROI_formation.h"
-#include "ROI_refinement.h"
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/Exceptions.h"
+#include "WireCellUtil/String.h"
+#include "WireCellUtil/FFTBestLength.h"
+#include "WireCellUtil/Waveform.h"
 
 #include "WireCellUtil/NamedFactory.h"
 
@@ -121,6 +123,9 @@ void OmnibusSigProc::configure(const WireCell::Configuration& config)
     m_coarse_time_offset = get(config, "ctoffset", m_coarse_time_offset);
     m_anode_tn = get(config, "anode", m_anode_tn);
 
+    std::string dft_tn = get<std::string>(config, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     // m_nticks = get(config,"nticks",m_nticks);
     if (!config["nticks"].isNull()) {
         log->warn("no setting \"nticks\", ignoring value {}", config["nticks"].asInt());
@@ -262,6 +267,7 @@ WireCell::Configuration OmnibusSigProc::default_configuration() const
 {
     Configuration cfg;
     cfg["anode"] = m_anode_tn;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     cfg["ftoffset"] = m_fine_time_offset;
     cfg["ctoffset"] = m_coarse_time_offset;
     // cfg["nticks"] = m_nticks;
@@ -756,7 +762,8 @@ void OmnibusSigProc::init_overall_response(IFrame::pointer frame)
     // auto ewave = ce.generate(tbins);
     auto ewave = (*m_elecresponse).waveform_samples(tbins);
     Waveform::scale(ewave, m_inter_gain * m_ADC_mV * (-1));
-    elec = Waveform::dft(ewave);
+    // elec = Waveform::dft(ewave);
+    elec = Aux::fwd_r2c(m_dft, ewave);
 
     std::complex<float> fine_period(fravg.period, 0);
 
@@ -782,18 +789,29 @@ void OmnibusSigProc::init_overall_response(IFrame::pointer frame)
     for (int iplane = 0; iplane < 3; ++iplane) {
         auto arr = Response::as_array(fravg.planes[iplane], fine_nwires, fine_nticks);
 
+
+        int nrows = 0;
+        int ncols = 0;
+
         // do FFT for response ...
-        Array::array_xxc c_data = Array::dft_rc(arr, 0);
-        int nrows = c_data.rows();
-        int ncols = c_data.cols();
+        // Array::array_xxc c_data = Array::dft_rc(arr, 0);
+        {
+            Array::array_xxc c_data = arr.cast<IDFT::complex_t>();
+            c_data = Aux::fwd(m_dft, c_data, 1);
 
-        for (int irow = 0; irow < nrows; ++irow) {
-            for (int icol = 0; icol < ncols; ++icol) {
-                c_data(irow, icol) = c_data(irow, icol) * elec.at(icol) * fine_period;
+            nrows = c_data.rows();
+            ncols = c_data.cols();
+
+            for (int irow = 0; irow < nrows; ++irow) {
+                for (int icol = 0; icol < ncols; ++icol) {
+                    c_data(irow, icol) = c_data(irow, icol) * elec.at(icol) * fine_period;
+                }
             }
-        }
 
-        arr = Array::idft_cr(c_data, 0);
+            // arr = Array::idft_cr(c_data, 0);
+            c_data = Aux::inv(m_dft, c_data, 1);
+            arr = c_data.real();
+        }
 
         // figure out how to do fine ... shift (good ...)
         int fine_time_shift = m_fine_time_offset / fravg.period;
@@ -883,7 +901,8 @@ void OmnibusSigProc::decon_2D_init(int plane)
 {
     // data part ...
     // first round of FFT on time
-    m_c_data[plane] = Array::dft_rc(m_r_data[plane], 0);
+    // m_c_data[plane] = Array::dft_rc(m_r_data[plane], 0);
+    m_c_data[plane] = Aux::fwd(m_dft, m_r_data[plane].cast<IDFT::complex_t>(), 1);
 
     // now apply the ch-by-ch response ...
     if (!m_per_chan_resp.empty()) {
@@ -909,13 +928,15 @@ void OmnibusSigProc::decon_2D_init(int plane)
 
         // const auto ewave = ce.generate(tbins);
         auto ewave = (*m_elecresponse).waveform_samples(tbins);
-        const WireCell::Waveform::compseq_t elec = Waveform::dft(ewave);
+        // const WireCell::Waveform::compseq_t elec = Waveform::dft(ewave);
+        const WireCell::Waveform::compseq_t elec = Aux::fwd_r2c(m_dft, ewave);
 
         for (auto och : m_channel_range[plane]) {
             // const auto& ch_resp = cr->channel_response(och.ident);
             Waveform::realseq_t tch_resp = cr->channel_response(och.ident);
             tch_resp.resize(m_fft_nticks, 0);
-            const WireCell::Waveform::compseq_t ch_elec = Waveform::dft(tch_resp);
+            // const WireCell::Waveform::compseq_t ch_elec = Waveform::dft(tch_resp);
+            const WireCell::Waveform::compseq_t ch_elec = Aux::fwd_r2c(m_dft, tch_resp);
 
             const int irow = och.wire + m_pad_nwires[plane];
             for (int icol = 0; icol != m_c_data[plane].cols(); icol++) {
@@ -931,7 +952,8 @@ void OmnibusSigProc::decon_2D_init(int plane)
     }
 
     // second round of FFT on wire
-    m_c_data[plane] = Array::dft_cc(m_c_data[plane], 1);
+    // m_c_data[plane] = Array::dft_cc(m_c_data[plane], 1);
+    m_c_data[plane] = Aux::fwd(m_dft, m_c_data[plane], 0);
 
     // response part ...
     Array::array_xxf r_resp = Array::array_xxf::Zero(m_r_data[plane].rows(), m_fft_nticks);
@@ -942,9 +964,11 @@ void OmnibusSigProc::decon_2D_init(int plane)
     }
 
     // do first round FFT on the resposne on time
-    Array::array_xxc c_resp = Array::dft_rc(r_resp, 0);
+    // Array::array_xxc c_resp = Array::dft_rc(r_resp, 0);
     // do second round FFT on the response on wire
-    c_resp = Array::dft_cc(c_resp, 1);
+    // c_resp = Array::dft_cc(c_resp, 1);
+    Array::array_xxc c_resp = r_resp.cast<IDFT::complex_t>();
+    Aux::fwd(m_dft, c_resp);
 
     // make ratio to the response and apply wire filter
     m_c_data[plane] = m_c_data[plane] / c_resp;
@@ -968,10 +992,10 @@ void OmnibusSigProc::decon_2D_init(int plane)
     }
 
     // do the first round of inverse FFT on wire
-    m_c_data[plane] = Array::idft_cc(m_c_data[plane], 1);
-
+    //m_c_data[plane] = Array::idft_cc(m_c_data[plane], 1);
     // do the second round of inverse FFT on time
-    m_r_data[plane] = Array::idft_cr(m_c_data[plane], 0);
+    //m_r_data[plane] = Array::idft_cr(m_c_data[plane], 0);
+    m_r_data[plane] = Aux::inv(m_dft, m_c_data[plane]).real();
 
     // do the shift in wire
     const int nrows = m_r_data[plane].rows();
@@ -995,7 +1019,9 @@ void OmnibusSigProc::decon_2D_init(int plane)
         m_r_data[plane].block(0, 0, nrows, time_shift) = arr2;
         m_r_data[plane].block(0, time_shift, nrows, ncols - time_shift) = arr1;
     }
-    m_c_data[plane] = Array::dft_rc(m_r_data[plane], 0);
+    // m_c_data[plane] = Array::dft_rc(m_r_data[plane], 0);
+    m_c_data[plane] = Aux::fwd(m_dft, m_r_data[plane].cast<IDFT::complex_t>(), 1);
+
 }
 
 void OmnibusSigProc::decon_2D_ROI_refine(int plane)
@@ -1016,7 +1042,9 @@ void OmnibusSigProc::decon_2D_ROI_refine(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
+
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     restore_baseline(m_r_data[plane]);
 }
@@ -1057,7 +1085,9 @@ void OmnibusSigProc::decon_2D_tightROI(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
+
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     restore_baseline(m_r_data[plane]);
 }
@@ -1099,7 +1129,9 @@ void OmnibusSigProc::decon_2D_tighterROI(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
+
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     restore_baseline(m_r_data[plane]);
 }
@@ -1176,7 +1208,9 @@ void OmnibusSigProc::decon_2D_looseROI(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
+
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     restore_baseline(m_r_data[plane]);
 }
@@ -1221,7 +1255,9 @@ void OmnibusSigProc::decon_2D_looseROI_debug_mode(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
+
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     restore_baseline(m_r_data[plane]);
 }
@@ -1282,7 +1318,8 @@ void OmnibusSigProc::decon_2D_hits(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     if (plane == 2) {
         restore_baseline(m_r_data[plane]);
@@ -1315,7 +1352,8 @@ void OmnibusSigProc::decon_2D_charge(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
+    Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     if (plane == 2) {
         restore_baseline(m_r_data[plane]);
@@ -1571,5 +1609,5 @@ bool OmnibusSigProc::operator()(const input_pointer& in, output_pointer& out)
 
 // Local Variables:
 // mode: c++
-// c-basic-offset: 2
+// c-basic-offset: 4
 // End:
diff --git a/sigproc/src/Protodune.cxx b/sigproc/src/Protodune.cxx
index 7e69a8e2a..4eece13a8 100644
--- a/sigproc/src/Protodune.cxx
+++ b/sigproc/src/Protodune.cxx
@@ -13,6 +13,8 @@
 #include "WireCellSigProc/Protodune.h"
 #include "WireCellSigProc/Derivations.h"
 
+#include "WireCellAux/DftTools.h"
+
 #include "WireCellUtil/NamedFactory.h"
 
 #include <cmath>
@@ -166,25 +168,6 @@ int LedgeIdentify1(WireCell::Waveform::realseq_t& signal, double baseline, int L
             }
         }
 
-        // // // find the sharp start edge
-        // if(ledge == 1&&StartOfLastLedgeCandidate>30){
-        // //   int edge = 0;
-        // //   int i = StartOfLastLedgeCandidate/UNIT-1;
-        // //   if(averaged.at(i)>averaged.at(i-1)&&averaged.at(i-1)>averaged.at(i-2)){ // find a edge
-        // //           edge = 1;
-        // //   }
-        // // if(edge == 0) ledge = 0; // if no edge, this is not ledge
-        // // if((averaged.at(i)-averaged.at(i-2)<10*UNIT)&&(averaged.at(i)-averaged.at(i-3)<10*UNIT)) // slope cut
-        // //         ledge = 0;
-        // // if(averaged.at(StartOfLastLedgeCandidate/UNIT)-baseline*UNIT>150*UNIT) ledge = 0; // ledge is close to the
-        // baseline
-
-        // // if(signal.at(tempLedgeEnd) - baseline > 100) ledge=0; // [wgu] ledge end is close to the baseline
-        //     if(averaged.at(tempLedgeEnd/UNIT)-baseline*UNIT>5.*UNIT) ledge = 0;
-        // // cout << "averaged.at(StartOfLastLedgeCandidate/UNIT) - baseline*UNIT = " <<
-        // averaged.at(StartOfLastLedgeCandidate/UNIT)-baseline*UNIT << std::endl;
-        // }
-
         if (ledge == 1) {  // ledge is close to the baseline
             if (averaged.at(tempLedgeEnd / UNIT) - baseline * UNIT > 5. * UNIT) ledge = 0;
 
@@ -273,14 +256,6 @@ bool LedgeIdentify(WireCell::Waveform::realseq_t& signal /*TH1F* h2*/, double ba
     }
     // find the sharp start edge
     if (ledge && LedgeStart > 30) {
-        // int edge = 0;
-        // int i = LedgeStart/UNIT-1;
-        // if(averaged.at(i)>averaged.at(i-1)&&averaged.at(i-1)>averaged.at(i-2)){ // find a edge
-        //         edge = 1;
-        // }
-        // if(edge == 0) ledge = false; // if no edge, this is not ledge
-        // if((averaged.at(i)-averaged.at(i-2)<10*UNIT)&&(averaged.at(i)-averaged.at(i-3)<10*UNIT)) // slope cut
-        //         ledge = false;
         if (averaged.at(LedgeStart / UNIT) - baseline * UNIT > 150 * UNIT)
             ledge = false;  // ledge is close to the baseline
     }
@@ -288,9 +263,6 @@ bool LedgeIdentify(WireCell::Waveform::realseq_t& signal /*TH1F* h2*/, double ba
     if (ledge && LedgeStart > 20) {
         double height = 0;
         if (LedgeStart < 5750) {  // calculate the height of edge
-            // double tempHeight = h2 ->GetBinContent(LedgeStart+1+200) +  h2 ->GetBinContent(LedgeStart+1+220) +  h2
-            // ->GetBinContent(LedgeStart+1+180) +  h2 ->GetBinContent(LedgeStart+1+240); height = h2
-            // ->GetBinContent(LedgeStart+1) - tempHeight/4;
             double tempHeight = signal.at(LedgeStart + 200) + signal.at(LedgeStart + 220) +
                                 signal.at(LedgeStart + 180) + signal.at(LedgeStart + 240);
             height = signal.at(LedgeStart) - tempHeight / 4;
@@ -302,11 +274,6 @@ bool LedgeIdentify(WireCell::Waveform::realseq_t& signal /*TH1F* h2*/, double ba
         if (height < 0) height = 80;             // norminal value
         if (height > 30 && LedgeStart < 5900) {  // test the decay with a relatively large height
             double height50 = 0, height100 = 0;
-            // height50 =  h2 ->GetBinContent(LedgeStart+51);
-            // height100 =  h2 ->GetBinContent(LedgeStart+101);
-            // double height50Pre =   h2 ->GetBinContent(LedgeStart+1)- height*(1-exp(-50/100.)); // minimum 100 ticks
-            // decay time double height100Pre =   h2 ->GetBinContent(LedgeStart+1) - height*(1-exp(-100./100)); //
-            // minimum 100 ticks decay time
 
             height50 = signal.at(LedgeStart + 50);
             height100 = signal.at(LedgeStart + 100);
@@ -350,44 +317,9 @@ bool LedgeIdentify(WireCell::Waveform::realseq_t& signal /*TH1F* h2*/, double ba
         }
         if (LedgeEnd == 0) LedgeEnd = 6000;
     }
-    // done, release the memory
-    // vector<int>(averaged).swap(averaged); // is it necessary?
     return ledge;
 }
 
-// adapted from WCP
-// int judgePlateau(int channel, TH1F* h2,double baseline, double & PlateauStart, double & PlateauStartEnd){
-//         int continueN = 0;
-//         int threshold = 200;
-//         int maximumF  = 50;
-//         int maxBin = h2->GetMaximumBin();
-//         for(int i=maxBin+10;i<5880&&i<maxBin+500;i++){
-//                 int plateau = 1;
-//                 int max = 0, min = 10000;
-//                 for(int j=i;j<i+20;j++){
-//                         int binC = h2->GetBinContent(j+1);
-//                         if(binC<baseline+threshold||binC>h2->GetMaximum()-500) {
-//                                 plateau = 0;
-//                                 break;
-//                         }
-//                         if(binC>max) max = binC;
-//                         if(binC<min) min = binC;
-//                 }
-//                 if(plateau==1&&max-min<maximumF){ // plateau found
-//                         PlateauStart = i;
-//                         PlateauStartEnd = i+20;
-//                         for(int k = i+20; k<6000;k++){
-//                                 if( h2->GetBinContent(k+1)<baseline+threshold){
-//                                         PlateauStartEnd = k-1;
-//                                         break;
-//                                 }
-//                         }
-//                         return 1;
-//                 }
-//         }
-//         return 0;
-// }
-
 bool Protodune::LinearInterpSticky(WireCell::Waveform::realseq_t& signal, WireCell::Waveform::BinRangeList& rng_list,
                                    float stky_sig_like_val, float stky_sig_like_rms)
 {
@@ -459,7 +391,8 @@ bool Protodune::LinearInterpSticky(WireCell::Waveform::realseq_t& signal, WireCe
     return true;
 }
 
-bool Protodune::FftInterpSticky(WireCell::Waveform::realseq_t& signal, WireCell::Waveform::BinRangeList& rng_list)
+bool Protodune::FftInterpSticky(const IDFT::pointer& dft,
+                                WireCell::Waveform::realseq_t& signal, WireCell::Waveform::BinRangeList& rng_list)
 {
     ;
     const int nsiglen = signal.size();
@@ -476,7 +409,8 @@ bool Protodune::FftInterpSticky(WireCell::Waveform::realseq_t& signal, WireCell:
     }
 
     // dft resampling for "even", see example in test_zero_padding.cxx
-    auto tran_even = WireCell::Waveform::dft(signal_even);
+    // auto tran_even = WireCell::Waveform::dft(signal_even);
+    auto tran_even = Aux::fwd_r2c(dft, signal_even);
     tran_even.resize(nsublen * 2);
     if (nsublen % 2 == 0) {
         std::rotate(tran_even.begin() + nsublen / 2, tran_even.begin() + nsublen, tran_even.end());
@@ -485,12 +419,14 @@ bool Protodune::FftInterpSticky(WireCell::Waveform::realseq_t& signal, WireCell:
         std::rotate(tran_even.begin() + (nsublen + 1) / 2, tran_even.begin() + nsublen, tran_even.end());
     }
     // inverse FFT
-    auto signal_even_fc = WireCell::Waveform::idft(tran_even);
+    // auto signal_even_fc = WireCell::Waveform::idft(tran_even);
+    auto signal_even_fc = Aux::inv_c2r(dft, tran_even);
     float scale = tran_even.size() / nsublen;
     WireCell::Waveform::scale(signal_even_fc, scale);
 
     // similar for "odd"
-    auto tran_odd = WireCell::Waveform::dft(signal_odd);
+    // auto tran_odd = WireCell::Waveform::dft(signal_odd);
+    auto tran_odd = Aux::fwd_r2c(dft, signal_odd);
     tran_odd.resize(nsublen2 * 2);
     if (nsublen2 % 2 == 0) {
         std::rotate(tran_odd.begin() + nsublen2 / 2, tran_odd.begin() + nsublen2, tran_odd.end());
@@ -498,7 +434,8 @@ bool Protodune::FftInterpSticky(WireCell::Waveform::realseq_t& signal, WireCell:
     else {
         std::rotate(tran_odd.begin() + (nsublen2 + 1) / 2, tran_odd.begin() + nsublen2, tran_odd.end());
     }
-    auto signal_odd_fc = WireCell::Waveform::idft(tran_odd);
+    // auto signal_odd_fc = WireCell::Waveform::idft(tran_odd);
+    auto signal_odd_fc = Aux::inv_c2r(dft, tran_odd);
     float scale2 = tran_odd.size() / nsublen2;
     WireCell::Waveform::scale(signal_odd_fc, scale2);
 
@@ -521,7 +458,8 @@ bool Protodune::FftInterpSticky(WireCell::Waveform::realseq_t& signal, WireCell:
     return true;
 }
 
-bool Protodune::FftShiftSticky(WireCell::Waveform::realseq_t& signal, double toffset,
+bool Protodune::FftShiftSticky(const IDFT::pointer& dft,
+                               WireCell::Waveform::realseq_t& signal, double toffset,
                                std::vector<std::pair<int, int> >& st_ranges)
 {
     const int nsiglen = signal.size();
@@ -538,7 +476,8 @@ bool Protodune::FftShiftSticky(WireCell::Waveform::realseq_t& signal, double tof
     }
 
     // dft shift for "even"
-    auto tran_even = WireCell::Waveform::dft(signal_even);
+    // auto tran_even = WireCell::Waveform::dft(signal_even);
+    auto tran_even = Aux::fwd_r2c(dft, signal_even);
     double f0 = 1. / nsublen;
     const double PI = std::atan(1.0) * 4;
     for (size_t i = 0; i < tran_even.size(); i++) {
@@ -550,12 +489,12 @@ bool Protodune::FftShiftSticky(WireCell::Waveform::realseq_t& signal, double tof
         tran_even.at(i) = z * std::exp(z1);
     }
     // inverse FFT
-    auto signal_even_fc = WireCell::Waveform::idft(tran_even);
-    // float scale = 1./tran_even.size();
-    // WireCell::Waveform::scale(signal_even_fc, 1./nsublen);
+    // auto signal_even_fc = WireCell::Waveform::idft(tran_even);
+    auto signal_even_fc = Aux::inv_c2r(dft, tran_even);
 
     // similar to "odd"
-    auto tran_odd = WireCell::Waveform::dft(signal_odd);
+    // auto tran_odd = WireCell::Waveform::dft(signal_odd);
+    auto tran_odd = Aux::fwd_r2c(dft, signal_odd);
     f0 = 1. / nsublen2;
     for (size_t i = 0; i < tran_odd.size(); i++) {
         double fi = i * f0;
@@ -566,7 +505,9 @@ bool Protodune::FftShiftSticky(WireCell::Waveform::realseq_t& signal, double tof
         tran_odd.at(i) = z * std::exp(z1);
     }
     //
-    auto signal_odd_fc = WireCell::Waveform::idft(tran_odd);
+    // auto signal_odd_fc = WireCell::Waveform::idft(tran_odd);
+    auto signal_odd_fc = Aux::inv_c2r(dft, tran_odd);
+    
     // float scale = 1./tran_odd.size();
     // WireCell::Waveform::scale(signal_odd_fc, 1./nsublen2);
 
@@ -593,10 +534,12 @@ bool Protodune::FftShiftSticky(WireCell::Waveform::realseq_t& signal, double tof
     return true;
 }
 
-bool Protodune::FftScaling(WireCell::Waveform::realseq_t& signal, int nsamples)
+bool Protodune::FftScaling(const IDFT::pointer& dft,
+                           WireCell::Waveform::realseq_t& signal, int nsamples)
 {
     const int nsiglen = signal.size();
-    auto tran = WireCell::Waveform::dft(signal);
+    // auto tran = WireCell::Waveform::dft(signal);
+    auto tran = Aux::fwd_r2c(dft, signal);
     tran.resize(nsamples);
     if (nsiglen % 2 == 0) {  // ref test_zero_padding.cxx
         std::rotate(tran.begin() + nsiglen / 2, tran.begin() + nsiglen, tran.end());
@@ -605,7 +548,9 @@ bool Protodune::FftScaling(WireCell::Waveform::realseq_t& signal, int nsamples)
         std::rotate(tran.begin() + (nsiglen + 1) / 2, tran.begin() + nsiglen, tran.end());
     }
     // inverse FFT
-    auto signal_fc = WireCell::Waveform::idft(tran);
+    // auto signal_fc = WireCell::Waveform::idft(tran);
+    auto signal_fc = Aux::inv_c2r(dft, tran);
+
     WireCell::Waveform::scale(signal_fc, nsamples / nsiglen);
     signal = signal_fc;
 
@@ -631,6 +576,10 @@ void Protodune::ConfigFilterBase::configure(const WireCell::Configuration& cfg)
     m_anode = Factory::find_tn<IAnodePlane>(m_anode_tn);
     m_noisedb_tn = get(cfg, "noisedb", m_noisedb_tn);
     m_noisedb = Factory::find_tn<IChannelNoiseDatabase>(m_noisedb_tn);
+
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     // std::cerr << "ConfigFilterBase: \n" << cfg << "\n";
 }
 WireCell::Configuration Protodune::ConfigFilterBase::default_configuration() const
@@ -638,6 +587,7 @@ WireCell::Configuration Protodune::ConfigFilterBase::default_configuration() con
     Configuration cfg;
     cfg["anode"] = m_anode_tn;
     cfg["noisedb"] = m_noisedb_tn;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 
@@ -664,6 +614,9 @@ void Protodune::StickyCodeMitig::configure(const WireCell::Configuration& cfg)
     m_noisedb_tn = get(cfg, "noisedb", m_noisedb_tn);
     m_noisedb = Factory::find_tn<IChannelNoiseDatabase>(m_noisedb_tn);
 
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     m_extra_stky.clear();
     auto jext = cfg["extra_stky"];
     if (!jext.isNull()) {
@@ -701,6 +654,7 @@ WireCell::Configuration Protodune::StickyCodeMitig::default_configuration() cons
     cfg["stky_sig_like_val"] = m_stky_sig_like_val;
     cfg["stky_sig_like_rms"] = m_stky_sig_like_rms;
     cfg["stky_max_len"] = m_stky_max_len;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 
@@ -745,11 +699,8 @@ WireCell::Waveform::ChannelMaskMap Protodune::StickyCodeMitig::apply(int ch, sig
     }
     // std::cerr << "[wgu] ch: " << ch << " long_stkylen: " << long_stkylen << std::endl;
 
-    // auto signal_lc = signal; // copy, need to keep original signal
     LinearInterpSticky(signal, sticky_rng_list, m_stky_sig_like_val, m_stky_sig_like_rms);
-    FftInterpSticky(signal, sticky_rng_list);
-    // FftShiftSticky(signal_lc, 0.5, st_ranges); // alternative approach, shift by 0.5 tick
-    // signal = signal_lc;
+    FftInterpSticky(m_dft, signal, sticky_rng_list);
 
     // Now calculate the baseline ...
     std::pair<double, double> temp = WireCell::Waveform::mean_rms(signal);
@@ -846,19 +797,13 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
         int smpin = m_resmp.at(ch);
         int smpout = signal.size();
         signal.resize(smpin);
-        FftScaling(signal, smpout);
+        FftScaling(m_dft, signal, smpout);
         // std::cerr << "[wgu] ch: " << ch << " smpin: " << smpin << " smpout: " << smpout << std::endl;
     }
-    // if( (ch>=2128 && ch<=2175) // W plane
-    // ||  (ch>=1520 && ch<=1559) // V plane
-    // ||  (ch>=440  && ch<=479)  // U plane
-    // ){
-    // 	signal.resize(5996);
-    // 	FftScaling(signal, 6000);
-    // }
 
     // correct rc undershoot
-    auto spectrum = WireCell::Waveform::dft(signal);
+    // auto spectrum = WireCell::Waveform::dft(signal);
+    auto spectrum = Aux::fwd_r2c(m_dft, signal);
     bool is_partial = m_check_partial(spectrum);  // Xin's "IS_RC()"
 
     if (!is_partial) {
@@ -876,12 +821,6 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
         Microboone::RawAdapativeBaselineAlg(mag);  // subtract "linear" background in spectrum
 
         auto const& spec = m_noisedb->noise(ch);
-        // std::cout << "[wgu] " << spec.at(10).real() << std::endl;
-        // std::cout << "[wgu] " << spec.at(148).real() << std::endl;
-        // std::cout << "[wgu] " << spec.at(149).real() << std::endl;
-        // std::cout << "[wgu] " << spec.at(160).real() << std::endl;
-        // std::cout << "[wgu] " << spec.at(161).real() << std::endl;
-        // WireCell::Waveform::scale(spectrum, spec);
 
         // spec -> freqBins;
         std::vector<std::pair<int, int> > freqBins;
@@ -916,12 +855,6 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
                 int nslice = iend - istart;
                 // std::cout << "hibin: " << iend << " lobin: " << istart << std::endl;
 
-                // }
-
-                // for(int i=0; i<57; i++){ // 150 - 3000th freq bin
-                //     int nslice = 50;
-                //     int istart = 150 + nslice*i;
-                //     int iend = istart + nslice;
                 // std::cerr << istart << " " << iend << std::endl;
                 WireCell::Waveform::realseq_t mag_slice(nslice);  // slice of magnitude spectrum
                 std::copy(mag.begin() + istart, mag.begin() + iend, mag_slice.begin());
@@ -931,9 +864,7 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
                 if (istart > 1050) {  // if(i>17){
                     cut = stat.first + 3 * stat.second;
                 }
-                // if(stat.second>1300){
-                //     cut = stat.first + stat.second;
-                // }
+
                 for (int j = istart; j < iend; j++) {
                     float content = mag.at(j);
                     if (content > cut) {
@@ -946,28 +877,6 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
                         n_harmonic++;
                     }
                 }
-
-                // for(int j=0; j<nslice; j++){
-                //     float content = mag_slice.at(j) - stat.first;
-
-                //     if(iend<1000){
-                //         if(content>2000 && content>5.*stat.second){
-                //         int tbin = istart + j;
-                //         spectrum.at(tbin).real(0);
-                //         spectrum.at(tbin).imag(0);
-                //         spectrum.at(6000+1-tbin).real(0); // FIXME: assuming 6000 ticks
-                //         spectrum.at(6000+1-tbin).imag(0);
-                //         // std::cerr << "[wgu] chan: " << ch << " , freq tick: " << tbin << " , amp: " << content <<
-                //         std::endl;
-                //         }
-                //     }
-                //     else if(content>250 && content>10.*stat.second){
-                //         spectrum.at(j).real(0);
-                //         spectrum.at(j).imag(0);
-                //         spectrum.at(6000+1-j).real(0); // FIXME: assuming 6000 ticks
-                //         spectrum.at(6000+1-j).imag(0);
-                //     }
-                // }
             }
         }
 
@@ -981,7 +890,8 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
 
     // remove the DC component
     spectrum.front() = 0;
-    signal = WireCell::Waveform::idft(spectrum);
+    // signal = WireCell::Waveform::idft(spectrum);
+    signal = Aux::inv_c2r(m_dft, spectrum);
 
     // Now calculate the baseline ...
     std::pair<double, double> temp = WireCell::Waveform::mean_rms(signal);
diff --git a/sigproc/src/SimpleChannelNoiseDB.cxx b/sigproc/src/SimpleChannelNoiseDB.cxx
index 97c4240db..8aaf68975 100644
--- a/sigproc/src/SimpleChannelNoiseDB.cxx
+++ b/sigproc/src/SimpleChannelNoiseDB.cxx
@@ -1,4 +1,5 @@
 #include "WireCellSigProc/SimpleChannelNoiseDB.h"
+#include "WireCellAux/DftTools.h"
 #include "WireCellUtil/Response.h"
 #include "WireCellUtil/Binning.h"
 
@@ -31,6 +32,20 @@ SimpleChannelNoiseDB::SimpleChannelNoiseDB(double tick, int nsamples)
 }
 SimpleChannelNoiseDB::~SimpleChannelNoiseDB() {}
 
+void SimpleChannelNoiseDB::configure(const WireCell::Configuration& cfg)
+{
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+}
+
+WireCell::Configuration SimpleChannelNoiseDB::default_configuration() const
+{
+    Configuration cfg;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
+    return cfg;
+}
+
+
 double SimpleChannelNoiseDB::nominal_baseline(int channel) const
 {
     const int ind = chind(channel);
@@ -240,7 +255,8 @@ void SimpleChannelNoiseDB::set_rcrc_constant(const std::vector<int>& channels, d
     //    auto signal = rcres.generate(WireCell::Binning(m_nsamples, 0, m_nsamples*m_tick));
     auto signal = rcres.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    Waveform::compseq_t spectrum = Waveform::dft(signal);
+    // Waveform::compseq_t spectrum = Waveform::dft(signal);
+    Waveform::compseq_t spectrum = Aux::fwd_r2c(m_dft, signal);
 
     // std::cout << rcrc << " " << m_tick << " " << m_nsamples << " " << signal.front() << " " << signal.at(1) << " " <<
     // signal.at(2) << std::endl;
@@ -295,8 +311,11 @@ void SimpleChannelNoiseDB::set_gains_shapings(const std::vector<int>& channels,
     auto to_sig = to_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
     auto from_sig = from_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    auto to_filt = Waveform::dft(to_sig);
-    auto from_filt = Waveform::dft(from_sig);
+    // auto to_filt = Waveform::dft(to_sig);
+    auto to_filt = Aux::fwd_r2c(m_dft, to_sig);
+
+    // auto from_filt = Waveform::dft(from_sig);
+    auto from_filt = Aux::fwd_r2c(m_dft, from_sig);
 
     // auto from_filt_sum = Waveform::sum(from_filt);
     // auto to_filt_sum   = Waveform::sum(to_filt);
diff --git a/sigproc/test/test_partial.cxx b/sigproc/test/test_partial.cxx
index 3756d297b..3fc539077 100644
--- a/sigproc/test/test_partial.cxx
+++ b/sigproc/test/test_partial.cxx
@@ -1,5 +1,9 @@
 #include "WireCellSigProc/Diagnostics.h"
-#include "WireCellUtil/Waveform.h"
+
+#include "WireCellAux/DftTools.h"
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
+
 #include "WireCellUtil/Testing.h"
 
 #include <iostream>
@@ -16,7 +20,11 @@ using namespace WireCell::SigProc;
 
 int main(int argc, char* argv[])
 {
-    auto spectrum = Waveform::dft(horig);
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
+
+    auto spectrum = Aux::fwd_r2c(idft, horig);
     Diagnostics::Partial m_check_partial;
     bool is_partial = m_check_partial(spectrum);
     Assert(is_partial);
diff --git a/sigproc/test/test_simple_channel_noisedb.cxx b/sigproc/test/test_simple_channel_noisedb.cxx
index 59c9a9880..c03c5b852 100644
--- a/sigproc/test/test_simple_channel_noisedb.cxx
+++ b/sigproc/test/test_simple_channel_noisedb.cxx
@@ -1,6 +1,9 @@
 #include "WireCellUtil/Testing.h"
 
 #include "WireCellSigProc/SimpleChannelNoiseDB.h"
+
+#include "WireCellUtil/PluginManager.h"
+#include "WireCellUtil/NamedFactory.h"
 #include "WireCellUtil/Units.h"
 
 #include <iostream>
@@ -11,10 +14,15 @@ using namespace WireCell::SigProc;
 
 int main()
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    Factory::lookup_tn<IDFT>("FftwDFT");
+
     const int nsamples = 5432;
     const double tick = 1.0 * units::ms;
 
     SimpleChannelNoiseDB cndb(tick, nsamples);
+    cndb.configure(cndb.default_configuration());
 
     Assert(cndb.sample_time() == tick);
     Assert(cndb.nominal_baseline(0) == 0.0);
diff --git a/sigproc/test/test_zero_padding.cxx b/sigproc/test/test_zero_padding.cxx
index c8d82d775..2182cbc27 100644
--- a/sigproc/test/test_zero_padding.cxx
+++ b/sigproc/test/test_zero_padding.cxx
@@ -1,6 +1,10 @@
 // Example for FFT resampling with zero-padding tricks
 #include "WireCellUtil/Waveform.h"
 
+#include "WireCellAux/DftTools.h"
+#include "WireCellUtil/NamedFactory.h"
+#include "WireCellUtil/PluginManager.h"
+
 #include <algorithm>
 
 // for FFT
@@ -14,10 +18,14 @@ using namespace WireCell;
 
 int main()
 {
+    PluginManager& pm = PluginManager::instance();
+    pm.add("WireCellAux");
+    auto idft = Factory::lookup_tn<IDFT>("FftwDFT");
+
     std::vector<float> a = {1, 2, 3, 2, 1};
     // can be sampled to 10 ticks: 1 , 1.35279 , 2 , 2.69443 , 3 , 2.69443 , 2 , 1.35279 , 1 , 0.905573
 
-    auto tran = WireCell::Waveform::dft(a);
+    auto tran = Aux::fwd_r2c(idft, a);
 
     std::cout << " tran = " << std::endl;
     std::cout << tran.size() << std::endl;
@@ -48,7 +56,7 @@ int main()
     std::cout << std::endl;
 
     // inverse FFT
-    auto b = WireCell::Waveform::idft(tran);
+    auto b = Aux::inv_c2r(idft, tran);
     float scale = tran.size() / inSmps;
     //
     std::cout << " b = " << std::endl;
diff --git a/util/inc/WireCellUtil/Array.h b/util/inc/WireCellUtil/Array.h
index 2b30a272e..2a01dd368 100644
--- a/util/inc/WireCellUtil/Array.h
+++ b/util/inc/WireCellUtil/Array.h
@@ -68,8 +68,8 @@ namespace WireCell {
 
             const_shared_array_xxf arr2 = idft(*spec);
          */
-        array_xxc dft(const array_xxf& arr);
-        array_xxf idft(const array_xxc& arr);
+        // array_xxc dft(const array_xxf& arr);
+        // array_xxf idft(const array_xxc& arr);
 
         /** Partial, 1D DFT and inverse DFT along one dimension of an
          * array.  Each row is transformed if dim=0, each column if
@@ -102,10 +102,10 @@ namespace WireCell {
          *     auto tmp = idft_cc(xxc, 1);
          *     auto xxf = idft_rc(tmp, 0);
          */
-        array_xxc dft_rc(const array_xxf& arr, int dim = 0);
-        array_xxc dft_cc(const array_xxc& arr, int dim = 1);
-        array_xxc idft_cc(const array_xxc& arr, int dim = 1);
-        array_xxf idft_cr(const array_xxc& arr, int dim = 0);
+        // array_xxc dft_rc(const array_xxf& arr, int dim = 0);
+        // array_xxc dft_cc(const array_xxc& arr, int dim = 1);
+        // array_xxc idft_cc(const array_xxc& arr, int dim = 1);
+        // array_xxf idft_cr(const array_xxc& arr, int dim = 0);
 
         /** Perform 2D deconvolution.
 
@@ -115,7 +115,7 @@ namespace WireCell {
             perform an 2D inverse DFT.
 
          */
-        array_xxf deconv(const array_xxf& arr, const array_xxc& filter);
+        // array_xxf deconv(const array_xxf& arr, const array_xxc& filter);
 
         /** downsample a 2D array along one axis by k
          *  simple average of all numbers in a bin
diff --git a/util/inc/WireCellUtil/Waveform.h b/util/inc/WireCellUtil/Waveform.h
index f2ed89cc0..96fe3ad9c 100644
--- a/util/inc/WireCellUtil/Waveform.h
+++ b/util/inc/WireCellUtil/Waveform.h
@@ -11,8 +11,8 @@
 
 // FIXME: remove the hard-wired Eigen::FFT related in favor of dynamic
 // DFT with Aux/DftTools.h.
-#include <Eigen/Core>
-#include <unsupported/Eigen/FFT>
+// #include <Eigen/Core>
+// #include <unsupported/Eigen/FFT>
 
 namespace WireCell {
 
@@ -193,49 +193,49 @@ namespace WireCell {
 
         /// Discrete Fourier transform of real sequence.  Returns full
         /// spectrum.  No normalization scaling applied
-        compseq_t dft(realseq_t seq);
+        // compseq_t dft(realseq_t seq);
 
         // Linear convolution, returns in1.size()+in2.size()-1.  If
         // truncate is false then the returned sequence will be
         // truncated to length that of the first input.  Otherwise the
         // function is symmetric between the two inputs.
-        realseq_t linear_convolve(Waveform::realseq_t in1, Waveform::realseq_t in2, bool truncate = true);
+        // realseq_t linear_convolve(Waveform::realseq_t in1, Waveform::realseq_t in2, bool truncate = true);
 
         // Replace old response in wave with new response.  If
         // truncate is false then the returned sequence will be the
         // length required for linear convolution.  This is the sum of
         // the sizes of all input less one and less the smallest.
-        realseq_t replace_convolve(Waveform::realseq_t wave, Waveform::realseq_t newres, Waveform::realseq_t oldres,
-                                   bool truncate = true);
+        // realseq_t replace_convolve(Waveform::realseq_t wave, Waveform::realseq_t newres, Waveform::realseq_t oldres,
+        //                            bool truncate = true);
 
         /// Inverse, discrete Fourier transform.  Expects full
         /// spectrum (twice Nyquist frequency).  Applies the
         /// 1/Nsamples normalization.
-        realseq_t idft(compseq_t spec);
+        // realseq_t idft(compseq_t spec);
 
         /// Return the smallest, most frequent value to appear in vector.
         short most_frequent(const std::vector<short>& vals);
 
-        class FFT {
-           public:
-            FFT() {}
-            inline compseq_t dft(realseq_t wave)
-            {
-                auto v = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
-                Eigen::VectorXcf ret = trans.fwd(v);
-                return compseq_t(ret.data(), ret.data() + ret.size());
-            }
-            inline realseq_t idft(compseq_t spec)
-            {
-                auto v = Eigen::Map<Eigen::VectorXcf>(spec.data(), spec.size());
-                Eigen::VectorXf ret;
-                trans.inv(ret, v);
-                return realseq_t(ret.data(), ret.data() + ret.size());
-            }
-
-           private:
-            Eigen::FFT<Waveform::real_t> trans;
-        };
+        // class FFT {
+        //    public:
+        //     FFT() {}
+        //     inline compseq_t dft(realseq_t wave)
+        //     {
+        //         auto v = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
+        //         Eigen::VectorXcf ret = trans.fwd(v);
+        //         return compseq_t(ret.data(), ret.data() + ret.size());
+        //     }
+        //     inline realseq_t idft(compseq_t spec)
+        //     {
+        //         auto v = Eigen::Map<Eigen::VectorXcf>(spec.data(), spec.size());
+        //         Eigen::VectorXf ret;
+        //         trans.inv(ret, v);
+        //         return realseq_t(ret.data(), ret.data() + ret.size());
+        //     }
+
+        //    private:
+        //     Eigen::FFT<Waveform::real_t> trans;
+        // };
 
     }  // namespace Waveform
 }  // namespace WireCell
diff --git a/util/src/Array.cxx b/util/src/Array.cxx
index e9609ca5b..c36560c72 100644
--- a/util/src/Array.cxx
+++ b/util/src/Array.cxx
@@ -1,7 +1,7 @@
 #include "WireCellUtil/Array.h"
 #include "WireCellUtil/Exceptions.h"
 
-#include <unsupported/Eigen/FFT>
+// #include <unsupported/Eigen/FFT>
 
 #include <algorithm>
 #include <complex>
@@ -12,210 +12,210 @@ using namespace WireCell::Array;
 // Need to use different planner for different input/output
 // https://eigen.tuxfamily.org/dox/unsupported/ei__fftw__impl_8h_source.html
 
-thread_local static Eigen::FFT<float> gEigenFFT_dft_1d;      // c2c fwd and inv
-thread_local static Eigen::FFT<float> gEigenFFT_dft_r2c_1d;  // r2c fwd
-thread_local static Eigen::FFT<float> gEigenFFT_dft_c2r_1d;  // c2r inv
+// thread_local static Eigen::FFT<float> gEigenFFT_dft_1d;      // c2c fwd and inv
+// thread_local static Eigen::FFT<float> gEigenFFT_dft_r2c_1d;  // r2c fwd
+// thread_local static Eigen::FFT<float> gEigenFFT_dft_c2r_1d;  // c2r inv
 
 // http://stackoverflow.com/a/33636445
 
-WireCell::Array::array_xxc WireCell::Array::dft(const WireCell::Array::array_xxf& arr)
-{
-    const int nrows = arr.rows();
-    const int ncols = arr.cols();
-
-    Eigen::MatrixXcf matc(nrows, ncols);
-
-    for (int irow = 0; irow < nrows; ++irow) {
-        Eigen::VectorXcf fspec(ncols);  // frequency spectrum
-        // gEigenFFT wants vectors, also input arr is const
-        Eigen::VectorXf tmp = arr.row(irow);
-        gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-        matc.row(irow) = fspec;
-    }
-
-    for (int icol = 0; icol < ncols; ++icol) {
-        Eigen::VectorXcf pspec(nrows);                // periodicity spectrum
-        gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
-        matc.col(icol) = pspec;
-    }
-
-    return matc;
-}
-
-WireCell::Array::array_xxc WireCell::Array::dft_rc(const WireCell::Array::array_xxf& arr, int dim)
-{
-    const int nrows = arr.rows();
-    const int ncols = arr.cols();
-
-    Eigen::MatrixXcf matc(nrows, ncols);
-
-    if (dim == 0) {
-        for (int irow = 0; irow < nrows; ++irow) {
-            Eigen::VectorXcf fspec(ncols);
-            Eigen::VectorXf tmp = arr.row(irow);
-            gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-            matc.row(irow) = fspec;
-        }
-    }
-    else if (dim == 1) {
-        for (int icol = 0; icol < ncols; ++icol) {
-            Eigen::VectorXcf fspec(nrows);
-            Eigen::VectorXf tmp = arr.col(icol);
-            gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-            matc.col(icol) = fspec;
-        }
-    }
-    return matc;
-}
-
-WireCell::Array::array_xxc WireCell::Array::dft_cc(const WireCell::Array::array_xxc& arr, int dim)
-{
-    const int nrows = arr.rows();
-    const int ncols = arr.cols();
-
-    Eigen::MatrixXcf matc(nrows, ncols);
-
-    matc = arr.matrix();
-
-    if (dim == 0) {
-        for (int irow = 0; irow < nrows; ++irow) {
-            Eigen::VectorXcf pspec(ncols);
-            gEigenFFT_dft_1d.fwd(pspec, matc.row(irow));  // c2c
-            matc.row(irow) = pspec;
-        }
-    }
-    else {
-        for (int icol = 0; icol < ncols; ++icol) {
-            Eigen::VectorXcf pspec(nrows);
-            gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
-            matc.col(icol) = pspec;
-        }
-    }
-    return matc;
-}
-
-WireCell::Array::array_xxf WireCell::Array::idft(const WireCell::Array::array_xxc& arr)
-{
-    const int nrows = arr.rows();
-    const int ncols = arr.cols();
-
-    // gEigenFFT works on matrices, not arrays, also don't step on const input
-    Eigen::MatrixXcf partial(nrows, ncols);
-    partial = arr.matrix();
-
-    for (int icol = 0; icol < ncols; ++icol) {
-        Eigen::VectorXcf pspec(nrows);                   // wire spectrum
-        gEigenFFT_dft_1d.inv(pspec, partial.col(icol));  // c2c
-        partial.col(icol) = pspec;
-    }
-
-    // shared_array_xxf ret = std::make_shared<array_xxf> (nrows, ncols);
-    array_xxf ret(nrows, ncols);
-
-    for (int irow = 0; irow < nrows; ++irow) {
-        Eigen::VectorXf wave(ncols);                        // back to real-valued time series
-        gEigenFFT_dft_c2r_1d.inv(wave, partial.row(irow));  // c2r
-        ret.row(irow) = wave;
-    }
-
-    return ret;
-}
-
-WireCell::Array::array_xxc WireCell::Array::idft_cc(const WireCell::Array::array_xxc& arr, int dim)
-{
-    const int nrows = arr.rows();
-    const int ncols = arr.cols();
-
-    // gEigenFFT works on matrices, not arrays, also don't step on const input
-    Eigen::MatrixXcf ret(nrows, ncols);
-    ret = arr.matrix();
-
-    if (dim == 1) {
-        for (int icol = 0; icol < ncols; ++icol) {
-            Eigen::VectorXcf pspec(nrows);
-            gEigenFFT_dft_1d.inv(pspec, ret.col(icol));  // c2c
-            ret.col(icol) = pspec;
-        }
-    }
-    else if (dim == 0) {
-        for (int irow = 0; irow < nrows; ++irow) {
-            Eigen::VectorXcf pspec(ncols);
-            gEigenFFT_dft_1d.inv(pspec, ret.row(irow));  // c2c
-            ret.row(irow) = pspec;
-        }
-    }
-    return ret;
-}
-
-WireCell::Array::array_xxf WireCell::Array::idft_cr(const WireCell::Array::array_xxc& arr, int dim)
-{
-    const int nrows = arr.rows();
-    const int ncols = arr.cols();
-
-    // gEigenFFT works on matrices, not arrays, also don't step on const input
-    Eigen::MatrixXcf partial(nrows, ncols);
-    partial = arr.matrix();
-
-    array_xxf ret(nrows, ncols);
-
-    if (dim == 0) {
-        for (int irow = 0; irow < nrows; ++irow) {
-            Eigen::VectorXf wave(ncols);                        // back to real-valued time series
-            gEigenFFT_dft_c2r_1d.inv(wave, partial.row(irow));  // c2r
-            ret.row(irow) = wave;
-        }
-    }
-    else if (dim == 1) {
-        for (int icol = 0; icol < ncols; ++icol) {
-            Eigen::VectorXf wave(nrows);
-            gEigenFFT_dft_c2r_1d.inv(wave, partial.col(icol));  // c2r
-            ret.col(icol) = wave;
-        }
-    }
-    return ret;
-}
-
-// this is a cut-and-paste mashup of dft() and idft() in order to avoid temporaries.
-WireCell::Array::array_xxf WireCell::Array::deconv(const WireCell::Array::array_xxf& arr,
-                                                   const WireCell::Array::array_xxc& filter)
-{
-    const int nrows = arr.rows();
-    const int ncols = arr.cols();
-
-    Eigen::MatrixXcf matc(nrows, ncols);
-    for (int irow = 0; irow < nrows; ++irow) {
-        Eigen::VectorXcf fspec(ncols);  // frequency spectrum
-        // gEigenFFT wants vectors, also input arr is const
-        Eigen::VectorXf tmp = arr.row(irow);
-        gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-        matc.row(irow) = fspec;
-    }
-
-    for (int icol = 0; icol < ncols; ++icol) {
-        Eigen::VectorXcf pspec(nrows);                // periodicity spectrum
-        gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
-        matc.col(icol) = pspec;
-    }
-
-    // deconvolution via multiplication in frequency space
-    Eigen::MatrixXcf filt = matc.array() * filter;
-
-    for (int icol = 0; icol < ncols; ++icol) {
-        Eigen::VectorXcf pspec(nrows);                // wire spectrum
-        gEigenFFT_dft_1d.inv(pspec, filt.col(icol));  // c2c
-        filt.col(icol) = pspec;
-    }
-
-    array_xxf ret(nrows, ncols);
-
-    for (int irow = 0; irow < nrows; ++irow) {
-        Eigen::VectorXf wave(ncols);                     // back to real-valued time series
-        gEigenFFT_dft_c2r_1d.inv(wave, filt.row(irow));  // c2r
-        ret.row(irow) = wave;
-    }
-
-    return ret;
-}
+// WireCell::Array::array_xxc WireCell::Array::dft(const WireCell::Array::array_xxf& arr)
+// {
+//     const int nrows = arr.rows();
+//     const int ncols = arr.cols();
+
+//     Eigen::MatrixXcf matc(nrows, ncols);
+
+//     for (int irow = 0; irow < nrows; ++irow) {
+//         Eigen::VectorXcf fspec(ncols);  // frequency spectrum
+//         // gEigenFFT wants vectors, also input arr is const
+//         Eigen::VectorXf tmp = arr.row(irow);
+//         gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
+//         matc.row(irow) = fspec;
+//     }
+
+//     for (int icol = 0; icol < ncols; ++icol) {
+//         Eigen::VectorXcf pspec(nrows);                // periodicity spectrum
+//         gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
+//         matc.col(icol) = pspec;
+//     }
+
+//     return matc;
+// }
+
+// WireCell::Array::array_xxc WireCell::Array::dft_rc(const WireCell::Array::array_xxf& arr, int dim)
+// {
+//     const int nrows = arr.rows();
+//     const int ncols = arr.cols();
+
+//     Eigen::MatrixXcf matc(nrows, ncols);
+
+//     if (dim == 0) {
+//         for (int irow = 0; irow < nrows; ++irow) {
+//             Eigen::VectorXcf fspec(ncols);
+//             Eigen::VectorXf tmp = arr.row(irow);
+//             gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
+//             matc.row(irow) = fspec;
+//         }
+//     }
+//     else if (dim == 1) {
+//         for (int icol = 0; icol < ncols; ++icol) {
+//             Eigen::VectorXcf fspec(nrows);
+//             Eigen::VectorXf tmp = arr.col(icol);
+//             gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
+//             matc.col(icol) = fspec;
+//         }
+//     }
+//     return matc;
+// }
+
+// WireCell::Array::array_xxc WireCell::Array::dft_cc(const WireCell::Array::array_xxc& arr, int dim)
+// {
+//     const int nrows = arr.rows();
+//     const int ncols = arr.cols();
+
+//     Eigen::MatrixXcf matc(nrows, ncols);
+
+//     matc = arr.matrix();
+
+//     if (dim == 0) {
+//         for (int irow = 0; irow < nrows; ++irow) {
+//             Eigen::VectorXcf pspec(ncols);
+//             gEigenFFT_dft_1d.fwd(pspec, matc.row(irow));  // c2c
+//             matc.row(irow) = pspec;
+//         }
+//     }
+//     else {
+//         for (int icol = 0; icol < ncols; ++icol) {
+//             Eigen::VectorXcf pspec(nrows);
+//             gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
+//             matc.col(icol) = pspec;
+//         }
+//     }
+//     return matc;
+// }
+
+// WireCell::Array::array_xxf WireCell::Array::idft(const WireCell::Array::array_xxc& arr)
+// {
+//     const int nrows = arr.rows();
+//     const int ncols = arr.cols();
+
+//     // gEigenFFT works on matrices, not arrays, also don't step on const input
+//     Eigen::MatrixXcf partial(nrows, ncols);
+//     partial = arr.matrix();
+
+//     for (int icol = 0; icol < ncols; ++icol) {
+//         Eigen::VectorXcf pspec(nrows);                   // wire spectrum
+//         gEigenFFT_dft_1d.inv(pspec, partial.col(icol));  // c2c
+//         partial.col(icol) = pspec;
+//     }
+
+//     // shared_array_xxf ret = std::make_shared<array_xxf> (nrows, ncols);
+//     array_xxf ret(nrows, ncols);
+
+//     for (int irow = 0; irow < nrows; ++irow) {
+//         Eigen::VectorXf wave(ncols);                        // back to real-valued time series
+//         gEigenFFT_dft_c2r_1d.inv(wave, partial.row(irow));  // c2r
+//         ret.row(irow) = wave;
+//     }
+
+//     return ret;
+// }
+
+// WireCell::Array::array_xxc WireCell::Array::idft_cc(const WireCell::Array::array_xxc& arr, int dim)
+// {
+//     const int nrows = arr.rows();
+//     const int ncols = arr.cols();
+
+//     // gEigenFFT works on matrices, not arrays, also don't step on const input
+//     Eigen::MatrixXcf ret(nrows, ncols);
+//     ret = arr.matrix();
+
+//     if (dim == 1) {
+//         for (int icol = 0; icol < ncols; ++icol) {
+//             Eigen::VectorXcf pspec(nrows);
+//             gEigenFFT_dft_1d.inv(pspec, ret.col(icol));  // c2c
+//             ret.col(icol) = pspec;
+//         }
+//     }
+//     else if (dim == 0) {
+//         for (int irow = 0; irow < nrows; ++irow) {
+//             Eigen::VectorXcf pspec(ncols);
+//             gEigenFFT_dft_1d.inv(pspec, ret.row(irow));  // c2c
+//             ret.row(irow) = pspec;
+//         }
+//     }
+//     return ret;
+// }
+
+// WireCell::Array::array_xxf WireCell::Array::idft_cr(const WireCell::Array::array_xxc& arr, int dim)
+// {
+//     const int nrows = arr.rows();
+//     const int ncols = arr.cols();
+
+//     // gEigenFFT works on matrices, not arrays, also don't step on const input
+//     Eigen::MatrixXcf partial(nrows, ncols);
+//     partial = arr.matrix();
+
+//     array_xxf ret(nrows, ncols);
+
+//     if (dim == 0) {
+//         for (int irow = 0; irow < nrows; ++irow) {
+//             Eigen::VectorXf wave(ncols);                        // back to real-valued time series
+//             gEigenFFT_dft_c2r_1d.inv(wave, partial.row(irow));  // c2r
+//             ret.row(irow) = wave;
+//         }
+//     }
+//     else if (dim == 1) {
+//         for (int icol = 0; icol < ncols; ++icol) {
+//             Eigen::VectorXf wave(nrows);
+//             gEigenFFT_dft_c2r_1d.inv(wave, partial.col(icol));  // c2r
+//             ret.col(icol) = wave;
+//         }
+//     }
+//     return ret;
+// }
+
+// // this is a cut-and-paste mashup of dft() and idft() in order to avoid temporaries.
+// WireCell::Array::array_xxf WireCell::Array::deconv(const WireCell::Array::array_xxf& arr,
+//                                                    const WireCell::Array::array_xxc& filter)
+// {
+//     const int nrows = arr.rows();
+//     const int ncols = arr.cols();
+
+//     Eigen::MatrixXcf matc(nrows, ncols);
+//     for (int irow = 0; irow < nrows; ++irow) {
+//         Eigen::VectorXcf fspec(ncols);  // frequency spectrum
+//         // gEigenFFT wants vectors, also input arr is const
+//         Eigen::VectorXf tmp = arr.row(irow);
+//         gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
+//         matc.row(irow) = fspec;
+//     }
+
+//     for (int icol = 0; icol < ncols; ++icol) {
+//         Eigen::VectorXcf pspec(nrows);                // periodicity spectrum
+//         gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
+//         matc.col(icol) = pspec;
+//     }
+
+//     // deconvolution via multiplication in frequency space
+//     Eigen::MatrixXcf filt = matc.array() * filter;
+
+//     for (int icol = 0; icol < ncols; ++icol) {
+//         Eigen::VectorXcf pspec(nrows);                // wire spectrum
+//         gEigenFFT_dft_1d.inv(pspec, filt.col(icol));  // c2c
+//         filt.col(icol) = pspec;
+//     }
+
+//     array_xxf ret(nrows, ncols);
+
+//     for (int irow = 0; irow < nrows; ++irow) {
+//         Eigen::VectorXf wave(ncols);                     // back to real-valued time series
+//         gEigenFFT_dft_c2r_1d.inv(wave, filt.row(irow));  // c2r
+//         ret.row(irow) = wave;
+//     }
+
+//     return ret;
+// }
 
 WireCell::Array::array_xxf WireCell::Array::downsample(const Array::array_xxf& in, const unsigned int k, const int dim)
 {
@@ -287,4 +287,4 @@ WireCell::Array::array_xxf WireCell::Array::baseline_subtraction(const Array::ar
         }
     }
     return ret;
-}
\ No newline at end of file
+}
diff --git a/util/src/Waveform.cxx b/util/src/Waveform.cxx
index 7817740e5..fcdee5e3e 100644
--- a/util/src/Waveform.cxx
+++ b/util/src/Waveform.cxx
@@ -155,80 +155,80 @@ std::pair<int, int> WireCell::Waveform::edge(const realseq_t& wave)
     return std::make_pair(imin, imax);
 }
 
-thread_local static Eigen::FFT<Waveform::real_t> gEigenFFT;
-
-Waveform::compseq_t WireCell::Waveform::dft(realseq_t wave)
-{
-    auto v = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
-    Eigen::VectorXcf ret = gEigenFFT.fwd(v);
-    return compseq_t(ret.data(), ret.data() + ret.size());
-}
-
-Waveform::realseq_t WireCell::Waveform::idft(compseq_t spec)
-{
-    auto v = Eigen::Map<Eigen::VectorXcf>(spec.data(), spec.size());
-    Eigen::VectorXf ret;
-    gEigenFFT.inv(ret, v);
-    return realseq_t(ret.data(), ret.data() + ret.size());
-}
-
-// Linear convolution, returns in1.size()+in2.size()-1.
-Waveform::realseq_t WireCell::Waveform::linear_convolve(Waveform::realseq_t in1, Waveform::realseq_t in2, bool truncate)
-{
-    size_t n1_orig = in1.size(), n2_orig = in2.size();
-    size_t n_out = n1_orig + n2_orig - 1;
-
-    in1.resize(n_out, 0);
-    in2.resize(n_out, 0);
-
-    auto v1 = Eigen::Map<Eigen::VectorXf>(in1.data(), in1.size());
-    auto v2 = Eigen::Map<Eigen::VectorXf>(in2.data(), in2.size());
-
-    Eigen::FFT<Waveform::real_t> trans;
-
-    Eigen::VectorXcf s1 = trans.fwd(v1);
-    Eigen::VectorXcf s2 = trans.fwd(v2);
-    Eigen::VectorXcf s12 = (s1.array() * s2.array()).matrix();
-    Eigen::VectorXf vret;
-    trans.inv(vret, s12);
-    realseq_t ret(vret.data(), vret.data() + vret.size());
-    if (truncate) {
-        ret.resize(n1_orig);
-    }
-    return ret;
-}
-
-// Replace old response in wave with new response.
-Waveform::realseq_t WireCell::Waveform::replace_convolve(Waveform::realseq_t wave, Waveform::realseq_t newres,
-                                                         Waveform::realseq_t oldres, bool truncate)
-{
-    size_t sizes[3] = {wave.size(), newres.size(), oldres.size()};
-    size_t n_out = sizes[0] + sizes[1] + sizes[2] - *std::min_element(sizes, sizes + 3) - 1;
-
-    wave.resize(n_out, 0);
-    newres.resize(n_out, 0);
-    oldres.resize(n_out, 0);
-
-    auto v1 = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
-    auto v2 = Eigen::Map<Eigen::VectorXf>(newres.data(), newres.size());
-    auto v3 = Eigen::Map<Eigen::VectorXf>(oldres.data(), oldres.size());
-
-    Eigen::FFT<Waveform::real_t> trans;
-
-    Eigen::VectorXcf s1 = trans.fwd(v1);
-    Eigen::VectorXcf s2 = trans.fwd(v2);
-    Eigen::VectorXcf s3 = trans.fwd(v3);
-
-    Eigen::VectorXcf s123 = (s1.array() * s2.array() / s3.array()).matrix();
-
-    Eigen::VectorXf vret;
-    trans.inv(vret, s123);
-    realseq_t ret(vret.data(), vret.data() + vret.size());
-    if (truncate) {
-        ret.resize(sizes[0]);
-    }
-    return ret;
-}
+// thread_local static Eigen::FFT<Waveform::real_t> gEigenFFT;
+
+// Waveform::compseq_t WireCell::Waveform::dft(realseq_t wave)
+// {
+//     auto v = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
+//     Eigen::VectorXcf ret = gEigenFFT.fwd(v);
+//     return compseq_t(ret.data(), ret.data() + ret.size());
+// }
+
+// Waveform::realseq_t WireCell::Waveform::idft(compseq_t spec)
+// {
+//     auto v = Eigen::Map<Eigen::VectorXcf>(spec.data(), spec.size());
+//     Eigen::VectorXf ret;
+//     gEigenFFT.inv(ret, v);
+//     return realseq_t(ret.data(), ret.data() + ret.size());
+// }
+
+// // Linear convolution, returns in1.size()+in2.size()-1.
+// Waveform::realseq_t WireCell::Waveform::linear_convolve(Waveform::realseq_t in1, Waveform::realseq_t in2, bool truncate)
+// {
+//     size_t n1_orig = in1.size(), n2_orig = in2.size();
+//     size_t n_out = n1_orig + n2_orig - 1;
+
+//     in1.resize(n_out, 0);
+//     in2.resize(n_out, 0);
+
+//     auto v1 = Eigen::Map<Eigen::VectorXf>(in1.data(), in1.size());
+//     auto v2 = Eigen::Map<Eigen::VectorXf>(in2.data(), in2.size());
+
+//     Eigen::FFT<Waveform::real_t> trans;
+
+//     Eigen::VectorXcf s1 = trans.fwd(v1);
+//     Eigen::VectorXcf s2 = trans.fwd(v2);
+//     Eigen::VectorXcf s12 = (s1.array() * s2.array()).matrix();
+//     Eigen::VectorXf vret;
+//     trans.inv(vret, s12);
+//     realseq_t ret(vret.data(), vret.data() + vret.size());
+//     if (truncate) {
+//         ret.resize(n1_orig);
+//     }
+//     return ret;
+// }
+
+// // Replace old response in wave with new response.
+// Waveform::realseq_t WireCell::Waveform::replace_convolve(Waveform::realseq_t wave, Waveform::realseq_t newres,
+//                                                          Waveform::realseq_t oldres, bool truncate)
+// {
+//     size_t sizes[3] = {wave.size(), newres.size(), oldres.size()};
+//     size_t n_out = sizes[0] + sizes[1] + sizes[2] - *std::min_element(sizes, sizes + 3) - 1;
+
+//     wave.resize(n_out, 0);
+//     newres.resize(n_out, 0);
+//     oldres.resize(n_out, 0);
+
+//     auto v1 = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
+//     auto v2 = Eigen::Map<Eigen::VectorXf>(newres.data(), newres.size());
+//     auto v3 = Eigen::Map<Eigen::VectorXf>(oldres.data(), oldres.size());
+
+//     Eigen::FFT<Waveform::real_t> trans;
+
+//     Eigen::VectorXcf s1 = trans.fwd(v1);
+//     Eigen::VectorXcf s2 = trans.fwd(v2);
+//     Eigen::VectorXcf s3 = trans.fwd(v3);
+
+//     Eigen::VectorXcf s123 = (s1.array() * s2.array() / s3.array()).matrix();
+
+//     Eigen::VectorXf vret;
+//     trans.inv(vret, s123);
+//     realseq_t ret(vret.data(), vret.data() + vret.size());
+//     if (truncate) {
+//         ret.resize(sizes[0]);
+//     }
+//     return ret;
+// }
 
 WireCell::Waveform::BinRangeList WireCell::Waveform::merge(const WireCell::Waveform::BinRangeList& brl)
 {
diff --git a/util/test/test_array.cxx b/util/test/test_array.cxx
index 85846ee00..888711022 100644
--- a/util/test/test_array.cxx
+++ b/util/test/test_array.cxx
@@ -69,88 +69,88 @@ bool same(const arrtype& a1, const arrtype& a2, double eps = 1.0e-6)
     return (diff <= eps);
 }
 
-void test_partial(ExecMon& em)
-{
-    const int nrows = 300;
-    const int ncols = 1000;
-
-    auto arr = my_great_array(em, nrows, ncols);
-    em("test_partial: make array");
-
-    auto spec = dft(arr);
-    auto spec_rc = dft_rc(arr);
-    auto spec_cc = dft_cc(spec_rc);
-    em("test_partial: forward");
-
-    auto arr2 = idft(spec);
-    auto arr2_cc = idft_cc(spec_cc);
-    auto arr2_cr = idft_cr(arr2_cc);
-    em("test_partial: reverse");
-
-    Assert(same(spec, spec_cc));
-    Assert(same(arr, arr2));
-    Assert(same(arr2, arr2_cr));
-
-    const int nrounds = 100;
-
-    for (int count = 0; count < nrounds; ++count) {
-        auto spec = dft(arr);
-        auto orig = idft(spec);
-    }
-    em("test_partial: direct round trip");
-    for (int count = 0; count < nrounds; ++count) {
-        auto spec_rc = dft_rc(arr);
-        auto spec_cc = dft_cc(spec_rc);
-        auto arr2_cc = idft_cc(spec_cc);
-        auto arr2_cr = idft_cr(arr2_cc);
-    }
-    em("test_partial: partial round trip");
-}
-
-void test_dft(ExecMon& em)
-{
-    const int nrows = 300;
-    const int ncols = 1000;
-
-    const int nrounds = 100;
-
-    auto arr = my_great_array(em, nrows, ncols);
-    em("dft: make array");
-    for (int count = 0; count < nrounds; ++count) {
-        auto spec = dft(arr);
-        auto orig = idft(spec);
-    }
-    em("dft with floats");
-#ifdef WCT_HACK_FOR_FFTW_NO_SP
-    for (int count = 0; count < nrounds; ++count) {
-        auto spec = dftd(arr);
-        auto orig = idftd(spec);
-    }
-    em("dft up/down cast through doubles");
-#endif
-}
-
-void test_deconv(ExecMon& em)
-{
-    const int nrows = 300;
-    const int ncols = 1000;
-
-    em("deconv: start");
-    auto arr = my_great_array(em, nrows, ncols);
-    em("deconv: got array");
-    array_xxc filt = Eigen::ArrayXXcf::Zero(nrows, ncols) + 1.0;
-    em("deconv: got filter");
-    auto deco = deconv(arr, filt);
-    em("deconv: done");  // 38ms opt, 274 debug
-
-    array_xxf diff = arr - deco;
-    em("deconv: diff");
-
-    double norm = diff.matrix().norm();
-    em("deconv: norm");
-    cerr << "got norm of diff " << norm << endl;
-    Assert(norm < 0.001);
-}
+// void test_partial(ExecMon& em)
+// {
+//     const int nrows = 300;
+//     const int ncols = 1000;
+
+//     auto arr = my_great_array(em, nrows, ncols);
+//     em("test_partial: make array");
+
+//     auto spec = dft(arr);
+//     auto spec_rc = dft_rc(arr);
+//     auto spec_cc = dft_cc(spec_rc);
+//     em("test_partial: forward");
+
+//     auto arr2 = idft(spec);
+//     auto arr2_cc = idft_cc(spec_cc);
+//     auto arr2_cr = idft_cr(arr2_cc);
+//     em("test_partial: reverse");
+
+//     Assert(same(spec, spec_cc));
+//     Assert(same(arr, arr2));
+//     Assert(same(arr2, arr2_cr));
+
+//     const int nrounds = 100;
+
+//     for (int count = 0; count < nrounds; ++count) {
+//         auto spec = dft(arr);
+//         auto orig = idft(spec);
+//     }
+//     em("test_partial: direct round trip");
+//     for (int count = 0; count < nrounds; ++count) {
+//         auto spec_rc = dft_rc(arr);
+//         auto spec_cc = dft_cc(spec_rc);
+//         auto arr2_cc = idft_cc(spec_cc);
+//         auto arr2_cr = idft_cr(arr2_cc);
+//     }
+//     em("test_partial: partial round trip");
+// }
+
+// void test_dft(ExecMon& em)
+// {
+//     const int nrows = 300;
+//     const int ncols = 1000;
+
+//     const int nrounds = 100;
+
+//     auto arr = my_great_array(em, nrows, ncols);
+//     em("dft: make array");
+//     for (int count = 0; count < nrounds; ++count) {
+//         auto spec = dft(arr);
+//         auto orig = idft(spec);
+//     }
+//     em("dft with floats");
+// #ifdef WCT_HACK_FOR_FFTW_NO_SP
+//     for (int count = 0; count < nrounds; ++count) {
+//         auto spec = dftd(arr);
+//         auto orig = idftd(spec);
+//     }
+//     em("dft up/down cast through doubles");
+// #endif
+// }
+
+// void test_deconv(ExecMon& em)
+// {
+//     const int nrows = 300;
+//     const int ncols = 1000;
+
+//     em("deconv: start");
+//     auto arr = my_great_array(em, nrows, ncols);
+//     em("deconv: got array");
+//     array_xxc filt = Eigen::ArrayXXcf::Zero(nrows, ncols) + 1.0;
+//     em("deconv: got filter");
+//     auto deco = deconv(arr, filt);
+//     em("deconv: done");  // 38ms opt, 274 debug
+
+//     array_xxf diff = arr - deco;
+//     em("deconv: diff");
+
+//     double norm = diff.matrix().norm();
+//     em("deconv: norm");
+//     cerr << "got norm of diff " << norm << endl;
+//     Assert(norm < 0.001);
+// }
 
 void test_division(ExecMon& em)
 {
@@ -200,11 +200,11 @@ int main()
 {
     WireCell::ExecMon em;
 
-    test_partial(em);
+    // test_partial(em);
     test_copy(em);
     test_return(em);
-    test_dft(em);
-    test_deconv(em);
+    // test_dft(em);
+    // test_deconv(em);
     test_division(em);
     test_division_complex(em);
 
diff --git a/util/test/test_waveform.cxx b/util/test/test_waveform.cxx
index 23b30ed2c..ed7c230a6 100644
--- a/util/test/test_waveform.cxx
+++ b/util/test/test_waveform.cxx
@@ -40,29 +40,6 @@ void test_mean_rms()
     cerr << us.first << " +/- " << us.second << " med=" << m << endl;
 }
 
-void test_fft()
-{
-    Waveform::realseq_t s;
-    const int nbins = 360;
-    for (int ind = 0; ind < nbins; ++ind) {
-        double phi = ind * 3.1415 / 180.0;
-        Waveform::real_t val = sin(phi) + sin(11.0 / 7.0 * phi);
-        s.push_back(val);
-    }
-
-    auto spec = Waveform::dft(s);
-    for (int ind = 0; ind < nbins; ++ind) {
-        auto c = spec[ind];
-        cerr << ind << "\ts=" << s[ind] << "\tc=" << c << "\tmag=" << std::abs(c) << "\tphi=" << std::arg(c) << endl;
-    }
-    cerr << s.size() << " " << spec.size() << endl;
-}
-
-void test_complex()
-{
-    Waveform::compseq_t cv{{1.1, 2.2}, {-3.3, 4.4}, {0, 0}, {1, 0}, {0, 1}, {-1, 0}, {0, -1}};
-    auto bogus = Waveform::idft(cv);
-}
 
 void test_arithmetic()
 {
@@ -94,8 +71,6 @@ void test_arithmetic()
 int main(int argc, char* argv[])
 {
     test_transform();
-    test_fft();
-    test_complex();
     test_mean_rms();
     test_arithmetic();
 

From 927d8ef9d40c5bad2b9c5e1ae9a28268f4732fa0 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 29 Nov 2021 12:27:09 -0500
Subject: [PATCH 28/46] Fix lack of storing device name.

---
 gen/inc/WireCellGen/PlaneImpactResponse.h  | 1 +
 pytorch/inc/WireCellPytorch/TorchContext.h | 2 +-
 pytorch/src/DNNROIFinding.cxx              | 3 ++-
 pytorch/src/TorchContext.cxx               | 1 +
 pytorch/src/TorchService.cxx               | 9 +++++----
 5 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/gen/inc/WireCellGen/PlaneImpactResponse.h b/gen/inc/WireCellGen/PlaneImpactResponse.h
index ec304c865..d1cb968e9 100644
--- a/gen/inc/WireCellGen/PlaneImpactResponse.h
+++ b/gen/inc/WireCellGen/PlaneImpactResponse.h
@@ -33,6 +33,7 @@ namespace WireCell {
                            const Waveform::realseq_t& wf, int waveform_pad,
                            const Waveform::realseq_t& long_wf, int long_waveform_pad)
               : m_impact(impact)
+              , m_spectrum(spectrum)
               , m_waveform(wf)
               , m_waveform_pad(waveform_pad)
               , m_long_waveform(long_wf)
diff --git a/pytorch/inc/WireCellPytorch/TorchContext.h b/pytorch/inc/WireCellPytorch/TorchContext.h
index 66979a1c5..6df72d090 100644
--- a/pytorch/inc/WireCellPytorch/TorchContext.h
+++ b/pytorch/inc/WireCellPytorch/TorchContext.h
@@ -38,7 +38,7 @@ namespace WireCell::Pytorch {
       private:
 
         torch::Device m_dev{torch::kCPU};
-        std::string m_devname;
+        std::string m_devname{""};
         ISemaphore::pointer m_sem;
      };
 
diff --git a/pytorch/src/DNNROIFinding.cxx b/pytorch/src/DNNROIFinding.cxx
index c875f9714..f3fda52df 100644
--- a/pytorch/src/DNNROIFinding.cxx
+++ b/pytorch/src/DNNROIFinding.cxx
@@ -234,7 +234,8 @@ bool Pytorch::DNNROIFinding::operator()(const IFrame::pointer& inframe, IFrame::
     std::vector<torch::jit::IValue> inputs;
     inputs.push_back(batch);
 
-    log->debug(tk(fmt::format("call={} calling model", m_save_count)));
+    log->debug(tk(fmt::format("call={} calling model \"{}\"",
+                              m_save_count, m_cfg.forward)));
 
     // Execute the model and turn its output into a tensor.
     auto iitens = Pytorch::to_itensor(inputs);
diff --git a/pytorch/src/TorchContext.cxx b/pytorch/src/TorchContext.cxx
index ed219f93b..72262f24b 100644
--- a/pytorch/src/TorchContext.cxx
+++ b/pytorch/src/TorchContext.cxx
@@ -27,6 +27,7 @@ void TorchContext::connect(const std::string& devname,
         }
         m_dev = torch::Device(torch::kCUDA, devnum);
     }
+    m_devname = devname;
 
     std::string s_tn = "Semaphore:torch-" + devname;
     if (not semname.empty()) {
diff --git a/pytorch/src/TorchService.cxx b/pytorch/src/TorchService.cxx
index b78a3a8d0..c09243657 100644
--- a/pytorch/src/TorchService.cxx
+++ b/pytorch/src/TorchService.cxx
@@ -49,19 +49,20 @@ void Pytorch::TorchService::configure(const WireCell::Configuration& cfg)
         m_module = torch::jit::load(model_path, m_ctx.device());
     }
     catch (const c10::Error& e) {
-        log->critical("error loading model: {} to {}: {}",
+        log->critical("error loading model: \"{}\" to device \"{}\": {}",
                       model_path, dev, e.what());
         throw;                  // rethrow
     }
 
-    log->debug("loaded model {} to {}", model_path, dev);
+    log->debug("loaded model \"{}\" to device \"{}\"",
+               model_path, m_ctx.devname());
 }
 
 ITensorSet::pointer Pytorch::TorchService::forward(const ITensorSet::pointer& in) const
 {
     TorchSemaphore sem(m_ctx);
 
-    log->debug("running model on {}", m_ctx.devname());
+    log->debug("running model on device: \"{}\"", m_ctx.devname());
 
     torch::NoGradGuard no_grad;
 
@@ -72,7 +73,7 @@ ITensorSet::pointer Pytorch::TorchService::forward(const ITensorSet::pointer& in
         oival = m_module.forward(iival);
     }
     catch (const std::runtime_error& err) {
-        log->error("error running model on {}: {}",
+        log->error("error running model on device \"{}\": {}",
                    m_ctx.devname(), err.what());
         return nullptr;
     }

From fedd276c00b8e286b3c810f5b381c3d3c9e21ea9 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 29 Nov 2021 12:28:13 -0500
Subject: [PATCH 29/46] Fix the ignored base class config methods by
 removing/moving the base code into the one and only subclass

---
 sigproc/inc/WireCellSigProc/Protodune.h | 35 ++++-----------------
 sigproc/src/Protodune.cxx               | 42 +++++--------------------
 2 files changed, 13 insertions(+), 64 deletions(-)

diff --git a/sigproc/inc/WireCellSigProc/Protodune.h b/sigproc/inc/WireCellSigProc/Protodune.h
index f83f7b06b..2fa443b00 100644
--- a/sigproc/inc/WireCellSigProc/Protodune.h
+++ b/sigproc/inc/WireCellSigProc/Protodune.h
@@ -30,35 +30,8 @@ namespace WireCell {
             bool FftScaling(const IDFT::pointer& dft,
                             WireCell::Waveform::realseq_t& signal, int nsamples);
 
-            // hold common config stuff
-            class ConfigFilterBase : public WireCell::IConfigurable {
-               public:
-                ConfigFilterBase(const std::string& anode = "AnodePlane",
-                                 const std::string& noisedb = "OmniChannelNoiseDB");
-                virtual ~ConfigFilterBase();
-
-                // IConfigurable configuration interface
-                virtual void configure(const WireCell::Configuration& config);
-                virtual WireCell::Configuration default_configuration() const;
-
-                // FIXME: this method needs to die.
-                void set_channel_noisedb(WireCell::IChannelNoiseDatabase::pointer ndb) { m_noisedb = ndb; }
-
-               protected:
-                std::string m_anode_tn, m_noisedb_tn;
-                IAnodePlane::pointer m_anode;
-                IChannelNoiseDatabase::pointer m_noisedb;
-                IDFT::pointer m_dft;
-            };
-
-            /** Microboone/ProtoDUNE style noise subtraction.
+            /** ProtoDUNE style noise subtraction.
              *
-             * Fixme: in principle, this class could be general purpose
-             * for other detectors.  However, it uses the functions above
-             * which hard code microboone-isms.  If those
-             * microboone/protodune-specific parameters can be pulled out to a
-             * higher layer then this class can become generic and move
-             * outside of this file.
              */
 
             class StickyCodeMitig : public WireCell::IChannelFilter, public WireCell::IConfigurable {
@@ -91,7 +64,7 @@ namespace WireCell {
                 int m_stky_max_len;
             };
 
-            class OneChannelNoise : public WireCell::IChannelFilter, public ConfigFilterBase {
+            class OneChannelNoise : public WireCell::IChannelFilter, public WireCell::IConfigurable {
                public:
                 OneChannelNoise(const std::string& anode_tn = "AnodePlane",
                                 const std::string& noisedb = "OmniChannelNoiseDB");
@@ -109,8 +82,12 @@ namespace WireCell {
                 WireCell::Configuration default_configuration() const;
 
                private:
+                std::string m_anode_tn, m_noisedb_tn;
                 Diagnostics::Partial m_check_partial;  // at least need to expose them to configuration
                 std::map<int, int> m_resmp;            // ch => orignal smp input
+                IAnodePlane::pointer m_anode;
+                IChannelNoiseDatabase::pointer m_noisedb;
+                IDFT::pointer m_dft;
             };
 
             // A relative gain correction based on David Adam's pulse area calibration
diff --git a/sigproc/src/Protodune.cxx b/sigproc/src/Protodune.cxx
index 4eece13a8..05cabbf9f 100644
--- a/sigproc/src/Protodune.cxx
+++ b/sigproc/src/Protodune.cxx
@@ -561,36 +561,6 @@ bool Protodune::FftScaling(const IDFT::pointer& dft,
  * Classes
  */
 
-/*
- * Configuration base class used for a couple filters
- */
-Protodune::ConfigFilterBase::ConfigFilterBase(const std::string& anode, const std::string& noisedb)
-  : m_anode_tn(anode)
-  , m_noisedb_tn(noisedb)
-{
-}
-Protodune::ConfigFilterBase::~ConfigFilterBase() {}
-void Protodune::ConfigFilterBase::configure(const WireCell::Configuration& cfg)
-{
-    m_anode_tn = get(cfg, "anode", m_anode_tn);
-    m_anode = Factory::find_tn<IAnodePlane>(m_anode_tn);
-    m_noisedb_tn = get(cfg, "noisedb", m_noisedb_tn);
-    m_noisedb = Factory::find_tn<IChannelNoiseDatabase>(m_noisedb_tn);
-
-    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
-    m_dft = Factory::find_tn<IDFT>(dft_tn);
-
-    // std::cerr << "ConfigFilterBase: \n" << cfg << "\n";
-}
-WireCell::Configuration Protodune::ConfigFilterBase::default_configuration() const
-{
-    Configuration cfg;
-    cfg["anode"] = m_anode_tn;
-    cfg["noisedb"] = m_noisedb_tn;
-    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
-    return cfg;
-}
-
 Protodune::StickyCodeMitig::StickyCodeMitig(const std::string& anode, const std::string& noisedb,
                                             float stky_sig_like_val, float stky_sig_like_rms, int stky_max_len)
   : m_anode_tn(anode)
@@ -745,8 +715,10 @@ WireCell::Waveform::ChannelMaskMap Protodune::StickyCodeMitig::apply(channel_sig
     return WireCell::Waveform::ChannelMaskMap();
 }
 
+
 Protodune::OneChannelNoise::OneChannelNoise(const std::string& anode, const std::string& noisedb)
-  : ConfigFilterBase(anode, noisedb)
+  : m_anode_tn(anode)
+  , m_noisedb_tn(noisedb)
   , m_check_partial()  // fixme, here too.
   , m_resmp()
 {
@@ -757,13 +729,12 @@ void Protodune::OneChannelNoise::configure(const WireCell::Configuration& cfg)
 {
     m_anode_tn = get(cfg, "anode", m_anode_tn);
     m_anode = Factory::find_tn<IAnodePlane>(m_anode_tn);
-    if (!m_anode) {
-        THROW(KeyError() << errmsg{"failed to get IAnodePlane: " + m_anode_tn});
-    }
-
     m_noisedb_tn = get(cfg, "noisedb", m_noisedb_tn);
     m_noisedb = Factory::find_tn<IChannelNoiseDatabase>(m_noisedb_tn);
 
+    std::string dft_tn = get<std::string>(cfg, "dft", "FftwDFT");
+    m_dft = Factory::find_tn<IDFT>(dft_tn);
+
     m_resmp.clear();
     auto jext = cfg["resmp"];
     if (!jext.isNull()) {
@@ -781,6 +752,7 @@ WireCell::Configuration Protodune::OneChannelNoise::default_configuration() cons
     Configuration cfg;
     cfg["anode"] = m_anode_tn;
     cfg["noisedb"] = m_noisedb_tn;
+    cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
     return cfg;
 }
 

From 28af34979ff808400c29d42fd140409ed164ff01 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Mon, 29 Nov 2021 12:29:31 -0500
Subject: [PATCH 30/46] Measure first exec+plan separate from subsequent execs

---
 root/test/test_fft.cxx | 158 +++++++++++++++++++++++++++++------------
 1 file changed, 113 insertions(+), 45 deletions(-)

diff --git a/root/test/test_fft.cxx b/root/test/test_fft.cxx
index ca20e7900..e5c63a6e7 100644
--- a/root/test/test_fft.cxx
+++ b/root/test/test_fft.cxx
@@ -178,25 +178,30 @@ int main(int argc, char* argv[])
     // do timing tests
     {
         TGraph* timings[4] = {new TGraph, new TGraph, new TGraph, new TGraph};
+        TGraph* timings_1st[4] = {new TGraph, new TGraph, new TGraph, new TGraph};
 
         // Some popular choices with powers-of-two sprinkled in
-        std::vector<int> nsampleslist{128,   256,  400,  480,  // protoDUNE U/V and W channels per plane
-                                      512,
-                                      800,  // protoDUNE, sum of U or V channels for both faces
-                                      960,  // protoDUNE, sum of W channels (or wires) for both faces
-                                      1024,
-                                      1148,  // N wires in U/V plane for protodune
-                                      2048,
-                                      2400,  // number of channels in U or V in microboone
-                                      2560,  // DUNE, total APA channels
-                                      3456,  // number of channels in microboone's W
-                                      4096,
-                                      6000,  // one choice of nticks for protoDUNE
-                                      8192,
-                                      8256,                     // total microboone channels
-                                      9592,  9594, 9595, 9600,  // various microboone readout lengths
-                                      10000,                    // 5 ms at 2MHz readout
-                                      10240, 16384};
+        std::vector<int> nsampleslist{
+            128, 256,        // small powers of 2
+            400, 480,        // protoDUNE U/V and W channels per plane
+            512,
+            800,                // protoDUNE, all U or V channels
+            960,                // protoDUNE, all W channels
+            1024,
+            1148,               // what's this?
+            2000,  // iceberg
+            2048,
+            2400,  // number of channels in U or V in microboone
+            2560,  // DUNE, total APA channels
+            3456,  // number of channels in microboone's W
+            4096,
+            6000,  // one choice of nticks for protoDUNE
+            8192,
+            8256,                     // total microboone channels
+            9587,                     // prime near MB nticks
+            9592,  9594, 9595, 9600,  // various MB nticks
+            10000,                    // 5 ms at 2MHz readout
+            10240, 16384};
         const int ntries = 1000;
         for (auto nsamps : nsampleslist) {
             Response::ColdElec ce(gains[1], shapings[1]);
@@ -204,6 +209,14 @@ int main(int argc, char* argv[])
             Waveform::realseq_t res = ce.generate(bins);
             Waveform::compseq_t spec;
 
+
+            double fwd_time_1st = 0.0;
+            {
+                auto t1 = std::chrono::high_resolution_clock::now();
+                spec = Aux::fwd_r2c(idft, res);
+                auto t2 = std::chrono::high_resolution_clock::now();
+                fwd_time_1st += std::chrono::duration_cast<std::chrono::nanoseconds>(t2 - t1).count();
+            }
             double fwd_time = 0.0;
             for (int itry = 0; itry < ntries; ++itry) {
                 auto t1 = std::chrono::high_resolution_clock::now();
@@ -213,6 +226,13 @@ int main(int argc, char* argv[])
             }
             fwd_time /= ntries;
 
+            double rev_time_1st = 0.0;
+            {
+                auto t1 = std::chrono::high_resolution_clock::now();
+                res = Aux::inv_c2r(idft, spec);
+                auto t2 = std::chrono::high_resolution_clock::now();
+                rev_time_1st = std::chrono::duration_cast<std::chrono::nanoseconds>(t2 - t1).count();
+            }
             double rev_time = 0.0;
             for (int itry = 0; itry < ntries; ++itry) {
                 auto t1 = std::chrono::high_resolution_clock::now();
@@ -233,45 +253,93 @@ int main(int argc, char* argv[])
             timings[1]->SetPoint(timings[1]->GetN(), nsamps, fwd_time / nsamps);
             timings[2]->SetPoint(timings[2]->GetN(), nsamps, rev_time);
             timings[3]->SetPoint(timings[3]->GetN(), nsamps, rev_time / nsamps);
+
+            timings_1st[0]->SetPoint(timings_1st[0]->GetN(), nsamps, fwd_time_1st);
+            timings_1st[1]->SetPoint(timings_1st[1]->GetN(), nsamps, fwd_time_1st / (fwd_time));
+            timings_1st[2]->SetPoint(timings_1st[2]->GetN(), nsamps, rev_time_1st);
+            timings_1st[3]->SetPoint(timings_1st[3]->GetN(), nsamps, rev_time_1st / (rev_time));
+
         }
 
         pdf.canvas.Clear();
         pdf.canvas.Divide(1, 2);
 
-        auto text = new TText;
         {
-            auto pad = pdf.canvas.cd(1);
-            pad->SetGridx();
-            pad->SetGridy();
-            pad->SetLogx();
-            auto graph = timings[0];
-            auto frame = graph->GetHistogram();
-            frame->SetTitle("Fwd/rev DFT timing (absolute)");
-            frame->GetXaxis()->SetTitle("number of samples");
-            frame->GetYaxis()->SetTitle("time (ns)");
-            timings[0]->Draw("AL");
-            timings[2]->Draw("L");
-            for (int ind = 0; ind < graph->GetN(); ++ind) {
-                auto x = graph->GetX()[ind];
-                auto y = graph->GetY()[ind];
-                text->DrawText(x, y, Form("%.0f", x));
+            auto text = new TText;
+            {
+                auto pad = pdf.canvas.cd(1);
+                pad->SetGridx();
+                pad->SetGridy();
+                pad->SetLogx();
+                pad->SetLogy();
+                auto graph = timings[0];
+                auto frame = graph->GetHistogram();
+                frame->SetTitle("Fwd/rev DFT timing (absolute)");
+                frame->GetXaxis()->SetTitle("number of samples");
+                frame->GetYaxis()->SetTitle("time [ns]");
+                timings[0]->Draw("AL");
+                timings[2]->Draw("L");
+                for (int ind = 0; ind < graph->GetN(); ++ind) {
+                    auto x = graph->GetX()[ind];
+                    auto y = graph->GetY()[ind];
+                    text->DrawText(x, y, Form("%.0f", x));
+                }
+            }
+
+            {
+                auto pad = pdf.canvas.cd(2);
+                pad->SetGridx();
+                pad->SetGridy();
+                pad->SetLogx();
+                auto frame = timings[1]->GetHistogram();
+                frame->SetTitle("Fwd/rev DFT timing (relative to size)");
+                frame->GetXaxis()->SetTitle("number of samples");
+                frame->GetYaxis()->SetTitle("time per sample [ns/samp]");
+                timings[1]->Draw("AL");
+                timings[3]->Draw("L");
             }
+            pdf();
         }
 
+        pdf.canvas.Clear();
+        pdf.canvas.Divide(1, 2);
+
         {
-            auto pad = pdf.canvas.cd(2);
-            pad->SetGridx();
-            pad->SetGridy();
-            pad->SetLogx();
-            auto frame = timings[1]->GetHistogram();
-            frame->SetTitle("Fwd/rev DFT timing (relative)");
-            frame->GetXaxis()->SetTitle("number of samples");
-            frame->GetYaxis()->SetTitle("time per sample (ns/samp)");
-            timings[1]->Draw("AL");
-            timings[3]->Draw("L");
+            auto text = new TText;
+            {
+                auto pad = pdf.canvas.cd(1);
+                pad->SetGridx();
+                pad->SetGridy();
+                pad->SetLogx();
+                pad->SetLogy();
+                auto graph = timings_1st[0];
+                auto frame = graph->GetHistogram();
+                frame->SetTitle("fwd/rev DFT timing, ''cold'' (plan+exec) (absolute time)");
+                frame->GetXaxis()->SetTitle("number of samples");
+                frame->GetYaxis()->SetTitle("time [ns]");
+                timings_1st[0]->Draw("AL");
+                timings_1st[2]->Draw("L");
+                for (int ind = 0; ind < graph->GetN(); ++ind) {
+                    auto x = graph->GetX()[ind];
+                    auto y = graph->GetY()[ind];
+                    text->DrawText(x, y, Form("%.0f", x));
+                }
+            }
+
+            {
+                auto pad = pdf.canvas.cd(2);
+                pad->SetGridx();
+                pad->SetGridy();
+                pad->SetLogx();
+                auto frame = timings_1st[1]->GetHistogram();
+                frame->SetTitle("Fwd/rev DFT timing (cold/warm relative)");
+                frame->GetXaxis()->SetTitle("number of samples");
+                frame->GetYaxis()->SetTitle("relative time [ns / ns]");
+                timings_1st[1]->Draw("AL");
+                timings_1st[3]->Draw("L");
+            }
+            pdf();
         }
-        pdf();
     }
-
     return 0;
 }

From 3411d424945f97b60e744c82afb98e9a7a54c709 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 30 Nov 2021 16:18:28 -0500
Subject: [PATCH 31/46] Add single precision complex float

---
 util/inc/custard/pigenc.hpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/util/inc/custard/pigenc.hpp b/util/inc/custard/pigenc.hpp
index 6c5b29773..1633ba4e0 100644
--- a/util/inc/custard/pigenc.hpp
+++ b/util/inc/custard/pigenc.hpp
@@ -10,6 +10,7 @@
 #include <ostream>
 #include <string>
 #include <regex>
+#include <complex>
 
 #include "nlohmann/json.hpp"
 
@@ -111,6 +112,7 @@ namespace pigenc {
     template<> inline std::string dtype<int64_t>()  { return "<i8"; }
     template<> inline std::string dtype<uint64_t>() { return "<u8"; }
     template<> inline std::string dtype<float>()    { return "<f4"; }
+    template<> inline std::string dtype<std::complex<float>>()    { return "<c8"; }
     template<> inline std::string dtype<double>()   { return "<f8"; }
 
     // This assumes string like "...NN" where NN is number of bytes.

From f31dcaabac1d8e301c5d6900b9719d239e219bc0 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Tue, 30 Nov 2021 16:19:07 -0500
Subject: [PATCH 32/46] A start on a correctness test for IDFT

---
 aux/inc/WireCellAux/DftTools.h           |   1 -
 aux/test/aux_test_dft_helpers.h          |  11 +-
 aux/test/check_idft.cxx                  | 223 +++++++++++++++++++++++
 cfg/pgrapher/common/helpers/aux.jsonnet  |   3 +
 cfg/pgrapher/common/helpers/gen.jsonnet  |  20 +-
 cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet |   3 +
 6 files changed, 249 insertions(+), 12 deletions(-)
 create mode 100644 aux/test/check_idft.cxx

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
index b072fc684..d4b988806 100644
--- a/aux/inc/WireCellAux/DftTools.h
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -54,7 +54,6 @@ namespace WireCell::Aux {
         std::transform(cvec.begin(), cvec.end(), rvec.begin(),
                        [](const Aux::complex_t& c) { return std::real(c); });
         return rvec;
-        
     }
 
     // 1D high-level interface
diff --git a/aux/test/aux_test_dft_helpers.h b/aux/test/aux_test_dft_helpers.h
index 240d5b667..d91fdfa69 100644
--- a/aux/test/aux_test_dft_helpers.h
+++ b/aux/test/aux_test_dft_helpers.h
@@ -102,6 +102,7 @@ namespace WireCell::Aux::Test {
         std::string pi{"WireCellAux"};
         std::string cfg_name{""};
         std::string output{""};
+        std::vector<std::string> positional;
         Configuration cfg;
     };        
 
@@ -110,13 +111,15 @@ namespace WireCell::Aux::Test {
     {
         CLI::App app{"wct dft test"};
         app.add_option("-o,--output", args.output,
-                   "Output file")->type_size(1)->allow_extra_args(false);
+                       "Output file")->type_size(1)->allow_extra_args(false);
         app.add_option("-p,--plugin", args.pi,
-                   "Plugin")->type_size(1)->allow_extra_args(false);
+                       "Plugin")->type_size(1)->allow_extra_args(false);
         app.add_option("-t,--typename", args.tn,
-                   "Type or Type:Name of IDFT imp")->type_size(1)->allow_extra_args(false);
+                       "Type or Type:Name of IDFT imp")->type_size(1)->allow_extra_args(false);
         app.add_option("-c,--config", args.cfg_name,
-                   "Config file for IDFT imp")->type_size(1)->allow_extra_args(false);
+                       "Config file for IDFT imp")->type_size(1)->allow_extra_args(false);
+        app.add_option("arguments", args.positional,
+                       "Any positional arguments");
         CLI11_PARSE(app, argc, argv);
 
         if (not args.cfg_name.empty()) {
diff --git a/aux/test/check_idft.cxx b/aux/test/check_idft.cxx
new file mode 100644
index 000000000..3e71a4dfa
--- /dev/null
+++ b/aux/test/check_idft.cxx
@@ -0,0 +1,223 @@
+/** Run IDFT operations on input array, write result
+
+    Usage:
+
+    check_idft -c cfg.[json|jsonnet] -o out.tar.bz2 [-p pi -t tn] in.tar.bz2 ...
+
+    The configuration file should be a sequence of objects describing
+    transformations.  Each object with these keys:
+
+    - src : source array name 
+    - dst : destination array name
+    - op : operator name, see below.
+
+    The operator is given as a keyword which encodes 
+
+    - DIR : the direction of the transform, one in {fwd, inv}
+    - R : the rank of the transform (not array), on in {1, 2}
+    - V : a variant of "batched" ("b") or full dimensional ("d")
+    - A : an optional "axis" number in {0,1} for bached
+    - C : an optional conversion between real and complex, in {"r2c", "c2r"}
+
+    Some examples:
+
+    All complex input and complex output:
+
+    - fwd1d :: 1D forward transform on a 1D array
+    - inv2d :: 2D transform on a 2D array
+    - fwd1b1 :: 1D forward transform on axis=1 (each row is transformed) on a 2D array
+
+    Mixed real/complex
+
+    - fwd1d_r2c :: fwd1d on 1D real array producing complex array
+    - inv2d_c2r :: inv2d on 2D complex array producing real array
+
+ */
+
+
+#include "aux_test_dft_helpers.h"
+#include "WireCellUtil/Stream.h"
+#include "WireCellAux/DftTools.h"
+
+#include <boost/iostreams/filtering_stream.hpp>
+
+#include <map>
+#include <string>
+#include <complex>
+#include <algorithm>
+
+using namespace WireCell;
+using namespace WireCell::Stream;
+using namespace WireCell::Aux::Test;
+
+using array_xxf = Eigen::Array<float, Eigen::Dynamic, Eigen::Dynamic>;
+using complex_t = std::complex<float>;
+using array_xxc = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic>;
+
+// may hold any dtype and shape
+using pig_array = pigenc::File;
+using array_store = std::map<std::string, pig_array>;
+
+using dft_op = std::function<pig_array(pig_array)>;
+using op_lu_t = std::map<std::string, dft_op>;
+
+using vector_xf = std::vector<float>;
+using vector_xc = std::vector<complex_t>;
+
+
+static
+vector_xf v_c2r(const vector_xc& cvec)
+{
+    vector_xf ret(cvec.size());
+    std::transform(cvec.begin(), cvec.end(), ret.begin(),
+                   [](complex_t c) { return std::real(c); });
+    return ret;
+}
+static
+vector_xc v_c2r(const vector_xf& rvec)
+{
+    vector_xc cret(rvec.size());
+    std::transform(rvec.begin(), rvec.end(), cret.begin(),
+                   [](float re) { return complex_t(re, 0); });
+    return cret;
+}
+
+
+template<typename Scalar>
+static std::vector<Scalar> p2v(const pig_array& pa)
+{
+    auto vec = pa.as_vec<Scalar>();
+    if (vec.empty()) {
+        throw std::runtime_error("p2v type mismatch");
+    }
+    return vec;
+}
+template<typename Scalar>
+pig_array v2p(const std::vector<Scalar>& vec)
+{
+    std::vector<char> data((const char*)vec.data(),
+                           (const char*)vec.data() + sizeof(Scalar)*vec.size());
+    pig_array pa;
+    pa.set<complex_t>(data, {vec.size()});
+    return pa;
+}
+
+
+template<typename Scalar>
+Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic> p2a(const pig_array& pa)
+{
+    Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic> arr;
+    bool ok = pigenc::eigen::load(pa, arr);
+    if (!ok) {
+        throw std::runtime_error("p2a type mismatch");
+    }
+    return arr;
+}
+template<typename Scalar>
+pig_array a2p(const Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic>& arr)
+{
+    pig_array pa;
+    pigenc::eigen::dump(pa, arr);
+    return pa;
+}
+
+
+pig_array dispatch(const IDFT::pointer& dft, const pig_array& pa, const std::string& op)
+{
+    if (op == "fwd1d") 
+        return v2p<complex_t>(Aux::fwd(dft, p2v<complex_t>(pa)));
+
+    if (op == "inv1d") 
+        return v2p<complex_t>(Aux::fwd(dft, p2v<complex_t>(pa)));
+            
+    if (op == "fwd1d_r2c") 
+        return v2p<complex_t>(Aux::fwd_r2c(dft, p2v<float>(pa)));
+
+    if (op == "inv1d_c2r") 
+        return v2p<float>(Aux::inv_c2r(dft, p2v<complex_t>(pa)));
+
+}
+
+int main(int argc, char* argv[])
+{
+    DftArgs args;
+    int rc = make_dft_args(args, argc, argv);
+    if (rc) { return rc; }
+
+    if (args.positional.empty()) {
+        std::cerr << "need at least one input file" << std::endl;
+        return 0;
+    }
+    if (args.output.empty()) {
+        std::cerr << "need output file" << std::endl;
+        return 0;
+    }
+    if (args.cfg.empty()) {
+        std::cerr << "need configuration" << std::endl;
+        return 0;
+    }
+    std::cerr << args.cfg << std::endl;
+    
+    auto idft = make_dft(args.tn, args.pi, args.cfg);
+
+    array_store arrs;
+
+    // Slurp in arrays.
+    for (const auto& sname : args.positional) {
+        boost::iostreams::filtering_istream ins;
+        std::cerr << "openning: "<<sname<<"\n";
+        ins.clear();
+        input_filters(ins, sname);
+        if (ins.size() < 2) {     // expect bz2 + tar filters + file source.
+            std::cerr << "Unexpected file format with: "<<sname<<"\n";
+            return 1;
+        }
+            
+        std::string fname{""};
+        size_t fsize{0};
+        custard::read(ins, fname, fsize);
+        if (ins.eof()) {
+            std::cerr << "EOF on custard head read\n";
+            break;
+        }
+        if (!ins) {
+            std::cerr << "ERROR unpacking tar header " << strerror(errno) << std::endl;
+            return -1;
+        }
+        std::cerr << "Unpacking " << fname << " " << fsize << std::endl;
+        
+        pigenc::File pig;
+        pig.read(ins);
+        if (!ins) {
+            std::cerr << "ERROR unpacking pig " << strerror(errno) << std::endl;
+            return -1;
+        }
+        std::cerr << "Read in " << fname << " with dtype=" << pig.header().dtype() << std::endl;
+
+        arrs[fname] = pig;
+    }
+
+    for (auto one : args.cfg) {
+        auto src = one["src"].asString();
+        auto it = arrs.find(src);
+        if (it == arrs.end()) {
+            std::cerr << "no src array: " << src << std::endl;
+            continue;
+        }
+
+        auto op = one["op"].asString();
+        auto darr = dispatch(idft, it->second, op);
+
+        auto dst = one["dst"];
+        if (darr.header().array_size() == 0) {
+            std::cerr << "failed: " << op <<  "(" << src << ") -> " << dst << "\n";
+            continue;
+        }
+
+        // write dst
+        std::cerr << "fixme: not (yet) writing: " << dst << std::endl;
+
+    }
+
+    return 0;
+}
diff --git a/cfg/pgrapher/common/helpers/aux.jsonnet b/cfg/pgrapher/common/helpers/aux.jsonnet
index 0aa977a4a..e83b444c3 100644
--- a/cfg/pgrapher/common/helpers/aux.jsonnet
+++ b/cfg/pgrapher/common/helpers/aux.jsonnet
@@ -6,6 +6,9 @@
 local wc = import "wirecell.jsonnet";
 
 {
+    // Default DFT uses FFTW3
+    dft : { type: "FftwDFT" },
+
     // Configure "wire" geometry and channel map to load from file
     wires(filename) :: {
         type:"WireSchemaFile",
diff --git a/cfg/pgrapher/common/helpers/gen.jsonnet b/cfg/pgrapher/common/helpers/gen.jsonnet
index 9bbaa6611..6ba78e335 100644
--- a/cfg/pgrapher/common/helpers/gen.jsonnet
+++ b/cfg/pgrapher/common/helpers/gen.jsonnet
@@ -4,6 +4,8 @@
 local wc = import "wirecell.jsonnet";
 local pg = import "pgraph.jsonnet";
 local u = import "utils.jsonnet";
+local aux = import "aux.jsonnet";
+
 
 {
     default_seeds: [0, 1, 2, 3, 4],
@@ -75,7 +77,7 @@ local u = import "utils.jsonnet";
     // fr is a field response object (see fr() above).
     // srs is list of "short response" config objects, eg cer()
     // lrs is list of "long response" config objects, eg rc()
-    pirs(fr, srs, lrs) :: [ {
+    pirs(fr, srs, lrs, dft=aux.dft) :: [ {
         type: "PlaneImpactResponse",
         name : std.toString(plane),
         data : {
@@ -87,12 +89,13 @@ local u = import "utils.jsonnet";
             long_responses: [wc.tn(r) for r in lrs],
             // this needs to be big enough to convolve RC
             long_padding: 1.5*wc.ms,
+            dft: wc.tn(dft),
         },
-        uses: [fr] + srs + lrs,
+        uses: [dft, fr] + srs + lrs,
     } for plane in [0,1,2]],
 
     // signal simulation
-    signal(anode, pirs, daq, lar, rnd=$.random()) ::
+    signal(anode, pirs, daq, lar, rnd=$.random(), dft=aux.dft) ::
         pg.pipeline([
             pg.pnode({
                 type:'DepoTransform',
@@ -108,8 +111,9 @@ local u = import "utils.jsonnet";
                     start_time: 0,
                     tick: daq.tick,
                     nsigma: 3,
+                    dft: wc.tn(dft),
                 },
-            }, nin=1, nout=1, uses=pirs + [anode, rnd]),
+            }, nin=1, nout=1, uses=pirs + [anode, rnd, dft]),
 
             pg.pnode({
                 type: 'Reframer',
@@ -126,7 +130,7 @@ local u = import "utils.jsonnet";
 
 
     // Return a frame filter config that will add in noise.
-    noise(anode, filename, daq, chstat=null, rnd=$.random()) ::
+    noise(anode, filename, daq, chstat=null, rnd=$.random(), dft=aux.dft) ::
         local cs = if std.type(chstat) == "null"
                    then {tn:"", uses:[]}
                    else {tn:wc.tn(chstat), uses:[chstat]};
@@ -140,8 +144,9 @@ local u = import "utils.jsonnet";
                 nsamples: daq.nticks,
                 period: daq.tick,
                 wire_length_scale: 1.0*wc.cm, // optimization binning
+                dft: wc.tn(dft),
             },
-            uses: [anode] + cs.uses,
+            uses: [anode, dft] + cs.uses,
         };
 
         pg.pnode({
@@ -152,7 +157,8 @@ local u = import "utils.jsonnet";
                 model: wc.tn(noise_model),
                 nsamples: daq.nticks,
                 replacement_percentage: 0.02, // random optimization
-            }}, nin=1, nout=1, uses=[rnd, noise_model]),
+                dft: wc.tn(dft),
+            }}, nin=1, nout=1, uses=[rnd, noise_model, dft]),
 
 
     // digitizer simulation
diff --git a/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet b/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet
index 631dcd2e7..aa268e325 100644
--- a/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet
+++ b/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet
@@ -11,6 +11,9 @@ local hs = import "pgrapher/common/helpers.jsonnet";
 local wires = hs.aux.wires(params.files.wires);
 local anodes = hs.aux.anodes(wires, params.det.volumes);
 
+// IDFT
+local dft = {type: 'FftwDFT'};
+
 // simulation
 
 // kinematics: ideal line source

From b7746792667900d579ac3850fa9cc5fe20cdc4de Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Wed, 1 Dec 2021 11:29:05 -0500
Subject: [PATCH 33/46] Add r2c and c2r helpers

---
 aux/inc/WireCellAux/DftTools.h | 16 ++++++++++++++--
 aux/src/DftTools.cxx           | 11 +++++++++++
 2 files changed, 25 insertions(+), 2 deletions(-)

diff --git a/aux/inc/WireCellAux/DftTools.h b/aux/inc/WireCellAux/DftTools.h
index d4b988806..9530bb3ef 100644
--- a/aux/inc/WireCellAux/DftTools.h
+++ b/aux/inc/WireCellAux/DftTools.h
@@ -86,8 +86,9 @@ namespace WireCell::Aux {
 
     // Eigen array based functions
 
-    /// A complex, 2D array.  Use Array::cast<type>() if you need to
-    /// convert to/from real.
+    /// 2D array types.  Note, use Array::cast<complex_t>() if you
+    /// need to convert rom real or arr.real() to convert to real.
+    using real_array_t = Eigen::ArrayXXf;
     using complex_array_t = Eigen::ArrayXXcf;
     
     // 2D with Eigen arrays.  Use eg arr.cast<complex_>() to provde
@@ -97,6 +98,12 @@ namespace WireCell::Aux {
     complex_array_t fwd(const IDFT::pointer& dft, const complex_array_t& arr);
     complex_array_t inv(const IDFT::pointer& dft, const complex_array_t& arr);
 
+    // As above but internally convert input or output.  These are
+    // just syntactic sugar hiding a .cast<complex_t>() or a .real()
+    // call.
+    complex_array_t fwd_r2c(const IDFT::pointer& dft, const real_array_t& arr);
+    real_array_t inv_c2r(const IDFT::pointer& dft, const complex_array_t& arr);
+
     // Transform a 2D array along one axis.
     //
     // The axis identifies the logical array "dimension" over which
@@ -113,6 +120,11 @@ namespace WireCell::Aux {
     complex_array_t fwd(const IDFT::pointer& dft, const complex_array_t& arr, int axis);
     complex_array_t inv(const IDFT::pointer& dft, const complex_array_t& arr, int axis);
 
+
+    // Fixme: possible additions
+    // - superposition of 2 reals for 2x speedup
+    // - r2c / c2r for 1b
+
 }
 
 #endif
diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index e0eb83e2c..1194c1aad 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -118,6 +118,17 @@ Aux::complex_array_t Aux::inv(const IDFT::pointer& dft,
     return ret;
 }
 
+Aux::complex_array_t Aux::fwd_r2c(const IDFT::pointer& dft,
+                                  const real_array_t& arr)
+{
+    return Aux::fwd(dft, arr.cast<Aux::complex_t>());
+}
+Aux::real_array_t Aux::inv_c2r(const IDFT::pointer& dft,
+                               const complex_array_t& arr)
+{
+    return Aux::inv(dft, arr).real();
+}
+
 
 Aux::real_vector_t Aux::convolve(const IDFT::pointer& dft,
                                  const Aux::real_vector_t& in1,

From e89f0c99e059e1f11a30060a68d2b2da7544fe68 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Wed, 1 Dec 2021 11:29:38 -0500
Subject: [PATCH 34/46] Replace cli11 with boost po and get checker fleshed out

---
 aux/test/aux_test_dft_helpers.h |  63 ++++++++++----
 aux/test/check_idft.cxx         | 143 +++++++++++++++++++++-----------
 2 files changed, 139 insertions(+), 67 deletions(-)

diff --git a/aux/test/aux_test_dft_helpers.h b/aux/test/aux_test_dft_helpers.h
index d91fdfa69..33d9564ec 100644
--- a/aux/test/aux_test_dft_helpers.h
+++ b/aux/test/aux_test_dft_helpers.h
@@ -5,11 +5,12 @@
 #include "WireCellUtil/PluginManager.h"
 #include "WireCellUtil/Exceptions.h"
 #include "WireCellUtil/Persist.h"
-#include "WireCellUtil/CLI11.hpp"
 
 #include "WireCellIface/IConfigurable.h"
 #include "WireCellIface/IDFT.h"
 
+#include <boost/program_options.hpp>
+
 #include <ctime>                // std::clock
 #include <chrono>
 
@@ -109,23 +110,49 @@ namespace WireCell::Aux::Test {
     // remove command name from main()'s argc/argv[0]
     int make_dft_args(DftArgs& args, int argc, char** argv) 
     {
-        CLI::App app{"wct dft test"};
-        app.add_option("-o,--output", args.output,
-                       "Output file")->type_size(1)->allow_extra_args(false);
-        app.add_option("-p,--plugin", args.pi,
-                       "Plugin")->type_size(1)->allow_extra_args(false);
-        app.add_option("-t,--typename", args.tn,
-                       "Type or Type:Name of IDFT imp")->type_size(1)->allow_extra_args(false);
-        app.add_option("-c,--config", args.cfg_name,
-                       "Config file for IDFT imp")->type_size(1)->allow_extra_args(false);
-        app.add_option("arguments", args.positional,
-                       "Any positional arguments");
-        CLI11_PARSE(app, argc, argv);
-
-        if (not args.cfg_name.empty()) {
-            // Either we get directly a "data" object 
+        // compilation times: po:19s, cli11:26s
+        namespace po = boost::program_options;
+
+        po::options_description desc("Options");
+        desc.add_options()("help,h", "IDFT tests [options] [arguments]")
+            ("output,o", po::value< std::string >(), "output file")
+            ("plugin,p", po::value< std::string >(), "plugin holding a IDFT")
+            ("typename,t", po::value< std::string >(), "type[:name] of the IDFT to use")
+            ("config,c",  po::value< std::string >(), "configuration file")
+            ("args",  po::value< std::vector<std::string> >(), "positional arguments")
+            ;
+        po::positional_options_description pos_desc;
+        pos_desc.add("args", -1);
+
+        auto parsed = po::command_line_parser(argc, argv)
+            .options(desc)
+            .positional(pos_desc)
+            .run();
+        po::variables_map opts;
+        po::store(parsed, opts);
+        po::notify(opts);
+
+        if (opts.count("help")) {
+            std::cout << desc << "\n";
+            return 1;
+        }
+        
+        if (opts.count("output")) {
+            args.output = opts["output"].as< std::string> ();
+        }
+        if (opts.count("plugin") ) {
+            args.pi = opts["plugin"].as< std::string >();
+        }
+        if (opts.count("typename")) {
+            args.tn = opts["typename"].as< std::string> ();
+        }
+        if (opts.count("args")) {
+            args.positional = opts["args"].as< std::vector<std::string> >();
+        }
+        if (opts.count("config")) {
+            args.cfg_name = opts["config"].as< std::string> ();
             auto cfg = Persist::load(args.cfg_name);
-            // or we go searching a list for matching type/name.
+
             if (cfg.isArray()) {
                 for (auto one : cfg) {
                     std::string tn = get<std::string>(one, "type");
@@ -140,7 +167,7 @@ namespace WireCell::Aux::Test {
                 }
             }
             args.cfg = cfg;
-        }
+        }        
         return 0;
     }
 
diff --git a/aux/test/check_idft.cxx b/aux/test/check_idft.cxx
index 3e71a4dfa..b013591f4 100644
--- a/aux/test/check_idft.cxx
+++ b/aux/test/check_idft.cxx
@@ -50,8 +50,9 @@ using namespace WireCell;
 using namespace WireCell::Stream;
 using namespace WireCell::Aux::Test;
 
-using array_xxf = Eigen::Array<float, Eigen::Dynamic, Eigen::Dynamic>;
-using complex_t = std::complex<float>;
+using scalar_t = float;
+using array_xxf = Eigen::Array<scalar_t, Eigen::Dynamic, Eigen::Dynamic>;
+using complex_t = std::complex<scalar_t>;
 using array_xxc = Eigen::Array<complex_t, Eigen::Dynamic, Eigen::Dynamic>;
 
 // may hold any dtype and shape
@@ -61,31 +62,15 @@ using array_store = std::map<std::string, pig_array>;
 using dft_op = std::function<pig_array(pig_array)>;
 using op_lu_t = std::map<std::string, dft_op>;
 
-using vector_xf = std::vector<float>;
+using vector_xf = std::vector<scalar_t>;
 using vector_xc = std::vector<complex_t>;
 
-
-static
-vector_xf v_c2r(const vector_xc& cvec)
-{
-    vector_xf ret(cvec.size());
-    std::transform(cvec.begin(), cvec.end(), ret.begin(),
-                   [](complex_t c) { return std::real(c); });
-    return ret;
-}
-static
-vector_xc v_c2r(const vector_xf& rvec)
-{
-    vector_xc cret(rvec.size());
-    std::transform(rvec.begin(), rvec.end(), cret.begin(),
-                   [](float re) { return complex_t(re, 0); });
-    return cret;
-}
-
-
 template<typename Scalar>
 static std::vector<Scalar> p2v(const pig_array& pa)
 {
+    if (pa.header().shape().size() != 1) {
+        throw std::runtime_error("p2v rank mismatch");
+    }
     auto vec = pa.as_vec<Scalar>();
     if (vec.empty()) {
         throw std::runtime_error("p2v type mismatch");
@@ -106,6 +91,9 @@ pig_array v2p(const std::vector<Scalar>& vec)
 template<typename Scalar>
 Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic> p2a(const pig_array& pa)
 {
+    if (pa.header().shape().size() != 2) {
+        throw std::runtime_error("p2a rank mismatch");
+    }
     Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic> arr;
     bool ok = pigenc::eigen::load(pa, arr);
     if (!ok) {
@@ -122,8 +110,11 @@ pig_array a2p(const Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic>& arr)
 }
 
 
+
 pig_array dispatch(const IDFT::pointer& dft, const pig_array& pa, const std::string& op)
 {
+    // vector
+
     if (op == "fwd1d") 
         return v2p<complex_t>(Aux::fwd(dft, p2v<complex_t>(pa)));
 
@@ -131,11 +122,38 @@ pig_array dispatch(const IDFT::pointer& dft, const pig_array& pa, const std::str
         return v2p<complex_t>(Aux::fwd(dft, p2v<complex_t>(pa)));
             
     if (op == "fwd1d_r2c") 
-        return v2p<complex_t>(Aux::fwd_r2c(dft, p2v<float>(pa)));
+        return v2p<complex_t>(Aux::fwd_r2c(dft, p2v<scalar_t>(pa)));
 
     if (op == "inv1d_c2r") 
-        return v2p<float>(Aux::inv_c2r(dft, p2v<complex_t>(pa)));
+        return v2p<scalar_t>(Aux::inv_c2r(dft, p2v<complex_t>(pa)));
+
+    // array
+
+    if (op == "fwd2d")
+        return a2p<complex_t>(Aux::fwd(dft, p2a<complex_t>(pa)));
+
+    if (op == "inv2d")
+        return a2p<complex_t>(Aux::inv(dft, p2a<complex_t>(pa)));
 
+    if (op == "fwd2d_r2c")
+        return a2p<complex_t>(Aux::fwd_r2c(dft, p2a<scalar_t>(pa)));
+
+    if (op == "inv2d_c2r")
+        return a2p<scalar_t>(Aux::inv_c2r(dft, p2a<complex_t>(pa)));
+
+    if (op == "fwd1b0")
+        return a2p<complex_t>(Aux::fwd(dft, p2a<complex_t>(pa), 0));
+
+    if (op == "fwd1b1")
+        return a2p<complex_t>(Aux::fwd(dft, p2a<complex_t>(pa), 1));
+
+    if (op == "inv1b0")
+        return a2p<complex_t>(Aux::inv(dft, p2a<complex_t>(pa), 0));
+
+    if (op == "inv1b1")
+        return a2p<complex_t>(Aux::inv(dft, p2a<complex_t>(pa), 1));
+
+    return pig_array();
 }
 
 int main(int argc, char* argv[])
@@ -166,35 +184,45 @@ int main(int argc, char* argv[])
     for (const auto& sname : args.positional) {
         boost::iostreams::filtering_istream ins;
         std::cerr << "openning: "<<sname<<"\n";
-        ins.clear();
+
         input_filters(ins, sname);
         if (ins.size() < 2) {     // expect bz2 + tar filters + file source.
             std::cerr << "Unexpected file format with: "<<sname<<"\n";
             return 1;
         }
             
-        std::string fname{""};
-        size_t fsize{0};
-        custard::read(ins, fname, fsize);
-        if (ins.eof()) {
-            std::cerr << "EOF on custard head read\n";
-            break;
+        while (true) {
+            std::string fname{""};
+            size_t fsize{0};
+            custard::read(ins, fname, fsize);
+            if (ins.eof()) {
+                break;
+            }
+            if (!ins) {
+                std::cerr << "ERROR unpacking tar header " << strerror(errno) << std::endl;
+                return -1;
+            }
+
+            pigenc::File pig;
+            pig.read(ins);
+            if (!ins) {
+                std::cerr << "ERROR unpacking pig " << strerror(errno) << std::endl;
+                return -1;
+            }
+            auto npy = fname.find(".npy");
+            if (npy != std::string::npos) {
+                fname = fname.substr(0, npy);
+            }
+            std::cerr << "\tread " << fname << " with dtype=" << pig.header().dtype() << std::endl;
+
+            arrs[fname] = pig;
         }
-        if (!ins) {
-            std::cerr << "ERROR unpacking tar header " << strerror(errno) << std::endl;
-            return -1;
-        }
-        std::cerr << "Unpacking " << fname << " " << fsize << std::endl;
-        
-        pigenc::File pig;
-        pig.read(ins);
-        if (!ins) {
-            std::cerr << "ERROR unpacking pig " << strerror(errno) << std::endl;
-            return -1;
-        }
-        std::cerr << "Read in " << fname << " with dtype=" << pig.header().dtype() << std::endl;
+    }
 
-        arrs[fname] = pig;
+    boost::iostreams::filtering_ostream outs;
+    output_filters(outs, args.output);
+    if (outs.size() < 2) {     // must have at least get tar filter + file sink.
+        std::cerr << "Unexpected file format: " << args.output << "\n";
     }
 
     for (auto one : args.cfg) {
@@ -206,18 +234,35 @@ int main(int argc, char* argv[])
         }
 
         auto op = one["op"].asString();
+        auto dst = one["dst"].asString();
+        std::cerr << op << "(" << src << ") -> " << dst << std::endl;
         auto darr = dispatch(idft, it->second, op);
 
-        auto dst = one["dst"];
-        if (darr.header().array_size() == 0) {
+        auto siz = darr.header().array_size();
+        if (siz == 0) {
             std::cerr << "failed: " << op <<  "(" << src << ") -> " << dst << "\n";
             continue;
         }
 
-        // write dst
-        std::cerr << "fixme: not (yet) writing: " << dst << std::endl;
 
+        auto fsiz = darr.header().file_size();
+        auto npy = dst.find(".npy");
+        if (npy == std::string::npos) {
+            dst = dst + ".npy";
+        }
+        std::cerr << "writing: " << dst << "(" << fsiz << " B) to " << args.output << std::endl;
+        custard::write(outs, dst, fsiz);
+        if (!outs) {
+            std::cerr << "failed to write " << dst
+                      << "(" << fsiz << ") to "
+                      << args.output << std::endl;
+            continue;
+        }
+        darr.write(outs);
+        outs.flush();
     }
 
+    outs.pop();
+
     return 0;
 }

From df869f306e396e147141136635173f6237daf919 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Wed, 1 Dec 2021 15:58:53 -0500
Subject: [PATCH 35/46] Fix row/col-wise monkeys

---
 aux/src/DftTools.cxx    | 84 +++++++++++++++++++----------------------
 aux/test/check_idft.cxx | 19 ++++++++--
 2 files changed, 55 insertions(+), 48 deletions(-)

diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index 1194c1aad..a8b80e2e5 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -1,6 +1,8 @@
 #include "WireCellAux/DftTools.h"
 #include <algorithm>
 
+#include <iostream>             // debugging
+
 
 using namespace WireCell;
 using namespace WireCell::Aux;
@@ -18,26 +20,18 @@ using COLM = Eigen::Array<Aux::complex_t, Eigen::Dynamic, Eigen::Dynamic, Eigen:
 template<typename trans>
 Aux::complex_array_t doit(const Aux::complex_array_t& arr, trans func)
 {
-    // Nominally, eigen storage memory is in column-major order
     const Aux::complex_t* in_data = arr.data();
-    int ncols = arr.rows();
-    int nrows = arr.cols();
-
-    // except when it isn't
-    bool flipped = arr.IsRowMajor;
-    if (flipped) {
-        ncols = arr.cols();
-        nrows = arr.rows();
-    }
+    Aux::complex_vector_t out_vec(arr.rows()*arr.cols());
 
-    Aux::complex_vector_t out_vec(nrows*ncols);
-    func(in_data, out_vec.data(), nrows, ncols);
+    std::cerr << "dft::doit: (" << arr.rows() << "," << arr.cols() << ") IsRowMajor:" << arr.IsRowMajor << std::endl;
 
-    if (flipped) {
+    if (arr.IsRowMajor) {
+        func(in_data, out_vec.data(), arr.cols(), arr.rows());
         return Eigen::Map<ROWM>(out_vec.data(), arr.rows(), arr.cols());
     }
-    return Eigen::Map<COLM>(out_vec.data(), arr.rows(), arr.cols());
 
+    func(in_data, out_vec.data(), arr.rows(), arr.cols());
+    return Eigen::Map<COLM>(out_vec.data(), arr.rows(), arr.cols());
 }
 
 Aux::complex_array_t Aux::fwd(const IDFT::pointer& dft, const Aux::complex_array_t& arr)
@@ -58,38 +52,38 @@ Aux::complex_array_t Aux::inv(const IDFT::pointer& dft, const Aux::complex_array
     });
 }
 
-template<typename trans>
-Aux::complex_array_t doit1b(const Aux::complex_array_t& arr, int axis, trans func)
-{
-    // We must provide a flat array with storage order such with
-    // logical axis-major ordering.
-    const Aux::complex_t* in_data = arr.data();
-    const int nrows = arr.rows(); // "logical"
-    const int ncols = arr.cols(); // shape
-
-    // If storage order matches "axis-major"
-    if ( (axis == 1 and arr.IsRowMajor)
-         or
-         (axis == 0 and not arr.IsRowMajor) ) {
-        Aux::complex_vector_t out_vec(nrows*ncols);
-        func(in_data, out_vec.data(), ncols, nrows);
-        if (arr.IsRowMajor) {
-            // note, returning makes a copy and will perform an actual
-            // storage order transpose.
-            return Eigen::Map<ROWM>(out_vec.data(), nrows, ncols);
-        }
-        return Eigen::Map<COLM>(out_vec.data(), nrows, ncols);
-    }
+// template<typename trans>
+// Aux::complex_array_t doit1b(const Aux::complex_array_t& arr, int axis, trans func)
+// {
+//     // We must provide a flat array with storage order such with
+//     // logical axis-major ordering.
+//     const Aux::complex_t* in_data = arr.data();
+//     const int nrows = arr.rows(); // "logical"
+//     const int ncols = arr.cols(); // shape
+
+//     // If storage order matches "axis-major"
+//     if ( (axis == 1 and arr.IsRowMajor)
+//          or
+//          (axis == 0 and not arr.IsRowMajor) ) {
+//         Aux::complex_vector_t out_vec(nrows*ncols);
+//         func(in_data, out_vec.data(), ncols, nrows);
+//         if (arr.IsRowMajor) {
+//             // note, returning makes a copy and will perform an actual
+//             // storage order transpose.
+//             return Eigen::Map<ROWM>(out_vec.data(), nrows, ncols);
+//         }
+//         return Eigen::Map<COLM>(out_vec.data(), nrows, ncols);
+//     }
     
-    // Either we have row-major and want column-major storage order or
-    // vice versa.
-
-    // Here, we must copy and not use "auto" to get actual storage
-    // order transpose and avoid the IsRowMajor flip optimization.
-    COLM flipped = arr.transpose();
-    COLM got = doit1b(flipped, (axis+1)%2, func);
-    return got.transpose();
-}
+//     // Either we have row-major and want column-major storage order or
+//     // vice versa.
+
+//     // Here, we must copy and not use "auto" to get actual storage
+//     // order transpose and avoid the IsRowMajor flip optimization.
+//     COLM flipped = arr.transpose();
+//     COLM got = doit1b(flipped, (axis+1)%2, func);
+//     return got.transpose();
+// }
 
 // Implementation notes for fwd()/inv():
 //
diff --git a/aux/test/check_idft.cxx b/aux/test/check_idft.cxx
index b013591f4..86266a503 100644
--- a/aux/test/check_idft.cxx
+++ b/aux/test/check_idft.cxx
@@ -153,7 +153,7 @@ pig_array dispatch(const IDFT::pointer& dft, const pig_array& pa, const std::str
     if (op == "inv1b1")
         return a2p<complex_t>(Aux::inv(dft, p2a<complex_t>(pa), 1));
 
-    return pig_array();
+    return pa;
 }
 
 int main(int argc, char* argv[])
@@ -213,7 +213,13 @@ int main(int argc, char* argv[])
             if (npy != std::string::npos) {
                 fname = fname.substr(0, npy);
             }
-            std::cerr << "\tread " << fname << " with dtype=" << pig.header().dtype() << std::endl;
+            std::cerr << "\tread " << fname
+                      << " with dtype=" << pig.header().dtype()
+                      << " shape: (";
+            for (auto dim : pig.header().shape()) {
+                std::cerr << " " << dim;
+            }
+            std::cerr << " )" << std::endl;
 
             arrs[fname] = pig;
         }
@@ -250,7 +256,14 @@ int main(int argc, char* argv[])
         if (npy == std::string::npos) {
             dst = dst + ".npy";
         }
-        std::cerr << "writing: " << dst << "(" << fsiz << " B) to " << args.output << std::endl;
+        std::cerr << "\twrite " << dst
+                  << " with dtype=" << darr.header().dtype()
+                  << " shape: (";
+        for (auto dim : darr.header().shape()) {
+            std::cerr << " " << dim;
+        }
+        std::cerr << " ) to " << args.output << std::endl;
+
         custard::write(outs, dst, fsiz);
         if (!outs) {
             std::cerr << "failed to write " << dst

From 81607008125a25427f7db3031667a5d263ea0a8b Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Wed, 1 Dec 2021 15:59:10 -0500
Subject: [PATCH 36/46] More eigen row/col-wise testing

---
 util/test/test_eigen_rowcol2.cxx | 44 ++++++++++++++++++++++++++++++++
 1 file changed, 44 insertions(+)
 create mode 100644 util/test/test_eigen_rowcol2.cxx

diff --git a/util/test/test_eigen_rowcol2.cxx b/util/test/test_eigen_rowcol2.cxx
new file mode 100644
index 000000000..809c0b1ea
--- /dev/null
+++ b/util/test/test_eigen_rowcol2.cxx
@@ -0,0 +1,44 @@
+#include <Eigen/Core>
+#include <cassert>
+
+using Scalar = int;
+using COLM = Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic, Eigen::ColMajor>;
+using ROWM = Eigen::Array<Scalar, Eigen::Dynamic, Eigen::Dynamic, Eigen::RowMajor>;
+
+int main()
+{
+    const int data[8] = {0,1,2,3,4,5,6,7};
+    const int shape[2] = {2,4};
+
+    COLM c2c = Eigen::Map<const COLM>(data, shape[0], shape[1]);
+    COLM r2c = Eigen::Map<const ROWM>(data, shape[0], shape[1]);
+    ROWM c2r = Eigen::Map<const COLM>(data, shape[0], shape[1]);
+    ROWM r2r = Eigen::Map<const ROWM>(data, shape[0], shape[1]);
+
+    assert(c2c.rows() == shape[0]);
+    assert(c2r.rows() == shape[0]);
+    assert(r2c.rows() == shape[0]);
+    assert(r2r.rows() == shape[0]);
+
+    assert(c2c.cols() == shape[1]);
+    assert(c2r.cols() == shape[1]);
+    assert(r2c.cols() == shape[1]);
+    assert(r2r.cols() == shape[1]);
+
+    assert(c2c(0,0) == 0);
+    assert(r2c(0,0) == 0);
+    assert(c2r(0,0) == 0);
+    assert(r2r(0,0) == 0);
+
+    assert(c2c(1,0) == 1);
+    assert(c2r(1,0) == 1);
+    assert(r2c(0,1) == 1);
+    assert(r2r(0,1) == 1);
+
+    assert(c2c(1,1) == 3);
+    assert(c2r(1,1) == 3);
+    assert(r2c(0,3) == 3);
+    assert(r2r(0,3) == 3);
+
+    return 0;
+}

From db16d5485d21cb0b3e748d7b076406e5926417be Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 2 Dec 2021 13:31:23 -0500
Subject: [PATCH 37/46] Fix one wrong conversion to IDFT, improve logging along
 the way to finding the problem

---
 sigproc/inc/WireCellSigProc/OmnibusSigProc.h |  16 +-
 sigproc/src/OmnibusSigProc.cxx               | 248 ++++++++++++-------
 2 files changed, 165 insertions(+), 99 deletions(-)

diff --git a/sigproc/inc/WireCellSigProc/OmnibusSigProc.h b/sigproc/inc/WireCellSigProc/OmnibusSigProc.h
index 34a40f2cd..23d77f48e 100644
--- a/sigproc/inc/WireCellSigProc/OmnibusSigProc.h
+++ b/sigproc/inc/WireCellSigProc/OmnibusSigProc.h
@@ -65,9 +65,18 @@ namespace WireCell {
 
             void decon_2D_looseROI_debug_mode(int plane);
 
-            // save data into the out frame and collect the indices
-            void save_data(ITrace::vector& itraces, IFrame::trace_list_t& indices, int plane,
-                           const std::vector<float>& perwire_rmses, IFrame::trace_summary_t& threshold);
+            // for debugging, check current state of working data
+            void check_data(int plane, const std::string& loglabel);
+
+            // Copy elements from m_r_data, mess with them, and store
+            // result into traces.  Update indices.  Fixme: best if we
+            // were to factor saving and munging!
+            void save_data(ITrace::vector& itraces,
+                           IFrame::trace_list_t& indices,
+                           int plane,
+                           const std::vector<float>& perwire_rmses,
+                           IFrame::trace_summary_t& threshold,
+                           const std::string& loglabel);
 
             // save ROI into the out frame (set use_roi_debug_mode=true)
             void save_roi(ITrace::vector& itraces, IFrame::trace_list_t& indices, int plane,
@@ -233,6 +242,7 @@ namespace WireCell {
             bool m_sparse;
 
             size_t m_count{0};
+            int m_verbose{0};
 
             IDFT::pointer m_dft;
         };
diff --git a/sigproc/src/OmnibusSigProc.cxx b/sigproc/src/OmnibusSigProc.cxx
index 6f2fa85ee..0eec9ad02 100644
--- a/sigproc/src/OmnibusSigProc.cxx
+++ b/sigproc/src/OmnibusSigProc.cxx
@@ -125,20 +125,21 @@ void OmnibusSigProc::configure(const WireCell::Configuration& config)
 
     std::string dft_tn = get<std::string>(config, "dft", "FftwDFT");
     m_dft = Factory::find_tn<IDFT>(dft_tn);
+    m_verbose = get(config, "verbose", 0);
 
     // m_nticks = get(config,"nticks",m_nticks);
     if (!config["nticks"].isNull()) {
-        log->warn("no setting \"nticks\", ignoring value {}", config["nticks"].asInt());
+        log->warn("config: no setting \"nticks\", ignoring value {}", config["nticks"].asInt());
     }
     // m_period = get(config,"period",m_period);
     if (!config["period"].isNull()) {
-        log->warn("no setting \"period\", ignoring value {}", config["period"].asDouble());
+        log->warn("config: no setting \"period\", ignoring value {}", config["period"].asDouble());
     }
 
     m_fft_flag = get(config, "fft_flag", m_fft_flag);
     if (m_fft_flag) {
       m_fft_flag = 0;
-      log->warn("fft_flag option is broken, will use native array sizes");
+      log->warn("config: fft_flag option is broken, will use native array sizes");
     }
     m_elecresponse_tn = get(config, "elecresponse", m_elecresponse_tn);
     m_gain = get(config, "gain", m_gain);
@@ -218,7 +219,7 @@ void OmnibusSigProc::configure(const WireCell::Configuration& config)
     // but we have plane-major order so make a temporary collection.
     IChannel::vector plane_channels[3];
     std::stringstream ss;
-    ss << "internal channel map for tags: gauss:\"" << m_gauss_tag << "\", wiener:\"" << m_wiener_tag
+    ss << "config: internal channel map for tags: gauss:\"" << m_gauss_tag << "\", wiener:\"" << m_wiener_tag
        << "\", frame:\"" << m_frame_tag << "\"\n";
 
     // fixme: this loop is now available as Aux::plane_channels()
@@ -268,6 +269,7 @@ WireCell::Configuration OmnibusSigProc::default_configuration() const
     Configuration cfg;
     cfg["anode"] = m_anode_tn;
     cfg["dft"] = "FftwDFT";     // type-name for the DFT to use
+    cfg["verbose"] = 0;         // larger is more more logging 
     cfg["ftoffset"] = m_fine_time_offset;
     cfg["ctoffset"] = m_coarse_time_offset;
     // cfg["nticks"] = m_nticks;
@@ -363,7 +365,8 @@ void OmnibusSigProc::load_data(const input_pointer& in, int plane)
         auto const& charges = trace->charge();
         const int ntbins = std::min((int) charges.size(), m_nticks);
         for (int qind = 0; qind < ntbins; ++qind) {
-            m_r_data[plane](och.wire + m_pad_nwires[plane], tbin + qind) = charges[qind];
+            const float q = charges[qind];
+            m_r_data[plane](och.wire + m_pad_nwires[plane], tbin + qind) = q;
         }
 
         // ensure dead channels are indeed dead ...
@@ -380,19 +383,42 @@ void OmnibusSigProc::load_data(const input_pointer& in, int plane)
             }
         }
     }
-    log->debug("plane index: {} input data identifies {} bad regions", plane, nbad);
+    log->debug("call={} load plane index: {}, ntraces={}, input bad regions: {}",
+               m_count, plane, traces->size(), nbad);
+    check_data(plane, "load data");
 }
 
 // used in sparsifying below.  Could use C++17 lambdas....
 static bool ispositive(float x) { return x > 0.0; }
 static bool isZero(float x) { return x == 0.0; }
 
-void OmnibusSigProc::save_data(ITrace::vector& itraces, IFrame::trace_list_t& indices, int plane,
-                               const std::vector<float>& perwire_rmses, IFrame::trace_summary_t& threshold)
+void OmnibusSigProc::check_data(int iplane, const std::string& loglabel)
 {
+    if (!m_verbose) { return; }
+
+    std::stringstream ss;
+    auto& arr = m_r_data[iplane];
+    
+    log->debug("data: plane={}, sum={}, mean={}, min={}, max={} \"{}\"",
+               iplane,
+               arr.sum(), arr.mean(), arr.minCoeff(), arr.maxCoeff(), 
+               loglabel);
+}
+
+void OmnibusSigProc::save_data(
+    ITrace::vector& itraces,
+    IFrame::trace_list_t& indices,
+    int plane,
+    const std::vector<float>& perwire_rmses,
+    IFrame::trace_summary_t& threshold,
+    const std::string& loglabel)
+{
+    check_data(plane, loglabel + " before save");
+
     // reuse this temporary vector to hold charge for a channel.
     ITrace::ChargeSequence charge(m_nticks, 0.0);
 
+    double qloss = 0.0;
     double qtot = 0.0;
     for (auto och : m_channel_range[plane]) {  // ordered by osp channel
 
@@ -402,10 +428,18 @@ void OmnibusSigProc::save_data(ITrace::vector& itraces, IFrame::trace_list_t& in
             const float q = m_r_data[plane](och.wire, itick);
             // charge.at(itick) = q > 0.0 ? q : 0.0;
             // charge.at(itick) = q ;
-            if (m_use_roi_debug_mode)
+            if (m_use_roi_debug_mode) {
                 charge.at(itick) = q;  // debug mode: save all decons
-            else
-                charge.at(itick) = q > 0.0 ? q : 0.0;  // default mode: only save positive
+            }
+            else {              // nominal: threshold at zero.
+                if (q > 0.0) {
+                    charge.at(itick) = q;
+                }
+                else {
+                    charge.at(itick) = 0.0;
+                    qloss += q;
+                }
+            }
         }
         {
             auto& bad = m_cmm["bad"];
@@ -413,6 +447,7 @@ void OmnibusSigProc::save_data(ITrace::vector& itraces, IFrame::trace_list_t& in
             if (badit != bad.end()) {
                 for (auto bad : badit->second) {
                     for (int itick = bad.first; itick < bad.second; ++itick) {
+                        qloss += charge.at(itick);
                         charge.at(itick) = 0.0;
                     }
                 }
@@ -460,15 +495,17 @@ void OmnibusSigProc::save_data(ITrace::vector& itraces, IFrame::trace_list_t& in
 
     // debug
     if (indices.empty()) {
-        log->debug("save_data plane index: {} empty", plane);
+        log->debug("call={} {} save plane index: {} empty",
+                   m_count, loglabel, plane);
     }
     else {
-        const int nadded = indices.back() - indices.front() + 1;
-        log->debug("save_data plane index: {}, Qtot={} "
-                   "added {} traces to total {} indices:[{},{}]",
-                   plane, qtot,
-                   nadded, indices.size(), indices.front(), indices.back());
+        log->debug("call={} save plane index: {}, Qtot={} Qloss={}, "
+                   "{} indices spanning [{},{}] \"{}\"",
+                   m_count, plane, qtot, qloss,
+                   indices.size(), indices.front(), indices.back(),
+                   loglabel);
     }
+    check_data(plane, loglabel + " after save");
 }
 
 // save ROI into the out frame
@@ -717,14 +754,14 @@ void OmnibusSigProc::init_overall_response(IFrame::pointer frame)
         int tbinmin = *mme.first;
         int tbinmax = *mme.second;
         m_nticks = tbinmax - tbinmin;
-        log->debug("OmnibusSigProc: nticks={} tbinmin={} tbinmax={}", m_nticks, tbinmin, tbinmax);
+        log->debug("call={} init nticks={} tbinmin={} tbinmax={}", m_count, m_nticks, tbinmin, tbinmax);
 
         if (m_fft_flag == 0) {
             m_fft_nticks = m_nticks;
         }
         else {
             m_fft_nticks = fft_best_length(m_nticks);
-            log->debug("OmnibusSigProc: enlarge window from {} to {}", m_nticks, m_fft_nticks);
+            log->debug("call={} init enlarge window from {} to {}", m_count, m_nticks, m_fft_nticks);
         }
         //
 
@@ -746,7 +783,8 @@ void OmnibusSigProc::init_overall_response(IFrame::pointer frame)
         }
         else {
             m_fft_nwires[i] = fft_best_length(m_nwires[i] + fravg.planes[0].paths.size() - 1, 1);
-            log->debug("OmnibusSigProc: enlarge wire number in plane {} from {} to {}", i, m_nwires[i],
+            log->debug("call={} init enlarge wire number in plane {} from {} to {}",
+                       m_count, i, m_nwires[i],
                        m_fft_nwires[i]);
         }
         m_pad_nwires[i] = (m_fft_nwires[i] - m_nwires[i]) / 2;
@@ -901,32 +939,20 @@ void OmnibusSigProc::decon_2D_init(int plane)
 {
     // data part ...
     // first round of FFT on time
-    // m_c_data[plane] = Array::dft_rc(m_r_data[plane], 0);
     m_c_data[plane] = Aux::fwd(m_dft, m_r_data[plane].cast<IDFT::complex_t>(), 1);
 
     // now apply the ch-by-ch response ...
     if (!m_per_chan_resp.empty()) {
-        log->debug("OmnibusSigProc: applying ch-by-ch electronics response correction");
+        log->debug("call={} applying ch-by-ch electronics response correction", m_count);
         auto cr = Factory::find_tn<IChannelResponse>(m_per_chan_resp);
         auto cr_bins = cr->channel_response_binning();
         if (cr_bins.binsize() != m_period) {
-            log->critical("OmnibusSigProc::decon_2D_init: channel response size mismatch");
+            log->critical("call={} decon_2D_init: channel response size mismatch", m_count);
             THROW(ValueError() << errmsg{"OmnibusSigProc::decon_2D_init: channel response size mismatch"});
         }
-        // starndard electronics response ...
-        // WireCell::Binning tbins(m_nticks, 0-m_period/2., m_nticks*m_period-m_period/2.);
-        // Response::ColdElec ce(m_gain, m_shaping_time);
 
-        // temporary hack ...
-        // float scaling = 1./(1e-9*0.5/1.13312);
-        // WireCell::Binning tbins(m_nticks, (-5-0.5)*m_period, (m_nticks-5-0.5)*m_period-m_period);
-        // Response::ColdElec ce(m_gain*scaling, m_shaping_time);
-        //// this is moved into wirecell.sigproc.main production of
-        //// microboone-channel-responses-v1.json.bz2
         WireCell::Binning tbins(m_fft_nticks, cr_bins.min(), cr_bins.min() + m_fft_nticks * m_period);
-        // Response::ColdElec ce(m_gain, m_shaping_time);
 
-        // const auto ewave = ce.generate(tbins);
         auto ewave = (*m_elecresponse).waveform_samples(tbins);
         // const WireCell::Waveform::compseq_t elec = Waveform::dft(ewave);
         const WireCell::Waveform::compseq_t elec = Aux::fwd_r2c(m_dft, ewave);
@@ -968,7 +994,7 @@ void OmnibusSigProc::decon_2D_init(int plane)
     // do second round FFT on the response on wire
     // c_resp = Array::dft_cc(c_resp, 1);
     Array::array_xxc c_resp = r_resp.cast<IDFT::complex_t>();
-    Aux::fwd(m_dft, c_resp);
+    c_resp = Aux::fwd(m_dft, c_resp);
 
     // make ratio to the response and apply wire filter
     m_c_data[plane] = m_c_data[plane] / c_resp;
@@ -1395,7 +1421,7 @@ bool OmnibusSigProc::operator()(const input_pointer& in, output_pointer& out)
 
     ITrace::vector* itraces = new ITrace::vector;  // will become shared_ptr.
     IFrame::trace_summary_t thresholds;
-    IFrame::trace_list_t wiener_traces, gauss_traces, perframe_traces[3];
+    IFrame::trace_list_t wiener_traces, gauss_traces;
     // here are some trace lists for debug mode
     IFrame::trace_list_t tight_lf_traces, loose_lf_traces, cleanup_roi_traces, break_roi_loop1_traces,
         break_roi_loop2_traces, shrink_roi_traces, extend_roi_traces;
@@ -1426,6 +1452,7 @@ bool OmnibusSigProc::operator()(const input_pointer& in, output_pointer& out)
         load_data(in, iplane);  // load into a large matrix
         // initial decon ...
         decon_2D_init(iplane);  // decon in large matrix
+        check_data(iplane, "after 2D init");
 
         // Form tight ROIs
         if (iplane != 2) {  // induction wire planes
@@ -1441,17 +1468,20 @@ bool OmnibusSigProc::operator()(const input_pointer& in, output_pointer& out)
             decon_2D_tightROI(iplane);
             roi_form.find_ROI_by_decon_itself(iplane, m_r_data[iplane]);
         }
+        check_data(iplane, "after 2D tight ROI");
 
         // [wgu] save decon result after tight LF
         std::vector<double> dummy;
-        if (m_use_roi_debug_mode and m_use_roi_refinement) save_data(*itraces, tight_lf_traces, iplane, perwire_rmses, dummy);
+        if (m_use_roi_debug_mode and m_use_roi_refinement) {
+            save_data(*itraces, tight_lf_traces, iplane, perwire_rmses, dummy, "tight_lf");
+        }
 
         // Form loose ROIs
         if (iplane != 2) {
             // [wgu] save decon result after loose LF
             if (m_use_roi_debug_mode) {
                 decon_2D_looseROI_debug_mode(iplane);
-                save_data(*itraces, loose_lf_traces, iplane, perwire_rmses, dummy);
+                save_data(*itraces, loose_lf_traces, iplane, perwire_rmses, dummy, "loose_lf");
             }
 
             if (m_use_roi_refinement) {
@@ -1463,7 +1493,11 @@ bool OmnibusSigProc::operator()(const input_pointer& in, output_pointer& out)
 
         // [wgu] collection plane does not need loose LF
         // but save something to be consistent
-        if (m_use_roi_debug_mode and iplane == 2) save_data(*itraces, loose_lf_traces, iplane, perwire_rmses, dummy);
+        if (m_use_roi_debug_mode and iplane == 2) {
+            save_data(*itraces, loose_lf_traces, iplane, perwire_rmses, dummy, "loose_lf");
+        }
+
+        check_data(iplane, "after 2D ROI refine");
 
         // Refine ROIs
         if (m_use_roi_refinement) roi_refine.load_data(iplane, m_r_data[iplane], roi_form);
@@ -1474,81 +1508,103 @@ bool OmnibusSigProc::operator()(const input_pointer& in, output_pointer& out)
     }
 
     if (m_use_roi_refinement) {
-    for (int iplane = 0; iplane != 3; ++iplane) {
-        auto it = std::find(m_process_planes.begin(), m_process_planes.end(), iplane);
-        if (it == m_process_planes.end()) continue;
+        for (int iplane = 0; iplane != 3; ++iplane) {
+            auto it = std::find(m_process_planes.begin(), m_process_planes.end(), iplane);
+            if (it == m_process_planes.end()) continue;
 
-        // roi_refine.refine_data(iplane, roi_form);
+            // roi_refine.refine_data(iplane, roi_form);
 
-        roi_refine.CleanUpROIs(iplane);
-        roi_refine.generate_merge_ROIs(iplane);
+            roi_refine.CleanUpROIs(iplane);
+            roi_refine.generate_merge_ROIs(iplane);
 
-        if (m_use_roi_debug_mode) {
-            save_roi(*itraces, cleanup_roi_traces, iplane, roi_refine.get_rois_by_plane(iplane));
-        }
+            if (m_use_roi_debug_mode) {
+                save_roi(*itraces, cleanup_roi_traces, iplane, roi_refine.get_rois_by_plane(iplane));
+            }
 
-        if (m_use_multi_plane_protection) {
-            roi_refine.MultiPlaneProtection(iplane, m_anode, m_roi_ch_ch_ident, roi_form, 1000, m_anode->ident() % 2);
-            save_mproi(*itraces, mp3_roi_traces, iplane, roi_refine.get_mp3_rois());
-            roi_refine.MultiPlaneROI(iplane, m_anode, m_roi_ch_ch_ident, roi_form, 1000, m_anode->ident() % 2);
-            save_mproi(*itraces, mp2_roi_traces, iplane, roi_refine.get_mp2_rois());
+            if (m_use_multi_plane_protection) {
+                roi_refine.MultiPlaneProtection(iplane, m_anode, m_roi_ch_ch_ident, roi_form, 1000, m_anode->ident() % 2);
+                save_mproi(*itraces, mp3_roi_traces, iplane, roi_refine.get_mp3_rois());
+                roi_refine.MultiPlaneROI(iplane, m_anode, m_roi_ch_ch_ident, roi_form, 1000, m_anode->ident() % 2);
+                save_mproi(*itraces, mp2_roi_traces, iplane, roi_refine.get_mp2_rois());
+            }
         }
-    }
 
-    for (int iplane = 0; iplane != 3; ++iplane) {
-        auto it = std::find(m_process_planes.begin(), m_process_planes.end(), iplane);
-        if (it == m_process_planes.end()) continue;
+        for (int iplane = 0; iplane != 3; ++iplane) {
+            auto it = std::find(m_process_planes.begin(), m_process_planes.end(), iplane);
+            if (it == m_process_planes.end()) continue;
 
-        const std::vector<float>& perwire_rmses = *perplane_thresholds[iplane];
+            const std::vector<float>& perwire_rmses = *perplane_thresholds[iplane];
 
-        for (int qx = 0; qx != m_r_break_roi_loop; qx++) {
-            roi_refine.BreakROIs(iplane, roi_form);
+            for (int qx = 0; qx != m_r_break_roi_loop; qx++) {
+                roi_refine.BreakROIs(iplane, roi_form);
+                roi_refine.CheckROIs(iplane, roi_form);
+                roi_refine.CleanUpROIs(iplane);
+                if (m_use_roi_debug_mode) {
+                    if (qx == 0) {
+                        save_roi(*itraces, break_roi_loop1_traces, iplane, roi_refine.get_rois_by_plane(iplane));
+                    }
+                    if (qx == 1) {
+                        save_roi(*itraces, break_roi_loop2_traces, iplane, roi_refine.get_rois_by_plane(iplane));
+                    }
+                }
+            }
+
+            roi_refine.ShrinkROIs(iplane, roi_form);
+            check_data(iplane, "after roi refine shrink");
             roi_refine.CheckROIs(iplane, roi_form);
+            check_data(iplane, "after roi refine check");
             roi_refine.CleanUpROIs(iplane);
             if (m_use_roi_debug_mode) {
-                if (qx == 0) save_roi(*itraces, break_roi_loop1_traces, iplane, roi_refine.get_rois_by_plane(iplane));
-                if (qx == 1) save_roi(*itraces, break_roi_loop2_traces, iplane, roi_refine.get_rois_by_plane(iplane));
+                save_roi(*itraces, shrink_roi_traces, iplane, roi_refine.get_rois_by_plane(iplane));
             }
-        }
 
-        roi_refine.ShrinkROIs(iplane, roi_form);
-        roi_refine.CheckROIs(iplane, roi_form);
-        roi_refine.CleanUpROIs(iplane);
-        if (m_use_roi_debug_mode) {
-            save_roi(*itraces, shrink_roi_traces, iplane, roi_refine.get_rois_by_plane(iplane));
-        }
+            if (iplane == 2) {
+                roi_refine.CleanUpCollectionROIs();
+            }
+            else {
+                roi_refine.CleanUpInductionROIs(iplane);
+            }
+            check_data(iplane, "after roi refine cleanup");
 
-        if (iplane == 2) {
-            roi_refine.CleanUpCollectionROIs();
-        }
-        else {
-            roi_refine.CleanUpInductionROIs(iplane);
-        }
-        roi_refine.ExtendROIs(iplane);
+            roi_refine.ExtendROIs(iplane);
+            check_data(iplane, "after roi refine extend");
 
-        if (m_use_roi_debug_mode) {
-            save_ext_roi(*itraces, extend_roi_traces, iplane, roi_refine.get_rois_by_plane(iplane));
-        }
+            if (m_use_roi_debug_mode) {
+                save_ext_roi(*itraces, extend_roi_traces, iplane, roi_refine.get_rois_by_plane(iplane));
+            }
+
+            // merge results ...
+            decon_2D_hits(iplane);
+            check_data(iplane, "after decon 2D hits");
+            roi_refine.apply_roi(iplane, m_r_data[iplane]);
+            check_data(iplane, "after roi refine apply");
+            // roi_form.apply_roi(iplane, m_r_data[plane],1);
+            {
+                // We only use an intermediate index list here to give
+                // some clarity to log msg about range added
+                IFrame::trace_list_t perframe;
+                save_data(*itraces, perframe, iplane, perwire_rmses, thresholds, "wiener");
+                wiener_traces.insert(wiener_traces.end(), perframe.begin(), perframe.end());
+            }
 
-        // merge results ...
-        decon_2D_hits(iplane);
-        roi_refine.apply_roi(iplane, m_r_data[iplane]);
-        // roi_form.apply_roi(iplane, m_r_data[plane],1);
-        save_data(*itraces, perframe_traces[iplane], iplane, perwire_rmses, thresholds);
-        wiener_traces.insert(wiener_traces.end(), perframe_traces[iplane].begin(), perframe_traces[iplane].end());
+            decon_2D_charge(iplane);
+            std::vector<double> dummy_thresholds;
+            if (m_use_roi_debug_mode) {
+                save_data(*itraces, decon_charge_traces, iplane, perwire_rmses, thresholds, "decon");
+            }
+            roi_refine.apply_roi(iplane, m_r_data[iplane]);
+            // roi_form.apply_roi(iplane, m_r_data[plane],1);
+            {
+                // We only use an intermediate index list here to give
+                // some clarity to log msg about range added
+                IFrame::trace_list_t perframe;
+                save_data(*itraces, perframe, iplane, perwire_rmses, dummy_thresholds, "gauss");
+                gauss_traces.insert(gauss_traces.end(), perframe.begin(), perframe.end());
+            }
 
-        decon_2D_charge(iplane);
-        std::vector<double> dummy_thresholds;
-        if (m_use_roi_debug_mode) {
-            save_data(*itraces, decon_charge_traces, iplane, perwire_rmses, thresholds);
+            m_c_data[iplane].resize(0, 0);  // clear memory
+            m_r_data[iplane].resize(0, 0);  // clear memory
         }
-        roi_refine.apply_roi(iplane, m_r_data[iplane]);
-        // roi_form.apply_roi(iplane, m_r_data[plane],1);
-        save_data(*itraces, gauss_traces, iplane, perwire_rmses, dummy_thresholds);
-
-        m_c_data[iplane].resize(0, 0);  // clear memory
-        m_r_data[iplane].resize(0, 0);  // clear memory
-    }
     }
 
     SimpleFrame* sframe = new SimpleFrame(in->ident(), in->time(), ITrace::shared_vector(itraces), in->tick(), m_cmm);

From 07d8a3d076d5d65d9de106dd95dc397adb6b02d8 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 2 Dec 2021 13:32:22 -0500
Subject: [PATCH 38/46] Remove noisy

---
 aux/src/DftTools.cxx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/aux/src/DftTools.cxx b/aux/src/DftTools.cxx
index a8b80e2e5..d9ebadac3 100644
--- a/aux/src/DftTools.cxx
+++ b/aux/src/DftTools.cxx
@@ -23,7 +23,7 @@ Aux::complex_array_t doit(const Aux::complex_array_t& arr, trans func)
     const Aux::complex_t* in_data = arr.data();
     Aux::complex_vector_t out_vec(arr.rows()*arr.cols());
 
-    std::cerr << "dft::doit: (" << arr.rows() << "," << arr.cols() << ") IsRowMajor:" << arr.IsRowMajor << std::endl;
+    // std::cerr << "dft::doit: (" << arr.rows() << "," << arr.cols() << ") IsRowMajor:" << arr.IsRowMajor << std::endl;
 
     if (arr.IsRowMajor) {
         func(in_data, out_vec.data(), arr.cols(), arr.rows());

From a9e7eb8a268c5b93ef14e67ce62c25004f43311d Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 2 Dec 2021 13:32:46 -0500
Subject: [PATCH 39/46] Fix typo in dispatch

---
 aux/test/check_idft.cxx | 15 ++++++++++-----
 1 file changed, 10 insertions(+), 5 deletions(-)

diff --git a/aux/test/check_idft.cxx b/aux/test/check_idft.cxx
index 86266a503..68ed81b0b 100644
--- a/aux/test/check_idft.cxx
+++ b/aux/test/check_idft.cxx
@@ -83,7 +83,7 @@ pig_array v2p(const std::vector<Scalar>& vec)
     std::vector<char> data((const char*)vec.data(),
                            (const char*)vec.data() + sizeof(Scalar)*vec.size());
     pig_array pa;
-    pa.set<complex_t>(data, {vec.size()});
+    pa.set<Scalar>(data, {vec.size()});
     return pa;
 }
 
@@ -119,7 +119,7 @@ pig_array dispatch(const IDFT::pointer& dft, const pig_array& pa, const std::str
         return v2p<complex_t>(Aux::fwd(dft, p2v<complex_t>(pa)));
 
     if (op == "inv1d") 
-        return v2p<complex_t>(Aux::fwd(dft, p2v<complex_t>(pa)));
+        return v2p<complex_t>(Aux::inv(dft, p2v<complex_t>(pa)));
             
     if (op == "fwd1d_r2c") 
         return v2p<complex_t>(Aux::fwd_r2c(dft, p2v<scalar_t>(pa)));
@@ -153,7 +153,11 @@ pig_array dispatch(const IDFT::pointer& dft, const pig_array& pa, const std::str
     if (op == "inv1b1")
         return a2p<complex_t>(Aux::inv(dft, p2a<complex_t>(pa), 1));
 
-    return pa;
+    if (op == "" or op == "noop" or op == "no-op") {
+        return pa;
+    }
+
+    throw std::runtime_error("unsupported op: " + op);
 }
 
 int main(int argc, char* argv[])
@@ -246,7 +250,7 @@ int main(int argc, char* argv[])
 
         auto siz = darr.header().array_size();
         if (siz == 0) {
-            std::cerr << "failed: " << op <<  "(" << src << ") -> " << dst << "\n";
+            std::cerr << "failed: " << op <<  "(" << src << ") -> " << dst << " (zero size)\n";
             continue;
         }
 
@@ -266,9 +270,10 @@ int main(int argc, char* argv[])
 
         custard::write(outs, dst, fsiz);
         if (!outs) {
+            std::cerr << "stream error: " << strerror(errno) << std::endl;
             std::cerr << "failed to write " << dst
                       << "(" << fsiz << ") to "
-                      << args.output << std::endl;
+                      << args.output << "\n" << one << std::endl;
             continue;
         }
         darr.write(outs);

From 5cf456b28b528acc5c39b5d08b85754cd38f0357 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 2 Dec 2021 13:33:07 -0500
Subject: [PATCH 40/46] Allow passing dft config down

---
 cfg/pgrapher/common/helpers/sp.jsonnet | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/cfg/pgrapher/common/helpers/sp.jsonnet b/cfg/pgrapher/common/helpers/sp.jsonnet
index 38728d496..5327e6e84 100644
--- a/cfg/pgrapher/common/helpers/sp.jsonnet
+++ b/cfg/pgrapher/common/helpers/sp.jsonnet
@@ -3,6 +3,7 @@
 
 local wc = import "wirecell.jsonnet";
 local pg = import "pgraph.jsonnet";
+local aux = import "aux.jsonnet";
 
 
 // Signal processing.
@@ -10,7 +11,7 @@ local pg = import "pgraph.jsonnet";
 // Note, spfilt are a list of filter objects which MUST match
 // hard-wired names in the C++, sorry.  See, eg
 // pgrapher/experiment/pdsp/sp-filters.jsonnet.
-function(anode, fieldresp, elecresp, spfilt, adcpermv, perchan=null, override={}) 
+function(anode, fieldresp, elecresp, spfilt, adcpermv, perchan=null, dft=aux.dft, override={}) 
     local apaid = anode.data.ident;
 
     // if perchan file name is given we need to add this to a
@@ -35,6 +36,7 @@ function(anode, fieldresp, elecresp, spfilt, adcpermv, perchan=null, override={}
                 *  Associated tuning in sp-filters.jsonnet
                 */
             anode: wc.tn(anode),
+            dft: wc.tn(dft),
             field_response: wc.tn(fieldresp),
             elecresponse: wc.tn(elecresp),
             ftoffset: 0.0, // default 0.0
@@ -81,4 +83,4 @@ function(anode, fieldresp, elecresp, spfilt, adcpermv, perchan=null, override={}
             isWrapped: false,
             // process_planes: [0, 2],
         } + override
-    }, nin=1, nout=1, uses=[anode, fieldresp, elecresp] + pc.uses + spfilt)
+    }, nin=1, nout=1, uses=[anode, dft, fieldresp, elecresp] + pc.uses + spfilt)

From f4f02c4eb1f7d26b2df23f8a7751e64c5ca80c03 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 2 Dec 2021 14:00:14 -0500
Subject: [PATCH 41/46] More passing down of IDFT

---
 cfg/pgrapher/common/helpers/nf.jsonnet        |   6 +-
 cfg/pgrapher/experiment/pdsp/nf.jsonnet       | 139 +++++++++---------
 .../experiment/pdsp/ocndb-perfect.jsonnet     |   7 +-
 cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet      |  16 +-
 cfg/test/test-pdsp-sim-sp.jsonnet             |  84 +++++++++++
 cfg/test/test-pdsp-sim.jsonnet                | 108 ++++++++++++++
 6 files changed, 281 insertions(+), 79 deletions(-)
 create mode 100644 cfg/test/test-pdsp-sim-sp.jsonnet
 create mode 100644 cfg/test/test-pdsp-sim.jsonnet

diff --git a/cfg/pgrapher/common/helpers/nf.jsonnet b/cfg/pgrapher/common/helpers/nf.jsonnet
index 9c666f1b1..e86562396 100644
--- a/cfg/pgrapher/common/helpers/nf.jsonnet
+++ b/cfg/pgrapher/common/helpers/nf.jsonnet
@@ -2,13 +2,17 @@ local wc = import "wirecell.jsonnet";
 local pg = import "pgraph.jsonnet";
 local u = import "utils.jsonnet";
 
-function(anode, fr, chndb, nsamples, tick=0.5*wc.us, rms_cuts=[])
+local default_dft = { type: 'FftwDFT' };
+
+function(anode, fr, chndb, nsamples, tick=0.5*wc.us, rms_cuts=[], dft=default_dft)
     local single = {
         type: 'pdOneChannelNoise',
         name: u.idents(anode),
+        uses: [dft],
         data: {
             noisedb: wc.tn(chndb),
             anode: wc.tn(anode),
+            dft: wc.tn(dft),
             resmp: [
             ],
         },
diff --git a/cfg/pgrapher/experiment/pdsp/nf.jsonnet b/cfg/pgrapher/experiment/pdsp/nf.jsonnet
index c9945ed2d..8f8345580 100644
--- a/cfg/pgrapher/experiment/pdsp/nf.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/nf.jsonnet
@@ -4,87 +4,90 @@ local g = import 'pgraph.jsonnet';
 local wc = import 'wirecell.jsonnet';
 local gainmap = import 'pgrapher/experiment/pdsp/chndb-rel-gain.jsonnet';
 
-function(params, anode, chndbobj, n, name='')
-  {
+local default_dft = { type: 'FftwDFT' };
+
+function(params, anode, chndbobj, n, name='', dft=default_dft) {
     local single = {
-      type: 'pdOneChannelNoise',
-      name: name,
-      data: {
-        noisedb: wc.tn(chndbobj),
-        anode: wc.tn(anode),
-        resmp: [
-          {channels: std.range(2128, 2175), sample_from: 5996},
-          {channels: std.range(1520, 1559), sample_from: 5996},
-          {channels: std.range( 440,  479), sample_from: 5996},
-        ],
-      },
+        type: 'pdOneChannelNoise',
+        name: name,
+        uses: [dft],
+        data: {
+            noisedb: wc.tn(chndbobj),
+            anode: wc.tn(anode),
+            dft: wc.tn(dft),
+            resmp: [
+                {channels: std.range(2128, 2175), sample_from: 5996},
+                {channels: std.range(1520, 1559), sample_from: 5996},
+                {channels: std.range( 440,  479), sample_from: 5996},
+            ],
+        },
     },
     local grouped = {
-      type: 'mbCoherentNoiseSub',
-      name: name,
-      data: {
-        noisedb: wc.tn(chndbobj),
-        anode: wc.tn(anode),
-        rms_threshold: 0.0,
-      },
+        type: 'mbCoherentNoiseSub',
+        name: name,
+        data: {
+            noisedb: wc.tn(chndbobj),
+            anode: wc.tn(anode),
+            rms_threshold: 0.0,
+        },
     },
     local sticky = {
-      type: 'pdStickyCodeMitig',
-      name: name,
-      data: {
-        extra_stky: [
-          {channels: std.range(n * 2560, (n + 1) * 2560 - 1), bits: [0,1,63]},
-          {channels: [4], bits: [6]  },
-          {channels: [159], bits: [6]  },
-          {channels: [164], bits: [36] },
-          {channels: [168], bits: [7]  },
-          {channels: [323], bits: [24] },
-          {channels: [451], bits: [25] },
-        ],
-        noisedb: wc.tn(chndbobj),
-        anode: wc.tn(anode),
-        stky_sig_like_val: 15.0,
-        stky_sig_like_rms: 2.0,
-        stky_max_len: 10,
-      },
+        type: 'pdStickyCodeMitig',
+        name: name,
+        data: {
+            extra_stky: [
+                {channels: std.range(n * 2560, (n + 1) * 2560 - 1), bits: [0,1,63]},
+                {channels: [4], bits: [6]  },
+                {channels: [159], bits: [6]  },
+                {channels: [164], bits: [36] },
+                {channels: [168], bits: [7]  },
+                {channels: [323], bits: [24] },
+                {channels: [451], bits: [25] },
+            ],
+            noisedb: wc.tn(chndbobj),
+            anode: wc.tn(anode),
+            stky_sig_like_val: 15.0,
+            stky_sig_like_rms: 2.0,
+            stky_max_len: 10,
+        },
     },
     local gaincalib = {
-      type: 'pdRelGainCalib',
-      name: name,
-      data: {
-        noisedb: wc.tn(chndbobj),
-        anode: wc.tn(anode),
-        rel_gain: gainmap.rel_gain,
-      },
+        type: 'pdRelGainCalib',
+        name: name,
+        data: {
+            noisedb: wc.tn(chndbobj),
+            anode: wc.tn(anode),
+            rel_gain: gainmap.rel_gain,
+        },
     },
 
     local obnf = g.pnode({
-      type: 'OmnibusNoiseFilter',
-      name: name,
-      data: {
+        type: 'OmnibusNoiseFilter',
+        name: name,
+        data: {
 
-        // Nonzero forces the number of ticks in the waveform
-        nticks: 0,
+            // Nonzero forces the number of ticks in the waveform
+            nticks: 0,
 
-        // channel bin ranges are ignored
-        // only when the channelmask is merged to `bad`
-        maskmap: {sticky: "bad", ledge: "bad", noisy: "bad"},
-        channel_filters: [
-          // wc.tn(sticky),
-          wc.tn(single),
-          // wc.tn(gaincalib),
-        ],
-        grouped_filters: [
-          // wc.tn(grouped),
-        ],
-        channel_status_filters: [
-        ],
-        noisedb: wc.tn(chndbobj),
-        intraces: 'orig%d' % n,  // frame tag get all traces
-        outtraces: 'raw%d' % n,
-      },
+            // channel bin ranges are ignored
+            // only when the channelmask is merged to `bad`
+            maskmap: {sticky: "bad", ledge: "bad", noisy: "bad"},
+            channel_filters: [
+                // wc.tn(sticky),
+                wc.tn(single),
+                // wc.tn(gaincalib),
+            ],
+            grouped_filters: [
+                // wc.tn(grouped),
+            ],
+            channel_status_filters: [
+            ],
+            noisedb: wc.tn(chndbobj),
+            intraces: 'orig%d' % n,  // frame tag get all traces
+            outtraces: 'raw%d' % n,
+        },
     }, uses=[chndbobj, anode, sticky, single, grouped, gaincalib], nin=1, nout=1),
 
 
     pipe: g.pipeline([obnf], name=name),
-  }.pipe
+}.pipe
diff --git a/cfg/pgrapher/experiment/pdsp/ocndb-perfect.jsonnet b/cfg/pgrapher/experiment/pdsp/ocndb-perfect.jsonnet
index 05fe99752..7a048d84a 100644
--- a/cfg/pgrapher/experiment/pdsp/ocndb-perfect.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/ocndb-perfect.jsonnet
@@ -3,18 +3,21 @@
 
 local wc = import "wirecell.jsonnet";
 
+local default_dft = { type: 'FftwDFT' };
+
 // The "perfect noise" database is one that is free of any
 // "special" considerations such as per channel variability.  The
 // "official" perfect chndb depends on the official "chndb-base"
 // and that seems to be adulterated with specific settings.  We
 // try to start fresh here.
-function(anode, fr, nsamples, tick=0.5*wc.us) {
+function(anode, fr, nsamples, tick=0.5*wc.us, dft=default_dft) {
     local apaid = anode.data.ident,
     type:'OmniChannelNoiseDB',
     name: std.toString(apaid),
-    uses: [anode, fr],
+    uses: [anode, fr, dft],
     data: {
         anode: wc.tn(anode),
+        dft: wc.tn(dft),
         field_response: wc.tn(fr),
         tick: tick,
         nsamples: nsamples,
diff --git a/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet b/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet
index aa268e325..427fa7419 100644
--- a/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet
+++ b/cfg/test/test-pdsp-sim-sp-dnnroi.jsonnet
@@ -12,7 +12,8 @@ local wires = hs.aux.wires(params.files.wires);
 local anodes = hs.aux.anodes(wires, params.det.volumes);
 
 // IDFT
-local dft = {type: 'FftwDFT'};
+//local dft = {type: 'FftwDFT'};
+local dft = {type: 'TorchDFT', data: { device: 'cpu' }};
 
 // simulation
 
@@ -38,7 +39,7 @@ local er = hs.aux.cer(params.elec.shaping, params.elec.gain,
                       params.elec.postgain,
                       params.daq.nticks, params.daq.tick);
 local rc = hs.aux.rc(1.0*wc.ms, params.daq.nticks, params.daq.tick);
-local pirs = hs.gen.pirs(sim_fr, [er], [rc]);
+local pirs = hs.gen.pirs(sim_fr, [er], [rc], dft=dft);
 
 // sp fr may differ from sim fr (as it does from real fr)
 local sp_fr = hs.aux.fr(if std.length(params.files.fields)>1
@@ -48,7 +49,7 @@ local sp_fr = hs.aux.fr(if std.length(params.files.fields)>1
 local sp_filters = import "pgrapher/experiment/pdsp/sp-filters.jsonnet";
 local adcpermv = hs.utils.adcpermv(params.adc);
 local chndbf = import "pgrapher/experiment/pdsp/ocndb-perfect.jsonnet";
-local chndb(anode) = chndbf(anode, sp_fr, params.nf.nsamples);
+local chndb(anode) = chndbf(anode, sp_fr, params.nf.nsamples, dft=dft);
 local dnnroi_override = {
     sparse: true,
     use_roi_debug_mode: true,
@@ -82,15 +83,14 @@ local out(anode, prefix, tag_pats, digitize=false, cap=false) =
 
 local anode_pipeline(anode, prefix) = pg.pipeline([
     // sim
-    hs.gen.signal(anode, pirs, params.daq, params.lar, rnd=random),
-    hs.gen.noise(anode, params.files.noise, params.daq, rnd=random),
+    hs.gen.signal(anode, pirs, params.daq, params.lar, rnd=random, dft=dft),
+    hs.gen.noise(anode, params.files.noise, params.daq, rnd=random, dft=dft),
     hs.gen.digi(anode, params.adc),
     out(anode, prefix, ["orig"], true),
         
     // nf+sp
-    hs.nf(anode, sp_fr, chndb(anode), params.nf.nsamples, params.daq.tick),
-    hs.sp(anode, sp_fr, er, sp_filters, adcpermv,
-          override=dnnroi_override),
+    hs.nf(anode, sp_fr, chndb(anode), params.nf.nsamples, params.daq.tick, dft=dft),
+    hs.sp(anode, sp_fr, er, sp_filters, adcpermv, override=dnnroi_override, dft=dft),
     out(anode, prefix, ["wiener","gauss"]),
 
     // // dnnroi
diff --git a/cfg/test/test-pdsp-sim-sp.jsonnet b/cfg/test/test-pdsp-sim-sp.jsonnet
new file mode 100644
index 000000000..9dbb19bf6
--- /dev/null
+++ b/cfg/test/test-pdsp-sim-sp.jsonnet
@@ -0,0 +1,84 @@
+// This provides a main wire-cell config file to exercise
+// sim+sigproc (no dnnroi).  When run it will produce tar files of frames
+// data as numpy arrays.  Ionization pattern is from ideal line
+// source.
+
+local wc = import "wirecell.jsonnet";
+local pg = import "pgraph.jsonnet";
+local params = import "pgrapher/experiment/pdsp/simparams.jsonnet";
+local hs = import "pgrapher/common/helpers.jsonnet";
+
+local wires = hs.aux.wires(params.files.wires);
+local anodes = hs.aux.anodes(wires, params.det.volumes);
+
+// IDFT
+local dft = {type: 'FftwDFT'};
+
+// simulation
+
+// kinematics: ideal line source
+local tracklist = [
+   {
+       time: 0,
+       charge: -5000,         
+       ray: params.det.bounds,
+   },
+];
+local depos = pg.pipeline([
+    hs.gen.track_depos(tracklist),
+    hs.gen.bagger(params.daq),
+]);
+
+local random = hs.gen.random();
+local drifter = hs.gen.drifter(params.det.volumes,params.lar,random);
+
+// responses
+local sim_fr = hs.aux.fr(params.files.fields[0]);
+local er = hs.aux.cer(params.elec.shaping, params.elec.gain,
+                      params.elec.postgain,
+                      params.daq.nticks, params.daq.tick);
+local rc = hs.aux.rc(1.0*wc.ms, params.daq.nticks, params.daq.tick);
+local pirs = hs.gen.pirs(sim_fr, [er], [rc]);
+
+// sp fr may differ from sim fr (as it does from real fr)
+local sp_fr = hs.aux.fr(if std.length(params.files.fields)>1
+                        then params.files.fields[1]
+                        else params.files.fields[0]);
+                        
+local sp_filters = import "pgrapher/experiment/pdsp/sp-filters.jsonnet";
+local adcpermv = hs.utils.adcpermv(params.adc);
+local chndbf = import "pgrapher/experiment/pdsp/ocndb-perfect.jsonnet";
+local chndb(anode) = chndbf(anode, sp_fr, params.nf.nsamples);
+
+// little function to return a frame file tap or sink (if cap is
+// true).  This bakes in PDSP-specific array bounds!
+local out(anode, prefix, tag_pats, digitize=false, cap=false) = 
+    local tags = [tp + std.toString(anode.data.ident)
+                  for tp in tag_pats];
+    local fname = prefix + "-"
+                  + std.join("-", tags) + ".tar.bz2";
+    local dense = hs.io.frame_bounds(2560, 6000,
+                                     2560 * anode.data.ident);
+    if cap
+    then hs.io.frame_file_sink(fname, tags, digitize, dense)
+    else hs.io.frame_file_tap(fname, tags, digitize, dense);
+                         
+
+local anode_pipeline(anode, prefix) = pg.pipeline([
+    // sim
+    hs.gen.signal(anode, pirs, params.daq, params.lar, rnd=random),
+    hs.gen.noise(anode, params.files.noise, params.daq, rnd=random),
+    hs.gen.digi(anode, params.adc),
+    out(anode, prefix, ["orig"], true),
+        
+    // nf+sp
+    hs.nf(anode, sp_fr, chndb(anode), params.nf.nsamples, params.daq.tick),
+    hs.sp(anode, sp_fr, er, sp_filters, adcpermv),
+    out(anode, prefix, ["wiener","gauss"], cap=true),
+]);
+
+function(prefix="test-pdsp-ssd") 
+    local pipes = [ anode_pipeline(a, prefix) for a in anodes];
+    local body = pg.fan.fanout('DepoSetFanout', pipes);
+    local graph = pg.pipeline([depos, drifter, body]);
+    hs.utils.main(graph, 'TbbFlow', ['WireCellPytorch'])
diff --git a/cfg/test/test-pdsp-sim.jsonnet b/cfg/test/test-pdsp-sim.jsonnet
new file mode 100644
index 000000000..d28b355b3
--- /dev/null
+++ b/cfg/test/test-pdsp-sim.jsonnet
@@ -0,0 +1,108 @@
+// This provides a main wire-cell config file to exercise
+// sim+sigproc+dnnroi.  When run it will produce tar files of frames
+// data as numpy arrays.  Ionization pattern is from ideal line
+// source.
+
+local wc = import "wirecell.jsonnet";
+local pg = import "pgraph.jsonnet";
+local params = import "pgrapher/experiment/pdsp/simparams.jsonnet";
+local hs = import "pgrapher/common/helpers.jsonnet";
+
+local wires = hs.aux.wires(params.files.wires);
+local anodes = hs.aux.anodes(wires, params.det.volumes);
+
+// IDFT
+local dft = {type: 'FftwDFT'};
+
+// simulation
+
+// kinematics: ideal line source
+local tracklist = [
+   {
+       time: 0,
+       charge: -5000,         
+       ray: params.det.bounds,
+   },
+];
+local depos = pg.pipeline([
+    hs.gen.track_depos(tracklist),
+    hs.gen.bagger(params.daq),
+]);
+
+local random = hs.gen.random();
+local drifter = hs.gen.drifter(params.det.volumes,params.lar,random);
+
+// responses
+local sim_fr = hs.aux.fr(params.files.fields[0]);
+local er = hs.aux.cer(params.elec.shaping, params.elec.gain,
+                      params.elec.postgain,
+                      params.daq.nticks, params.daq.tick);
+local rc = hs.aux.rc(1.0*wc.ms, params.daq.nticks, params.daq.tick);
+local pirs = hs.gen.pirs(sim_fr, [er], [rc]);
+
+// sp fr may differ from sim fr (as it does from real fr)
+local sp_fr = hs.aux.fr(if std.length(params.files.fields)>1
+                        then params.files.fields[1]
+                        else params.files.fields[0]);
+                        
+local sp_filters = import "pgrapher/experiment/pdsp/sp-filters.jsonnet";
+local adcpermv = hs.utils.adcpermv(params.adc);
+local chndbf = import "pgrapher/experiment/pdsp/ocndb-perfect.jsonnet";
+local chndb(anode) = chndbf(anode, sp_fr, params.nf.nsamples);
+local dnnroi_override = {
+    sparse: true,
+    use_roi_debug_mode: true,
+    use_multi_plane_protection: true,
+    process_planes: [0, 1, 2]
+};
+
+local ts = {
+    type: "TorchService",
+    name: "dnnroi",
+    data: {
+        model: "unet-l23-cosmic500-e50.ts",
+        device: "cpu",
+        concurrency: 1,
+    },
+};
+
+// little function to return a frame file tap or sink (if cap is
+// true).  This bakes in PDSP-specific array bounds!
+local out(anode, prefix, tag_pats, digitize=false, cap=false) = 
+    local tags = [tp + std.toString(anode.data.ident)
+                  for tp in tag_pats];
+    local fname = prefix + "-"
+                  + std.join("-", tags) + ".tar.bz2";
+    local dense = hs.io.frame_bounds(2560, 6000,
+                                     2560 * anode.data.ident);
+    if cap
+    then hs.io.frame_file_sink(fname, tags, digitize, dense)
+    else hs.io.frame_file_tap(fname, tags, digitize, dense);
+                         
+
+local anode_pipeline(anode, prefix) = pg.pipeline([
+    // sim
+    hs.gen.signal(anode, pirs, params.daq, params.lar, rnd=random),
+    // hs.gen.noise(anode, params.files.noise, params.daq, rnd=random),
+    hs.gen.digi(anode, params.adc),
+    out(anode, prefix, ["orig"], true),
+        
+    // // nf+sp
+    // hs.nf(anode, sp_fr, chndb(anode), params.nf.nsamples, params.daq.tick),
+    // hs.sp(anode, sp_fr, er, sp_filters, adcpermv,
+    //       override=dnnroi_override),
+    // out(anode, prefix, ["wiener","gauss"]),
+
+    // // // dnnroi
+    // hs.dnnroi(anode, ts, output_scale=1.2),
+    // out(anode, prefix, ["dnnsp"], cap=true),
+]);
+
+function(prefix="test-pdsp-ssd") 
+    local pipes = [ anode_pipeline(a, prefix) for a in anodes];
+    local body = pg.fan.fanout('DepoSetFanout', pipes);
+    local graph = pg.pipeline([depos, drifter, body]);
+    hs.utils.main(graph, 'TbbFlow', ['WireCellPytorch'])
+
+    
+

From f58127498bb66635802081f69b406797932b1186 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Fri, 3 Dec 2021 11:23:02 -0500
Subject: [PATCH 42/46] Add DFT throughout config.

---
 cfg/pgrapher/common/helpers/gen.jsonnet       |  2 +-
 cfg/pgrapher/common/params.jsonnet            | 21 ++++++++++--------
 cfg/pgrapher/common/sim/nodes.jsonnet         |  8 ++++---
 cfg/pgrapher/common/tools.jsonnet             | 22 ++++++++++++++++---
 cfg/pgrapher/experiment/dune-vd/sim.jsonnet   |  6 +++--
 cfg/pgrapher/experiment/dune-vd/sp.jsonnet    |  3 ++-
 .../experiment/dune-vd/wcls-nf-sp.jsonnet     |  6 ++---
 .../dune-vd/wcls-sim-drift-simchannel.jsonnet |  4 ++--
 .../experiment/dune10kt-1x2x6/nf.jsonnet      |  6 ++---
 .../experiment/dune10kt-1x2x6/sim.jsonnet     |  6 +++--
 .../experiment/dune10kt-1x2x6/sp.jsonnet      |  3 ++-
 .../wcls-blip-sim-drift-simchannel.jsonnet    |  4 ++--
 .../dune10kt-1x2x6/wcls-nf-sp.jsonnet         |  4 ++--
 .../wcls-sim-drift-simchannel.jsonnet         |  4 ++--
 .../experiment/dune10kt-1x2x6/wcls-sp.jsonnet |  4 ++--
 .../dune10kt-1x2x6/wct-sim-check.jsonnet      |  4 ++--
 cfg/pgrapher/experiment/icarus/nf.jsonnet     |  8 ++++++-
 cfg/pgrapher/experiment/icarus/sim.jsonnet    |  6 +++--
 cfg/pgrapher/experiment/icarus/sp.jsonnet     |  3 ++-
 .../icarus/wcls-decode-to-sig.jsonnet         |  4 ++--
 ...pc-sim-drift-simchannel-omit-noise.jsonnet |  4 ++--
 ...wcls-multitpc-sim-drift-simchannel.jsonnet | 13 ++++++-----
 .../icarus/wcls-sim-drift-simchannel.jsonnet  |  6 +++--
 .../icarus/wct-coherent-noise.jsonnet         | 10 +++++----
 .../experiment/icarus/wct-sim-check.jsonnet   | 10 +++++----
 cfg/pgrapher/experiment/iceberg/nf.jsonnet    |  6 ++---
 cfg/pgrapher/experiment/iceberg/sim.jsonnet   |  6 +++--
 cfg/pgrapher/experiment/iceberg/sp.jsonnet    |  3 ++-
 .../experiment/iceberg/wcls-nf-sp.jsonnet     |  4 ++--
 .../experiment/iceberg/wcls-sp.jsonnet        |  4 ++--
 cfg/pgrapher/experiment/pdsp/chndb.jsonnet    |  4 ++--
 cfg/pgrapher/experiment/pdsp/nf.jsonnet       |  7 +++++-
 cfg/pgrapher/experiment/pdsp/sim.jsonnet      |  6 +++--
 cfg/pgrapher/experiment/pdsp/sp.jsonnet       |  3 ++-
 .../experiment/pdsp/wcls-nf-sp.jsonnet        |  4 ++--
 .../experiment/pdsp/wcls-raw-to-sig.jsonnet   |  4 ++--
 .../pdsp/wcls-sim-drift-simchannel.jsonnet    |  4 ++--
 cfg/pgrapher/experiment/pdsp/wcls-sp.jsonnet  |  4 ++--
 .../experiment/pdsp/wct-sim-check.jsonnet     |  4 ++--
 cfg/pgrapher/experiment/sbnd/chndb.jsonnet    |  4 ++--
 cfg/pgrapher/experiment/sbnd/nf.jsonnet       | 10 ++++++++-
 cfg/pgrapher/experiment/sbnd/sim.jsonnet      |  6 +++--
 cfg/pgrapher/experiment/sbnd/sp.jsonnet       |  3 ++-
 .../experiment/sbnd/wcls-nf-sp.jsonnet        |  4 ++--
 .../sbnd/wcls-sim-drift-simchannel.jsonnet    |  4 ++--
 .../experiment/sbnd/wct-sim-check.jsonnet     |  4 ++--
 cfg/pgrapher/experiment/uboone/chndb.jsonnet  |  4 ++--
 cfg/pgrapher/experiment/uboone/nf.jsonnet     | 18 ++++++++++-----
 cfg/pgrapher/experiment/uboone/nodes.jsonnet  | 10 +++++----
 cfg/pgrapher/experiment/uboone/sim.jsonnet    |  6 +++--
 cfg/pgrapher/experiment/uboone/sp.jsonnet     | 17 +++++++++-----
 cfg/test/test_multiductor.jsonnet             |  6 ++++-
 52 files changed, 208 insertions(+), 122 deletions(-)

diff --git a/cfg/pgrapher/common/helpers/gen.jsonnet b/cfg/pgrapher/common/helpers/gen.jsonnet
index 6ba78e335..c9313ffa2 100644
--- a/cfg/pgrapher/common/helpers/gen.jsonnet
+++ b/cfg/pgrapher/common/helpers/gen.jsonnet
@@ -102,6 +102,7 @@ local aux = import "aux.jsonnet";
                 name: u.idents(anode),
                 data: {
                     rng: wc.tn(rnd),
+                    dft: wc.tn(dft),
                     anode: wc.tn(anode),
                     pirs: [wc.tn(p) for p in pirs],
                     fluctuate: true,
@@ -111,7 +112,6 @@ local aux = import "aux.jsonnet";
                     start_time: 0,
                     tick: daq.tick,
                     nsigma: 3,
-                    dft: wc.tn(dft),
                 },
             }, nin=1, nout=1, uses=pirs + [anode, rnd, dft]),
 
diff --git a/cfg/pgrapher/common/params.jsonnet b/cfg/pgrapher/common/params.jsonnet
index 92ba7c797..d83fd95a2 100644
--- a/cfg/pgrapher/common/params.jsonnet
+++ b/cfg/pgrapher/common/params.jsonnet
@@ -1,19 +1,22 @@
-// This file is part of wire-cell-cfg.
+// This file is part of wire-cell-toolkit/cfg/.
 //
 // This file provides a base data structure to define parameters that
 // span all currently supported WCT functionality.  Not every
-// parameter will be used and not all value here is valid.  The
-// parameters are named and factored into sub-objects in order to be
-// sympathetic to how the C++ components are structured and name their
-// configuration paramters.  As such it's often possible to build a
-// component configuration object by inheriting from one or more
-// sub-objects in the parameter structure.  For most jobs, this
-// structure should be derived and overriden before being passed to
-// functions that produce other configuration structures.
+// parameter will be used and not every value here may be valid for
+// your use and should be overridden.  The parameters are named and
+// factored into sub-objects in order to be sympathetic to how the C++
+// components are structured and name their configuration paramters.
+// As such it's often possible to build a component configuration
+// object by inheriting from one or more sub-objects in the parameter
+// structure.  For most jobs, this structure should be derived and
+// overriden before being passed to functions that produce other
+// configuration structures.
+//
 
 local wc = import "wirecell.jsonnet";
 
 {
+
     // Parameters relevant to the bulk liquid argon volume.
     lar : {
         // Longitudinal diffusion constant
diff --git a/cfg/pgrapher/common/sim/nodes.jsonnet b/cfg/pgrapher/common/sim/nodes.jsonnet
index ee34b45b1..db30192e6 100644
--- a/cfg/pgrapher/common/sim/nodes.jsonnet
+++ b/cfg/pgrapher/common/sim/nodes.jsonnet
@@ -69,6 +69,7 @@ function(params, tools)
         name:name,
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             anode: wc.tn(anode),
             pirs: std.map(function(pir) wc.tn(pir), pirs),
             fluctuate: params.sim.fluctuate,
@@ -79,7 +80,7 @@ function(params, tools)
             tick: params.daq.tick,
             nsigma: 3,
         },
-    }, nin=1, nout=1, uses=[anode, tools.random] + pirs),
+    }, nin=1, nout=1, uses=[anode, tools.random, tools.dft] + pirs),
 
     // This may look similar to above but above is expected to diverge
     make_depozipper :: function(name, anode, pirs) g.pnode({
@@ -261,9 +262,10 @@ function(params, tools)
 
                 // fixme: these should probably be set from params.
                 nsamples: 50,   // number of samples of the response
-                truncate:true // result is extended by nsamples, tuncate clips that off
+                truncate:true, // result is extended by nsamples, tuncate clips that off
+                dft: wc.tn(tools.dft),
             }
-        }, nin=1, nout=1),
+        }, nin=1, nout=1, uses[tools.dft]),
 
         local merge = g.pnode({
             type: "FrameMerger",
diff --git a/cfg/pgrapher/common/tools.jsonnet b/cfg/pgrapher/common/tools.jsonnet
index cd9a6e4e5..734b93403 100644
--- a/cfg/pgrapher/common/tools.jsonnet
+++ b/cfg/pgrapher/common/tools.jsonnet
@@ -1,13 +1,22 @@
-
 // This file provides a function which takes a params object (see
 // ../params/) and returns a data structure with a number of
 // sub-objects that may configure various WCT "tool" type componets
 // which are not INodes.
 
+// Some attributes are merely default and you may wish to override
+// them.  For example, the default IDFT FftwDFT and to instead ues
+// TorchDFT you may do something like:
+//
+// local default_tools = tools_maker(params)
+// local tools = std.mergePatch(default_tools,
+//   {dft: {type: "TorchDFT", data: {device: "gpu"}}});
+// 
+
 local wc = import "wirecell.jsonnet";
 
 function(params)
 {
+    // The IRandom pRNG
     random : {
         type: "Random",
         data: {
@@ -15,6 +24,11 @@ function(params)
             seeds: [0,1,2,3,4],
         }
     },
+    // The IDFT FFT implementation 
+    dft : {
+        type: "FftwDFT",
+    }
+
 
     // One FR per field file.
     fields : std.mapWithIndex(function (n, fname) {
@@ -90,13 +104,15 @@ function(params)
     },
 
     // there is one trio of PIRs (one per wire plane in a face) for
-    // each field response.
+    // each field response.  WARNING/fixme: this sets the default DFT
+    // with no way to override!  This config structure needs a redo!
     pirs : std.mapWithIndex(function (n, fr) [
         {
             type: "PlaneImpactResponse",
             name : "PIR%splane%d" % [fr.name, plane],
             data : sim_response_binning {
                 plane: plane,
+                dft: wc.tn($.dft),
                 field_response: wc.tn(fr),
                 // note twice we give rc so we have rc^2 in the final convolution
                 short_responses: if params.sys_status == false
@@ -112,7 +128,7 @@ function(params)
         else [wc.tn($.rc_resp), wc.tn($.rc_resp)],
 		long_padding: 1.5*wc.ms,
 	    },
-            uses: [fr, $.elec_resp, $.rc_resp, $.sys_resp],
+            uses: [$.dft, fr, $.elec_resp, $.rc_resp, $.sys_resp],
         } for plane in [0,1,2]], $.fields),
 
     // One anode per detector "volume"
diff --git a/cfg/pgrapher/experiment/dune-vd/sim.jsonnet b/cfg/pgrapher/experiment/dune-vd/sim.jsonnet
index 4e5b043c5..e58622135 100644
--- a/cfg/pgrapher/experiment/dune-vd/sim.jsonnet
+++ b/cfg/pgrapher/experiment/dune-vd/sim.jsonnet
@@ -33,13 +33,14 @@ function(params, tools) {
         name: "empericalnoise%s"% anode.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(tools.dft),
             chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+        uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
     },
     local noise_models = [make_noise_model(anode) for anode in tools.anodes],
 
@@ -49,10 +50,11 @@ function(params, tools) {
         name: "addnoise%s"%[model.name],
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             model: wc.tn(model),
 	    nsamples: params.daq.nticks,
             replacement_percentage: 0.02, // random optimization
-        }}, nin=1, nout=1, uses=[model]),
+        }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]),
 
     local noises = [add_noise(model) for model in noise_models],
 
diff --git a/cfg/pgrapher/experiment/dune-vd/sp.jsonnet b/cfg/pgrapher/experiment/dune-vd/sp.jsonnet
index 625ed9e99..5e5b708f8 100644
--- a/cfg/pgrapher/experiment/dune-vd/sp.jsonnet
+++ b/cfg/pgrapher/experiment/dune-vd/sp.jsonnet
@@ -47,6 +47,7 @@ function(params, tools, override = {}) {
        *  Associated tuning in sp-filters.jsonnet
        */
       anode: wc.tn(anode),
+      dft: wc.tn(tools.dft),
       field_response: wc.tn(tools.field),
       elecresponse: wc.tn(tools.elec_resp),
       ftoffset: 0.0, // default 0.0
@@ -77,6 +78,6 @@ function(params, tools, override = {}) {
       wiener_threshold_tag: 'threshold%d' % anode.data.ident,
       gauss_tag: 'gauss%d' % anode.data.ident,
     } + override,
-  }, nin=1, nout=1, uses=[anode, tools.field, tools.elec_resp] + pc.uses + spfilt),
+  }, nin=1, nout=1, uses=[anode, tools.dft, tools.field, tools.elec_resp] + pc.uses + spfilt),
 
 }
diff --git a/cfg/pgrapher/experiment/dune-vd/wcls-nf-sp.jsonnet b/cfg/pgrapher/experiment/dune-vd/wcls-nf-sp.jsonnet
index a0438bbf9..7a46327b5 100644
--- a/cfg/pgrapher/experiment/dune-vd/wcls-nf-sp.jsonnet
+++ b/cfg/pgrapher/experiment/dune-vd/wcls-nf-sp.jsonnet
@@ -131,9 +131,9 @@ local base = import 'chndb-base.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  // data: perfect(params, tools.anodes[n], tools.field, n) { dft:wc.tn(tools.dft) },
+  data: base(params, tools.anodes[n], tools.field, n) { dft:wc.tn(tools.dft) },
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 // local nf_maker = import 'pgrapher/experiment/dune10kt-1x2x6/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/dune-vd/wcls-sim-drift-simchannel.jsonnet b/cfg/pgrapher/experiment/dune-vd/wcls-sim-drift-simchannel.jsonnet
index 06aba27b3..59bf42d03 100644
--- a/cfg/pgrapher/experiment/dune-vd/wcls-sim-drift-simchannel.jsonnet
+++ b/cfg/pgrapher/experiment/dune-vd/wcls-sim-drift-simchannel.jsonnet
@@ -120,8 +120,8 @@ local perfect = import 'pgrapher/experiment/dune10kt-1x2x6/chndb-perfect.jsonnet
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n) {dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 //local chndb_maker = import 'pgrapher/experiment/pdsp/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/nf.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/nf.jsonnet
index 5dc74f593..8a24d3f4a 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/nf.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/nf.jsonnet
@@ -6,7 +6,7 @@ local wc = import 'wirecell.jsonnet';
 function(params, anode, chndbobj, n, name='')
   {
     local status = {
-      type: 'mbOneChannelStatus',
+      type: std.trace("Warning MB in DUNE?", 'mbOneChannelStatus'),
       name: name,
       data: {
         Threshold: 3.5,
@@ -17,7 +17,7 @@ function(params, anode, chndbobj, n, name='')
       },
     },
     local single = {
-      type: 'mbOneChannelNoise',
+      type: std.trace("Warning MB in DUNE?", 'mbOneChannelNoise'),
       name: name,
       data: {
         noisedb: wc.tn(chndbobj),
@@ -25,7 +25,7 @@ function(params, anode, chndbobj, n, name='')
       },
     },
     local grouped = {
-      type: 'mbCoherentNoiseSub',
+      type: std.trace("Warning MB in DUNE?", 'mbCoherentNoiseSub'),
       name: name,
       data: {
         noisedb: wc.tn(chndbobj),
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/sim.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/sim.jsonnet
index 27bcefb35..97fb8f680 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/sim.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/sim.jsonnet
@@ -46,13 +46,14 @@ function(params, tools) {
         name: "empericalnoise%s"% anode.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(tools.dft),
             chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+        uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
     },
     local noise_models = [make_noise_model(anode) for anode in tools.anodes],
 
@@ -62,10 +63,11 @@ function(params, tools) {
         name: "addnoise%s"%[model.name],
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             model: wc.tn(model),
 	    nsamples: params.daq.nticks,
             replacement_percentage: 0.02, // random optimization
-        }}, nin=1, nout=1, uses=[model]),
+        }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]),
 
     local noises = [add_noise(model) for model in noise_models],
     
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/sp.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/sp.jsonnet
index 07cd43d63..a311f09ad 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/sp.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/sp.jsonnet
@@ -47,6 +47,7 @@ function(params, tools, override = {}) {
        *  Associated tuning in sp-filters.jsonnet
        */
       anode: wc.tn(anode),
+      dft: wc.tn(tools.dft),
       field_response: wc.tn(tools.field),
       elecresponse: wc.tn(tools.elec_resp),
       ftoffset: 0.0, // default 0.0
@@ -77,6 +78,6 @@ function(params, tools, override = {}) {
       wiener_threshold_tag: 'threshold%d' % anode.data.ident,
       gauss_tag: 'gauss%d' % anode.data.ident,
     } + override,
-  }, nin=1, nout=1, uses=[anode, tools.field, tools.elec_resp] + pc.uses + spfilt),
+  }, nin=1, nout=1, uses=[anode, tools.dft, tools.field, tools.elec_resp] + pc.uses + spfilt),
 
 }
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-blip-sim-drift-simchannel.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-blip-sim-drift-simchannel.jsonnet
index d908a451f..3f28a734c 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-blip-sim-drift-simchannel.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-blip-sim-drift-simchannel.jsonnet
@@ -117,8 +117,8 @@ local perfect = import 'pgrapher/experiment/dune10kt-1x2x6/chndb-perfect.jsonnet
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],  // pnode extension
 } for n in anode_iota];
 
 //local chndb_maker = import 'pgrapher/experiment/pdsp/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-nf-sp.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-nf-sp.jsonnet
index 0132824a5..6df82186f 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-nf-sp.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-nf-sp.jsonnet
@@ -123,8 +123,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 local nf_maker = import 'pgrapher/experiment/dune10kt-1x2x6/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sim-drift-simchannel.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sim-drift-simchannel.jsonnet
index 0437e98dc..d26a1f131 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sim-drift-simchannel.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sim-drift-simchannel.jsonnet
@@ -116,8 +116,8 @@ local perfect = import 'pgrapher/experiment/dune10kt-1x2x6/chndb-perfect.jsonnet
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 //local chndb_maker = import 'pgrapher/experiment/pdsp/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sp.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sp.jsonnet
index 22969c7ba..fbdf79232 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sp.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/wcls-sp.jsonnet
@@ -130,8 +130,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 // local nf_maker = import 'pgrapher/experiment/pdsp/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/dune10kt-1x2x6/wct-sim-check.jsonnet b/cfg/pgrapher/experiment/dune10kt-1x2x6/wct-sim-check.jsonnet
index c8c9ba691..7f72cf3b3 100644
--- a/cfg/pgrapher/experiment/dune10kt-1x2x6/wct-sim-check.jsonnet
+++ b/cfg/pgrapher/experiment/dune10kt-1x2x6/wct-sim-check.jsonnet
@@ -77,8 +77,8 @@ local perfect = import 'chndb-perfect.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 //local chndb_maker = import 'pgrapher/experiment/pdsp/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/icarus/nf.jsonnet b/cfg/pgrapher/experiment/icarus/nf.jsonnet
index c41cc9743..fc92dc1d7 100644
--- a/cfg/pgrapher/experiment/icarus/nf.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/nf.jsonnet
@@ -3,23 +3,29 @@
 local g = import 'pgraph.jsonnet';
 local wc = import 'wirecell.jsonnet';
 
-function(params, anode, chndbobj, n, name='')
+local default_dft = { type: 'FftwDFT' };
+
+function(params, anode, chndbobj, n, name='', dft=default_dft)
   {
 
     local single = {
       type: 'pdOneChannelNoise',
       name: name,
+      uses: [dft, chndbobj, anode],
       data: {
         noisedb: wc.tn(chndbobj),
         anode: wc.tn(anode),
+        dft: wc.tn(dft),
       },
     },
     local grouped = {
       type: 'mbCoherentNoiseSub',
       name: name,
+      uses: [dft, chndbobj, anode],
       data: {
         noisedb: wc.tn(chndbobj),
         anode: wc.tn(anode),
+        dft: wc.tn(dft),
         rms_threshold: 0.0,
       },
     },
diff --git a/cfg/pgrapher/experiment/icarus/sim.jsonnet b/cfg/pgrapher/experiment/icarus/sim.jsonnet
index 2d88cf005..bd578ea57 100644
--- a/cfg/pgrapher/experiment/icarus/sim.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/sim.jsonnet
@@ -46,13 +46,14 @@ function(params, tools) {
         name: "empericalnoise-" + anode.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(tools.dft),
             chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+        uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
     },
     local noise_models = [make_noise_model(anode) for anode in tools.anodes],
 
@@ -62,10 +63,11 @@ function(params, tools) {
         name: "addnoise-" + model.name,
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             model: wc.tn(model),
 	    nsamples: params.daq.nticks,
             replacement_percentage: 0.02, // random optimization
-        }}, nin=1, nout=1, uses=[model]),
+        }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]),
 
     local noises = [add_noise(model) for model in noise_models],
     
diff --git a/cfg/pgrapher/experiment/icarus/sp.jsonnet b/cfg/pgrapher/experiment/icarus/sp.jsonnet
index 6e5c6871f..ab66d462c 100644
--- a/cfg/pgrapher/experiment/icarus/sp.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/sp.jsonnet
@@ -21,6 +21,7 @@ function(params, tools, override = {}) {
     data: {
       // Many parameters omitted here.
       anode: wc.tn(anode),
+      dft: wc.tn(tools.dft),
       field_response: wc.tn(tools.field),
       ftoffset: 0.0, // default 0.0
       ctoffset: 0.0*wc.microsecond, // default -8.0
@@ -67,6 +68,6 @@ function(params, tools, override = {}) {
       process_planes: [0, util.anode_split(anode.data.ident)], // balance the left and right split
 
     } + override,
-  }, nin=1, nout=1, uses=[anode, tools.field, tools.elec_resp] + pc.uses + spfilt),
+  }, nin=1, nout=1, uses=[anode, tools.dft, tools.field, tools.elec_resp] + pc.uses + spfilt),
 
 }
diff --git a/cfg/pgrapher/experiment/icarus/wcls-decode-to-sig.jsonnet b/cfg/pgrapher/experiment/icarus/wcls-decode-to-sig.jsonnet
index a950670b2..bf7e838de 100644
--- a/cfg/pgrapher/experiment/icarus/wcls-decode-to-sig.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/wcls-decode-to-sig.jsonnet
@@ -122,8 +122,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 local nf_maker = import 'pgrapher/experiment/icarus/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel-omit-noise.jsonnet b/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel-omit-noise.jsonnet
index 6545f6d63..69c60da92 100644
--- a/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel-omit-noise.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel-omit-noise.jsonnet
@@ -123,8 +123,8 @@ local perfect = import 'pgrapher/experiment/icarus/chndb-base.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 
diff --git a/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel.jsonnet b/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel.jsonnet
index 4817f0000..cc7949d39 100644
--- a/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/wcls-multitpc-sim-drift-simchannel.jsonnet
@@ -123,8 +123,8 @@ local perfect = import 'pgrapher/experiment/icarus/chndb-base.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 
@@ -165,13 +165,14 @@ local make_noise_model = function(anode, csdb=null) {
     name: "empericalnoise-" + anode.name,
     data: {
         anode: wc.tn(anode),
+        dft: wc.tn(tools.dft),
         chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
         spectra_file: params.files.noise,
         nsamples: params.daq.nticks,
         period: params.daq.tick,
         wire_length_scale: 1.0*wc.cm, // optimization binning
     },
-    uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+    uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
 };
 local noise_model = make_noise_model(mega_anode);
 local add_noise = function(model, n) g.pnode({
@@ -179,10 +180,11 @@ local add_noise = function(model, n) g.pnode({
     name: "addnoise%d-" %n + model.name,
     data: {
         rng: wc.tn(tools.random),
+        dfg: wc.tn(tools.dft),
         model: wc.tn(model),
   nsamples: params.daq.nticks,
         replacement_percentage: 0.02, // random optimization
-    }}, nin=1, nout=1, uses=[model]);
+    }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]);
 local noises = [add_noise(noise_model, n) for n in std.range(0,3)];
 
 local add_coherent_noise = function(n) g.pnode({
@@ -191,11 +193,12 @@ local add_coherent_noise = function(n) g.pnode({
       data: {
           spectra_file: params.files.coherent_noise,
           rng: wc.tn(tools.random),
+          dft: wc.tn(tools.dft),
           nsamples: params.daq.nticks,
           random_fluctuation_amplitude: 0.1,
           period: params.daq.tick,
           normalization: 1
-      }}, nin=1, nout=1, uses=[]);
+      }}, nin=1, nout=1, uses=[tools.random, tools.dft]);
 local coherent_noises = [add_coherent_noise(n) for n in std.range(0,3)];
 
 // local digitizer = sim.digitizer(mega_anode, name="digitizer", tag="orig");
diff --git a/cfg/pgrapher/experiment/icarus/wcls-sim-drift-simchannel.jsonnet b/cfg/pgrapher/experiment/icarus/wcls-sim-drift-simchannel.jsonnet
index 68591c7bc..960e2666c 100644
--- a/cfg/pgrapher/experiment/icarus/wcls-sim-drift-simchannel.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/wcls-sim-drift-simchannel.jsonnet
@@ -140,13 +140,14 @@ local make_noise_model = function(anode, csdb=null) {
     name: "empericalnoise-" + anode.name,
     data: {
         anode: wc.tn(anode),
+        dft: wc.tn(tools.dft),
         chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
         spectra_file: params.files.noise,
         nsamples: params.daq.nticks,
         period: params.daq.tick,
         wire_length_scale: 1.0*wc.cm, // optimization binning
     },
-    uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+    uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
 };
 local noise_model = make_noise_model(mega_anode);
 local add_noise = function(model, n) g.pnode({
@@ -154,10 +155,11 @@ local add_noise = function(model, n) g.pnode({
     name: "addnoise%d-" %n + model.name,
     data: {
         rng: wc.tn(tools.random),
+        dft: wc.tn(tools.dft),
         model: wc.tn(model),
   nsamples: params.daq.nticks,
         replacement_percentage: 0.02, // random optimization
-    }}, nin=1, nout=1, uses=[model]);
+    }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]);
 local noises = [add_noise(noise_model, n) for n in std.range(0,3)];
 
 // local digitizer = sim.digitizer(mega_anode, name="digitizer", tag="orig");
diff --git a/cfg/pgrapher/experiment/icarus/wct-coherent-noise.jsonnet b/cfg/pgrapher/experiment/icarus/wct-coherent-noise.jsonnet
index 29f0a5895..73f3cb66d 100644
--- a/cfg/pgrapher/experiment/icarus/wct-coherent-noise.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/wct-coherent-noise.jsonnet
@@ -48,8 +48,8 @@ local perfect = import 'pgrapher/experiment/icarus/chndb-base.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 local nf_maker = import 'pgrapher/experiment/icarus/nf.jsonnet';
@@ -72,13 +72,14 @@ local make_noise_model = function(anode, csdb=null) {
     name: "empericalnoise-" + anode.name,
     data: {
         anode: wc.tn(anode),
+        dft: wc.tn(tools.dft),
         chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
         spectra_file: params.files.noise,
         nsamples: params.daq.nticks,
         period: params.daq.tick,
         wire_length_scale: 1.0*wc.cm, // optimization binning
     },
-    uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+    uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
 };
 local noise_model = make_noise_model(mega_anode);
 local add_noise = function(model, n) g.pnode({
@@ -98,11 +99,12 @@ local add_coherent_noise = function(n) g.pnode({
       data: {
           spectra_file: params.files.coherent_noise,
           rng: wc.tn(tools.random),
+          dft: wc.tn(tools.dft),
           nsamples: params.daq.nticks,
           random_fluctuation_amplitude: 0.1,
           period: params.daq.tick,
           normalization: 1
-      }}, nin=1, nout=1, uses=[]);
+      }}, nin=1, nout=1, uses=[tools.random, tools.dft]);
 local coherent_noises = [add_coherent_noise(n) for n in std.range(0,3)];
 
 // local digitizer = sim.digitizer(mega_anode, name="digitizer", tag="orig");
diff --git a/cfg/pgrapher/experiment/icarus/wct-sim-check.jsonnet b/cfg/pgrapher/experiment/icarus/wct-sim-check.jsonnet
index 82548c030..0bf8b74f1 100644
--- a/cfg/pgrapher/experiment/icarus/wct-sim-check.jsonnet
+++ b/cfg/pgrapher/experiment/icarus/wct-sim-check.jsonnet
@@ -48,8 +48,8 @@ local perfect = import 'pgrapher/experiment/icarus/chndb-base.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 local nf_maker = import 'pgrapher/experiment/icarus/nf.jsonnet';
@@ -73,13 +73,14 @@ local make_noise_model = function(anode, csdb=null) {
     name: "empericalnoise-" + anode.name,
     data: {
         anode: wc.tn(anode),
+        dft: wc.tn(tools.dft),
         chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
         spectra_file: params.files.noise,
         nsamples: params.daq.nticks,
         period: params.daq.tick,
         wire_length_scale: 1.0*wc.cm, // optimization binning
     },
-    uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+    uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
 };
 local noise_model = make_noise_model(mega_anode);
 local add_noise = function(model, n) g.pnode({
@@ -87,10 +88,11 @@ local add_noise = function(model, n) g.pnode({
     name: "addnoise%d-" %n + model.name,
     data: {
         rng: wc.tn(tools.random),
+        dft: wc.tn(tools.dft),
         model: wc.tn(model),
   nsamples: params.daq.nticks,
         replacement_percentage: 0.02, // random optimization
-    }}, nin=1, nout=1, uses=[model]);
+    }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]);
 local noises = [add_noise(noise_model, n) for n in std.range(0,3)];
 
 // local digitizer = sim.digitizer(mega_anode, name="digitizer", tag="orig");
diff --git a/cfg/pgrapher/experiment/iceberg/nf.jsonnet b/cfg/pgrapher/experiment/iceberg/nf.jsonnet
index 5dc74f593..8a24d3f4a 100644
--- a/cfg/pgrapher/experiment/iceberg/nf.jsonnet
+++ b/cfg/pgrapher/experiment/iceberg/nf.jsonnet
@@ -6,7 +6,7 @@ local wc = import 'wirecell.jsonnet';
 function(params, anode, chndbobj, n, name='')
   {
     local status = {
-      type: 'mbOneChannelStatus',
+      type: std.trace("Warning MB in DUNE?", 'mbOneChannelStatus'),
       name: name,
       data: {
         Threshold: 3.5,
@@ -17,7 +17,7 @@ function(params, anode, chndbobj, n, name='')
       },
     },
     local single = {
-      type: 'mbOneChannelNoise',
+      type: std.trace("Warning MB in DUNE?", 'mbOneChannelNoise'),
       name: name,
       data: {
         noisedb: wc.tn(chndbobj),
@@ -25,7 +25,7 @@ function(params, anode, chndbobj, n, name='')
       },
     },
     local grouped = {
-      type: 'mbCoherentNoiseSub',
+      type: std.trace("Warning MB in DUNE?", 'mbCoherentNoiseSub'),
       name: name,
       data: {
         noisedb: wc.tn(chndbobj),
diff --git a/cfg/pgrapher/experiment/iceberg/sim.jsonnet b/cfg/pgrapher/experiment/iceberg/sim.jsonnet
index 27bcefb35..97fb8f680 100644
--- a/cfg/pgrapher/experiment/iceberg/sim.jsonnet
+++ b/cfg/pgrapher/experiment/iceberg/sim.jsonnet
@@ -46,13 +46,14 @@ function(params, tools) {
         name: "empericalnoise%s"% anode.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(tools.dft),
             chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+        uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
     },
     local noise_models = [make_noise_model(anode) for anode in tools.anodes],
 
@@ -62,10 +63,11 @@ function(params, tools) {
         name: "addnoise%s"%[model.name],
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             model: wc.tn(model),
 	    nsamples: params.daq.nticks,
             replacement_percentage: 0.02, // random optimization
-        }}, nin=1, nout=1, uses=[model]),
+        }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]),
 
     local noises = [add_noise(model) for model in noise_models],
     
diff --git a/cfg/pgrapher/experiment/iceberg/sp.jsonnet b/cfg/pgrapher/experiment/iceberg/sp.jsonnet
index ffd9fee47..717231089 100644
--- a/cfg/pgrapher/experiment/iceberg/sp.jsonnet
+++ b/cfg/pgrapher/experiment/iceberg/sp.jsonnet
@@ -43,6 +43,7 @@ function(params, tools, override = {}) {
        *  Associated tuning in sp-filters.jsonnet
        */
       anode: wc.tn(anode),
+      dft: wc.tn(tools.dft),
       field_response: wc.tn(tools.field),
       elecresponse: wc.tn(tools.elec_resp),
       ftoffset: 0.0, // default 0.0
@@ -73,6 +74,6 @@ function(params, tools, override = {}) {
       wiener_threshold_tag: 'threshold%d' % anode.data.ident,
       gauss_tag: 'gauss%d' % anode.data.ident,
     } + override,
-  }, nin=1, nout=1, uses=[anode, tools.field, tools.elec_resp] + pc.uses + spfilt),
+  }, nin=1, nout=1, uses=[anode, tools.dft, tools.field, tools.elec_resp] + pc.uses + spfilt),
 
 }
diff --git a/cfg/pgrapher/experiment/iceberg/wcls-nf-sp.jsonnet b/cfg/pgrapher/experiment/iceberg/wcls-nf-sp.jsonnet
index 7c4e4b70a..e8a82b5f6 100644
--- a/cfg/pgrapher/experiment/iceberg/wcls-nf-sp.jsonnet
+++ b/cfg/pgrapher/experiment/iceberg/wcls-nf-sp.jsonnet
@@ -120,8 +120,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 local nf_maker = import 'pgrapher/experiment/iceberg/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/iceberg/wcls-sp.jsonnet b/cfg/pgrapher/experiment/iceberg/wcls-sp.jsonnet
index 31de7f7a7..c1ba88b98 100644
--- a/cfg/pgrapher/experiment/iceberg/wcls-sp.jsonnet
+++ b/cfg/pgrapher/experiment/iceberg/wcls-sp.jsonnet
@@ -126,8 +126,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 // an empty omnibus noise filter
diff --git a/cfg/pgrapher/experiment/pdsp/chndb.jsonnet b/cfg/pgrapher/experiment/pdsp/chndb.jsonnet
index f8cafaa6b..5c7ce3a95 100644
--- a/cfg/pgrapher/experiment/pdsp/chndb.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/chndb.jsonnet
@@ -8,8 +8,8 @@ function(params, tools) {
     perfect(anode) :: {
         type:'OmniChannelNoiseDB',
         name: 'ocndbperfect-' + anode.name,
-        data: base(params, anode, tools.field, anode.data.ident),
-        uses: [anode, tools.field],
+        data: base(params, anode, tools.field, anode.data.ident){dft:wc.tn(tools.dft)},
+        uses: [anode, tools.field, tools.dft],
     },
 
 }
diff --git a/cfg/pgrapher/experiment/pdsp/nf.jsonnet b/cfg/pgrapher/experiment/pdsp/nf.jsonnet
index 8f8345580..aff05f7d7 100644
--- a/cfg/pgrapher/experiment/pdsp/nf.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/nf.jsonnet
@@ -10,7 +10,7 @@ function(params, anode, chndbobj, n, name='', dft=default_dft) {
     local single = {
         type: 'pdOneChannelNoise',
         name: name,
-        uses: [dft],
+        uses: [dft, chndbobj, anode],
         data: {
             noisedb: wc.tn(chndbobj),
             anode: wc.tn(anode),
@@ -25,15 +25,18 @@ function(params, anode, chndbobj, n, name='', dft=default_dft) {
     local grouped = {
         type: 'mbCoherentNoiseSub',
         name: name,
+        uses: [dft, chndbobj, anode],
         data: {
             noisedb: wc.tn(chndbobj),
             anode: wc.tn(anode),
+            dft: wc.tn(dft),
             rms_threshold: 0.0,
         },
     },
     local sticky = {
         type: 'pdStickyCodeMitig',
         name: name,
+        uses: [dft, chndbobj, anode],
         data: {
             extra_stky: [
                 {channels: std.range(n * 2560, (n + 1) * 2560 - 1), bits: [0,1,63]},
@@ -46,6 +49,7 @@ function(params, anode, chndbobj, n, name='', dft=default_dft) {
             ],
             noisedb: wc.tn(chndbobj),
             anode: wc.tn(anode),
+            dft: wc.tn(dft),
             stky_sig_like_val: 15.0,
             stky_sig_like_rms: 2.0,
             stky_max_len: 10,
@@ -54,6 +58,7 @@ function(params, anode, chndbobj, n, name='', dft=default_dft) {
     local gaincalib = {
         type: 'pdRelGainCalib',
         name: name,
+        uses: [chndbobj, anode],
         data: {
             noisedb: wc.tn(chndbobj),
             anode: wc.tn(anode),
diff --git a/cfg/pgrapher/experiment/pdsp/sim.jsonnet b/cfg/pgrapher/experiment/pdsp/sim.jsonnet
index d03dc5391..7ac5213ef 100644
--- a/cfg/pgrapher/experiment/pdsp/sim.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/sim.jsonnet
@@ -46,13 +46,14 @@ function(params, tools) {
         name: "empericalnoise-" + anode.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(tools.dft),
             chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+        uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
     },
     local noise_models = [make_noise_model(anode) for anode in tools.anodes],
 
@@ -62,10 +63,11 @@ function(params, tools) {
         name: "addnoise-" + model.name,
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             model: wc.tn(model),
 	    nsamples: params.daq.nticks,
             replacement_percentage: 0.02, // random optimization
-        }}, nin=1, nout=1, uses=[model]),
+        }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]),
 
     local noises = [add_noise(model) for model in noise_models],
     
diff --git a/cfg/pgrapher/experiment/pdsp/sp.jsonnet b/cfg/pgrapher/experiment/pdsp/sp.jsonnet
index 2c9a30339..37559412f 100644
--- a/cfg/pgrapher/experiment/pdsp/sp.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/sp.jsonnet
@@ -47,6 +47,7 @@ function(params, tools, override = {}) {
        *  Associated tuning in sp-filters.jsonnet
        */
       anode: wc.tn(anode),
+      dft: wc.tn(tools.dft),
       field_response: wc.tn(tools.field),
       elecresponse: wc.tn(tools.elec_resp),
       ftoffset: 0.0, // default 0.0
@@ -95,6 +96,6 @@ function(params, tools, override = {}) {
       // process_planes: [0, 2],
 
     } + override,
-  }, nin=1, nout=1, uses=[anode, tools.field, tools.elec_resp] + pc.uses + spfilt),
+  }, nin=1, nout=1, uses=[anode, tools.dft, tools.field, tools.elec_resp] + pc.uses + spfilt),
 
 }
diff --git a/cfg/pgrapher/experiment/pdsp/wcls-nf-sp.jsonnet b/cfg/pgrapher/experiment/pdsp/wcls-nf-sp.jsonnet
index a0759b370..c427d5899 100644
--- a/cfg/pgrapher/experiment/pdsp/wcls-nf-sp.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/wcls-nf-sp.jsonnet
@@ -123,8 +123,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 local nf_maker = import 'pgrapher/experiment/pdsp/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/pdsp/wcls-raw-to-sig.jsonnet b/cfg/pgrapher/experiment/pdsp/wcls-raw-to-sig.jsonnet
index 037db3ca4..1640a131a 100644
--- a/cfg/pgrapher/experiment/pdsp/wcls-raw-to-sig.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/wcls-raw-to-sig.jsonnet
@@ -88,8 +88,8 @@ local chndb = [{
     type: 'OmniChannelNoiseDB',
     name: 'ocndbperfect%d' % n,
     // data: perfect(params, tools.anodes[n], tools.field, n),
-    data: base(params, tools.anodes[n], tools.field, n),
-    uses: [tools.anodes[n], tools.field],  // pnode extension
+    data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+    uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 local nf_maker = import 'pgrapher/experiment/pdsp/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/pdsp/wcls-sim-drift-simchannel.jsonnet b/cfg/pgrapher/experiment/pdsp/wcls-sim-drift-simchannel.jsonnet
index 9d4e3b714..ed4b755dc 100644
--- a/cfg/pgrapher/experiment/pdsp/wcls-sim-drift-simchannel.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/wcls-sim-drift-simchannel.jsonnet
@@ -105,8 +105,8 @@ local perfect = import 'pgrapher/experiment/pdsp/chndb-perfect.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 //local chndb_maker = import 'pgrapher/experiment/pdsp/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/pdsp/wcls-sp.jsonnet b/cfg/pgrapher/experiment/pdsp/wcls-sp.jsonnet
index 328504c6e..c54b44405 100644
--- a/cfg/pgrapher/experiment/pdsp/wcls-sp.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/wcls-sp.jsonnet
@@ -129,8 +129,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 // local nf_maker = import 'pgrapher/experiment/pdsp/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/pdsp/wct-sim-check.jsonnet b/cfg/pgrapher/experiment/pdsp/wct-sim-check.jsonnet
index ddef2ccb2..9872f4cd6 100644
--- a/cfg/pgrapher/experiment/pdsp/wct-sim-check.jsonnet
+++ b/cfg/pgrapher/experiment/pdsp/wct-sim-check.jsonnet
@@ -99,8 +99,8 @@ local perfect = import 'pgrapher/experiment/pdsp/chndb-base.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 //local chndb_maker = import 'pgrapher/experiment/pdsp/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/sbnd/chndb.jsonnet b/cfg/pgrapher/experiment/sbnd/chndb.jsonnet
index f8cafaa6b..5c7ce3a95 100644
--- a/cfg/pgrapher/experiment/sbnd/chndb.jsonnet
+++ b/cfg/pgrapher/experiment/sbnd/chndb.jsonnet
@@ -8,8 +8,8 @@ function(params, tools) {
     perfect(anode) :: {
         type:'OmniChannelNoiseDB',
         name: 'ocndbperfect-' + anode.name,
-        data: base(params, anode, tools.field, anode.data.ident),
-        uses: [anode, tools.field],
+        data: base(params, anode, tools.field, anode.data.ident){dft:wc.tn(tools.dft)},
+        uses: [anode, tools.field, tools.dft],
     },
 
 }
diff --git a/cfg/pgrapher/experiment/sbnd/nf.jsonnet b/cfg/pgrapher/experiment/sbnd/nf.jsonnet
index 0b8d95072..af61fc6b7 100644
--- a/cfg/pgrapher/experiment/sbnd/nf.jsonnet
+++ b/cfg/pgrapher/experiment/sbnd/nf.jsonnet
@@ -4,14 +4,18 @@ local g = import 'pgraph.jsonnet';
 local wc = import 'wirecell.jsonnet';
 local gainmap = import 'pgrapher/experiment/sbnd/chndb-rel-gain.jsonnet';
 
-function(params, anode, chndbobj, n, name='')
+local default_dft = { type: 'FftwDFT' };
+
+function(params, anode, chndbobj, n, name='', dft=default_dft)
   {
     local single = {
       type: 'pdOneChannelNoise',
       name: name,
+      uses: [dft, chndbobj, anode],
       data: {
         noisedb: wc.tn(chndbobj),
         anode: wc.tn(anode),
+        dft: wc.tn(dft),
         resmp: [
           {channels: std.range(2128, 2175), sample_from: 5996},
           {channels: std.range(1520, 1559), sample_from: 5996},
@@ -22,15 +26,18 @@ function(params, anode, chndbobj, n, name='')
     local grouped = {
       type: 'mbCoherentNoiseSub',
       name: name,
+      uses: [dft, chndbobj, anode],
       data: {
         noisedb: wc.tn(chndbobj),
         anode: wc.tn(anode),
+        dft: wc.tn(dft),
         rms_threshold: 0.0,
       },
     },
     local sticky = {
       type: 'pdStickyCodeMitig',
       name: name,
+      uses: [dft, chndbobj, anode],
       data: {
         extra_stky: [
           {channels: std.range(n * 2560, (n + 1) * 2560 - 1), bits: [0,1,63]},
@@ -43,6 +50,7 @@ function(params, anode, chndbobj, n, name='')
         ],
         noisedb: wc.tn(chndbobj),
         anode: wc.tn(anode),
+        dft: wc.tn(dft),
         stky_sig_like_val: 15.0,
         stky_sig_like_rms: 2.0,
         stky_max_len: 10,
diff --git a/cfg/pgrapher/experiment/sbnd/sim.jsonnet b/cfg/pgrapher/experiment/sbnd/sim.jsonnet
index d03dc5391..7ac5213ef 100644
--- a/cfg/pgrapher/experiment/sbnd/sim.jsonnet
+++ b/cfg/pgrapher/experiment/sbnd/sim.jsonnet
@@ -46,13 +46,14 @@ function(params, tools) {
         name: "empericalnoise-" + anode.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(tools.dft),
             chanstat: if std.type(csdb) == "null" then "" else wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode] + if std.type(csdb) == "null" then [] else [csdb],
+        uses: [anode, tools.dft] + if std.type(csdb) == "null" then [] else [csdb],
     },
     local noise_models = [make_noise_model(anode) for anode in tools.anodes],
 
@@ -62,10 +63,11 @@ function(params, tools) {
         name: "addnoise-" + model.name,
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             model: wc.tn(model),
 	    nsamples: params.daq.nticks,
             replacement_percentage: 0.02, // random optimization
-        }}, nin=1, nout=1, uses=[model]),
+        }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]),
 
     local noises = [add_noise(model) for model in noise_models],
     
diff --git a/cfg/pgrapher/experiment/sbnd/sp.jsonnet b/cfg/pgrapher/experiment/sbnd/sp.jsonnet
index fd767ced4..f6bfe4fe7 100644
--- a/cfg/pgrapher/experiment/sbnd/sp.jsonnet
+++ b/cfg/pgrapher/experiment/sbnd/sp.jsonnet
@@ -47,6 +47,7 @@ function(params, tools, override = {}) {
        *  Associated tuning in sp-filters.jsonnet
        */
       anode: wc.tn(anode),
+      dft: wc.tn(tools.dft),
       field_response: wc.tn(tools.field),
       elecresponse: wc.tn(tools.elec_resp),
       ftoffset: 0.0, // default 0.0
@@ -95,6 +96,6 @@ function(params, tools, override = {}) {
       // process_planes: [0, 2],
 
     } + override,
-  }, nin=1, nout=1, uses=[anode, tools.field, tools.elec_resp] + pc.uses + spfilt),
+  }, nin=1, nout=1, uses=[anode, tools.dft, tools.field, tools.elec_resp] + pc.uses + spfilt),
 
 }
diff --git a/cfg/pgrapher/experiment/sbnd/wcls-nf-sp.jsonnet b/cfg/pgrapher/experiment/sbnd/wcls-nf-sp.jsonnet
index 9b5dbcde8..fc79aa23a 100644
--- a/cfg/pgrapher/experiment/sbnd/wcls-nf-sp.jsonnet
+++ b/cfg/pgrapher/experiment/sbnd/wcls-nf-sp.jsonnet
@@ -123,8 +123,8 @@ local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
   // data: perfect(params, tools.anodes[n], tools.field, n),
-  data: base(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: base(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 // local nf_maker = import 'pgrapher/experiment/pdsp/nf.jsonnet';
diff --git a/cfg/pgrapher/experiment/sbnd/wcls-sim-drift-simchannel.jsonnet b/cfg/pgrapher/experiment/sbnd/wcls-sim-drift-simchannel.jsonnet
index f9754299c..8d9aec3c6 100644
--- a/cfg/pgrapher/experiment/sbnd/wcls-sim-drift-simchannel.jsonnet
+++ b/cfg/pgrapher/experiment/sbnd/wcls-sim-drift-simchannel.jsonnet
@@ -100,8 +100,8 @@ local perfect = import 'pgrapher/experiment/sbnd/chndb-perfect.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in anode_iota];
 
 //local chndb_maker = import 'pgrapher/experiment/sbnd/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/sbnd/wct-sim-check.jsonnet b/cfg/pgrapher/experiment/sbnd/wct-sim-check.jsonnet
index ca40e10b1..24216ec06 100644
--- a/cfg/pgrapher/experiment/sbnd/wct-sim-check.jsonnet
+++ b/cfg/pgrapher/experiment/sbnd/wct-sim-check.jsonnet
@@ -58,8 +58,8 @@ local perfect = import 'pgrapher/experiment/sbnd/chndb-base.jsonnet';
 local chndb = [{
   type: 'OmniChannelNoiseDB',
   name: 'ocndbperfect%d' % n,
-  data: perfect(params, tools.anodes[n], tools.field, n),
-  uses: [tools.anodes[n], tools.field],  // pnode extension
+  data: perfect(params, tools.anodes[n], tools.field, n){dft:wc.tn(tools.dft)},
+  uses: [tools.anodes[n], tools.field, tools.dft],
 } for n in std.range(0, std.length(tools.anodes) - 1)];
 
 //local chndb_maker = import 'pgrapher/experiment/sbnd/chndb.jsonnet';
diff --git a/cfg/pgrapher/experiment/uboone/chndb.jsonnet b/cfg/pgrapher/experiment/uboone/chndb.jsonnet
index 209559aab..ddbc73640 100644
--- a/cfg/pgrapher/experiment/uboone/chndb.jsonnet
+++ b/cfg/pgrapher/experiment/uboone/chndb.jsonnet
@@ -11,11 +11,11 @@ function(params, tools)
     wct: function(epoch="before") {
         type: "OmniChannelNoiseDB",
         name: "ocndb%s"%epoch,
-        data :
+        data : {dft: wc.tn(tools.dft)}
         if epoch == "perfect"
         then perfect(params, tools.anode, tools.field)
         else base(params, tools.anode, tools.field, rms_cuts[epoch]),
-        uses: [tools.anode, tools.field],    // pnode extension
+        uses: [tools.anode, tools.field, tools.dft],
     },
 
     wcls: function(epoch="before") {
diff --git a/cfg/pgrapher/experiment/uboone/nf.jsonnet b/cfg/pgrapher/experiment/uboone/nf.jsonnet
index a030091a3..081f9e7c5 100644
--- a/cfg/pgrapher/experiment/uboone/nf.jsonnet
+++ b/cfg/pgrapher/experiment/uboone/nf.jsonnet
@@ -23,24 +23,30 @@ function(params, tools, chndbobj, name="")
             Window: 5,
             Nbins: 250,
             Cut: 14,
-            anode: wc.tn(tools.anode)
-        },            
+            anode: wc.tn(tools.anode),
+            dft: wc.tn(tools.dft),
+        },
+        uses: [tools.anode, tools.dft],
     },
     local single = {
         type: "mbOneChannelNoise",
         name:name,
         data: {
             noisedb: wc.tn(chndbobj),
-            anode: wc.tn(tools.anode)
-        }
+            anode: wc.tn(tools.anode),
+            dft: wc.tn(tools.dft),
+        },
+        uses: [tools.anode, tools.dft, chndbobj],
     },
     local grouped = {
         type: "mbCoherentNoiseSub",
         name:name,
         data: {
             noisedb: wc.tn(chndbobj),
-            anode: wc.tn(tools.anode)
-        }
+            anode: wc.tn(tools.anode),
+            dft: wc.tn(tools.dft),
+        },
+        uses: [tools.anode, tools.dft, chndbobj],
     },
 
     local obnf = g.pnode({
diff --git a/cfg/pgrapher/experiment/uboone/nodes.jsonnet b/cfg/pgrapher/experiment/uboone/nodes.jsonnet
index 4386e02f3..83de781d7 100644
--- a/cfg/pgrapher/experiment/uboone/nodes.jsonnet
+++ b/cfg/pgrapher/experiment/uboone/nodes.jsonnet
@@ -98,18 +98,19 @@ local g = import "pgraph.jsonnet";
 
         
     // Make a noise model bound to an anode and a channel status
-    local make_noise_model = function(anode, csdb) {
+    local make_noise_model = function(anode, csdb, dft={type:"FftwDFT"}) {
         type: "EmpiricalNoiseModel",
         name: "empericalnoise%s"% csdb.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(dft),
             chanstat: wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode, csdb],
+        uses: [anode, dft, csdb],
     },
 
 
@@ -118,7 +119,8 @@ local g = import "pgraph.jsonnet";
         type: "NoiseSource",
         name: "%s%s"%[anode.name, model.name],
         data: params.daq {
-            rng: wc.tn(tools.random),
+            rng: wc.tn(tools.random), // this is going to fail, is this file even used?
+            dft: wc.tn(dft),
             model: wc.tn(model),
 	    anode: wc.tn(anode),
 
@@ -127,7 +129,7 @@ local g = import "pgraph.jsonnet";
             readout_time: params.daq.readout_time,
             sample_period: params.daq.tick,
             first_frame_number: params.daq.first_frame_number,
-        }}, nin=0, nout=1, uses=[anode, model]),
+        }}, nin=0, nout=1, uses=[anode, model, dft]),
 
 
     local noise_summer = g.pnode({
diff --git a/cfg/pgrapher/experiment/uboone/sim.jsonnet b/cfg/pgrapher/experiment/uboone/sim.jsonnet
index 45d9b15c4..1a46178c8 100644
--- a/cfg/pgrapher/experiment/uboone/sim.jsonnet
+++ b/cfg/pgrapher/experiment/uboone/sim.jsonnet
@@ -82,13 +82,14 @@ function(params, tools)
         name: "empericalnoise%s"% csdb.name,
         data: {
             anode: wc.tn(anode),
+            dft: wc.tn(tools.dft),
             chanstat: wc.tn(csdb),
             spectra_file: params.files.noise,
             nsamples: params.daq.nticks,
             period: params.daq.tick,
             wire_length_scale: 1.0*wc.cm, // optimization binning
         },
-        uses: [anode, csdb],
+        uses: [anode, csdb, tools.dft],
     },
 
 
@@ -98,10 +99,11 @@ function(params, tools)
         name: "addnoise%s"%[model.name],
         data: {
             rng: wc.tn(tools.random),
+            dft: wc.tn(tools.dft),
             model: wc.tn(model),
 	    nsamples: params.daq.nticks,
 	    replacement_percentage: 0.02, // random optimization
-        }}, nin=1, nout=1, uses=[model]),
+        }}, nin=1, nout=1, uses=[tools.random, tools.dft, model]),
 
     ret: {
         signal : signal,
diff --git a/cfg/pgrapher/experiment/uboone/sp.jsonnet b/cfg/pgrapher/experiment/uboone/sp.jsonnet
index 03a4ac0eb..697289547 100644
--- a/cfg/pgrapher/experiment/uboone/sp.jsonnet
+++ b/cfg/pgrapher/experiment/uboone/sp.jsonnet
@@ -15,6 +15,7 @@ function(params, tools) {
             // codes a slew of SP filter component names which MUST
             // correctly match what is provided in sp-filters.jsonnet.
             anode: wc.tn(tools.anode),
+            dft: wc.tn(tools.dft),
             field_response: wc.tn(tools.field),
             elecresponse: wc.tn(tools.elec_resp),
             postgain: 1,  // default 1.2
@@ -22,11 +23,13 @@ function(params, tools) {
             per_chan_resp: wc.tn(tools.perchanresp),
 	    fft_flag: 0,   // 1 is faster but higher memory, 0 is slightly slower but lower memory
         }
-    }, nin=1,nout=1, uses=[tools.anode, tools.field, tools.elec_resp, tools.perchanresp] + import "sp-filters.jsonnet"),
-local sigproc_uniform = g.pnode({
+    }, nin=1,nout=1, uses=[tools.anode, tools.dft, tools.field, tools.elec_resp, tools.perchanresp] + import "sp-filters.jsonnet"),
+
+    local sigproc_uniform = g.pnode({
         type: "OmnibusSigProc",
         data: {
             anode: wc.tn(tools.anode),
+            dft: wc.tn(tools.dft),
             field_response: wc.tn(tools.field),
             elecresponse: wc.tn(tools.elec_resp),
             postgain: 1,  // default 1.2
@@ -37,9 +40,10 @@ local sigproc_uniform = g.pnode({
 	    // r_fake_signal_low_th: 300,
 	    // r_fake_signal_high_th: 600,
         }
-    }, nin=1,nout=1,uses=[tools.anode, tools.field, tools.elec_resp] + import "sp-filters.jsonnet"),
-// ch-by-ch response correction in SP turn off by setting null input
-local sigproc = if std.type(params.files.chresp)=='null'
+    }, nin=1,nout=1,uses=[tools.anode, tools.dft, tools.field, tools.elec_resp] + import "sp-filters.jsonnet"),
+
+    // ch-by-ch response correction in SP turn off by setting null input
+    local sigproc = if std.type(params.files.chresp)=='null'
                     then sigproc_uniform
                     else sigproc_perchan,
 
@@ -72,6 +76,7 @@ local sigproc = if std.type(params.files.chresp)=='null'
     local l1spfilter = g.pnode({
         type: "L1SPFilter",
         data: {
+            dft: wc.tn(tools.dft),
             fields: wc.tn(tools.field),
             filter: [0.000305453, 0.000978027, 0.00277049, 0.00694322, 0.0153945,
                      0.0301973, 0.0524048, 0.0804588, 0.109289, 0.131334, 0.139629,
@@ -103,7 +108,7 @@ local sigproc = if std.type(params.files.chresp)=='null'
             sigtag: "gauss",                           // trace tag of input signal
             outtag: "l1sp",                            // trace tag for output signal
         }
-    }, nin=1, nout=1, uses=[tools.field]),
+    }, nin=1, nout=1, uses=[tools.dft, tools.field]),
 
     // merge the split output from NF ("raw" tag) and just the "gauss"
     // from normal SP for input to L1SP
diff --git a/cfg/test/test_multiductor.jsonnet b/cfg/test/test_multiductor.jsonnet
index c90f3e7d4..f170ca358 100644
--- a/cfg/test/test_multiductor.jsonnet
+++ b/cfg/test/test_multiductor.jsonnet
@@ -4,6 +4,8 @@
 
 local wc = import "wirecell.jsonnet";
 
+local dft = {type:'FftwDFT'};
+
 
 // special wire-cell command line configuration just to save us typing.
 local cmdline = {
@@ -144,10 +146,12 @@ local noise_model = {
         // fixme: replace this with various models for DUNE, for now,
         // just pretend to be microboone.
         anode: wc.tn(anode_nominal),
+        dft: dft,
         spectra_file: "microboone-noise-spectra-v2.json.bz2",
         chanstat: "StaticChannelStatus",
         nsamples: params.daq.ticks_per_readout,
-    }
+    },
+    uses: [dft],
 };
 local noise_source = {
     type: "NoiseSource",

From 1f282d5a635340d91ce288bf45314b3d79c23b06 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Fri, 3 Dec 2021 11:51:50 -0500
Subject: [PATCH 43/46] Remove previously commented-out old-style dft()/idft()
 calls

---
 gen/src/AddCoherentNoise.cxx         |   1 -
 gen/src/EmpiricalNoiseModel.cxx      |  18 ---
 gen/src/ImpactData.cxx               |   2 -
 gen/src/ImpactTransform.cxx          |  26 +---
 gen/src/Noise.cxx                    |   2 -
 gen/src/PlaneImpactResponse.cxx      |   4 -
 gen/src/TruthTraceID.cxx             |   2 -
 sig/src/Decon2DFilter.cxx            |   1 -
 sig/src/Decon2DResponse.cxx          |  13 --
 sigproc/src/L1SPFilter.cxx           |   5 -
 sigproc/src/Microboone.cxx           |   7 -
 sigproc/src/OmniChannelNoiseDB.cxx   |   5 -
 sigproc/src/OmnibusSigProc.cxx       |  18 ---
 sigproc/src/Protodune.cxx            |  12 --
 sigproc/src/SimpleChannelNoiseDB.cxx |   3 -
 util/inc/WireCellUtil/Array.h        |  63 --------
 util/inc/WireCellUtil/Waveform.h     |  47 ------
 util/src/Array.cxx                   | 209 ---------------------------
 util/src/Waveform.cxx                |  79 ----------
 19 files changed, 2 insertions(+), 515 deletions(-)

diff --git a/gen/src/AddCoherentNoise.cxx b/gen/src/AddCoherentNoise.cxx
index cd2c7e7bd..9c6a02082 100644
--- a/gen/src/AddCoherentNoise.cxx
+++ b/gen/src/AddCoherentNoise.cxx
@@ -147,7 +147,6 @@ bool Gen::AddCoherentNoise::operator()(const input_pointer& inframe, output_poin
             noise_freq[i] = tc;
         }
 
-        // Waveform::realseq_t wave = WireCell::Waveform::idft(noise_freq);
         auto wave = Waveform::real(Aux::inv(m_dft, noise_freq));
 
         // Add signal (be careful to double counting with the incoherent noise)
diff --git a/gen/src/EmpiricalNoiseModel.cxx b/gen/src/EmpiricalNoiseModel.cxx
index 79db5a957..cfc87dc19 100644
--- a/gen/src/EmpiricalNoiseModel.cxx
+++ b/gen/src/EmpiricalNoiseModel.cxx
@@ -48,8 +48,6 @@ Gen::EmpiricalNoiseModel::~EmpiricalNoiseModel() {}
 
 void Gen::EmpiricalNoiseModel::gen_elec_resp_default()
 {
-    // double shaping[5]={1,1.1,2,2.2,3}; // us
-
     // calculate the frequencies ...
     m_elec_resp_freq.resize(m_fft_length, 0);
     for (unsigned int i = 0; i != m_elec_resp_freq.size(); i++) {
@@ -61,21 +59,7 @@ void Gen::EmpiricalNoiseModel::gen_elec_resp_default()
             m_elec_resp_freq.at(i) = (m_elec_resp_freq.size() - i) / (m_elec_resp_freq.size() * 1.0) * 1. /
                                      m_period;  // the second half is useless ...
         }
-
-        // if (m_elec_resp_freq.at(i) > 1./m_period / 2.){
-        //   m_elec_resp_freq.resize(i);
-        //   break;
-        // }
     }
-
-    // for (int i=0;i!=5;i++){
-    //   Response::ColdElec elec_resp(1, shaping[i]); // default at 1 mV/fC
-    //   auto sig   =   elec_resp.generate(WireCell::Waveform::Domain(0, m_fft_length*m_period), m_fft_length);
-    //   auto filt   = Waveform::dft(sig);
-    //   int nconfig = shaping[i]/ 0.1;
-    //   auto ele_resp_amp = Waveform::magnitude(filt);
-    //   m_elec_resp_cache[nconfig] = ele_resp_amp;
-    // }
 }
 
 WireCell::Configuration Gen::EmpiricalNoiseModel::default_configuration() const
@@ -358,7 +342,6 @@ const IChannelSpectrum::amplitude_t& Gen::EmpiricalNoiseModel::operator()(int ch
         if (resp1 == m_elec_resp_cache.end()) {
             Response::ColdElec elec_resp(10, ch_shaping);  // default at 1 mV/fC
             auto sig = elec_resp.generate(WireCell::Waveform::Domain(0, m_fft_length * m_period), m_fft_length);
-            //auto filt = Waveform::dft(sig);
             auto filt = Aux::fwd_r2c(m_dft, sig);
             auto ele_resp_amp = Waveform::magnitude(filt);
 
@@ -372,7 +355,6 @@ const IChannelSpectrum::amplitude_t& Gen::EmpiricalNoiseModel::operator()(int ch
         if (resp2 == m_elec_resp_cache.end()) {
             Response::ColdElec elec_resp(10, db_shaping);  // default at 1 mV/fC
             auto sig = elec_resp.generate(WireCell::Waveform::Domain(0, m_fft_length * m_period), m_fft_length);
-            // auto filt = Waveform::dft(sig);
             auto filt = Aux::fwd_r2c(m_dft, sig);
             auto ele_resp_amp = Waveform::magnitude(filt);
 
diff --git a/gen/src/ImpactData.cxx b/gen/src/ImpactData.cxx
index 89191abc8..09c8c093a 100644
--- a/gen/src/ImpactData.cxx
+++ b/gen/src/ImpactData.cxx
@@ -56,9 +56,7 @@ void Gen::ImpactData::calculate(const IDFT::pointer& dft, int nticks) const
         }
     }
 
-    // m_spectrum = Waveform::dft(m_waveform);
     m_spectrum = Aux::fwd_r2c(dft, m_waveform);
-    // m_weight_spectrum = Waveform::dft(m_weights);
     m_weight_spectrum = Aux::fwd_r2c(dft, m_weights);
 }
 
diff --git a/gen/src/ImpactTransform.cxx b/gen/src/ImpactTransform.cxx
index abcebfc21..183a44fc8 100644
--- a/gen/src/ImpactTransform.cxx
+++ b/gen/src/ImpactTransform.cxx
@@ -142,9 +142,7 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
         m_vec_vec_charge.at(ii).shrink_to_fit();
 
         // Do FFT on time
-        // c_data = Array::dft_cc(c_data, 0);
         // Do FFT on wire
-        // c_data = Array::dft_cc(c_data, 1);
         c_data = Aux::fwd(m_dft, c_data);
 
         // std::cout << i << std::endl;
@@ -154,7 +152,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[0]->spectrum();
                 // do a inverse FFT
-                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
                 Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 // pick the first xxx ticks
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
@@ -163,7 +160,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
                 // do a FFT
-                // rs1 = Waveform::dft(rs1_reduced);
                 rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
 
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
@@ -173,24 +169,20 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
 
             for (int irow = 0; irow != m_num_pad_wire; irow++) {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[irow + 1]->spectrum();
-                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
                 Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs1_t.size())) break;
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
-                // rs1 = Waveform::dft(rs1_reduced);
                 rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
                 Waveform::compseq_t rs2 = m_vec_map_resp.at(i)[-irow - 1]->spectrum();
-                // Waveform::realseq_t rs2_t = Waveform::idft(rs2);
                 Waveform::realseq_t rs2_t = Aux::inv_c2r(m_dft, rs2);
                 Waveform::realseq_t rs2_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs2_t.size())) break;
                     rs2_reduced.at(icol) = rs2_t[icol];
                 }
-                //rs2 = Waveform::dft(rs2_reduced);
                 rs2 = Aux::fwd_r2c(m_dft, rs2_reduced);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(irow + 1, icol) = rs1[icol];
@@ -200,7 +192,7 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             // std::cout << i << std::endl;
 
             // Do FFT on wire for response // slight larger
-            // resp_f_w = Array::dft_cc(resp_f_w, 1);  // Now becomes the f and f in both time and wire domain ...
+            // Now becomes the f and f in both time and wire domain ...
             resp_f_w = Aux::fwd(m_dft, resp_f_w, 0);
 
             // multiply them together
@@ -208,7 +200,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
         }
 
         // Do inverse FFT on wire
-        // c_data = Array::idft_cc(c_data, 1);
         c_data = Aux::inv(m_dft, c_data, 0);
 
         // Add to wire result in frequency
@@ -238,9 +229,7 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             m_vec_vec_charge.at(i).shrink_to_fit();
 
             // Do FFT on time
-            // data_f_w = Array::dft_rc(data_t_w, 0);
             // Do FFT on wire
-            // data_f_w = Array::dft_cc(data_f_w, 1);
             data_f_w = data_t_w.cast<IDFT::complex_t>();
             data_f_w = Aux::fwd(m_dft, data_f_w);
 
@@ -254,7 +243,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[0]->spectrum();
 
                 // do a inverse FFT
-                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
                 Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 // pick the first xxx ticks
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
@@ -265,7 +253,6 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                     //  std::cout << icol << " " << rs1_t[icol] << std::endl;
                 }
                 // do a FFT
-                // rs1 = Waveform::dft(rs1_reduced);
                 rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
 
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
@@ -275,24 +262,20 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
             }
             for (int irow = 0; irow != m_num_pad_wire; irow++) {
                 Waveform::compseq_t rs1 = m_vec_map_resp.at(i)[irow + 1]->spectrum();
-                // Waveform::realseq_t rs1_t = Waveform::idft(rs1);
                 Waveform::realseq_t rs1_t = Aux::inv_c2r(m_dft, rs1);
                 Waveform::realseq_t rs1_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs1_t.size())) break;
                     rs1_reduced.at(icol) = rs1_t[icol];
                 }
-                // rs1 = Waveform::dft(rs1_reduced);
                 rs1 = Aux::fwd_r2c(m_dft, rs1_reduced);
                 Waveform::compseq_t rs2 = m_vec_map_resp.at(i)[-irow - 1]->spectrum();
-                // Waveform::realseq_t rs2_t = Waveform::idft(rs2);
                 Waveform::realseq_t rs2_t = Aux::inv_c2r(m_dft, rs2);
                 Waveform::realseq_t rs2_reduced(m_end_tick - m_start_tick, 0);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     if (icol >= int(rs2_t.size())) break;
                     rs2_reduced.at(icol) = rs2_t[icol];
                 }
-                // rs2 = Waveform::dft(rs2_reduced);
                 rs2 = Aux::fwd_r2c(m_dft, rs2_reduced);
                 for (int icol = 0; icol != m_end_tick - m_start_tick; icol++) {
                     resp_f_w(irow + 1, icol) = rs1[icol];
@@ -300,21 +283,19 @@ Gen::ImpactTransform::ImpactTransform(IPlaneImpactResponse::pointer pir,
                 }
             }
             // Do FFT on wire for response // slight larger
-            // resp_f_w = Array::dft_cc(resp_f_w, 1);  // Now becomes the f and f in both time and wire domain ...
+            // Now becomes the f and f in both time and wire domain ...
             resp_f_w = Aux::fwd(m_dft, resp_f_w, 0);
             // multiply them together
             data_f_w = data_f_w * resp_f_w;
         }
 
         // Do inverse FFT on wire
-        // data_f_w = Array::idft_cc(data_f_w, 1);
         data_f_w = Aux::inv(m_dft, data_f_w, 0);
 
         // Add to wire result in frequency
         acc_data_f_w += data_f_w;
     }
 
-    // acc_data_f_w = Array::idft_cc(acc_data_f_w, 0);
     acc_data_f_w = Aux::inv(m_dft, acc_data_f_w, 1); 
     Array::array_xxf real_m_decon_data = acc_data_f_w.real();
     Array::array_xxf img_m_decon_data = acc_data_f_w.imag().colwise().reverse();
@@ -348,14 +329,11 @@ Waveform::realseq_t Gen::ImpactTransform::waveform(int iwire) const
             wf.resize(nlength, 0);
             Waveform::realseq_t long_resp = m_pir->closest(0)->long_aux_waveform();
             long_resp.resize(nlength, 0);
-            // Waveform::compseq_t spec = Waveform::dft(wf);
             Waveform::compseq_t spec = Aux::fwd_r2c(m_dft, wf);
-            // Waveform::compseq_t long_spec = Waveform::dft(long_resp);
             Waveform::compseq_t long_spec = Aux::fwd_r2c(m_dft, long_resp);
             for (size_t i = 0; i != nlength; i++) {
                 spec.at(i) *= long_spec.at(i);
             }
-            // wf = Waveform::idft(spec);
             wf = Aux::inv_c2r(m_dft, spec);
             wf.resize(nsamples, 0);
         }
diff --git a/gen/src/Noise.cxx b/gen/src/Noise.cxx
index ee8350b97..f31cdd3eb 100644
--- a/gen/src/Noise.cxx
+++ b/gen/src/Noise.cxx
@@ -50,6 +50,4 @@ Waveform::compseq_t Gen::Noise::generate_spectrum(const std::vector<float>& spec
     }
 
     return noise_freq;
-    // Waveform::realseq_t noise_time = WireCell::Waveform::idft(noise_freq);
-    // return noise_time;
 }
diff --git a/gen/src/PlaneImpactResponse.cxx b/gen/src/PlaneImpactResponse.cxx
index d5e74eee3..3f15c4349 100644
--- a/gen/src/PlaneImpactResponse.cxx
+++ b/gen/src/PlaneImpactResponse.cxx
@@ -111,7 +111,6 @@ void Gen::PlaneImpactResponse::build_responses()
         }
         // note: we are ignoring waveform_start which will introduce
         // an arbitrary phase shift....
-        // auto spec = Waveform::dft(wave);
         auto spec = Aux::fwd_r2c(dft, wave);
         for (size_t ibin = 0; ibin < n_short_length; ++ibin) {
             short_spec[ibin] *= spec[ibin];
@@ -138,7 +137,6 @@ void Gen::PlaneImpactResponse::build_responses()
         }
         // note: we are ignoring waveform_start which will introduce
         // an arbitrary phase shift....
-        // auto spec = Waveform::dft(wave);
         auto spec = Aux::fwd_r2c(dft, wave);
         for (size_t ibin = 0; ibin < n_long_length; ++ibin) {
             long_spec[ibin] *= spec[ibin];
@@ -232,7 +230,6 @@ void Gen::PlaneImpactResponse::build_responses()
             // sum up over coarse ticks.
             wave[bin] += induced_charge;
         }
-        // WireCell::Waveform::compseq_t spec = Waveform::dft(wave);
         WireCell::Waveform::compseq_t spec = Aux::fwd_r2c(dft, wave);
 
         // Convolve with short responses
@@ -241,7 +238,6 @@ void Gen::PlaneImpactResponse::build_responses()
                 spec[find] *= short_spec[find];
             }
         }
-        // Waveform::realseq_t wf = Waveform::idft(spec);
         Waveform::realseq_t wf = Aux::inv_c2r(dft, spec);
 
         wf.resize(m_nbins, 0);
diff --git a/gen/src/TruthTraceID.cxx b/gen/src/TruthTraceID.cxx
index 512693f2f..209c6c7f9 100644
--- a/gen/src/TruthTraceID.cxx
+++ b/gen/src/TruthTraceID.cxx
@@ -200,8 +200,6 @@ void Gen::TruthTraceID::process(output_queue& frames)
                     }
                     bindiff.erase(0, min_impact);
 
-                    // Waveform::realseq_t wave(nsamples, 0.0);
-                    // wave = Waveform::idft(total_spectrum);
                     Waveform::realseq_t wave = Aux::inv_c2r(m_dft, total_spectrum);
                     auto mm = Waveform::edge(wave);
                     if (mm.first == (int) wave.size()) {
diff --git a/sig/src/Decon2DFilter.cxx b/sig/src/Decon2DFilter.cxx
index 5529446ff..73081d942 100644
--- a/sig/src/Decon2DFilter.cxx
+++ b/sig/src/Decon2DFilter.cxx
@@ -118,7 +118,6 @@ bool Sig::Decon2DFilter::operator()(const ITensorSet::pointer &in, ITensorSet::p
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
 
     Array::array_xxf r_data = tm_r_data.block(m_pad_nwires, 0, m_nwires, m_nticks);
diff --git a/sig/src/Decon2DResponse.cxx b/sig/src/Decon2DResponse.cxx
index 7fc52bd89..5a997d4c4 100644
--- a/sig/src/Decon2DResponse.cxx
+++ b/sig/src/Decon2DResponse.cxx
@@ -126,7 +126,6 @@ std::vector<Waveform::realseq_t> Sig::Decon2DResponse::init_overall_response(con
     Response::ColdElec ce(m_gain, m_shaping_time);
     auto ewave = ce.generate(tbins);
     Waveform::scale(ewave, m_inter_gain * m_ADC_mV * (-1));
-    // elec = Waveform::dft(ewave);
     elec = Aux::fwd_r2c(m_dft, ewave);
 
     std::complex<float> fine_period(fravg.period, 0);
@@ -150,7 +149,6 @@ std::vector<Waveform::realseq_t> Sig::Decon2DResponse::init_overall_response(con
     auto arr = Response::as_array(fravg.planes[iplane], fine_nwires, fine_nticks);
 
     // do FFT for response ...
-    // Array::array_xxc c_data = Array::dft_rc(arr, 0);
     Array::array_xxc c_data = arr.cast<IDFT::complex_t>();
     c_data = Aux::fwd(m_dft, c_data, 1);
 
@@ -163,7 +161,6 @@ std::vector<Waveform::realseq_t> Sig::Decon2DResponse::init_overall_response(con
         }
     }
 
-    // arr = Array::idft_cr(c_data, 0);
     arr = Aux::inv(m_dft, c_data, 1).real();
 
     // figure out how to do fine ... shift (good ...)
@@ -272,7 +269,6 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->debug("r_data: {} {}", r_data.rows(), r_data.cols());
 
     // first round of FFT on time
-    // auto c_data = Array::dft_rc(r_data, 0);
     WireCell::Array::array_xxc c_data = r_data.cast<IDFT::complex_t>();
     c_data = Aux::fwd(m_dft, c_data, 1);
 
@@ -287,13 +283,11 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
         Response::ColdElec ce(m_gain, m_shaping_time);
 
         const auto ewave = ce.generate(tbins);
-        // const WireCell::Waveform::compseq_t elec = Waveform::dft(ewave);
         const WireCell::Waveform::compseq_t elec = Aux::fwd_r2c(m_dft, ewave);
 
         for (int irow = 0; irow != c_data.rows(); irow++) {
             Waveform::realseq_t tch_resp = m_cresp->channel_response(ch_arr[irow]);
             tch_resp.resize(m_fft_nticks, 0);
-            // const WireCell::Waveform::compseq_t ch_elec = Waveform::dft(tch_resp);
             const WireCell::Waveform::compseq_t ch_elec = Aux::fwd_r2c(m_dft, tch_resp);
 
             // FIXME figure this out
@@ -312,7 +306,6 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->trace("TRACE {}", __LINE__);
 
     // second round of FFT on wire
-    // c_data = Array::dft_cc(c_data, 1);
     c_data = Aux::fwd(m_dft, c_data, 0);
 
     // response part ...
@@ -325,10 +318,7 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->trace("TRACE {}", __LINE__);
 
     // do first round FFT on the resposne on time
-    //Array::array_xxc c_resp = Array::dft_rc(r_resp, 0);
     // do second round FFT on the response on wire
-    //c_resp = Array::dft_cc(c_resp, 1);
-
     Array::array_xxc c_resp = r_resp.cast<IDFT::complex_t>();
     c_resp = Aux::fwd(m_dft, c_resp);
 
@@ -355,9 +345,7 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
     log->trace("TRACE {}", __LINE__);
 
     // do the first round of inverse FFT on wire
-    // c_data = Array::idft_cc(c_data, 1);
     // do the second round of inverse FFT on time
-    // r_data = Array::idft_cr(c_data, 0);
     c_data = Aux::inv(m_dft, c_data);
     r_data = c_data.real();
 
@@ -383,7 +371,6 @@ bool Sig::Decon2DResponse::operator()(const ITensorSet::pointer &in, ITensorSet:
         r_data.block(0, 0, nrows, time_shift) = arr2;
         r_data.block(0, time_shift, nrows, ncols - time_shift) = arr1;
     }
-    // c_data = Array::dft_rc(r_data, 0);
     c_data = Aux::fwd(m_dft, r_data.cast<IDFT::complex_t>(), 1);
 
     log->trace("TRACE {}", __LINE__);
diff --git a/sigproc/src/L1SPFilter.cxx b/sigproc/src/L1SPFilter.cxx
index 89bd736af..0b0a42343 100644
--- a/sigproc/src/L1SPFilter.cxx
+++ b/sigproc/src/L1SPFilter.cxx
@@ -57,7 +57,6 @@ void L1SPFilter::init_resp()
         Response::ColdElec ce(m_gain, m_shaping);
         auto ewave = ce.generate(tbins);
         Waveform::scale(ewave, m_postgain * m_ADC_mV * (-1));  // ADC to electron ...
-        //elec = Waveform::dft(ewave);
         elec = Aux::fwd_r2c(m_dft, ewave); 
 
         std::complex<float> fine_period(fravg.period, 0);
@@ -66,9 +65,7 @@ void L1SPFilter::init_resp()
         WireCell::Waveform::realseq_t resp_V = fravg.planes[1].paths[0].current;
         WireCell::Waveform::realseq_t resp_W = fravg.planes[2].paths[0].current;
 
-        // auto spectrum_V = WireCell::Waveform::dft(resp_V);
         auto spectrum_V = Aux::fwd_r2c(m_dft, resp_V);
-        // auto spectrum_W = WireCell::Waveform::dft(resp_W);
         auto spectrum_W = Aux::fwd_r2c(m_dft, resp_W);
 
         WireCell::Waveform::scale(spectrum_V, elec);
@@ -78,9 +75,7 @@ void L1SPFilter::init_resp()
         WireCell::Waveform::scale(spectrum_W, fine_period);
 
         // Now this response is ADC for 1 electron .
-        // resp_V = WireCell::Waveform::idft(spectrum_V);
         resp_V = Aux::inv_c2r(m_dft, spectrum_V);
-        // resp_W = WireCell::Waveform::idft(spectrum_W);
         resp_W = Aux::inv_c2r(m_dft, spectrum_W);
 
         // convolute with V and Y average responses ...
diff --git a/sigproc/src/Microboone.cxx b/sigproc/src/Microboone.cxx
index 3d44db947..7fbf8ada8 100644
--- a/sigproc/src/Microboone.cxx
+++ b/sigproc/src/Microboone.cxx
@@ -138,7 +138,6 @@ bool Microboone::Subtract_WScaling(WireCell::IChannelFilter::channel_signals_t&
             }
 
             // do the deconvolution with a very loose low-frequency filter
-            // WireCell::Waveform::compseq_t signal_roi_freq = WireCell::Waveform::dft(signal_roi);
             WireCell::Waveform::compseq_t signal_roi_freq = Aux::fwd_r2c(dft, signal_roi);
             WireCell::Waveform::shrink(signal_roi_freq, respec);
             for (size_t i = 0; i != signal_roi_freq.size(); i++) {
@@ -153,7 +152,6 @@ bool Microboone::Subtract_WScaling(WireCell::IChannelFilter::channel_signals_t&
                 std::complex<float> factor = filter_time(freq) * filter_low_loose(freq);
                 signal_roi_freq.at(i) = signal_roi_freq.at(i) * factor;
             }
-            // WireCell::Waveform::realseq_t signal_roi_decon = WireCell::Waveform::idft(signal_roi_freq);
             WireCell::Waveform::realseq_t signal_roi_decon = Aux::inv_c2r(dft, signal_roi_freq);
 
             if (rms_threshold) {
@@ -350,7 +348,6 @@ std::vector<std::vector<int> > Microboone::SignalProtection(WireCell::Waveform::
     if (respec.size() > 0 && (respec.at(0).real() != 1 || respec.at(0).imag() != 0) && res_offset != 0) {
         // std::cout << nbin << std::endl;
 
-        // WireCell::Waveform::compseq_t medians_freq = WireCell::Waveform::dft(medians);
         WireCell::Waveform::compseq_t medians_freq = Aux::fwd_r2c(dft, medians);
         WireCell::Waveform::shrink(medians_freq, respec);
 
@@ -366,7 +363,6 @@ std::vector<std::vector<int> > Microboone::SignalProtection(WireCell::Waveform::
             std::complex<float> factor = filter_time(freq) * filter_low(freq, decon_lf_cutoff);
             medians_freq.at(i) = medians_freq.at(i) * factor;
         }
-        // WireCell::Waveform::realseq_t medians_decon = WireCell::Waveform::idft(medians_freq);
         WireCell::Waveform::realseq_t medians_decon = Aux::inv_c2r(dft, medians_freq);
 
         temp = Derivations::CalcRMS(medians_decon);
@@ -941,7 +937,6 @@ WireCell::Waveform::ChannelMaskMap Microboone::OneChannelNoise::apply(int ch, si
         }
     }
 
-    // auto spectrum = WireCell::Waveform::dft(signal);
     auto spectrum = Aux::fwd_r2c(m_dft, signal);
     // std::cerr << "OneChannelNoise: "<<ch<<" dft spectral sum="<<Waveform::sum(spectrum)<<"\n";
 
@@ -986,7 +981,6 @@ WireCell::Waveform::ChannelMaskMap Microboone::OneChannelNoise::apply(int ch, si
 
     // remove the DC component
     spectrum.front() = 0;
-    // signal = WireCell::Waveform::idft(spectrum);
     signal = Aux::inv_c2r(m_dft, spectrum);
 
     // std::cerr << "OneChannelNoise: "<<ch<<" after dft: sigsum="<<Waveform::sum(signal)<<"\n";
@@ -1315,7 +1309,6 @@ bool Microboone::OneChannelStatus::ID_lf_noisy(signal_t& sig) const
     //     temp_sig.at(i)=i;
     // }
     // do FFT
-    // Waveform::compseq_t sig_freq = Waveform::dft(temp_sig);
     Waveform::compseq_t sig_freq = Aux::fwd_r2c(m_dft, temp_sig);    
     for (int i = 0; i != m_nbins; i++) {
         content += abs(sig_freq.at(i + 1));
diff --git a/sigproc/src/OmniChannelNoiseDB.cxx b/sigproc/src/OmniChannelNoiseDB.cxx
index c2907e489..e17dfa33c 100644
--- a/sigproc/src/OmniChannelNoiseDB.cxx
+++ b/sigproc/src/OmniChannelNoiseDB.cxx
@@ -183,7 +183,6 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::parse_rcrc(Json::Value j
     // auto signal = rcres.generate(WireCell::Binning(m_nsamples, 0, m_nsamples*m_tick));
     auto signal = rcres.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    // Waveform::compseq_t spectrum = Waveform::dft(signal);
     Waveform::compseq_t spectrum = Aux::fwd_r2c(m_dft, signal);
 
     // get the square of it because there are two RC filters
@@ -259,9 +258,7 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::get_reconfig(double from
     auto to_sig = to_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
     auto from_sig = from_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    // auto to_filt = Waveform::dft(to_sig);
     auto to_filt = Aux::fwd_r2c(m_dft, to_sig);
-    // auto from_filt = Waveform::dft(from_sig);
     auto from_filt = Aux::fwd_r2c(m_dft, from_sig);
 
     // auto from_filt_sum = Waveform::sum(from_filt);
@@ -322,7 +319,6 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::parse_response(Json::Val
                 waveform[ind] += current[ind];
             }
         }
-        // auto spectrum = WireCell::Waveform::dft(waveform);
         auto spectrum = Aux::fwd_r2c(m_dft, waveform);
         auto ret = std::make_shared<filter_t>(spectrum);
         m_response_cache[wpid.ident()] = ret;
@@ -345,7 +341,6 @@ OmniChannelNoiseDB::shared_filter_t OmniChannelNoiseDB::parse_response(Json::Val
             waveform[ind] = jwave[ind].asFloat();
         }
 
-        // auto spectrum = WireCell::Waveform::dft(waveform);
         auto spectrum = Aux::fwd_r2c(m_dft, waveform);
         auto ret = std::make_shared<filter_t>(spectrum);
         m_waveform_cache[id] = ret;
diff --git a/sigproc/src/OmnibusSigProc.cxx b/sigproc/src/OmnibusSigProc.cxx
index 0eec9ad02..9e76e9d07 100644
--- a/sigproc/src/OmnibusSigProc.cxx
+++ b/sigproc/src/OmnibusSigProc.cxx
@@ -800,7 +800,6 @@ void OmnibusSigProc::init_overall_response(IFrame::pointer frame)
     // auto ewave = ce.generate(tbins);
     auto ewave = (*m_elecresponse).waveform_samples(tbins);
     Waveform::scale(ewave, m_inter_gain * m_ADC_mV * (-1));
-    // elec = Waveform::dft(ewave);
     elec = Aux::fwd_r2c(m_dft, ewave);
 
     std::complex<float> fine_period(fravg.period, 0);
@@ -832,7 +831,6 @@ void OmnibusSigProc::init_overall_response(IFrame::pointer frame)
         int ncols = 0;
 
         // do FFT for response ...
-        // Array::array_xxc c_data = Array::dft_rc(arr, 0);
         {
             Array::array_xxc c_data = arr.cast<IDFT::complex_t>();
             c_data = Aux::fwd(m_dft, c_data, 1);
@@ -846,7 +844,6 @@ void OmnibusSigProc::init_overall_response(IFrame::pointer frame)
                 }
             }
 
-            // arr = Array::idft_cr(c_data, 0);
             c_data = Aux::inv(m_dft, c_data, 1);
             arr = c_data.real();
         }
@@ -954,14 +951,12 @@ void OmnibusSigProc::decon_2D_init(int plane)
         WireCell::Binning tbins(m_fft_nticks, cr_bins.min(), cr_bins.min() + m_fft_nticks * m_period);
 
         auto ewave = (*m_elecresponse).waveform_samples(tbins);
-        // const WireCell::Waveform::compseq_t elec = Waveform::dft(ewave);
         const WireCell::Waveform::compseq_t elec = Aux::fwd_r2c(m_dft, ewave);
 
         for (auto och : m_channel_range[plane]) {
             // const auto& ch_resp = cr->channel_response(och.ident);
             Waveform::realseq_t tch_resp = cr->channel_response(och.ident);
             tch_resp.resize(m_fft_nticks, 0);
-            // const WireCell::Waveform::compseq_t ch_elec = Waveform::dft(tch_resp);
             const WireCell::Waveform::compseq_t ch_elec = Aux::fwd_r2c(m_dft, tch_resp);
 
             const int irow = och.wire + m_pad_nwires[plane];
@@ -978,7 +973,6 @@ void OmnibusSigProc::decon_2D_init(int plane)
     }
 
     // second round of FFT on wire
-    // m_c_data[plane] = Array::dft_cc(m_c_data[plane], 1);
     m_c_data[plane] = Aux::fwd(m_dft, m_c_data[plane], 0);
 
     // response part ...
@@ -990,9 +984,7 @@ void OmnibusSigProc::decon_2D_init(int plane)
     }
 
     // do first round FFT on the resposne on time
-    // Array::array_xxc c_resp = Array::dft_rc(r_resp, 0);
     // do second round FFT on the response on wire
-    // c_resp = Array::dft_cc(c_resp, 1);
     Array::array_xxc c_resp = r_resp.cast<IDFT::complex_t>();
     c_resp = Aux::fwd(m_dft, c_resp);
 
@@ -1018,9 +1010,7 @@ void OmnibusSigProc::decon_2D_init(int plane)
     }
 
     // do the first round of inverse FFT on wire
-    //m_c_data[plane] = Array::idft_cc(m_c_data[plane], 1);
     // do the second round of inverse FFT on time
-    //m_r_data[plane] = Array::idft_cr(m_c_data[plane], 0);
     m_r_data[plane] = Aux::inv(m_dft, m_c_data[plane]).real();
 
     // do the shift in wire
@@ -1045,7 +1035,6 @@ void OmnibusSigProc::decon_2D_init(int plane)
         m_r_data[plane].block(0, 0, nrows, time_shift) = arr2;
         m_r_data[plane].block(0, time_shift, nrows, ncols - time_shift) = arr1;
     }
-    // m_c_data[plane] = Array::dft_rc(m_r_data[plane], 0);
     m_c_data[plane] = Aux::fwd(m_dft, m_r_data[plane].cast<IDFT::complex_t>(), 1);
 
 }
@@ -1068,7 +1057,6 @@ void OmnibusSigProc::decon_2D_ROI_refine(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
 
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
@@ -1111,7 +1099,6 @@ void OmnibusSigProc::decon_2D_tightROI(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
 
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
@@ -1155,7 +1142,6 @@ void OmnibusSigProc::decon_2D_tighterROI(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
 
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
@@ -1234,7 +1220,6 @@ void OmnibusSigProc::decon_2D_looseROI(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
 
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
@@ -1281,7 +1266,6 @@ void OmnibusSigProc::decon_2D_looseROI_debug_mode(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
 
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
@@ -1344,7 +1328,6 @@ void OmnibusSigProc::decon_2D_hits(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     if (plane == 2) {
@@ -1378,7 +1361,6 @@ void OmnibusSigProc::decon_2D_charge(int plane)
     }
 
     // do the second round of inverse FFT on wire
-    // Array::array_xxf tm_r_data = Array::idft_cr(c_data_afterfilter, 0);
     Array::array_xxf tm_r_data = Aux::inv(m_dft, c_data_afterfilter, 1).real();
     m_r_data[plane] = tm_r_data.block(m_pad_nwires[plane], 0, m_nwires[plane], m_nticks);
     if (plane == 2) {
diff --git a/sigproc/src/Protodune.cxx b/sigproc/src/Protodune.cxx
index 05cabbf9f..bb3593c18 100644
--- a/sigproc/src/Protodune.cxx
+++ b/sigproc/src/Protodune.cxx
@@ -409,7 +409,6 @@ bool Protodune::FftInterpSticky(const IDFT::pointer& dft,
     }
 
     // dft resampling for "even", see example in test_zero_padding.cxx
-    // auto tran_even = WireCell::Waveform::dft(signal_even);
     auto tran_even = Aux::fwd_r2c(dft, signal_even);
     tran_even.resize(nsublen * 2);
     if (nsublen % 2 == 0) {
@@ -419,13 +418,11 @@ bool Protodune::FftInterpSticky(const IDFT::pointer& dft,
         std::rotate(tran_even.begin() + (nsublen + 1) / 2, tran_even.begin() + nsublen, tran_even.end());
     }
     // inverse FFT
-    // auto signal_even_fc = WireCell::Waveform::idft(tran_even);
     auto signal_even_fc = Aux::inv_c2r(dft, tran_even);
     float scale = tran_even.size() / nsublen;
     WireCell::Waveform::scale(signal_even_fc, scale);
 
     // similar for "odd"
-    // auto tran_odd = WireCell::Waveform::dft(signal_odd);
     auto tran_odd = Aux::fwd_r2c(dft, signal_odd);
     tran_odd.resize(nsublen2 * 2);
     if (nsublen2 % 2 == 0) {
@@ -434,7 +431,6 @@ bool Protodune::FftInterpSticky(const IDFT::pointer& dft,
     else {
         std::rotate(tran_odd.begin() + (nsublen2 + 1) / 2, tran_odd.begin() + nsublen2, tran_odd.end());
     }
-    // auto signal_odd_fc = WireCell::Waveform::idft(tran_odd);
     auto signal_odd_fc = Aux::inv_c2r(dft, tran_odd);
     float scale2 = tran_odd.size() / nsublen2;
     WireCell::Waveform::scale(signal_odd_fc, scale2);
@@ -476,7 +472,6 @@ bool Protodune::FftShiftSticky(const IDFT::pointer& dft,
     }
 
     // dft shift for "even"
-    // auto tran_even = WireCell::Waveform::dft(signal_even);
     auto tran_even = Aux::fwd_r2c(dft, signal_even);
     double f0 = 1. / nsublen;
     const double PI = std::atan(1.0) * 4;
@@ -489,11 +484,9 @@ bool Protodune::FftShiftSticky(const IDFT::pointer& dft,
         tran_even.at(i) = z * std::exp(z1);
     }
     // inverse FFT
-    // auto signal_even_fc = WireCell::Waveform::idft(tran_even);
     auto signal_even_fc = Aux::inv_c2r(dft, tran_even);
 
     // similar to "odd"
-    // auto tran_odd = WireCell::Waveform::dft(signal_odd);
     auto tran_odd = Aux::fwd_r2c(dft, signal_odd);
     f0 = 1. / nsublen2;
     for (size_t i = 0; i < tran_odd.size(); i++) {
@@ -505,7 +498,6 @@ bool Protodune::FftShiftSticky(const IDFT::pointer& dft,
         tran_odd.at(i) = z * std::exp(z1);
     }
     //
-    // auto signal_odd_fc = WireCell::Waveform::idft(tran_odd);
     auto signal_odd_fc = Aux::inv_c2r(dft, tran_odd);
     
     // float scale = 1./tran_odd.size();
@@ -538,7 +530,6 @@ bool Protodune::FftScaling(const IDFT::pointer& dft,
                            WireCell::Waveform::realseq_t& signal, int nsamples)
 {
     const int nsiglen = signal.size();
-    // auto tran = WireCell::Waveform::dft(signal);
     auto tran = Aux::fwd_r2c(dft, signal);
     tran.resize(nsamples);
     if (nsiglen % 2 == 0) {  // ref test_zero_padding.cxx
@@ -548,7 +539,6 @@ bool Protodune::FftScaling(const IDFT::pointer& dft,
         std::rotate(tran.begin() + (nsiglen + 1) / 2, tran.begin() + nsiglen, tran.end());
     }
     // inverse FFT
-    // auto signal_fc = WireCell::Waveform::idft(tran);
     auto signal_fc = Aux::inv_c2r(dft, tran);
 
     WireCell::Waveform::scale(signal_fc, nsamples / nsiglen);
@@ -774,7 +764,6 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
     }
 
     // correct rc undershoot
-    // auto spectrum = WireCell::Waveform::dft(signal);
     auto spectrum = Aux::fwd_r2c(m_dft, signal);
     bool is_partial = m_check_partial(spectrum);  // Xin's "IS_RC()"
 
@@ -862,7 +851,6 @@ WireCell::Waveform::ChannelMaskMap Protodune::OneChannelNoise::apply(int ch, sig
 
     // remove the DC component
     spectrum.front() = 0;
-    // signal = WireCell::Waveform::idft(spectrum);
     signal = Aux::inv_c2r(m_dft, spectrum);
 
     // Now calculate the baseline ...
diff --git a/sigproc/src/SimpleChannelNoiseDB.cxx b/sigproc/src/SimpleChannelNoiseDB.cxx
index 8aaf68975..cf4b3cdea 100644
--- a/sigproc/src/SimpleChannelNoiseDB.cxx
+++ b/sigproc/src/SimpleChannelNoiseDB.cxx
@@ -255,7 +255,6 @@ void SimpleChannelNoiseDB::set_rcrc_constant(const std::vector<int>& channels, d
     //    auto signal = rcres.generate(WireCell::Binning(m_nsamples, 0, m_nsamples*m_tick));
     auto signal = rcres.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    // Waveform::compseq_t spectrum = Waveform::dft(signal);
     Waveform::compseq_t spectrum = Aux::fwd_r2c(m_dft, signal);
 
     // std::cout << rcrc << " " << m_tick << " " << m_nsamples << " " << signal.front() << " " << signal.at(1) << " " <<
@@ -311,10 +310,8 @@ void SimpleChannelNoiseDB::set_gains_shapings(const std::vector<int>& channels,
     auto to_sig = to_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
     auto from_sig = from_ce.generate(WireCell::Waveform::Domain(0, m_nsamples * m_tick), m_nsamples);
 
-    // auto to_filt = Waveform::dft(to_sig);
     auto to_filt = Aux::fwd_r2c(m_dft, to_sig);
 
-    // auto from_filt = Waveform::dft(from_sig);
     auto from_filt = Aux::fwd_r2c(m_dft, from_sig);
 
     // auto from_filt_sum = Waveform::sum(from_filt);
diff --git a/util/inc/WireCellUtil/Array.h b/util/inc/WireCellUtil/Array.h
index 2a01dd368..1bcd879f5 100644
--- a/util/inc/WireCellUtil/Array.h
+++ b/util/inc/WireCellUtil/Array.h
@@ -54,69 +54,6 @@ namespace WireCell {
         /// A complex, 2D array
         typedef Eigen::ArrayXXcf array_xxc;
 
-        /** Perform full, 2D discrete Fourier transform on a real 2D
-            array.
-
-            The full 2D DFT first performs a 1D DFT (real->complex) on
-            each individual row and then a 1D DFT (complex->complex)
-            on each resulting column.
-
-            const_shared_array_xxf arr = ...;
-            const_shared_array_xxc spec = dft(*arr);
-
-            // ...
-
-            const_shared_array_xxf arr2 = idft(*spec);
-         */
-        // array_xxc dft(const array_xxf& arr);
-        // array_xxf idft(const array_xxc& arr);
-
-        /** Partial, 1D DFT and inverse DFT along one dimension of an
-         * array.  Each row is transformed if dim=0, each column if
-         * dim=1.  
-         *
-         * NOTE: this is backward from numpy.fft and IDFT convention!.
-         *
-         * The transfer is either real->complex (rc),
-         * complex->complex(cc) or complex->real(cr).
-         *
-         * The full 2D DFT should be used unless an intermediate
-         * filter is required as it will avoid producing some
-         * temporaries.
-         *
-         * Conceptually:
-         *
-         *    auto xxc = dft(xxf);
-         *
-         * is equivalent to
-         *
-         *    auto tmp = dft_rc(xxf, 0);
-         *    auto xxc = dft_cc(tmp, 1);
-         *
-         * and:
-         *
-         *     auto xxf = idft(xxc)
-         *
-         * is equivalent to:
-         *
-         *     auto tmp = idft_cc(xxc, 1);
-         *     auto xxf = idft_rc(tmp, 0);
-         */
-        // array_xxc dft_rc(const array_xxf& arr, int dim = 0);
-        // array_xxc dft_cc(const array_xxc& arr, int dim = 1);
-        // array_xxc idft_cc(const array_xxc& arr, int dim = 1);
-        // array_xxf idft_cr(const array_xxc& arr, int dim = 0);
-
-        /** Perform 2D deconvolution.
-
-            This will perform a 2D forward DFT, do an
-            element-by-element multiplication of that
-            periodicity/frequency space matrix by the filter and then
-            perform an 2D inverse DFT.
-
-         */
-        // array_xxf deconv(const array_xxf& arr, const array_xxc& filter);
-
         /** downsample a 2D array along one axis by k
          *  simple average of all numbers in a bin
          *  e.g: MxN -> Mxfloor(N/k)
diff --git a/util/inc/WireCellUtil/Waveform.h b/util/inc/WireCellUtil/Waveform.h
index 96fe3ad9c..25e4d691b 100644
--- a/util/inc/WireCellUtil/Waveform.h
+++ b/util/inc/WireCellUtil/Waveform.h
@@ -9,11 +9,6 @@
 #include <algorithm>
 #include <string>
 
-// FIXME: remove the hard-wired Eigen::FFT related in favor of dynamic
-// DFT with Aux/DftTools.h.
-// #include <Eigen/Core>
-// #include <unsupported/Eigen/FFT>
-
 namespace WireCell {
 
     namespace Waveform {
@@ -191,51 +186,9 @@ namespace WireCell {
         real_t percentile(realseq_t& wave, real_t percentage);
         real_t percentile_binned(realseq_t& wave, real_t percentage);
 
-        /// Discrete Fourier transform of real sequence.  Returns full
-        /// spectrum.  No normalization scaling applied
-        // compseq_t dft(realseq_t seq);
-
-        // Linear convolution, returns in1.size()+in2.size()-1.  If
-        // truncate is false then the returned sequence will be
-        // truncated to length that of the first input.  Otherwise the
-        // function is symmetric between the two inputs.
-        // realseq_t linear_convolve(Waveform::realseq_t in1, Waveform::realseq_t in2, bool truncate = true);
-
-        // Replace old response in wave with new response.  If
-        // truncate is false then the returned sequence will be the
-        // length required for linear convolution.  This is the sum of
-        // the sizes of all input less one and less the smallest.
-        // realseq_t replace_convolve(Waveform::realseq_t wave, Waveform::realseq_t newres, Waveform::realseq_t oldres,
-        //                            bool truncate = true);
-
-        /// Inverse, discrete Fourier transform.  Expects full
-        /// spectrum (twice Nyquist frequency).  Applies the
-        /// 1/Nsamples normalization.
-        // realseq_t idft(compseq_t spec);
-
         /// Return the smallest, most frequent value to appear in vector.
         short most_frequent(const std::vector<short>& vals);
 
-        // class FFT {
-        //    public:
-        //     FFT() {}
-        //     inline compseq_t dft(realseq_t wave)
-        //     {
-        //         auto v = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
-        //         Eigen::VectorXcf ret = trans.fwd(v);
-        //         return compseq_t(ret.data(), ret.data() + ret.size());
-        //     }
-        //     inline realseq_t idft(compseq_t spec)
-        //     {
-        //         auto v = Eigen::Map<Eigen::VectorXcf>(spec.data(), spec.size());
-        //         Eigen::VectorXf ret;
-        //         trans.inv(ret, v);
-        //         return realseq_t(ret.data(), ret.data() + ret.size());
-        //     }
-
-        //    private:
-        //     Eigen::FFT<Waveform::real_t> trans;
-        // };
 
     }  // namespace Waveform
 }  // namespace WireCell
diff --git a/util/src/Array.cxx b/util/src/Array.cxx
index c36560c72..ac4406758 100644
--- a/util/src/Array.cxx
+++ b/util/src/Array.cxx
@@ -1,221 +1,12 @@
 #include "WireCellUtil/Array.h"
 #include "WireCellUtil/Exceptions.h"
 
-// #include <unsupported/Eigen/FFT>
-
 #include <algorithm>
 #include <complex>
 
 using namespace WireCell;
 using namespace WireCell::Array;
 
-// Need to use different planner for different input/output
-// https://eigen.tuxfamily.org/dox/unsupported/ei__fftw__impl_8h_source.html
-
-// thread_local static Eigen::FFT<float> gEigenFFT_dft_1d;      // c2c fwd and inv
-// thread_local static Eigen::FFT<float> gEigenFFT_dft_r2c_1d;  // r2c fwd
-// thread_local static Eigen::FFT<float> gEigenFFT_dft_c2r_1d;  // c2r inv
-
-// http://stackoverflow.com/a/33636445
-
-// WireCell::Array::array_xxc WireCell::Array::dft(const WireCell::Array::array_xxf& arr)
-// {
-//     const int nrows = arr.rows();
-//     const int ncols = arr.cols();
-
-//     Eigen::MatrixXcf matc(nrows, ncols);
-
-//     for (int irow = 0; irow < nrows; ++irow) {
-//         Eigen::VectorXcf fspec(ncols);  // frequency spectrum
-//         // gEigenFFT wants vectors, also input arr is const
-//         Eigen::VectorXf tmp = arr.row(irow);
-//         gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-//         matc.row(irow) = fspec;
-//     }
-
-//     for (int icol = 0; icol < ncols; ++icol) {
-//         Eigen::VectorXcf pspec(nrows);                // periodicity spectrum
-//         gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
-//         matc.col(icol) = pspec;
-//     }
-
-//     return matc;
-// }
-
-// WireCell::Array::array_xxc WireCell::Array::dft_rc(const WireCell::Array::array_xxf& arr, int dim)
-// {
-//     const int nrows = arr.rows();
-//     const int ncols = arr.cols();
-
-//     Eigen::MatrixXcf matc(nrows, ncols);
-
-//     if (dim == 0) {
-//         for (int irow = 0; irow < nrows; ++irow) {
-//             Eigen::VectorXcf fspec(ncols);
-//             Eigen::VectorXf tmp = arr.row(irow);
-//             gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-//             matc.row(irow) = fspec;
-//         }
-//     }
-//     else if (dim == 1) {
-//         for (int icol = 0; icol < ncols; ++icol) {
-//             Eigen::VectorXcf fspec(nrows);
-//             Eigen::VectorXf tmp = arr.col(icol);
-//             gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-//             matc.col(icol) = fspec;
-//         }
-//     }
-//     return matc;
-// }
-
-// WireCell::Array::array_xxc WireCell::Array::dft_cc(const WireCell::Array::array_xxc& arr, int dim)
-// {
-//     const int nrows = arr.rows();
-//     const int ncols = arr.cols();
-
-//     Eigen::MatrixXcf matc(nrows, ncols);
-
-//     matc = arr.matrix();
-
-//     if (dim == 0) {
-//         for (int irow = 0; irow < nrows; ++irow) {
-//             Eigen::VectorXcf pspec(ncols);
-//             gEigenFFT_dft_1d.fwd(pspec, matc.row(irow));  // c2c
-//             matc.row(irow) = pspec;
-//         }
-//     }
-//     else {
-//         for (int icol = 0; icol < ncols; ++icol) {
-//             Eigen::VectorXcf pspec(nrows);
-//             gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
-//             matc.col(icol) = pspec;
-//         }
-//     }
-//     return matc;
-// }
-
-// WireCell::Array::array_xxf WireCell::Array::idft(const WireCell::Array::array_xxc& arr)
-// {
-//     const int nrows = arr.rows();
-//     const int ncols = arr.cols();
-
-//     // gEigenFFT works on matrices, not arrays, also don't step on const input
-//     Eigen::MatrixXcf partial(nrows, ncols);
-//     partial = arr.matrix();
-
-//     for (int icol = 0; icol < ncols; ++icol) {
-//         Eigen::VectorXcf pspec(nrows);                   // wire spectrum
-//         gEigenFFT_dft_1d.inv(pspec, partial.col(icol));  // c2c
-//         partial.col(icol) = pspec;
-//     }
-
-//     // shared_array_xxf ret = std::make_shared<array_xxf> (nrows, ncols);
-//     array_xxf ret(nrows, ncols);
-
-//     for (int irow = 0; irow < nrows; ++irow) {
-//         Eigen::VectorXf wave(ncols);                        // back to real-valued time series
-//         gEigenFFT_dft_c2r_1d.inv(wave, partial.row(irow));  // c2r
-//         ret.row(irow) = wave;
-//     }
-
-//     return ret;
-// }
-
-// WireCell::Array::array_xxc WireCell::Array::idft_cc(const WireCell::Array::array_xxc& arr, int dim)
-// {
-//     const int nrows = arr.rows();
-//     const int ncols = arr.cols();
-
-//     // gEigenFFT works on matrices, not arrays, also don't step on const input
-//     Eigen::MatrixXcf ret(nrows, ncols);
-//     ret = arr.matrix();
-
-//     if (dim == 1) {
-//         for (int icol = 0; icol < ncols; ++icol) {
-//             Eigen::VectorXcf pspec(nrows);
-//             gEigenFFT_dft_1d.inv(pspec, ret.col(icol));  // c2c
-//             ret.col(icol) = pspec;
-//         }
-//     }
-//     else if (dim == 0) {
-//         for (int irow = 0; irow < nrows; ++irow) {
-//             Eigen::VectorXcf pspec(ncols);
-//             gEigenFFT_dft_1d.inv(pspec, ret.row(irow));  // c2c
-//             ret.row(irow) = pspec;
-//         }
-//     }
-//     return ret;
-// }
-
-// WireCell::Array::array_xxf WireCell::Array::idft_cr(const WireCell::Array::array_xxc& arr, int dim)
-// {
-//     const int nrows = arr.rows();
-//     const int ncols = arr.cols();
-
-//     // gEigenFFT works on matrices, not arrays, also don't step on const input
-//     Eigen::MatrixXcf partial(nrows, ncols);
-//     partial = arr.matrix();
-
-//     array_xxf ret(nrows, ncols);
-
-//     if (dim == 0) {
-//         for (int irow = 0; irow < nrows; ++irow) {
-//             Eigen::VectorXf wave(ncols);                        // back to real-valued time series
-//             gEigenFFT_dft_c2r_1d.inv(wave, partial.row(irow));  // c2r
-//             ret.row(irow) = wave;
-//         }
-//     }
-//     else if (dim == 1) {
-//         for (int icol = 0; icol < ncols; ++icol) {
-//             Eigen::VectorXf wave(nrows);
-//             gEigenFFT_dft_c2r_1d.inv(wave, partial.col(icol));  // c2r
-//             ret.col(icol) = wave;
-//         }
-//     }
-//     return ret;
-// }
-
-// // this is a cut-and-paste mashup of dft() and idft() in order to avoid temporaries.
-// WireCell::Array::array_xxf WireCell::Array::deconv(const WireCell::Array::array_xxf& arr,
-//                                                    const WireCell::Array::array_xxc& filter)
-// {
-//     const int nrows = arr.rows();
-//     const int ncols = arr.cols();
-
-//     Eigen::MatrixXcf matc(nrows, ncols);
-//     for (int irow = 0; irow < nrows; ++irow) {
-//         Eigen::VectorXcf fspec(ncols);  // frequency spectrum
-//         // gEigenFFT wants vectors, also input arr is const
-//         Eigen::VectorXf tmp = arr.row(irow);
-//         gEigenFFT_dft_r2c_1d.fwd(fspec, tmp);  // r2c
-//         matc.row(irow) = fspec;
-//     }
-
-//     for (int icol = 0; icol < ncols; ++icol) {
-//         Eigen::VectorXcf pspec(nrows);                // periodicity spectrum
-//         gEigenFFT_dft_1d.fwd(pspec, matc.col(icol));  // c2c
-//         matc.col(icol) = pspec;
-//     }
-
-//     // deconvolution via multiplication in frequency space
-//     Eigen::MatrixXcf filt = matc.array() * filter;
-
-//     for (int icol = 0; icol < ncols; ++icol) {
-//         Eigen::VectorXcf pspec(nrows);                // wire spectrum
-//         gEigenFFT_dft_1d.inv(pspec, filt.col(icol));  // c2c
-//         filt.col(icol) = pspec;
-//     }
-
-//     array_xxf ret(nrows, ncols);
-
-//     for (int irow = 0; irow < nrows; ++irow) {
-//         Eigen::VectorXf wave(ncols);                     // back to real-valued time series
-//         gEigenFFT_dft_c2r_1d.inv(wave, filt.row(irow));  // c2r
-//         ret.row(irow) = wave;
-//     }
-
-//     return ret;
-// }
 
 WireCell::Array::array_xxf WireCell::Array::downsample(const Array::array_xxf& in, const unsigned int k, const int dim)
 {
diff --git a/util/src/Waveform.cxx b/util/src/Waveform.cxx
index fcdee5e3e..e6483ef23 100644
--- a/util/src/Waveform.cxx
+++ b/util/src/Waveform.cxx
@@ -3,10 +3,6 @@
 
 #include <algorithm>
 
-// for FFT
-#include <Eigen/Core>
-#include <unsupported/Eigen/FFT>
-
 #include <complex>
 
 using namespace WireCell;
@@ -155,81 +151,6 @@ std::pair<int, int> WireCell::Waveform::edge(const realseq_t& wave)
     return std::make_pair(imin, imax);
 }
 
-// thread_local static Eigen::FFT<Waveform::real_t> gEigenFFT;
-
-// Waveform::compseq_t WireCell::Waveform::dft(realseq_t wave)
-// {
-//     auto v = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
-//     Eigen::VectorXcf ret = gEigenFFT.fwd(v);
-//     return compseq_t(ret.data(), ret.data() + ret.size());
-// }
-
-// Waveform::realseq_t WireCell::Waveform::idft(compseq_t spec)
-// {
-//     auto v = Eigen::Map<Eigen::VectorXcf>(spec.data(), spec.size());
-//     Eigen::VectorXf ret;
-//     gEigenFFT.inv(ret, v);
-//     return realseq_t(ret.data(), ret.data() + ret.size());
-// }
-
-// // Linear convolution, returns in1.size()+in2.size()-1.
-// Waveform::realseq_t WireCell::Waveform::linear_convolve(Waveform::realseq_t in1, Waveform::realseq_t in2, bool truncate)
-// {
-//     size_t n1_orig = in1.size(), n2_orig = in2.size();
-//     size_t n_out = n1_orig + n2_orig - 1;
-
-//     in1.resize(n_out, 0);
-//     in2.resize(n_out, 0);
-
-//     auto v1 = Eigen::Map<Eigen::VectorXf>(in1.data(), in1.size());
-//     auto v2 = Eigen::Map<Eigen::VectorXf>(in2.data(), in2.size());
-
-//     Eigen::FFT<Waveform::real_t> trans;
-
-//     Eigen::VectorXcf s1 = trans.fwd(v1);
-//     Eigen::VectorXcf s2 = trans.fwd(v2);
-//     Eigen::VectorXcf s12 = (s1.array() * s2.array()).matrix();
-//     Eigen::VectorXf vret;
-//     trans.inv(vret, s12);
-//     realseq_t ret(vret.data(), vret.data() + vret.size());
-//     if (truncate) {
-//         ret.resize(n1_orig);
-//     }
-//     return ret;
-// }
-
-// // Replace old response in wave with new response.
-// Waveform::realseq_t WireCell::Waveform::replace_convolve(Waveform::realseq_t wave, Waveform::realseq_t newres,
-//                                                          Waveform::realseq_t oldres, bool truncate)
-// {
-//     size_t sizes[3] = {wave.size(), newres.size(), oldres.size()};
-//     size_t n_out = sizes[0] + sizes[1] + sizes[2] - *std::min_element(sizes, sizes + 3) - 1;
-
-//     wave.resize(n_out, 0);
-//     newres.resize(n_out, 0);
-//     oldres.resize(n_out, 0);
-
-//     auto v1 = Eigen::Map<Eigen::VectorXf>(wave.data(), wave.size());
-//     auto v2 = Eigen::Map<Eigen::VectorXf>(newres.data(), newres.size());
-//     auto v3 = Eigen::Map<Eigen::VectorXf>(oldres.data(), oldres.size());
-
-//     Eigen::FFT<Waveform::real_t> trans;
-
-//     Eigen::VectorXcf s1 = trans.fwd(v1);
-//     Eigen::VectorXcf s2 = trans.fwd(v2);
-//     Eigen::VectorXcf s3 = trans.fwd(v3);
-
-//     Eigen::VectorXcf s123 = (s1.array() * s2.array() / s3.array()).matrix();
-
-//     Eigen::VectorXf vret;
-//     trans.inv(vret, s123);
-//     realseq_t ret(vret.data(), vret.data() + vret.size());
-//     if (truncate) {
-//         ret.resize(sizes[0]);
-//     }
-//     return ret;
-// }
-
 WireCell::Waveform::BinRangeList WireCell::Waveform::merge(const WireCell::Waveform::BinRangeList& brl)
 {
     WireCell::Waveform::BinRangeList tmp(brl.begin(), brl.end());

From 2c13e3cd546de2573ce3834f73ef423289477424 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Fri, 3 Dec 2021 12:13:55 -0500
Subject: [PATCH 44/46] Add construction of IDFT for tests

---
 root/test/anode_loader.h | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/root/test/anode_loader.h b/root/test/anode_loader.h
index 9b7d41351..cdf1d7b16 100644
--- a/root/test/anode_loader.h
+++ b/root/test/anode_loader.h
@@ -15,6 +15,7 @@
 #include "WireCellIface/IAnodePlane.h"
 #include "WireCellIface/IFieldResponse.h"
 #include "WireCellIface/IWireSchema.h"
+#include "WireCellIface/IDFT.h"
 
 #include <vector>
 #include <string>
@@ -59,6 +60,7 @@ std::vector<std::string> anode_loader(std::string detector)
         PluginManager& pm = PluginManager::instance();
         pm.add("WireCellSigProc");
         pm.add("WireCellGen");
+        pm.add("WireCellAux");
 
         const std::string fr_tn = "FieldResponse";
         const std::string ws_tn = "WireSchemaFile";
@@ -75,6 +77,11 @@ std::vector<std::string> anode_loader(std::string detector)
             cfg["filename"] = ws_fname;
             icfg->configure(cfg);
         }
+        {
+            // If FftwDFT grows to be an IConfigurable, this needs to
+            // change to suit.
+            Factory::lookup<IDFT>("FftwDFT"); 
+        }
 
         for (int ianode = 0; ianode < nanodes; ++ianode) {
             std::string tn = String::format("AnodePlane:%d", ianode);

From d8ddb6ee459de33552c29e359dc0341b66b2c049 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Wed, 8 Dec 2021 14:46:03 -0500
Subject: [PATCH 45/46] Remove include of removed header

My build was picking up a stale copy in the install dir
---
 root/test/test_interpolation.cxx | 1 -
 1 file changed, 1 deletion(-)

diff --git a/root/test/test_interpolation.cxx b/root/test/test_interpolation.cxx
index fad40692d..2a1e59edf 100644
--- a/root/test/test_interpolation.cxx
+++ b/root/test/test_interpolation.cxx
@@ -3,7 +3,6 @@
  *  Implementation in GaussianDiffusion for each charge depo
  */
 #include "WireCellGen/GaussianDiffusion.h"
-#include "WireCellGen/ImpactZipper.h"
 #include "WireCellGen/TrackDepos.h"
 #include "WireCellGen/BinnedDiffusion.h"
 #include "WireCellGen/TransportedDepo.h"

From 847fb83bc5c85d68eb5daf9981301e1d0e5c22b3 Mon Sep 17 00:00:00 2001
From: Brett Viren <brett.viren@gmail.com>
Date: Thu, 9 Dec 2021 11:34:49 -0500
Subject: [PATCH 46/46] Few fixes found by Haiwang in review

---
 cfg/pgrapher/common/sim/nodes.jsonnet | 2 +-
 cfg/pgrapher/common/tools.jsonnet     | 3 +--
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/cfg/pgrapher/common/sim/nodes.jsonnet b/cfg/pgrapher/common/sim/nodes.jsonnet
index db30192e6..15d1c641d 100644
--- a/cfg/pgrapher/common/sim/nodes.jsonnet
+++ b/cfg/pgrapher/common/sim/nodes.jsonnet
@@ -265,7 +265,7 @@ function(params, tools)
                 truncate:true, // result is extended by nsamples, tuncate clips that off
                 dft: wc.tn(tools.dft),
             }
-        }, nin=1, nout=1, uses[tools.dft]),
+        }, nin=1, nout=1, uses=[tools.dft]),
 
         local merge = g.pnode({
             type: "FrameMerger",
diff --git a/cfg/pgrapher/common/tools.jsonnet b/cfg/pgrapher/common/tools.jsonnet
index 734b93403..f47c19a8c 100644
--- a/cfg/pgrapher/common/tools.jsonnet
+++ b/cfg/pgrapher/common/tools.jsonnet
@@ -27,8 +27,7 @@ function(params)
     // The IDFT FFT implementation 
     dft : {
         type: "FftwDFT",
-    }
-
+    },
 
     // One FR per field file.
     fields : std.mapWithIndex(function (n, fname) {