From f9dc73ee518fef82ab8d122d2ca81748a3fdaf4b Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 14 Mar 2019 16:36:22 +1100
Subject: [PATCH 0001/1056] csv::options: full_xpath set to true by default

---
 csv/applications/csv-blocks.cpp     |  1 -
 csv/applications/csv-calc.new.cpp   |  1 -
 csv/applications/csv-enumerate.cpp  |  2 --
 csv/applications/csv-select.cpp     |  1 -
 csv/applications/csv-sort.cpp       |  1 -
 csv/applications/csv-time-delay.cpp |  2 +-
 csv/applications/csv-time.cpp       |  1 -
 csv/applications/csv-units.cpp      |  1 -
 csv/applications/csv-update.cpp     |  4 ----
 csv/impl/program_options.h          |  2 --
 csv/options.cpp                     | 28 +++++++---------------------
 csv/options.h                       |  4 ++--
 csv/test/stream_test.cpp            |  1 -
 csv/traits.h                        |  2 --
 etc/bash_completion.d/comma         |  1 -
 15 files changed, 10 insertions(+), 42 deletions(-)

diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index 5e3c9b24a..94998dd44 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -413,7 +413,6 @@ int main( int ac, char** av )
         verbose = options.exists( "--verbose,-v" );
         strict = options.exists( "--strict" );
         csv = comma::csv::options( options );
-        csv.full_xpath = true;
         csv.quote.reset();
         comma::csv::options csv_out;
         if( csv.binary() ) { csv_out.format( comma::csv::format("ui") ); }
diff --git a/csv/applications/csv-calc.new.cpp b/csv/applications/csv-calc.new.cpp
index e9bf661d9..c064cc641 100644
--- a/csv/applications/csv-calc.new.cpp
+++ b/csv/applications/csv-calc.new.cpp
@@ -182,7 +182,6 @@ static std::pair< entry_t, comma::csv::options > make_input_( const comma::csv::
         else { vf.push_back( "" ); }
     }
     p.second.fields = comma::join( vf, ',' );
-    p.second.full_xpath = true;
     return p;
 }
 
diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index a58cfc4f7..ff5d4955a 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -74,7 +74,6 @@ int main( int ac, char** av )
         bool has_non_empty_field = false;
         for( const auto& f: comma::split( csv.fields, ',' ) ) { if( !f.empty() ) { has_non_empty_field = true; break; } }
         if( !has_non_empty_field ) { std::cerr << "csv-enumerate: please specify at least one key in fields" << std::endl; return 1; }
-        csv.full_xpath = true;
         std::string first_line;
         comma::csv::format f;
         if( csv.binary() ) { f = csv.format(); }
@@ -131,7 +130,6 @@ int main( int ac, char** av )
         if( !output_map ) { return 0; }
         comma::csv::options output_csv;
         output_csv.delimiter = csv.delimiter;
-        output_csv.full_xpath = true;
         if( csv.binary() ) { output_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" ); }
         comma::csv::output_stream< map_t::value_type > ostream( std::cout, output_csv, std::make_pair( default_input, std::make_pair( 0, 0 ) ) );
         for( map_t::const_iterator it = map.begin(); it != map.end(); ++it ) { ostream.write( *it ); }
diff --git a/csv/applications/csv-select.cpp b/csv/applications/csv-select.cpp
index 0ccadd3a9..e0fb9c1ff 100644
--- a/csv/applications/csv-select.cpp
+++ b/csv/applications/csv-select.cpp
@@ -338,7 +338,6 @@ static void init_input( const comma::csv::format& format, const comma::command_l
         }
     }
     csv.fields = comma::join( fields, ',' );
-    csv.full_xpath = true;
 }
 
 int main( int ac, char** av )
diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index 18cfffbec..48d216abf 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -678,7 +678,6 @@ int main( int ac, char** av )
         options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--max,--sliding-window,--window,--unique" );
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
-        csv.full_xpath = true;
         return options.exists( "--first,--min,--max" ) ? handle_operations_with_ids( options ) : sort( options );
     }
     catch( std::exception& ex ) { std::cerr << "csv-sort: " << ex.what() << std::endl; }
diff --git a/csv/applications/csv-time-delay.cpp b/csv/applications/csv-time-delay.cpp
index 187838166..10e9b7910 100644
--- a/csv/applications/csv-time-delay.cpp
+++ b/csv/applications/csv-time-delay.cpp
@@ -78,7 +78,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av );
         if( options.exists( "--help" ) || options.exists( "-h" ) || ac == 1 ) { usage(); }
-        const std::vector< std::string >& v = options.unnamed( "--flush", "--binary,-b,--delimiter,-d,--fields,-f,--full-xpath,--precision,--quote" );
+        const std::vector< std::string >& v = options.unnamed( "--flush", "--binary,-b,--delimiter,-d,--fields,-f,--precision,--quote" );
         if( v.empty() ) { std::cerr << "csv-time-delay: expected time delay, got none" << std::endl; return 1; }
         double d = boost::lexical_cast< double >( v[0] );
         int sign = d < 0 ? -1 : 1;
diff --git a/csv/applications/csv-time.cpp b/csv/applications/csv-time.cpp
index 78308a2ba..7e5922825 100644
--- a/csv/applications/csv-time.cpp
+++ b/csv/applications/csv-time.cpp
@@ -451,7 +451,6 @@ static void init_input()
     }
 
     csv.fields = fields;
-    csv.full_xpath = true;
     input.values.resize( size );
 }
 
diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index 8a74d546a..c2bf85f77 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -461,7 +461,6 @@ static void init_input()
         fields += init_input_field( v[i] );
     }
     csv.fields = fields;
-    csv.full_xpath = true;
     input.values.resize( input_fields.size() ); //input.values.resize( size );
 }
 
diff --git a/csv/applications/csv-update.cpp b/csv/applications/csv-update.cpp
index 98f0ff463..4778f02f2 100644
--- a/csv/applications/csv-update.cpp
+++ b/csv/applications/csv-update.cpp
@@ -256,7 +256,6 @@ static input_t::input_stream_t* make_filter_stream()
     if( filter_transport ) { return new input_t::input_stream_t( **filter_transport, csv, default_input ); }
     if( filter_line.empty() ) { return NULL; }
     comma::csv::options c;
-    c.full_xpath = true;
     c.fields = csv.fields;
     static std::istringstream iss( filter_line );
     return new input_t::input_stream_t( iss, c, default_input );
@@ -390,7 +389,6 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
-        csv.full_xpath = true;
         csv.quote.reset();
         last_only = options.exists( "--last-only,--last" );
         last_block = options.exists( "--last-block" );
@@ -448,7 +446,6 @@ int main( int ac, char** av )
             std::string s = options.value< std::string >( "--empty" ) + std::string( f.count(), ',' );
             std::istringstream iss( s );
             comma::csv::options c;
-            c.full_xpath = true;
             c.fields = csv.fields;
             comma::csv::input_stream< input_t > isstream( iss, c, default_input );
             empty = ( isstream.read() )->value;
@@ -460,7 +457,6 @@ int main( int ac, char** av )
             std::string s = options.value< std::string >( "--remove,--reset,--unset,--erase" ) + std::string( f.count(), ',' );
             std::istringstream iss( s );
             comma::csv::options c;
-            c.full_xpath = true;
             c.fields = csv.fields;
             comma::csv::input_stream< input_t > isstream( iss, c, default_input );
             erase = ( isstream.read() )->value;
diff --git a/csv/impl/program_options.h b/csv/impl/program_options.h
index 7dd400ae4..9aa7bc424 100644
--- a/csv/impl/program_options.h
+++ b/csv/impl/program_options.h
@@ -55,7 +55,6 @@ inline boost::program_options::options_description program_options::description(
         ( "fields", boost::program_options::value< std::string >()->default_value( default_fields ), "csv fields" )
         ( "binary,b", boost::program_options::value< std::string >(), "csv binary format" )
         ( "delimiter,d", boost::program_options::value< char >()->default_value( ',' ), "csv delimiter" )
-        ( "full-xpath", "expect full xpaths as field names" )
         ( "precision", boost::program_options::value< unsigned int >()->default_value( 12 ), "floating point precision" )
         ( "quote", boost::program_options::value< std::string >()->default_value( "\"" ), "quote sign to quote strings (ascii only)" )
         ( "flush", "flush output stream after each record" );
@@ -69,7 +68,6 @@ inline csv::options program_options::get( const boost::program_options::variable
     if( vm.count( "delimiter ") ) { csv.delimiter = vm[ "delimiter" ].as< char >(); }
     if( vm.count( "precision" ) ) { csv.precision = vm[ "precision" ].as< unsigned int >(); }
     if( vm.count( "binary" ) ) { csv.format( vm[ "binary" ].as< std::string >() ); }
-    csv.full_xpath = vm.count( "full-xpath" ) > 0;
     csv.flush = vm.count( "flush" ) > 0;
     if( vm.count( "quote" ) )
     {
diff --git a/csv/options.cpp b/csv/options.cpp
index ce369090e..f6f494e8c 100644
--- a/csv/options.cpp
+++ b/csv/options.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #include <boost/regex.hpp>
@@ -50,17 +49,14 @@ bool options::binary() const { return static_cast< bool >( format_ ); }
 
 namespace impl {
 
-inline static void init( comma::csv::options& csv_options, const comma::command_line_options& options, const std::string& defaultFields )
+inline static void init( comma::csv::options& csv_options, const comma::command_line_options& options, const std::string& defaultFields, bool full_xpath )
 {
-    csv_options.full_xpath = options.exists( "--full-xpath" );
+    csv_options.full_xpath = full_xpath;
     csv_options.fields = options.value( "--fields,-f", defaultFields );
     if( options.exists( "--binary,-b" ) )
     {
         boost::optional< std::string > format = options.optional< std::string >( "--binary,-b" );
-        if( format )
-        {
-            csv_options.format( options.value< std::string >( "--binary,-b" ) );
-        }
+        if( format ) { csv_options.format( options.value< std::string >( "--binary,-b" ) ); }
     }
     csv_options.precision = options.value< unsigned int >( "--precision", 12 );
     csv_options.delimiter = options.exists( "--delimiter" ) ? options.value( "--delimiter", ',' ) : options.value( "-d", ',' );
@@ -79,18 +75,11 @@ inline static void init( comma::csv::options& csv_options, const comma::command_
 
 } // namespace impl {
 
-options::options() : full_xpath( false ), delimiter( ',' ), precision( 12 ), quote( '"' ), flush( false ) {}
+options::options() : full_xpath( true ), delimiter( ',' ), precision( 12 ), quote( '"' ), flush( false ) {}
 
-options::options( int argc, char** argv, const std::string& defaultFields )
-{
-    impl::init( *this, comma::command_line_options( argc, argv ), defaultFields );
-}
+options::options( int argc, char** argv, const std::string& defaultFields, bool full_xpath ) { impl::init( *this, comma::command_line_options( argc, argv ), defaultFields, full_xpath ); }
 
-options::options( const comma::command_line_options& options, const std::string& defaultFields, bool set_full_xpath )
-{
-    impl::init( *this, options, defaultFields );
-    if(set_full_xpath) { full_xpath = true; }
-}
+options::options( const comma::command_line_options& options, const std::string& defaultFields, bool full_xpath ) { impl::init( *this, options, defaultFields, full_xpath ); }
 
 std::string options::usage( const std::string& default_fields, bool verbose )
 {
@@ -101,9 +90,6 @@ std::string options::usage( const std::string& default_fields, bool verbose )
         oss << "    --fields,-f <names>: comma-separated field names";
         if( !default_fields.empty() ) { oss << "; default: " << default_fields; }
         oss << std::endl;
-        oss << "    --full-xpath: expect full xpaths as field names; default: false" << std::endl;
-        oss << "                  default false was a wrong choice, but changing it" << std::endl;
-        oss << "                  to true now may break too many things" << std::endl;
         oss << "    --precision <precision>: floating point precision; default: 12" << std::endl;
         oss << "    --quote=[<quote_character>]: quote sign to quote strings (ascii only); default: '\"'" << std::endl;
         oss << "    --flush: if present, flush output stream after each record" << std::endl;
@@ -174,6 +160,6 @@ bool options::has_some_of_paths( const std::string& paths ) const
     return false;
 }
 
-std::string options::valueless_options() { return "--full-xpath,--flush"; }
+std::string options::valueless_options() { return "--flush"; }
 
 } } // namespace comma { namespace csv {
diff --git a/csv/options.h b/csv/options.h
index 01c561a2a..12bc7c863 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -45,10 +45,10 @@ class options
         options();
 
         /// constructor
-        options( int argc, char** argv, const std::string& defaultFields = "" );
+        options( int argc, char** argv, const std::string& defaultFields = "", bool full_xpath = true );
 
         /// constructor
-        options( const comma::command_line_options& options, const std::string& defaultFields = "", bool set_full_xpath = false );
+        options( const comma::command_line_options& options, const std::string& defaultFields = "", bool full_xpath = true );
 
         /// return usage to incorporate into application usage
         static std::string usage( const std::string& default_fields = "", bool verbose = true );
diff --git a/csv/test/stream_test.cpp b/csv/test/stream_test.cpp
index 2322d3cde..bef1731db 100644
--- a/csv/test/stream_test.cpp
+++ b/csv/test/stream_test.cpp
@@ -94,7 +94,6 @@ namespace comma { namespace csv { namespace stream_test {
 TEST( csv, container )
 {
 	comma::csv::options csv;
-     csv.full_xpath = true;
 	{
         std::string s( "2,3,,,6" );
         std::istringstream iss( s );
diff --git a/csv/traits.h b/csv/traits.h
index 0aeba617f..d8ed02bf2 100644
--- a/csv/traits.h
+++ b/csv/traits.h
@@ -45,7 +45,6 @@ template <> struct traits< comma::csv::options >
         v.apply( "filename", p.filename );
         v.apply( "delimiter", p.delimiter );
         v.apply( "fields", p.fields );
-        v.apply( "full-xpath", p.full_xpath );
         v.apply( "precision", p.precision );
         v.apply( "quote", p.quote ? std::string( 1, *p.quote ) : std::string() );
         v.apply( "flush", p.flush );
@@ -59,7 +58,6 @@ template <> struct traits< comma::csv::options >
         v.apply( "filename", p.filename );
         v.apply( "delimiter", p.delimiter );
         v.apply( "fields", p.fields );
-        v.apply( "full-xpath", p.full_xpath );
         v.apply( "precision", p.precision );
         std::string quote = p.quote ? std::string( 1, *p.quote ) : std::string();
         v.apply( "quote", p.quote );
diff --git a/etc/bash_completion.d/comma b/etc/bash_completion.d/comma
index 6dd9eec80..0911896ae 100644
--- a/etc/bash_completion.d/comma
+++ b/etc/bash_completion.d/comma
@@ -36,7 +36,6 @@ _comma_opts()
 --delimiter
 --fields
 --flush
---full-xpath
 --help
 --output-fields
 --precision

From 962cdad8b9319bebcca8a7adb9d561072e928637 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Mar 2019 18:28:49 +1100
Subject: [PATCH 0002/1056] comma-options-validate: a bug fixed

---
 application/command_line_options.cpp | 22 +++++++++++++---------
 1 file changed, 13 insertions(+), 9 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 831ccef3e..f7b3e601d 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -30,19 +30,18 @@
 
 /// @author vsevolod vlaskine
 
-#include "../string/split.h"
-#include "../application/command_line_options.h"
-#include "../base/exception.h"
+#include <algorithm>
 #include <sstream>
 #include <set>
+#include <unordered_map>
 #include <boost/bind.hpp>
 #include <boost/config/warning_disable.hpp>
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>
-#include <boost/unordered_set.hpp>
-
-#include <algorithm>
+#include "../string/split.h"
+#include "../application/command_line_options.h"
+#include "../base/exception.h"
 
 namespace comma {
 
@@ -192,9 +191,14 @@ void command_line_options::assert_valid( const std::vector< description >& d, bo
 {
     for( unsigned int i = 0; i < d.size(); ++i ) { d[i].assert_valid( *this ); }
     if( !unknown_options_invalid ) { return; }
-    boost::unordered_set< std::string > s; // real quick and dirty, just to make it work
-    for( unsigned int i = 0; i < d.size(); ++i ) { for( unsigned int j = 0; j < d[i].names.size(); s.insert( d[i].names[j] ), ++j ); }
-    for( unsigned int i = 0; i < names_.size(); ++i ) { if( s.find( names_[i] ) == s.end() ) { COMMA_THROW( comma::exception, "unknown option " << names_[i] ); } }
+    std::unordered_map< std::string, bool > m; // real quick and dirty, just to make it work
+    for( unsigned int i = 0; i < d.size(); ++i ) { for( unsigned int j = 0; j < d[i].names.size(); ++j ) { m[ d[i].names[j] ] = d[i].has_value; } }
+    for( unsigned int i = 1; i < argv_.size(); ++i )
+    {
+        auto it = m.find( argv_[i] );
+        if( it == m.end() ) { COMMA_THROW( comma::exception, "unknown option " << argv_[i] ); }
+        if( it->second ) { ++i; }
+    }
 }
 
 namespace impl {

From b806621eed2e9521517ec8092c0542486f3b9880 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Mar 2019 18:28:39 +1100
Subject: [PATCH 0003/1056] csv/stream: full_xpath: default set to true

---
 csv/stream.h | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/csv/stream.h b/csv/stream.h
index 815878ad1..c862c011b 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -64,7 +64,7 @@ class ascii_input_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        ascii_input_stream( std::istream& is, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = false, const S& sample = S() );
+        ascii_input_stream( std::istream& is, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = true, const S& sample = S() );
 
         /// constructor from csv options
         ascii_input_stream( std::istream& is, const options& o, const S& sample = S() );
@@ -115,7 +115,7 @@ class ascii_output_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        ascii_output_stream( std::ostream& os, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = false, const S& sample = S() );
+        ascii_output_stream( std::ostream& os, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = true, const S& sample = S() );
 
         /// constructor from csv options
         ascii_output_stream( std::ostream& os, const options& o, const S& sample = S() );
@@ -166,7 +166,7 @@ class binary_input_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        binary_input_stream( std::istream& is, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = false, const S& sample = S() );
+        binary_input_stream( std::istream& is, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = true, const S& sample = S() );
 
         /// constructor from options
         binary_input_stream( std::istream& is, const options& o, const S& sample = S() );
@@ -215,7 +215,7 @@ class binary_output_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        binary_output_stream( std::ostream& os, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = false, bool flush = false, const S& sample = S() );
+        binary_output_stream( std::ostream& os, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = true, bool flush = false, const S& sample = S() );
 
         /// constructor from options
         binary_output_stream( std::ostream& os, const options& o, const S& sample = S() );
@@ -320,7 +320,7 @@ class output_stream : public boost::noncopyable
         /// construct from csv options
         output_stream( std::ostream& os, const csv::options& o, const S& sample = S() );
 
-        output_stream( std::ostream& os, bool binary, bool full_xpath = false, bool flush = false, const S& sample = S() );
+        output_stream( std::ostream& os, bool binary, bool full_xpath = true, bool flush = false, const S& sample = S() );
 
         /// write
         void write( const S& s ) { if( ascii_ ) { ascii_->write( s ); } else { binary_->write( s ); } }

From 4290987de768582469938df16d4d917223c74d3e Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 19 Mar 2019 18:46:45 +1100
Subject: [PATCH 0004/1056] csv-play: full xpath flag set to false

---
 csv/applications/csv-play.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 3d9eb2a69..62d084c11 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -254,10 +254,11 @@ int main( int argc, char** argv )
         bool flush =  !options.exists( "--no-flush" );
         std::vector< std::string > configstrings = options.unnamed("--interactive,-i,--paused,--paused-at-start,--quiet,--flush,--no-flush","--slow,--slowdown,--speed,--resolution,--binary,--fields,--clients,--from,--to");
         if( configstrings.empty() ) { configstrings.push_back( "-;-" ); }
-        comma::csv::options csvoptions( argc, argv );
+        comma::csv::options csv( argc, argv );
+        csv.full_xpath = false;
         comma::name_value::parser name_value("filename,output", ';', '=', false );
         std::vector< comma::Multiplay::SourceConfig > sourceConfigs( configstrings.size() );
-        comma::Multiplay::SourceConfig defaultConfig( "-", options.value( "--clients", 0 ), csvoptions );
+        comma::Multiplay::SourceConfig defaultConfig( "-", options.value( "--clients", 0 ), csv );
         for( unsigned int i = 0U; i < configstrings.size(); ++i ) { sourceConfigs[i] = name_value.get< comma::Multiplay::SourceConfig >( configstrings[i], defaultConfig ); }
         boost::posix_time::ptime fromtime;
         if( !from.empty() ) { fromtime = boost::posix_time::from_iso_string( from ); }

From 1ede632bbcff9f56d5468d58af7912912e619747 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 27 Mar 2019 19:00:16 +1100
Subject: [PATCH 0005/1056] csv::options::full_xpath: dave jennings' stage 1:
 set full_xpath to false explicitly wherever appropriate

---
 csv/applications/csv-bin-cut.cpp    | 1 +
 csv/applications/csv-blocks.cpp     | 1 +
 csv/applications/csv-calc.cpp       | 1 +
 csv/applications/csv-interval.cpp   | 1 +
 csv/applications/csv-join.cpp       | 2 ++
 csv/applications/csv-repeat.cpp     | 1 +
 csv/applications/csv-shape.cpp      | 1 +
 csv/applications/csv-shuffle.cpp    | 1 +
 csv/applications/csv-thin.cpp       | 1 +
 csv/applications/csv-time-delay.cpp | 1 +
 csv/applications/csv-time.cpp       | 1 +
 csv/applications/csv-to-sql.cpp     | 1 +
 csv/applications/play/multiplay.h   | 2 +-
 csv/impl/fieldwise.cpp              | 1 +
 csv/test/format_test.cpp            | 1 +
 csv/test/options_test.cpp           | 2 ++
 16 files changed, 18 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-bin-cut.cpp b/csv/applications/csv-bin-cut.cpp
index ce87a1067..ae1309d96 100644
--- a/csv/applications/csv-bin-cut.cpp
+++ b/csv/applications/csv-bin-cut.cpp
@@ -361,6 +361,7 @@ int main( int ac, char** av )
     {
         command_line_options options( ac, av, usage );
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         std::vector< std::string > files = options.unnamed( "--help,-h,--verbose,-v,--flush,--read-all,--force-read", "--fields,-f,--output-fields,--output,-o,--binary,-b,--skip,--count" );
         if( !csv.binary() )
         {
diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index 94998dd44..fd89c8b58 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -415,6 +415,7 @@ int main( int ac, char** av )
         csv = comma::csv::options( options );
         csv.quote.reset();
         comma::csv::options csv_out;
+        csv_out.full_xpath = false;
         if( csv.binary() ) { csv_out.format( comma::csv::format("ui") ); }
         std::vector< std::string > unnamed = options.unnamed( "--help,-h,--reverse,--verbose,-v", "-.*" );
         if( unnamed.empty() ) { std::cerr << name() << "please specify operation" << std::endl; return 1; }
diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 1670f4ac2..5a5b8af5d 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1231,6 +1231,7 @@ int main( int ac, char** av )
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
         std::vector< std::string > unnamed = options.unnamed( "", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         #ifdef WIN32
         if( csv.binary() ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
diff --git a/csv/applications/csv-interval.cpp b/csv/applications/csv-interval.cpp
index 5fa81d6a2..338eaee1b 100644
--- a/csv/applications/csv-interval.cpp
+++ b/csv/applications/csv-interval.cpp
@@ -476,6 +476,7 @@ int main( int ac, char** av )
         if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
         if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< double > >(), ',' ); }
         if( !csv.has_field( "from,to" ) ) { COMMA_THROW( comma::exception, "expected from and to fields" ); }
         options.assert_mutually_exclusive( "--binary,--format" );
diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 161a7df33..f3b6456b5 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -295,6 +295,7 @@ template < typename T > static std::string keys_as_string( const input< T >& i )
 {
     std::ostringstream oss;
     comma::csv::options csv;
+    csv.full_xpath = false;
     csv.fields = "keys";
     comma::csv::ascii_output_stream< input< T > > os( oss, csv, i );
     os.write( i );
@@ -430,6 +431,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
                 if( !strict ) { ++discarded; continue; }
                 std::string s;
                 comma::csv::options c;
+                c.full_xpath = false;
                 c.fields = "keys";
                 std::cerr << "csv-join: match not found for key(s): " << comma::csv::ascii< input< K > >( c, default_input ).put( *p, s ) << ", block: " << block << std::endl;
                 return 1;
diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index a6fe24e6d..460133a7e 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -154,6 +154,7 @@ int main( int ac, char** av )
         comma::io::istream is( "-", comma::io::mode::binary );
         boost::scoped_ptr< comma::csv::output_stream< output_t > > ostream;
         comma::csv::options output_csv;
+        output_csv.full_xpath = false;
         if( options.exists( "--append-fields,--append,-a" ) )
         {
             output_csv.fields = options.value< std::string >( "--append-fields,--append,-a", "" );
diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 024b6456e..5218d03af 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -249,6 +249,7 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         std::vector< std::string > unnamed = options.unnamed( "--size,-n,--sliding-window,-w,--step,--verbose,-v", "-.*" );
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         if (csv.fields.empty()) { csv.fields="a"; }
         is_binary = csv.binary();
         if( unnamed.empty() ) { std::cerr << comma::verbose.app_name() << ": please specify operations" << std::endl; exit( 1 ); }
diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 556514099..aecceed64 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -93,6 +93,7 @@ int main( int ac, char** av )
         bool verbose = options.exists( "--verbose,-v" );
         if( options.exists( "--help,-h" ) ) { usage( verbose ); }
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         std::string f = options.value< std::string >( "--input-fields", "" );
         if( !f.empty() ) { csv.fields = f; }
         std::vector< std::string > input_fields = comma::split( csv.fields, ',' );
diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index 3ee53466f..ac6dfa137 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -189,6 +189,7 @@ int main( int ac, char** av )
         {
             if( !period ) { COMMA_THROW( comma::exception, "--fields requires --period option" ); }
             comma::csv::options csv( options );
+            csv.full_xpath = false;
             comma::csv::input_stream< timestamped > istream( std::cin, csv );
             while( std::cin.good() && !std::cin.eof() )
             {
diff --git a/csv/applications/csv-time-delay.cpp b/csv/applications/csv-time-delay.cpp
index 10e9b7910..6f80d0f30 100644
--- a/csv/applications/csv-time-delay.cpp
+++ b/csv/applications/csv-time-delay.cpp
@@ -90,6 +90,7 @@ int main( int ac, char** av )
         microseconds *= sign;
         boost::posix_time::time_duration delay = boost::posix_time::minutes( minutes ) + boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds );
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         comma::csv::input_stream< Point > istream( std::cin, csv );
         comma::csv::output_stream< Point > ostream( std::cout, csv );
         while( std::cin.good() && !std::cin.eof() )
diff --git a/csv/applications/csv-time.cpp b/csv/applications/csv-time.cpp
index 7e5922825..887db2cfb 100644
--- a/csv/applications/csv-time.cpp
+++ b/csv/applications/csv-time.cpp
@@ -476,6 +476,7 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         accept_empty = options.exists( "--empty-as-not-a-date-time,--accept-empty,-e" );
         csv = comma::csv::options( options );
+        csv.full_xpath = false;
         csv.precision = 16;
         if( csv.fields.empty() ) { csv.fields="a"; }
         init_input();
diff --git a/csv/applications/csv-to-sql.cpp b/csv/applications/csv-to-sql.cpp
index d7e8f8b59..4dc5df12b 100644
--- a/csv/applications/csv-to-sql.cpp
+++ b/csv/applications/csv-to-sql.cpp
@@ -148,6 +148,7 @@ int main( int ac, char** av )
         if( options.exists( "--help,-h" ) ) { usage( true ); }
 
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         if ( csv.binary() ) { std::cerr << app_name << ": binary not handled" << std::endl; return 1; }
 
         std::string null_value = default_null_value;
diff --git a/csv/applications/play/multiplay.h b/csv/applications/play/multiplay.h
index 6486854f1..c10c35d0f 100644
--- a/csv/applications/play/multiplay.h
+++ b/csv/applications/play/multiplay.h
@@ -63,7 +63,7 @@ class Multiplay
                 outputFileName( output ), minNumberOfClients( 0 ), options( csv ) {}
             SourceConfig( const std::string& output, std::size_t n, const csv::options& csv ) :
                 outputFileName( output ), minNumberOfClients( n ), options( csv ) {}
-            SourceConfig() {};
+            SourceConfig() { options.full_xpath = false; };
         };
 
         Multiplay( const std::vector< SourceConfig >& configs
diff --git a/csv/impl/fieldwise.cpp b/csv/impl/fieldwise.cpp
index 53f16dde9..724efa32a 100644
--- a/csv/impl/fieldwise.cpp
+++ b/csv/impl/fieldwise.cpp
@@ -42,6 +42,7 @@ fieldwise::fieldwise( const std::string& fields, char delimiter )
     , binary_( this )
 {
     csv::options o;
+    o.full_xpath = false;
     o.fields = fields;
     o.delimiter = delimiter;
     init_( o, split( fields, ',' ) );
diff --git a/csv/test/format_test.cpp b/csv/test/format_test.cpp
index 97e3929ea..28ea7f599 100644
--- a/csv/test/format_test.cpp
+++ b/csv/test/format_test.cpp
@@ -349,6 +349,7 @@ TEST( csv, unstructured )
     EXPECT_EQ( "l,l,l,l", comma::csv::impl::unstructured::guess_format( "1,2,3,4" ).string() );
     EXPECT_EQ( "l,d,t,s[1024]", comma::csv::impl::unstructured::guess_format( "1,2.1,20121212T000000,blah" ).string() );
     comma::csv::options csv;
+    csv.full_xpath = false;
     csv.fields = "a,,,b,,,c";
     csv.delimiter = ',';
     EXPECT_EQ( "l,s[1024],s[1024],s[1024],s[1024],s[1024],t", comma::csv::impl::unstructured::guess_format( "1,,,blah,,,20121212T000000" ).string() );
diff --git a/csv/test/options_test.cpp b/csv/test/options_test.cpp
index faf3f53ae..8e13dd614 100644
--- a/csv/test/options_test.cpp
+++ b/csv/test/options_test.cpp
@@ -36,6 +36,7 @@ TEST( options, has_paths )
 {
     {
         comma::csv::options csv;
+        csv.full_xpath = false;
         csv.fields = "a,b/c,d/e/f,p[0],q[0]/x,s/t/y[0],s/t/y[1]/z";
         EXPECT_TRUE( csv.has_paths( "a" ) );
         EXPECT_TRUE( csv.has_paths( "b" ) );
@@ -66,6 +67,7 @@ TEST( options, has_paths )
     }
     {
         comma::csv::options csv;
+        csv.full_xpath = false;
         csv.fields = "a,b/c,d/e/f,p[0],q[0]/x,s/t/y[0],s/t/y[1]/z";
         EXPECT_TRUE( csv.has_some_of_paths( "a" ) );
         EXPECT_TRUE( csv.has_some_of_paths( "a,blah" ) );

From 65b8a05c1d884c2e6049fd14eed185fd097b0fd1 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 29 Mar 2019 17:13:33 +1100
Subject: [PATCH 0006/1056] csv-thin: trivial brush-up

---
 csv/applications/csv-thin.cpp | 52 ++++++++++-------------------------
 1 file changed, 15 insertions(+), 37 deletions(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index ac6dfa137..61139202e 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -53,7 +53,7 @@
 
 using namespace comma;
 
-static void usage(bool detail=false)
+static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
     std::cerr << "Read input data and thin them down by the given percentage;" << std::endl;
@@ -68,22 +68,13 @@ static void usage(bool detail=false)
     std::cerr << "                That is, if <rate> is 0.33, output every third packet." << std::endl;
     std::cerr << "                Default is to output each packet with a probability of <rate>." << std::endl;
     std::cerr << "    --fields=<fields>: use timestamp in fields to determine time for --period" << std::endl;
-    std::cerr << "    --fps,--frames-per-second=<d>: deprecated and removed" << std::endl;
     std::cerr << "    --period=<n>: output once every <n> seconds, ignores <rate>" << std::endl;
     std::cerr << "    --size,-s=<size>: data is packets of fixed size, otherwise data is expected" << std::endl;
     std::cerr << "                      line-wise. Alternatively use --binary" << std::endl;
     std::cerr << std::endl;
-    if( detail )
-    {
-        std::cerr << "csv options:" << std::endl;
-        std::cerr<< comma::csv::options::usage() << std::endl;
-        std::cerr << std::endl;
-    }
-    else
-    {
-        std::cerr << "use -v or --verbose to see more detail" << std::endl;
-        std::cerr << std::endl;
-    }
+    std::cerr << "csv options:" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
     std::cerr << "examples:" << std::endl;
     std::cerr << "    output 70% of data:          cat full.csv | csv-thin 0.7" << std::endl;
     std::cerr << "    output once every 2 seconds: cat full.csv | csv-thin --period 2" << std::endl;
@@ -122,12 +113,9 @@ static bool ignore()
     {
         static boost::posix_time::ptime next_time = boost::posix_time::microsec_clock::universal_time();
         boost::posix_time::ptime now = boost::posix_time::microsec_clock::universal_time();
-        if( now > next_time )
-        {
-            next_time += *period;
-            return false;
-        }
-        return true;
+        if( now <= next_time ) { return true; }
+        next_time += *period;
+        return false;
     }
     if( deterministic )
     {
@@ -161,15 +149,12 @@ static bool ignore()
     return do_ignore && random() > rate;
 }
 
-static bool ignore_with_timestamp( boost::posix_time::ptime timestamp )
+static bool ignore_by_timestamp( boost::posix_time::ptime timestamp )
 {
     static boost::posix_time::ptime next_time = timestamp;
-    if( timestamp > next_time )
-    {
-        next_time += *period;
-        return false;
-    }
-    return true;
+    if( timestamp <= next_time ) { return true; }
+    next_time += *period;
+    return false;
 }
 
 int main( int ac, char** av )
@@ -180,7 +165,6 @@ int main( int ac, char** av )
         bool binary = options.exists( "--size,-s,--binary,-b" );
         deterministic = options.exists( "--deterministic,-d" );
         if( options.exists( "--period" )) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
-        if(options.exists("--fps,--frames-per-second")) { COMMA_THROW( comma::exception, "ERROR: --fps option is deprecated and removed! Please talk to software team if you are using it"); }
         #ifdef WIN32
         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
@@ -188,24 +172,18 @@ int main( int ac, char** av )
         if( options.exists( "--fields" ))
         {
             if( !period ) { COMMA_THROW( comma::exception, "--fields requires --period option" ); }
-            comma::csv::options csv( options );
-            csv.full_xpath = false;
-            comma::csv::input_stream< timestamped > istream( std::cin, csv );
+            comma::csv::input_stream< timestamped > istream( std::cin, comma::csv::options( options ) );
             while( std::cin.good() && !std::cin.eof() )
             {
                 const timestamped* p = istream.read();
                 if( !p ) { break; }
-                if( !ignore_with_timestamp( p->timestamp ))
-                {
-                    if( istream.is_binary()) { std::cout.write( istream.binary().last(), istream.binary().size() ); }
-                    else { std::cout << comma::join( istream.ascii().last(), istream.ascii().ascii().delimiter() )<< std::endl; }
-                }
+                if( ignore_by_timestamp( p->timestamp ) ) { continue; }
+                if( istream.is_binary()) { std::cout.write( istream.binary().last(), istream.binary().size() ); }
+                else { std::cout << comma::join( istream.ascii().last(), istream.ascii().ascii().delimiter() )<< std::endl; }
             }
             return 0;
         }
-        
         std::vector< std::string > v;
-
         if( !period )
         {
             v = options.unnamed( "--deterministic,-d", "-.*" );

From 5d20df9fb190f2f8425758f6ceeed87201626e87 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 31 Mar 2019 13:17:13 +1100
Subject: [PATCH 0007/1056] updated

---
 name_value/applications/name-value-to-csv.cpp | 1 -
 python/comma/csv/applications/csv_eval.py     | 1 -
 2 files changed, 2 deletions(-)

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index b9d678e65..92c38ed19 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -1,6 +1,5 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// Copyright (c) 2019 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index efd3ceb88..c634e2cb2 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -1,6 +1,5 @@
 # This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# Copyright (c) 2018 Vsevolod Vlaskine
 # All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without

From b1d1104ed6789369543313f4c61f9953f1cecd1d Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 Apr 2019 12:36:18 +1100
Subject: [PATCH 0008/1056] string::split(): empty_if_empty_input parameter
 added; csv-split numbers: --fields implemented

---
 csv/applications/csv-fields.cpp |  7 ++++++-
 csv/test/csv-fields/expected    | 10 ++++++++++
 csv/test/csv-fields/input       |  5 +++++
 string/split.cpp                | 12 +++++-------
 string/split.h                  | 15 ++++++++-------
 5 files changed, 34 insertions(+), 15 deletions(-)

diff --git a/csv/applications/csv-fields.cpp b/csv/applications/csv-fields.cpp
index 6cea12a13..2e4442673 100644
--- a/csv/applications/csv-fields.cpp
+++ b/csv/applications/csv-fields.cpp
@@ -53,6 +53,7 @@ static void usage( bool )
     std::cerr << "    numbers (default): convert comma-separated field names to field numbers" << std::endl;
     std::cerr << "                       e.g. for combining with cut or csv-bin-cut" << std::endl;
     std::cerr << "        --count,--size: output the total number of fields" << std::endl;
+    std::cerr << "        --fields=[<fields>]: number only fields with given names, same as csv-fields clear --except ... | csv-fields numbers" << std::endl;
     std::cerr << "        --fill: number even empty fields, e.g. try: echo ,, | csv-fields numbers --fill" << std::endl;
     std::cerr << "        --from=<value>: start field numbering from <value>; default=1" << std::endl;
     std::cerr << "                        to keep it consistent with linux cut utility" << std::endl;
@@ -177,7 +178,10 @@ int main( int ac, char** av )
         {
             int from = options.value( "--from", 1 );
             bool fill = options.exists( "--fill" );
-            std::string prefix = options.value< std::string >( "--prefix", "" );
+            options.assert_mutually_exclusive( "--fill,--fields" );
+            const auto& v = comma::split( options.value< std::string >( "--fields", "" ), ',', true );
+            std::set< std::string > fields( v.begin(), v.end() );
+            std::string prefix = options.value< std::string >( "--prefix", "" );            
             while( std::cin.good() )
             {
                 std::string line;
@@ -189,6 +193,7 @@ int main( int ac, char** av )
                 for( unsigned int i = 0; i < v.size(); ++i )
                 {
                     if( v[i].empty() && !fill ) { continue; }
+                    if( !fields.empty() && fields.find( v[i] ) == fields.end() ) { continue; }
                     std::cout << comma << prefix << ( i + from );
                     comma = ',';
                 }
diff --git a/csv/test/csv-fields/expected b/csv/test/csv-fields/expected
index 43a1a5ac8..f00b0889c 100644
--- a/csv/test/csv-fields/expected
+++ b/csv/test/csv-fields/expected
@@ -18,6 +18,16 @@ numbers/fill[2]/output="f1,f2,f3,f4"
 numbers/fill[2]/status=0
 numbers/fill[3]/output="f1,f2,f3,f4"
 numbers/fill[3]/status=0
+numbers/fields[0]/output=""
+numbers/fields[0]/status=0
+numbers/fields[1]/output="1"
+numbers/fields[1]/status=0
+numbers/fields[2]/output="2"
+numbers/fields[2]/status=0
+numbers/fields[3]/output="2"
+numbers/fields[3]/status=0
+numbers/fields[4]/output="2,3"
+numbers/fields[4]/status=0
 
 clear/keep[0]/output=",,,"
 clear/keep[0]/status=0
diff --git a/csv/test/csv-fields/input b/csv/test/csv-fields/input
index c4a92cbd8..f7b0a309f 100644
--- a/csv/test/csv-fields/input
+++ b/csv/test/csv-fields/input
@@ -8,6 +8,11 @@ numbers/fill[0]="echo ,,, | csv-fields numbers --fill"
 numbers/fill[1]="echo a,,,b | csv-fields numbers --fill"
 numbers/fill[2]="echo ,,, | csv-fields numbers --fill --prefix f"
 numbers/fill[3]="echo a,,,b | csv-fields numbers --fill --prefix f"
+numbers/fields[0]="echo ,,, | csv-fields numbers --fields=a"
+numbers/fields[1]="echo a,,, | csv-fields numbers --fields=a"
+numbers/fields[2]="echo ,a,, | csv-fields numbers --fields=a"
+numbers/fields[3]="echo ,a,b, | csv-fields numbers --fields=a"
+numbers/fields[4]="echo ,a,b, | csv-fields numbers --fields=a,b"
 
 clear/keep[0]="echo a,b,c,d | csv-fields clear --keep ,,,"
 clear/keep[1]="echo a,b,c,d | csv-fields clear --keep a"
diff --git a/string/split.cpp b/string/split.cpp
index ed00ae1ee..fd09fe931 100644
--- a/string/split.cpp
+++ b/string/split.cpp
@@ -45,26 +45,24 @@ bool string::is_one_of( char c, const char * characters )
     return false;
 }
 
-std::vector< std::string > split( const std::string & s, const char * separators )
+std::vector< std::string > split( const std::string & s, const char * separators, bool empty_if_empty_input )
 {
     std::vector< std::string > v;
+    if( empty_if_empty_input && s.empty() ) { return v; }
     const char* begin( &s[0] );
     const char* end( begin + s.length() );
     v.push_back( std::string() );
     for( const char* p = begin; p < end; ++p )
     {
-        if( string::is_one_of( *p, separators ) )
-            v.push_back( std::string() );
-        else
-            v.back() += *p;
+        if( string::is_one_of( *p, separators ) ) { v.push_back( std::string() ); } else { v.back() += *p; }
     }
     return v;
 }
 
-std::vector< std::string > split( const std::string & s, char separator )
+std::vector< std::string > split( const std::string & s, char separator, bool empty_if_empty_input )
 {
     const char separators[] = { separator, 0 };
-    return split( s, separators );
+    return split( s, separators, empty_if_empty_input );
 }
 
 std::vector< std::string > split_escaped( const std::string & s, const char * separators, const char * quotes, char escape )
diff --git a/string/split.h b/string/split.h
index bdfe94722..ec8f176e3 100644
--- a/string/split.h
+++ b/string/split.h
@@ -39,15 +39,16 @@
 namespace comma {
 
 namespace string {
-    // Used for escaping / unescaping to maybe find a character in a list of specials
-    bool is_one_of( char c, const char * characters );
-}
+    
+bool is_one_of( char c, const char* characters );
+
+} // namespace string {
 
 /// split string into tokens (a quick implementation); always contains at least one element
-std::vector< std::string > split( const std::string& s, const char* separators = " " );
+std::vector< std::string > split( const std::string& s, const char* separators = " ", bool empty_if_empty_input = false );
 
 /// split string into tokens (a quick implementation); always contains at least one element
-std::vector< std::string > split( const std::string& s, char separator );
+std::vector< std::string > split( const std::string& s, char separator, bool empty_if_empty_input = false );
 
 /// Split string into tokens; always contains at least one element;
 /// skips backslash escaped separator, handle non-nested quotes;
@@ -64,10 +65,10 @@ std::vector< std::string > split( const std::string& s, char separator );
 /// quote must be paired with an end quote, or an exception is thrown.
 /// Quotes don't nest and can not be mixed; e.g. a ' will not close a " quoted string.
 /// However "'" and '"' are perfectly legal strings of ' and "
-std::vector< std::string > split_escaped( const std::string & s, const char * separators = " ", const char * quotes = "\"\'", char escape = '\\' );
+std::vector< std::string > split_escaped( const std::string& s, const char * separators = " ", const char * quotes = "\"\'", char escape = '\\' );
 /// split string into tokens; always contains at least one element;
 /// skips backslash escaped seperator, handle boolean quotes 
-std::vector< std::string > split_escaped( const std::string & s, char separator, const char * quotes = "\"\'", char escape = '\\' );
+std::vector< std::string > split_escaped( const std::string& s, char separator, const char * quotes = "\"\'", char escape = '\\' );
 
 } // namespace comma {
 

From 85fd860827f39466e889bea3523587d1586ddfda Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 Apr 2019 12:37:51 +1100
Subject: [PATCH 0009/1056] csv-fields: test case added

---
 csv/test/csv-fields/expected | 2 ++
 csv/test/csv-fields/input    | 1 +
 2 files changed, 3 insertions(+)

diff --git a/csv/test/csv-fields/expected b/csv/test/csv-fields/expected
index f00b0889c..2dddba1ee 100644
--- a/csv/test/csv-fields/expected
+++ b/csv/test/csv-fields/expected
@@ -28,6 +28,8 @@ numbers/fields[3]/output="2"
 numbers/fields[3]/status=0
 numbers/fields[4]/output="2,3"
 numbers/fields[4]/status=0
+numbers/fields[5]/output="2,3,4"
+numbers/fields[5]/status=0
 
 clear/keep[0]/output=",,,"
 clear/keep[0]/status=0
diff --git a/csv/test/csv-fields/input b/csv/test/csv-fields/input
index f7b0a309f..9bb3ea7ca 100644
--- a/csv/test/csv-fields/input
+++ b/csv/test/csv-fields/input
@@ -13,6 +13,7 @@ numbers/fields[1]="echo a,,, | csv-fields numbers --fields=a"
 numbers/fields[2]="echo ,a,, | csv-fields numbers --fields=a"
 numbers/fields[3]="echo ,a,b, | csv-fields numbers --fields=a"
 numbers/fields[4]="echo ,a,b, | csv-fields numbers --fields=a,b"
+numbers/fields[5]="echo ,a,a,a | csv-fields numbers --fields=a"
 
 clear/keep[0]="echo a,b,c,d | csv-fields clear --keep ,,,"
 clear/keep[1]="echo a,b,c,d | csv-fields clear --keep a"

From fd96e42bb547299f11d773559e49dc35cc04f459 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 5 Apr 2019 20:26:11 +1100
Subject: [PATCH 0010/1056] packed: implementing generic big/little endian
 values to introduce 3-byte big-endian

---
 packed/big_endian.h    |  65 +-------------
 packed/detail/endian.h | 188 +++++++++++++++++++++++++++++++++++++++++
 packed/little_endian.h |  85 +++----------------
 3 files changed, 202 insertions(+), 136 deletions(-)
 create mode 100644 packed/detail/endian.h

diff --git a/packed/big_endian.h b/packed/big_endian.h
index 017a6f215..a8b662250 100644
--- a/packed/big_endian.h
+++ b/packed/big_endian.h
@@ -39,75 +39,12 @@
 #include "../base/exception.h"
 #include "../base/types.h"
 #include "../packed/field.h"
+#include "detail/endian.h"
 
 namespace comma { namespace packed {
 
 namespace detail {
 
-template < typename T > struct net_traits {};
-
-template <> struct net_traits< comma::uint16 >
-{
-    static comma::uint16 hton( comma::uint16 v ) { return htons( v ); }
-    static comma::uint16 ntoh( comma::uint16 v ) { return ntohs( v ); }
-};
-
-template <> struct net_traits< comma::int16 >
-{
-    static comma::int16 hton( comma::int16 v ) { return htons( v ); }
-    static comma::int16 ntoh( comma::int16 v ) { return ntohs( v ); }
-};
-
-template <> struct net_traits< comma::uint32 >
-{
-    static comma::uint32 hton( comma::uint32 v ) { return htonl( v ); }
-    static comma::uint32 ntoh( comma::uint32 v ) { return ntohl( v ); }
-};
-
-template <> struct net_traits< comma::int32 >
-{
-    static comma::int32 hton( comma::int32 v ) { return htonl( v ); }
-    static comma::int32 ntoh( comma::int32 v ) { return ntohl( v ); }
-};
-
-BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
-
-template < typename type, typename uint_of_same_size >
-inline type pack_float( type value )
-{
-    char storage[sizeof(type)];
-    uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-    for( unsigned int i = 0; i < sizeof( type ); ++i, *p >>= 8 ) { storage[sizeof(type)-i-1] = *p & 0xff; } 
-    const type* result = reinterpret_cast< const type* >( &storage );
-    return *result;
-}
-
-template< typename type, typename uint_of_same_size >
-inline type unpack_float( type value ) 
-{
-    const char* storage = reinterpret_cast< const char* >( &value ); 
-    uint_of_same_size v = 0;
-    unsigned int shift = 0;
-    for( unsigned int i = 0; i < sizeof( type ); ++i, shift += 8 ) { v += static_cast< uint_of_same_size >( ( unsigned char )( storage[sizeof(type)-i-1] ) ) << shift; }
-    const type* result = reinterpret_cast< const type* >( &v );
-    return *result;
-}
-
-template <> struct net_traits< float >
-{
-    typedef comma::uint32 uint_of_same_size;
-    static float hton( float value ) { return pack_float< float, uint_of_same_size >( value ); }
-    static float ntoh( float value ) { return unpack_float< float, uint_of_same_size >( value ); }
-};
-
-template <> struct net_traits< double >
-{
-    typedef comma::uint64 uint_of_same_size;
-    static double hton( double value ) { return pack_float< double, uint_of_same_size >( value ); }
-    static double ntoh( double value ) { return unpack_float< double, uint_of_same_size >( value ); }
-};
-
 template < typename T >
 class big_endian : public packed::field< big_endian< T >, T, sizeof( T ) >
 {
diff --git a/packed/detail/endian.h b/packed/detail/endian.h
new file mode 100644
index 000000000..c54a3be7f
--- /dev/null
+++ b/packed/detail/endian.h
@@ -0,0 +1,188 @@
+// This file is provided in addition to snark and is not an integral
+// part of snark library.
+// Copyright (c) 2018 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+// snark is a generic and flexible library for robotics research
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <algorithm>
+#include <boost/static_assert.hpp>
+#include "../../base/exception.h"
+#include "../../base/types.h"
+#include "../field.h"
+
+namespace comma { namespace packed { namespace detail {
+
+BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
+BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
+
+//inline static bool host_is_little_endian_() { comma::uint32 i = 1; return reinterpret_cast< char* >( &i )[0] == 1; }
+
+//static bool host_is_little_endian = detail::host_is_little_endian_(); // super quick and dirty
+
+template < typename T > struct net_traits {};
+
+template <> struct net_traits< comma::uint16 >
+{
+    static comma::uint16 hton( comma::uint16 v ) { return htons( v ); }
+    static comma::uint16 ntoh( comma::uint16 v ) { return ntohs( v ); }
+};
+
+template <> struct net_traits< comma::int16 >
+{
+    static comma::int16 hton( comma::int16 v ) { return htons( v ); }
+    static comma::int16 ntoh( comma::int16 v ) { return ntohs( v ); }
+};
+
+template <> struct net_traits< comma::uint32 >
+{
+    static comma::uint32 hton( comma::uint32 v ) { return htonl( v ); }
+    static comma::uint32 ntoh( comma::uint32 v ) { return ntohl( v ); }
+};
+
+template <> struct net_traits< comma::int32 >
+{
+    static comma::int32 hton( comma::int32 v ) { return htonl( v ); }
+    static comma::int32 ntoh( comma::int32 v ) { return ntohl( v ); }
+};
+
+template < typename type, typename uint_of_same_size >
+inline type pack_float( type value )
+{
+    char storage[sizeof(type)];
+    uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
+    for( unsigned int i = 0; i < sizeof( type ); ++i, *p >>= 8 ) { storage[sizeof(type)-i-1] = *p & 0xff; } 
+    const type* result = reinterpret_cast< const type* >( &storage );
+    return *result;
+}
+
+template< typename type, typename uint_of_same_size >
+inline type unpack_float( type value ) 
+{
+    const char* storage = reinterpret_cast< const char* >( &value ); 
+    uint_of_same_size v = 0;
+    unsigned int shift = 0;
+    for( unsigned int i = 0; i < sizeof( type ); ++i, shift += 8 ) { v += static_cast< uint_of_same_size >( ( unsigned char )( storage[sizeof(type)-i-1] ) ) << shift; }
+    const type* result = reinterpret_cast< const type* >( &v );
+    return *result;
+}
+
+template <> struct net_traits< float >
+{
+    typedef comma::uint32 uint_of_same_size;
+    static float hton( float value ) { return pack_float< float, uint_of_same_size >( value ); }
+    static float ntoh( float value ) { return unpack_float< float, uint_of_same_size >( value ); }
+};
+
+template <> struct net_traits< double >
+{
+    typedef comma::uint64 uint_of_same_size;
+    static double hton( double value ) { return pack_float< double, uint_of_same_size >( value ); }
+    static double ntoh( double value ) { return unpack_float< double, uint_of_same_size >( value ); }
+};
+    
+template < bool Little, unsigned int Size, bool Signed, bool Floating = false > struct endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
+template < bool Little > struct endian_traits< Little, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
+template < bool Little > struct endian_traits< Little, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
+template < bool Little > struct endian_traits< Little, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
+template < bool Little > struct endian_traits< Little, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
+
+enum { little = 0, big = 1 };
+
+template < bool Little, unsigned int Size, bool Signed, bool Floating = false >
+struct endian : public packed::field< endian< Little, Size, Signed, Floating >, typename endian_traits< Little, Size, Signed, Floating >::type, Size >
+{
+    static const unsigned int size = Size;
+
+    typedef typename endian_traits< Little, Size, Signed, Floating >::type type;
+    
+    BOOST_STATIC_ASSERT( size <= sizeof( type ) );
+
+    typedef packed::field< endian< Little, Size, Signed, Floating >, typename endian_traits< Little, Size, Signed, Floating >::type, Size > base_type;
+
+    static type default_value() { return 0; }
+
+    typedef typename endian_traits< Little, size, Signed, Floating >::uint_of_same_size uint_of_same_size;
+    
+    static void pack( char* storage, type value )
+    {
+        uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
+        for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
+    }
+
+    static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
+    {
+        uint_of_same_size v = 0;
+        unsigned int shift = 0;
+        unsigned int i = 0;
+        for( ; i < size; ++i, shift += 8 )
+        {
+            v += static_cast< uint_of_same_size >( ( unsigned char )( storage[i] ) ) << shift;
+        }
+        if( !Floating && Signed && ( storage[ size - 1 ] & 0x80 ) )
+        {            
+            for( ; i < sizeof( type ); ++i, shift += 8 ) { v +=  static_cast< uint_of_same_size >( 0xff ) << shift; } 
+        }
+        const type* result = reinterpret_cast< const type* >( &v );
+        return *result;
+    }
+
+    const endian& operator=( const endian& rhs ) { return base_type::operator=( rhs ); }
+
+    const endian& operator=( const type& rhs ) { return base_type::operator=( rhs ); }
+};
+
+} } } // namespace comma { namespace packed { namespace detail {
diff --git a/packed/little_endian.h b/packed/little_endian.h
index 5d419f095..28694a5b5 100644
--- a/packed/little_endian.h
+++ b/packed/little_endian.h
@@ -27,102 +27,43 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author Matthew Herrmann 2007
-/// @author Vsevolod Vlaskine 2010-2011
+/// @author vsevolod vlaskine
 
-#ifndef COMMA_PACKED_LITTLEENDIAN_H_
-#define COMMA_PACKED_LITTLEENDIAN_H_
+#pragma once
 
 #include <boost/static_assert.hpp>
 #include "../base/exception.h"
 #include "../base/types.h"
 #include "field.h"
+#include "detail/endian.h"
 
 namespace comma { namespace packed {
 
-namespace detail {
-
-BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
-    
-template < unsigned int Size, bool Signed, bool Floating = false > struct little_endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
-template <> struct little_endian_traits< 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
-template <> struct little_endian_traits< 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
-template <> struct little_endian_traits< 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
-template <> struct little_endian_traits< 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
-
-template < unsigned int Size, bool Signed, bool Floating = false >
-struct little_endian : public packed::field< little_endian< Size, Signed, Floating >, typename little_endian_traits< Size, Signed, Floating >::type, Size >
-{
-    static const unsigned int size = Size;
-
-    typedef typename little_endian_traits< Size, Signed, Floating >::type type;
-    
-    BOOST_STATIC_ASSERT( size <= sizeof( type ) );
-
-    typedef packed::field< little_endian< Size, Signed, Floating >, typename little_endian_traits< Size, Signed, Floating >::type, Size > base_type;
-
-    static type default_value() { return 0; }
-
-    typedef typename little_endian_traits< size, Signed, Floating >::uint_of_same_size uint_of_same_size;
-    
-    static void pack( char* storage, type value )
-    {
-        uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-        for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
-    }
-
-    static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
-    {
-        uint_of_same_size v = 0;
-        unsigned int shift = 0;
-        unsigned int i = 0;
-        for( ; i < size; ++i, shift += 8 )
-        {
-            v += static_cast< uint_of_same_size >( ( unsigned char )( storage[i] ) ) << shift;
-        }
-        if( !Floating && Signed && ( storage[ size - 1 ] & 0x80 ) )
-        {            
-            for( ; i < sizeof( type ); ++i, shift += 8 ) { v +=  static_cast< uint_of_same_size >( 0xff ) << shift; } 
-        }
-        const type* result = reinterpret_cast< const type* >( &v );
-        return *result;
-    }
-
-    const little_endian& operator=( const little_endian& rhs ) { return base_type::operator=( rhs ); }
-
-    const little_endian& operator=( const type& rhs ) { return base_type::operator=( rhs ); }
-};
-
-} // namespace detail {
-
 /// packed little endian 16-bit integers
-typedef detail::little_endian< 2, true > little_endian16;
-typedef detail::little_endian< 2, false > little_endian_uint16;
+typedef detail::endian< detail::little, 2, true > little_endian16;
+typedef detail::endian< detail::little, 2, false > little_endian_uint16;
 typedef little_endian16 int16;
 typedef little_endian_uint16 uint16;
 /// packed little endian 24-bit integers (strangely, there are protocols using it)
-typedef detail::little_endian< 3, true > little_endian24;
-typedef detail::little_endian< 3, false > little_endian_uint24;
+typedef detail::endian< detail::little, 3, true > little_endian24;
+typedef detail::endian< detail::little, 3, false > little_endian_uint24;
 typedef little_endian24 int24;
 typedef little_endian_uint24 uint24;
 /// packed little endian 32-bit integers
-typedef detail::little_endian< 4, true > little_endian32;
-typedef detail::little_endian< 4, false > little_endian_uint32;
+typedef detail::endian< detail::little, 4, true > little_endian32;
+typedef detail::endian< detail::little, 4, false > little_endian_uint32;
 typedef little_endian32 int32;
 typedef little_endian_uint32 uint32;
 /// packed little endian 32-bit integers
-typedef detail::little_endian< 8, true > little_endian64;
-typedef detail::little_endian< 8, false > little_endian_uint64;
+typedef detail::endian< detail::little, 8, true > little_endian64;
+typedef detail::endian< detail::little, 8, false > little_endian_uint64;
 typedef little_endian64 int64;
 typedef little_endian_uint64 uint64;
 /// packed floating point number (does it even make sense?)
-typedef detail::little_endian< 4, true, true > little_endian_float32;
-typedef detail::little_endian< 8, true, true > little_endian_float64;
+typedef detail::endian< detail::little, 4, true, true > little_endian_float32;
+typedef detail::endian< detail::little, 8, true, true > little_endian_float64;
 typedef little_endian_float32 float32;
 typedef little_endian_float64 float64;
 
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_LITTLEENDIAN_H_

From 31dea043b906e4fb0834953e9a541115266a5f89 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 5 Apr 2019 21:27:13 +1100
Subject: [PATCH 0011/1056] packed: implementing generic big/little endian
 values to introduce 3-byte big-endian...

---
 packed/big_endian.h    |  57 ++-----------
 packed/detail/endian.h | 177 +++++++++++++++++++++++++++--------------
 packed/little_endian.h |   4 -
 3 files changed, 125 insertions(+), 113 deletions(-)

diff --git a/packed/big_endian.h b/packed/big_endian.h
index a8b662250..bc20eef82 100644
--- a/packed/big_endian.h
+++ b/packed/big_endian.h
@@ -31,74 +31,31 @@
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_BIG_ENDIAN_H_
-#define COMMA_PACKED_BIG_ENDIAN_H_
+#pragma once
 
-#include <algorithm>
-#include <boost/static_assert.hpp>
-#include "../base/exception.h"
-#include "../base/types.h"
-#include "../packed/field.h"
 #include "detail/endian.h"
 
 namespace comma { namespace packed {
 
-namespace detail {
-
-template < typename T >
-class big_endian : public packed::field< big_endian< T >, T, sizeof( T ) >
-{
-    public:
-        enum { size = sizeof( T ) };
-
-        typedef T type;
-
-        typedef packed::field< big_endian< T >, T, size > base_type;
-
-        static type default_value() { return 0; }
-
-        static void pack( char* storage, type value )
-        {
-            type v( net_traits< type >::hton( value ) );
-            ::memcpy( storage, ( void* )&v, size );
-        }
-
-        static type unpack( const char* storage )
-        {
-            type value;
-            ::memcpy( ( void* )&value, storage, size );
-            return net_traits< type >::ntoh( value );
-        }
-
-        const big_endian& operator=( const big_endian& rhs ) { return base_type::operator=( rhs ); }
-
-        const big_endian& operator=( type rhs ) { return base_type::operator=( rhs ); }
-};
-
-} // namespace detail {
-
 /// big endian 16-bit integers
-typedef detail::big_endian< comma::uint16 > big_endian_uint16;
-typedef detail::big_endian< comma::int16 > big_endian_int16;
+typedef detail::endian< detail::big, 2, false > big_endian_uint16;
+typedef detail::endian< detail::big, 2, true > big_endian_int16;
 /// aliases for big endian 16-bit integers
 typedef big_endian_uint16 net_uint16;
 typedef big_endian_int16 net_int16;
 /// big endian 32-bit integers
-typedef detail::big_endian< comma::uint32 > big_endian_uint32;
-typedef detail::big_endian< comma::int32 > big_endian_int32;
+typedef detail::endian< detail::big, 4, false > big_endian_uint32;
+typedef detail::endian< detail::big, 4, true > big_endian_int32;
 /// aliases for big endian 32-bit integers
 typedef big_endian_uint32 net_uint32;
 typedef big_endian_int32 net_int32;
 /// big endian float and double
-typedef detail::big_endian< float > big_endian_float32;
-typedef detail::big_endian< double > big_endian_float64;
+typedef detail::endian< detail::big, 4, true, true > big_endian_float32;
+typedef detail::endian< detail::big, 8, true, true > big_endian_float64;
 typedef big_endian_float64 big_endian_double;
 /// aliases for big endian float and double
 typedef big_endian_float32 net_float32;
 typedef big_endian_float64 net_float64;
 typedef net_float64 net_double;
 
-
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_BIG_ENDIAN_H_
diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index c54a3be7f..4120e92b6 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -58,6 +58,7 @@
 
 #pragma once
 
+#include <endian.h>
 #include <algorithm>
 #include <boost/static_assert.hpp>
 #include "../../base/exception.h"
@@ -69,115 +70,173 @@ namespace comma { namespace packed { namespace detail {
 BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
 BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
 
-//inline static bool host_is_little_endian_() { comma::uint32 i = 1; return reinterpret_cast< char* >( &i )[0] == 1; }
-
-//static bool host_is_little_endian = detail::host_is_little_endian_(); // super quick and dirty
-
 template < typename T > struct net_traits {};
 
 template <> struct net_traits< comma::uint16 >
 {
-    static comma::uint16 hton( comma::uint16 v ) { return htons( v ); }
-    static comma::uint16 ntoh( comma::uint16 v ) { return ntohs( v ); }
+    typedef comma::uint16 uint_of_same_size;
+    static comma::uint16 htobe( comma::uint16 v ) { return htobe16( v ); }
+    static comma::uint16 betoh( comma::uint16 v ) { return be16toh( v ); }
+    static comma::uint16 htole( comma::uint16 v ) { return htole16( v ); }
+    static comma::uint16 letoh( comma::uint16 v ) { return le16toh( v ); }
 };
 
 template <> struct net_traits< comma::int16 >
 {
-    static comma::int16 hton( comma::int16 v ) { return htons( v ); }
-    static comma::int16 ntoh( comma::int16 v ) { return ntohs( v ); }
+    typedef comma::uint16 uint_of_same_size;
+    static comma::int16 htobe( comma::int16 v ) { return htobe16( v ); }
+    static comma::int16 betoh( comma::int16 v ) { return be16toh( v ); }
+    static comma::int16 htole( comma::int16 v ) { return htole16( v ); }
+    static comma::int16 letoh( comma::int16 v ) { return le16toh( v ); }
 };
 
 template <> struct net_traits< comma::uint32 >
 {
-    static comma::uint32 hton( comma::uint32 v ) { return htonl( v ); }
-    static comma::uint32 ntoh( comma::uint32 v ) { return ntohl( v ); }
+    typedef comma::uint32 uint_of_same_size;
+    static comma::uint32 htobe( comma::uint32 v ) { return htobe32( v ); }
+    static comma::uint32 betoh( comma::uint32 v ) { return be32toh( v ); }
+    static comma::uint32 htole( comma::uint32 v ) { return htole32( v ); }
+    static comma::uint32 letoh( comma::uint32 v ) { return le32toh( v ); }
 };
 
 template <> struct net_traits< comma::int32 >
 {
-    static comma::int32 hton( comma::int32 v ) { return htonl( v ); }
-    static comma::int32 ntoh( comma::int32 v ) { return ntohl( v ); }
+    typedef comma::uint32 uint_of_same_size;
+    static comma::int32 htobe( comma::int32 v ) { return htobe32( v ); }
+    static comma::int32 betoh( comma::int32 v ) { return be32toh( v ); }
+    static comma::int32 htole( comma::int32 v ) { return htole32( v ); }
+    static comma::int32 letoh( comma::int32 v ) { return le32toh( v ); }
 };
 
-template < typename type, typename uint_of_same_size >
-inline type pack_float( type value )
+template <> struct net_traits< comma::uint64 >
 {
-    char storage[sizeof(type)];
-    uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-    for( unsigned int i = 0; i < sizeof( type ); ++i, *p >>= 8 ) { storage[sizeof(type)-i-1] = *p & 0xff; } 
-    const type* result = reinterpret_cast< const type* >( &storage );
-    return *result;
-}
-
-template< typename type, typename uint_of_same_size >
-inline type unpack_float( type value ) 
+    typedef comma::uint64 uint_of_same_size;
+    static comma::uint64 htobe( comma::uint64 v ) { return htobe64( v ); }
+    static comma::uint64 betoh( comma::uint64 v ) { return be64toh( v ); }
+    static comma::uint64 htole( comma::uint64 v ) { return htole64( v ); }
+    static comma::uint64 letoh( comma::uint64 v ) { return le64toh( v ); }
+};
+
+template <> struct net_traits< comma::int64 >
 {
-    const char* storage = reinterpret_cast< const char* >( &value ); 
-    uint_of_same_size v = 0;
-    unsigned int shift = 0;
-    for( unsigned int i = 0; i < sizeof( type ); ++i, shift += 8 ) { v += static_cast< uint_of_same_size >( ( unsigned char )( storage[sizeof(type)-i-1] ) ) << shift; }
-    const type* result = reinterpret_cast< const type* >( &v );
-    return *result;
-}
+    typedef comma::uint64 uint_of_same_size;
+    static comma::int64 htobe( comma::int64 v ) { return htobe64( v ); }
+    static comma::int64 betoh( comma::int64 v ) { return be64toh( v ); }
+    static comma::int64 htole( comma::int64 v ) { return htole64( v ); }
+    static comma::int64 letoh( comma::int64 v ) { return le64toh( v ); }
+};
 
 template <> struct net_traits< float >
 {
     typedef comma::uint32 uint_of_same_size;
-    static float hton( float value ) { return pack_float< float, uint_of_same_size >( value ); }
-    static float ntoh( float value ) { return unpack_float< float, uint_of_same_size >( value ); }
+    static float htobe( float value )
+    {
+        uint_of_same_size v = net_traits< uint_of_same_size >::htobe( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< float* >( &v ) );
+    }
+    static float betoh( float value )
+    { 
+        uint_of_same_size v = net_traits< uint_of_same_size >::betoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< float* >( &v ) );
+    }
+    static float htole( float value )
+    { 
+        uint_of_same_size v = net_traits< uint_of_same_size >::htole( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< float* >( &v ) );
+    }
+    static float letoh( float value )
+    { 
+        uint_of_same_size v = net_traits< uint_of_same_size >::letoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< float* >( &v ) );
+    }
 };
 
 template <> struct net_traits< double >
 {
     typedef comma::uint64 uint_of_same_size;
-    static double hton( double value ) { return pack_float< double, uint_of_same_size >( value ); }
-    static double ntoh( double value ) { return unpack_float< double, uint_of_same_size >( value ); }
+    static double htobe( double value )
+    {
+        uint_of_same_size v = net_traits< uint_of_same_size >::htobe( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< double* >( &v ) );
+    }
+    static double betoh( double value )
+    { 
+        uint_of_same_size v = net_traits< uint_of_same_size >::betoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< double* >( &v ) );
+    }
+    static double htole( double value )
+    { 
+        uint_of_same_size v = net_traits< uint_of_same_size >::htole( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< double* >( &v ) );
+    }
+    static double letoh( double value )
+    { 
+        uint_of_same_size v = net_traits< uint_of_same_size >::letoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
+        return *( reinterpret_cast< double* >( &v ) );
+    }
 };
-    
-template < bool Little, unsigned int Size, bool Signed, bool Floating = false > struct endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
-template < bool Little > struct endian_traits< Little, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
-template < bool Little > struct endian_traits< Little, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
-template < bool Little > struct endian_traits< Little, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
-template < bool Little > struct endian_traits< Little, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
-
-enum { little = 0, big = 1 };
 
-template < bool Little, unsigned int Size, bool Signed, bool Floating = false >
-struct endian : public packed::field< endian< Little, Size, Signed, Floating >, typename endian_traits< Little, Size, Signed, Floating >::type, Size >
+enum endiannes { little = 0, big = 1 };
+    
+template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false > struct endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
+
+template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false >
+struct endian : public packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size >
 {
     static const unsigned int size = Size;
 
-    typedef typename endian_traits< Little, Size, Signed, Floating >::type type;
+    typedef typename endian_traits< Endianness, Size, Signed, Floating >::type type;
     
     BOOST_STATIC_ASSERT( size <= sizeof( type ) );
 
-    typedef packed::field< endian< Little, Size, Signed, Floating >, typename endian_traits< Little, Size, Signed, Floating >::type, Size > base_type;
+    typedef packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size > base_type;
 
     static type default_value() { return 0; }
 
-    typedef typename endian_traits< Little, size, Signed, Floating >::uint_of_same_size uint_of_same_size;
+    typedef typename endian_traits< Endianness, size, Signed, Floating >::uint_of_same_size uint_of_same_size;
     
     static void pack( char* storage, type value )
     {
-        uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-        for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
+        if( Endianness == packed::detail::little ) // no point for further generics; should be optimized by compiler anyway
+        {
+            uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
+            for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
+        }
+        else
+        {
+            type v( net_traits< type >::htobe( value ) );
+            ::memcpy( storage, ( void* )&v, size );
+        }
     }
 
     static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
     {
-        uint_of_same_size v = 0;
-        unsigned int shift = 0;
-        unsigned int i = 0;
-        for( ; i < size; ++i, shift += 8 )
+        if( Endianness == packed::detail::little ) // no point for further generics; should be optimized by compiler anyway
         {
-            v += static_cast< uint_of_same_size >( ( unsigned char )( storage[i] ) ) << shift;
+            uint_of_same_size v = 0;
+            unsigned int shift = 0;
+            unsigned int i = 0;
+            for( ; i < size; ++i, shift += 8 )
+            {
+                v += static_cast< uint_of_same_size >( ( unsigned char )( storage[i] ) ) << shift;
+            }
+            if( !Floating && Signed && ( storage[ size - 1 ] & 0x80 ) )
+            {            
+                for( ; i < sizeof( type ); ++i, shift += 8 ) { v +=  static_cast< uint_of_same_size >( 0xff ) << shift; } 
+            }
+            const type* result = reinterpret_cast< const type* >( &v );
+            return *result;
         }
-        if( !Floating && Signed && ( storage[ size - 1 ] & 0x80 ) )
-        {            
-            for( ; i < sizeof( type ); ++i, shift += 8 ) { v +=  static_cast< uint_of_same_size >( 0xff ) << shift; } 
+        else
+        {
+            type value;
+            ::memcpy( ( void* )&value, storage, size );
+            return net_traits< type >::betoh( value );
         }
-        const type* result = reinterpret_cast< const type* >( &v );
-        return *result;
     }
 
     const endian& operator=( const endian& rhs ) { return base_type::operator=( rhs ); }
diff --git a/packed/little_endian.h b/packed/little_endian.h
index 28694a5b5..b2b9a823d 100644
--- a/packed/little_endian.h
+++ b/packed/little_endian.h
@@ -32,10 +32,6 @@
 
 #pragma once
 
-#include <boost/static_assert.hpp>
-#include "../base/exception.h"
-#include "../base/types.h"
-#include "field.h"
 #include "detail/endian.h"
 
 namespace comma { namespace packed {

From 5b03746b6f180304ee27a8b689c914d497f23dfe Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 5 Apr 2019 21:29:23 +1100
Subject: [PATCH 0012/1056] packed: cmake fixed

---
 packed/CMakeLists.txt | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/packed/CMakeLists.txt b/packed/CMakeLists.txt
index 4475ab364..648c65102 100644
--- a/packed/CMakeLists.txt
+++ b/packed/CMakeLists.txt
@@ -3,11 +3,13 @@ SET( TARGET_NAME comma_${PROJECT} )
 
 FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp )
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h )
-SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
-ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
+FILE( GLOB detail_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/detail/*.h )
+SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} ${detail_includes} )
+ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} ${detail_includes} )
 # target_link_libraries( ${TARGET_NAME} comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+INSTALL( FILES ${detail_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/detail )
 
 IF( comma_BUILD_TESTS )
     ADD_SUBDIRECTORY( test )

From a26109369fa48b6a59442b09d2a2c2f25790ad3b Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 5 Apr 2019 21:51:11 +1100
Subject: [PATCH 0013/1056] packed: implementing generic big/little endian
 values to introduce 3-byte big-endian...

---
 packed/detail/endian.h | 109 ++++++-----------------------------------
 1 file changed, 15 insertions(+), 94 deletions(-)

diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index 4120e92b6..53250411e 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -70,120 +70,40 @@ namespace comma { namespace packed { namespace detail {
 BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
 BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
 
+enum endiannes { little = 0, big = 1 };
+    
+template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false > struct endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
+
 template < typename T > struct net_traits {};
 
 template <> struct net_traits< comma::uint16 >
 {
-    typedef comma::uint16 uint_of_same_size;
     static comma::uint16 htobe( comma::uint16 v ) { return htobe16( v ); }
     static comma::uint16 betoh( comma::uint16 v ) { return be16toh( v ); }
     static comma::uint16 htole( comma::uint16 v ) { return htole16( v ); }
     static comma::uint16 letoh( comma::uint16 v ) { return le16toh( v ); }
 };
 
-template <> struct net_traits< comma::int16 >
-{
-    typedef comma::uint16 uint_of_same_size;
-    static comma::int16 htobe( comma::int16 v ) { return htobe16( v ); }
-    static comma::int16 betoh( comma::int16 v ) { return be16toh( v ); }
-    static comma::int16 htole( comma::int16 v ) { return htole16( v ); }
-    static comma::int16 letoh( comma::int16 v ) { return le16toh( v ); }
-};
-
 template <> struct net_traits< comma::uint32 >
 {
-    typedef comma::uint32 uint_of_same_size;
     static comma::uint32 htobe( comma::uint32 v ) { return htobe32( v ); }
     static comma::uint32 betoh( comma::uint32 v ) { return be32toh( v ); }
     static comma::uint32 htole( comma::uint32 v ) { return htole32( v ); }
     static comma::uint32 letoh( comma::uint32 v ) { return le32toh( v ); }
 };
 
-template <> struct net_traits< comma::int32 >
-{
-    typedef comma::uint32 uint_of_same_size;
-    static comma::int32 htobe( comma::int32 v ) { return htobe32( v ); }
-    static comma::int32 betoh( comma::int32 v ) { return be32toh( v ); }
-    static comma::int32 htole( comma::int32 v ) { return htole32( v ); }
-    static comma::int32 letoh( comma::int32 v ) { return le32toh( v ); }
-};
-
 template <> struct net_traits< comma::uint64 >
 {
-    typedef comma::uint64 uint_of_same_size;
     static comma::uint64 htobe( comma::uint64 v ) { return htobe64( v ); }
     static comma::uint64 betoh( comma::uint64 v ) { return be64toh( v ); }
     static comma::uint64 htole( comma::uint64 v ) { return htole64( v ); }
     static comma::uint64 letoh( comma::uint64 v ) { return le64toh( v ); }
 };
 
-template <> struct net_traits< comma::int64 >
-{
-    typedef comma::uint64 uint_of_same_size;
-    static comma::int64 htobe( comma::int64 v ) { return htobe64( v ); }
-    static comma::int64 betoh( comma::int64 v ) { return be64toh( v ); }
-    static comma::int64 htole( comma::int64 v ) { return htole64( v ); }
-    static comma::int64 letoh( comma::int64 v ) { return le64toh( v ); }
-};
-
-template <> struct net_traits< float >
-{
-    typedef comma::uint32 uint_of_same_size;
-    static float htobe( float value )
-    {
-        uint_of_same_size v = net_traits< uint_of_same_size >::htobe( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< float* >( &v ) );
-    }
-    static float betoh( float value )
-    { 
-        uint_of_same_size v = net_traits< uint_of_same_size >::betoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< float* >( &v ) );
-    }
-    static float htole( float value )
-    { 
-        uint_of_same_size v = net_traits< uint_of_same_size >::htole( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< float* >( &v ) );
-    }
-    static float letoh( float value )
-    { 
-        uint_of_same_size v = net_traits< uint_of_same_size >::letoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< float* >( &v ) );
-    }
-};
-
-template <> struct net_traits< double >
-{
-    typedef comma::uint64 uint_of_same_size;
-    static double htobe( double value )
-    {
-        uint_of_same_size v = net_traits< uint_of_same_size >::htobe( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< double* >( &v ) );
-    }
-    static double betoh( double value )
-    { 
-        uint_of_same_size v = net_traits< uint_of_same_size >::betoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< double* >( &v ) );
-    }
-    static double htole( double value )
-    { 
-        uint_of_same_size v = net_traits< uint_of_same_size >::htole( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< double* >( &v ) );
-    }
-    static double letoh( double value )
-    { 
-        uint_of_same_size v = net_traits< uint_of_same_size >::letoh( *( reinterpret_cast< uint_of_same_size* >( &value ) ) );
-        return *( reinterpret_cast< double* >( &v ) );
-    }
-};
-
-enum endiannes { little = 0, big = 1 };
-    
-template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false > struct endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
-template < endiannes Endianness > struct endian_traits< Endianness, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
-template < endiannes Endianness > struct endian_traits< Endianness, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
-template < endiannes Endianness > struct endian_traits< Endianness, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
-template < endiannes Endianness > struct endian_traits< Endianness, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
-
 template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false >
 struct endian : public packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size >
 {
@@ -201,6 +121,7 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
     
     static void pack( char* storage, type value )
     {
+        uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
         if( Endianness == packed::detail::little ) // no point for further generics; should be optimized by compiler anyway
         {
             uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
@@ -208,16 +129,16 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
         }
         else
         {
-            type v( net_traits< type >::htobe( value ) );
-            ::memcpy( storage, ( void* )&v, size );
+            uint_of_same_size i = net_traits< uint_of_same_size >::htobe( *p );
+            ::memcpy( storage, ( void* )&i, size );
         }
     }
 
     static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
     {
+        uint_of_same_size v = 0;
         if( Endianness == packed::detail::little ) // no point for further generics; should be optimized by compiler anyway
         {
-            uint_of_same_size v = 0;
             unsigned int shift = 0;
             unsigned int i = 0;
             for( ; i < size; ++i, shift += 8 )
@@ -233,9 +154,9 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
         }
         else
         {
-            type value;
-            ::memcpy( ( void* )&value, storage, size );
-            return net_traits< type >::betoh( value );
+            ::memcpy( ( void* )&v, storage, size );
+            v = net_traits< uint_of_same_size >::betoh( v );
+            return *( reinterpret_cast< type* >( &v ) );
         }
     }
 

From e77037cc82ddce34a56c75f86d9d215e48297f1e Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 5 Apr 2019 23:38:38 +1100
Subject: [PATCH 0014/1056] packed/traits.h removed

---
 packed/traits.h | 49 -------------------------------------------------
 1 file changed, 49 deletions(-)
 delete mode 100644 packed/traits.h

diff --git a/packed/traits.h b/packed/traits.h
deleted file mode 100644
index e16a5e22e..000000000
--- a/packed/traits.h
+++ /dev/null
@@ -1,49 +0,0 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-#pragma once
-
-#include "big_endian.h"
-#include <boost/array.hpp>
-#include "../visiting/traits.h"
-
-namespace comma { namespace visiting {
-
-template < typename T, std::size_t N > struct traits< boost::array<comma::packed::detail::big_endian<T>, N> >
-{
-    template< typename K, typename V > static void visit( const K& k, const boost::array<comma::packed::detail::big_endian<T>, N>& t, V& v )
-    {
-        for( std::size_t i = 0; i < t.size(); i++ ) { v.apply( i, t[i]() ); }
-    }
-};
-
-
-} } //namespace comma { namespace visiting {
-
-

From a0c4b66b333d4ca060c1d1b66cd8a2ce9462030c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 6 Apr 2019 13:34:06 +1100
Subject: [PATCH 0015/1056] packed: endian stuff further refactored in
 preparation to handle signed 24-bit big endian numbers

---
 packed/detail/endian.h | 61 ++++++++++++++++++++++--------------------
 1 file changed, 32 insertions(+), 29 deletions(-)

diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index 53250411e..6fb850558 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -78,7 +78,7 @@ template < endiannes Endianness > struct endian_traits< Endianness, 3, false > {
 template < endiannes Endianness > struct endian_traits< Endianness, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
 template < endiannes Endianness > struct endian_traits< Endianness, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
 
-template < typename T > struct net_traits {};
+template < typename T > struct net_traits;
 
 template <> struct net_traits< comma::uint16 >
 {
@@ -104,6 +104,23 @@ template <> struct net_traits< comma::uint64 >
     static comma::uint64 letoh( comma::uint64 v ) { return le64toh( v ); }
 };
 
+template < endiannes Endianness > struct convert;
+
+template <> struct convert< packed::detail::little >
+{
+    template < typename T > static T from_host( T t ) { return net_traits< T >::htole( t ); }
+    template < typename T > static T to_host( T t ) { return net_traits< T >::letoh( t ); }
+};
+
+template <> struct convert< packed::detail::big >
+{
+    template < typename T > static T from_host( T t ) { return net_traits< T >::htobe( t ); }
+    template < typename T > static T to_host( T t ) { return net_traits< T >::betoh( t ); }
+};
+
+template < unsigned int Size > struct ff { enum { value = ff< Size - 1 >::value << 8 + 0xff }; };
+template <> struct ff< 1 > { enum { value = 0xff }; };
+
 template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false >
 struct endian : public packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size >
 {
@@ -112,6 +129,8 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
     typedef typename endian_traits< Endianness, Size, Signed, Floating >::type type;
     
     BOOST_STATIC_ASSERT( size <= sizeof( type ) );
+    
+    BOOST_STATIC_ASSERT( Signed || !Floating ); // unsigned floats don't make sense
 
     typedef packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size > base_type;
 
@@ -122,42 +141,26 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
     static void pack( char* storage, type value )
     {
         uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-        if( Endianness == packed::detail::little ) // no point for further generics; should be optimized by compiler anyway
+        *p = convert< Endianness >::from_host( *p );
+        if( sizeof( uint_of_same_size ) == size ) // no point for further generics; should be optimized by compiler anyway
         {
-            uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-            for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
+            ::memcpy( storage, ( void* )p, size );
         }
         else
         {
-            uint_of_same_size i = net_traits< uint_of_same_size >::htobe( *p );
-            ::memcpy( storage, ( void* )&i, size );
+            // todo! 24-bit big endian!!!
+            // todo: test signed big endian
+            
+            for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
         }
     }
-
+    
     static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
     {
-        uint_of_same_size v = 0;
-        if( Endianness == packed::detail::little ) // no point for further generics; should be optimized by compiler anyway
-        {
-            unsigned int shift = 0;
-            unsigned int i = 0;
-            for( ; i < size; ++i, shift += 8 )
-            {
-                v += static_cast< uint_of_same_size >( ( unsigned char )( storage[i] ) ) << shift;
-            }
-            if( !Floating && Signed && ( storage[ size - 1 ] & 0x80 ) )
-            {            
-                for( ; i < sizeof( type ); ++i, shift += 8 ) { v +=  static_cast< uint_of_same_size >( 0xff ) << shift; } 
-            }
-            const type* result = reinterpret_cast< const type* >( &v );
-            return *result;
-        }
-        else
-        {
-            ::memcpy( ( void* )&v, storage, size );
-            v = net_traits< uint_of_same_size >::betoh( v );
-            return *( reinterpret_cast< type* >( &v ) );
-        }
+        uint_of_same_size i = ( !Floating && Signed && ( storage[ Endianness == little ? size - 1 : 0 ] & 0x80 ) ) ? -1 : 0;
+        ::memcpy( ( void* )&i + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), storage, size );
+        i = convert< Endianness >::to_host( i );
+        return *( reinterpret_cast< type* >( &i ) );
     }
 
     const endian& operator=( const endian& rhs ) { return base_type::operator=( rhs ); }

From 155e0f1f1431e62d4b05e2d87108aff9ce2acef5 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 6 Apr 2019 19:44:57 +1100
Subject: [PATCH 0016/1056] packed: 24-bit big endian implemented; basic unit
 test added

---
 packed/big_endian.h         |  28 ++++++--
 packed/detail/endian.h      |  12 +---
 packed/little_endian.h      |  21 ++++--
 packed/test/packed_test.cpp | 127 ++++++++++++++++++------------------
 4 files changed, 103 insertions(+), 85 deletions(-)

diff --git a/packed/big_endian.h b/packed/big_endian.h
index bc20eef82..230eafb04 100644
--- a/packed/big_endian.h
+++ b/packed/big_endian.h
@@ -37,25 +37,41 @@
 
 namespace comma { namespace packed {
 
-/// big endian 16-bit integers
 typedef detail::endian< detail::big, 2, false > big_endian_uint16;
 typedef detail::endian< detail::big, 2, true > big_endian_int16;
-/// aliases for big endian 16-bit integers
 typedef big_endian_uint16 net_uint16;
 typedef big_endian_int16 net_int16;
-/// big endian 32-bit integers
+typedef detail::endian< detail::big, 3, false > big_endian_uint24;
+typedef detail::endian< detail::big, 3, true > big_endian_int24;
+typedef big_endian_uint24 net_uint24;
+typedef big_endian_int24 net_int24;
 typedef detail::endian< detail::big, 4, false > big_endian_uint32;
 typedef detail::endian< detail::big, 4, true > big_endian_int32;
-/// aliases for big endian 32-bit integers
 typedef big_endian_uint32 net_uint32;
 typedef big_endian_int32 net_int32;
-/// big endian float and double
 typedef detail::endian< detail::big, 4, true, true > big_endian_float32;
 typedef detail::endian< detail::big, 8, true, true > big_endian_float64;
+typedef big_endian_float32 big_endian_float;
 typedef big_endian_float64 big_endian_double;
-/// aliases for big endian float and double
 typedef big_endian_float32 net_float32;
 typedef big_endian_float64 net_float64;
+typedef net_float32 net_float;
 typedef net_float64 net_double;
 
+// all types above deprecated; use namespacing below
+namespace big_endian { // i love namespacing
+
+typedef detail::endian< detail::big, 2, false > uint16;
+typedef detail::endian< detail::big, 2, true > int16;
+typedef detail::endian< detail::big, 3, false > uint24;
+typedef detail::endian< detail::big, 3, true > int24;
+typedef detail::endian< detail::big, 4, false > uint32;
+typedef detail::endian< detail::big, 4, true > int32;
+typedef detail::endian< detail::big, 8, false > uint64;
+typedef detail::endian< detail::big, 8, true > int64;
+typedef detail::endian< detail::big, 4, true, true > float32;
+typedef detail::endian< detail::big, 8, true, true > float64;
+
+} // namespace big_endian {
+
 } } // namespace comma { namespace packed {
diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index 6fb850558..80b1b9b75 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -142,17 +142,7 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
     {
         uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
         *p = convert< Endianness >::from_host( *p );
-        if( sizeof( uint_of_same_size ) == size ) // no point for further generics; should be optimized by compiler anyway
-        {
-            ::memcpy( storage, ( void* )p, size );
-        }
-        else
-        {
-            // todo! 24-bit big endian!!!
-            // todo: test signed big endian
-            
-            for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
-        }
+        ::memcpy( storage, ( void* )p + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), size );
     }
     
     static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
diff --git a/packed/little_endian.h b/packed/little_endian.h
index b2b9a823d..7f8b16d70 100644
--- a/packed/little_endian.h
+++ b/packed/little_endian.h
@@ -36,30 +36,41 @@
 
 namespace comma { namespace packed {
 
-/// packed little endian 16-bit integers
 typedef detail::endian< detail::little, 2, true > little_endian16;
 typedef detail::endian< detail::little, 2, false > little_endian_uint16;
 typedef little_endian16 int16;
 typedef little_endian_uint16 uint16;
-/// packed little endian 24-bit integers (strangely, there are protocols using it)
 typedef detail::endian< detail::little, 3, true > little_endian24;
 typedef detail::endian< detail::little, 3, false > little_endian_uint24;
 typedef little_endian24 int24;
 typedef little_endian_uint24 uint24;
-/// packed little endian 32-bit integers
 typedef detail::endian< detail::little, 4, true > little_endian32;
 typedef detail::endian< detail::little, 4, false > little_endian_uint32;
 typedef little_endian32 int32;
 typedef little_endian_uint32 uint32;
-/// packed little endian 32-bit integers
 typedef detail::endian< detail::little, 8, true > little_endian64;
 typedef detail::endian< detail::little, 8, false > little_endian_uint64;
 typedef little_endian64 int64;
 typedef little_endian_uint64 uint64;
-/// packed floating point number (does it even make sense?)
 typedef detail::endian< detail::little, 4, true, true > little_endian_float32;
 typedef detail::endian< detail::little, 8, true, true > little_endian_float64;
 typedef little_endian_float32 float32;
 typedef little_endian_float64 float64;
 
+// all types above deprecated; use namespacing below
+namespace little_endian { // i love namespacing
+
+typedef detail::endian< detail::little, 2, false > uint16;
+typedef detail::endian< detail::little, 2, true > int16;
+typedef detail::endian< detail::little, 3, false > uint24;
+typedef detail::endian< detail::little, 3, true > int24;
+typedef detail::endian< detail::little, 4, false > uint32;
+typedef detail::endian< detail::little, 4, true > int32;
+typedef detail::endian< detail::little, 8, false > uint64;
+typedef detail::endian< detail::little, 8, true > int64;
+typedef detail::endian< detail::little, 4, true, true > float32;
+typedef detail::endian< detail::little, 8, true, true > float64;
+
+} // namespace little_endian {
+
 } } // namespace comma { namespace packed {
diff --git a/packed/test/packed_test.cpp b/packed/test/packed_test.cpp
index e7b891b9d..5ee680ff6 100644
--- a/packed/test/packed_test.cpp
+++ b/packed/test/packed_test.cpp
@@ -47,8 +47,8 @@ struct test_packed_struct_t : public comma::packed::packed_struct< test_packed_s
 {
     comma::packed::string< 4 > hello;
     comma::packed::string< 5 > world;
-    comma::packed::net_uint16 int16;
-    comma::packed::net_uint32 int32;
+    comma::packed::big_endian::uint16 int16;
+    comma::packed::big_endian::uint32 int32;
     comma::packed::byte byte;
 };
 
@@ -75,8 +75,7 @@ TEST( packed_struct, test_packed_struct )
     EXPECT_EQ( s.byte(), 3 );
 }
 
-template < typename T >
-void test_packed_int( comma::int64 value )
+template < typename T > static void test_packed_int( comma::int64 value )
 {
     T t;
     EXPECT_EQ( true, t == 0 );
@@ -85,8 +84,7 @@ void test_packed_int( comma::int64 value )
     EXPECT_EQ( value, t() );
 }
 
-template < typename T >
-void test_packed_uint( comma::uint64 value )
+template < typename T > static void test_packed_uint( comma::uint64 value )
 {
     T t;
     EXPECT_EQ( true, t == 0 );
@@ -95,42 +93,45 @@ void test_packed_uint( comma::uint64 value )
     EXPECT_EQ( value, t() );
 }
 
-
 TEST( test_packed_struct_test, test_little_endian )
 {
-    test_packed_uint< comma::packed::uint16 >( 1231 );
-    test_packed_uint< comma::packed::uint16 >( 65535 );
-    test_packed_uint< comma::packed::uint24 >( 1232 );
-    test_packed_uint< comma::packed::uint24 >( 16777215 );
-    test_packed_uint< comma::packed::uint32 >( 1233 );
-    test_packed_uint< comma::packed::uint32 >( 4294967295 );
-    test_packed_uint< comma::packed::uint64 >( 4321 );
-    test_packed_uint< comma::packed::uint64 >( comma::uint64( std::numeric_limits< comma::uint64 >::max() ) );
-    test_packed_uint< comma::packed::uint64 >( comma::uint64( 0x1BCDEF1213141500ULL ) );
-
-    test_packed_int< comma::packed::int16 >( 1234 );
-    test_packed_int< comma::packed::int24 >( 1235 );
-    test_packed_int< comma::packed::int24 >( 8388607 );
-    test_packed_int< comma::packed::int32 >( 8388607 );
-    test_packed_int< comma::packed::int32 >( 1236 );
-    test_packed_int< comma::packed::int16 >( -1231 );
-    test_packed_int< comma::packed::int24 >( -1232 );
-    test_packed_int< comma::packed::int24 >( -8388608 );
-    test_packed_int< comma::packed::int32 >( -1233 );
-    test_packed_int< comma::packed::int64 >( -4321 );
-    test_packed_int< comma::packed::int64 >( comma::int64( std::numeric_limits< comma::int64 >::min() ) );
+    test_packed_uint< comma::packed::little_endian::uint16 >( 1231 );
+    test_packed_uint< comma::packed::little_endian::uint16 >( 65535 );
+    test_packed_uint< comma::packed::little_endian::uint24 >( 1232 );
+    test_packed_uint< comma::packed::little_endian::uint24 >( 16777215 );
+    test_packed_uint< comma::packed::little_endian::uint32 >( 1233 );
+    test_packed_uint< comma::packed::little_endian::uint32 >( 4294967295 );
+    test_packed_uint< comma::packed::little_endian::uint64 >( 4321 );
+    test_packed_uint< comma::packed::little_endian::uint64 >( comma::uint64( std::numeric_limits< comma::uint64 >::max() ) );
+    test_packed_uint< comma::packed::little_endian::uint64 >( comma::uint64( 0x1BCDEF1213141500ULL ) );
+
+    test_packed_int< comma::packed::little_endian::int16 >( 1234 );
+    test_packed_int< comma::packed::little_endian::int24 >( 1235 );
+    test_packed_int< comma::packed::little_endian::int24 >( 8388607 );
+    test_packed_int< comma::packed::little_endian::int32 >( 8388607 );
+    test_packed_int< comma::packed::little_endian::int32 >( 1236 );
+    test_packed_int< comma::packed::little_endian::int16 >( -1231 );
+    test_packed_int< comma::packed::little_endian::int24 >( -1232 );
+    test_packed_int< comma::packed::little_endian::int24 >( -8388608 );
+    test_packed_int< comma::packed::little_endian::int32 >( -1233 );
+    test_packed_int< comma::packed::little_endian::int64 >( -4321 );
+    test_packed_int< comma::packed::little_endian::int64 >( comma::int64( std::numeric_limits< comma::int64 >::min() ) );
 }
 
 TEST( test_packed_struct_test, test_big_endian )
 {
-    test_packed_int< comma::packed::net_uint16 >( 1234 );
-    test_packed_int< comma::packed::net_uint16 >( 65535 );
-    test_packed_int< comma::packed::net_uint32 >( 1234 );
-    test_packed_int< comma::packed::net_uint32 >( 4294967295 );
-    test_packed_int< comma::packed::net_int16 >( 1234 );
-    test_packed_int< comma::packed::net_int32 >( 1234 );
-    test_packed_int< comma::packed::net_int16 >( -1234 );
-    test_packed_int< comma::packed::net_int32 >( -1234 );
+    test_packed_int< comma::packed::big_endian::uint16 >( 1234 );
+    test_packed_int< comma::packed::big_endian::uint16 >( 65535 );
+    test_packed_uint< comma::packed::big_endian::uint24 >( 1232 );
+    test_packed_uint< comma::packed::big_endian::uint24 >( 16777215 );
+    test_packed_int< comma::packed::big_endian::uint32 >( 1234 );
+    test_packed_int< comma::packed::big_endian::uint32 >( 4294967295 );
+    test_packed_int< comma::packed::big_endian::int16 >( 1234 );
+    test_packed_int< comma::packed::big_endian::int32 >( 1234 );
+    test_packed_int< comma::packed::big_endian::int16 >( -1234 );
+    test_packed_int< comma::packed::big_endian::int32 >( -1234 );
+    test_packed_int< comma::packed::big_endian::int24 >( -1232 );
+    test_packed_int< comma::packed::big_endian::int24 >( -8388608 );
 }
 
 template< typename T >
@@ -151,7 +152,7 @@ static void test_int64_byte_order( comma::int64 value, char byte0, char byte1, c
 TEST( test_packed_struct_test, test_int64_byte_order )
 {
     comma::int64 i = 0xFBCDEF1213141500LL;
-    test_int64_byte_order< comma::packed::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xFB );
+    test_int64_byte_order< comma::packed::little_endian::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xFB );
 }
 
 template< typename T >
@@ -172,12 +173,12 @@ static void test_uint64_byte_order( comma::uint64 value, char byte0, char byte1,
 TEST( test_packed_struct_test, test_uint64_byte_order )
 {
     comma::uint64 i = 0xABCDEF1213141500ULL;
-    test_uint64_byte_order< comma::packed::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xAB );
+    test_uint64_byte_order< comma::packed::little_endian::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xAB );
 }
 
 static void test_int24_byte_order( int value, char byte0, char byte1, char byte2 )
 {
-    comma::packed::int24 a;
+    comma::packed::little_endian::int24 a;
     a = value;
     EXPECT_EQ( ( 0xff & a.data()[0] ), ( 0xff & byte0 ) );
     EXPECT_EQ( ( 0xff & a.data()[1] ), ( 0xff & byte1 ) );
@@ -201,10 +202,10 @@ TEST( test_packed_struct_test, test_int24_byte_order )
 
 struct test_packed_struct_floats_t : public comma::packed::packed_struct< test_packed_struct_floats_t, 24 >
 {
-    comma::packed::float32 f32;
-    comma::packed::float64 f64;
-    comma::packed::net_float32 nf32;
-    comma::packed::net_float64 nf64;
+    comma::packed::little_endian::float32 f32;
+    comma::packed::little_endian::float64 f64;
+    comma::packed::big_endian::float32 nf32;
+    comma::packed::big_endian::float64 nf64;
 };
 
 TEST( packed_struct, test_packed_struct_floats )
@@ -218,7 +219,7 @@ TEST( packed_struct, test_packed_struct_floats )
     EXPECT_DOUBLE_EQ( 1.23456789, s.f64() );
 }
 
-TEST( packed_struct, test_packed_struct_net_floats )
+TEST( packed_struct, test_packed_struct_big_endian_floats )
 {
     test_packed_struct_floats_t s;
     EXPECT_FLOAT_EQ( true, s.nf32 == 0 );
@@ -231,25 +232,25 @@ TEST( packed_struct, test_packed_struct_net_floats )
 
 TEST( test_packed_struct_test, test_little_endian_floats )
 {
-    comma::packed::float32 a;
+    comma::packed::little_endian::float32 a;
     EXPECT_FLOAT_EQ( 0, a() );
     a = 1.2345;
     EXPECT_FLOAT_EQ( 1.2345, a() );
 
-    comma::packed::float64 b;
+    comma::packed::little_endian::float64 b;
     EXPECT_DOUBLE_EQ( 0, b() );
     b = 1.23456789;
     EXPECT_DOUBLE_EQ( 1.23456789, b() );
 }
 
-TEST( test_packed_struct_test, test_net_floats )
+TEST( test_packed_struct_test, test_big_endian_floats )
 {
-    comma::packed::net_float32 a;
+    comma::packed::big_endian::float32 a;
     EXPECT_FLOAT_EQ( 0, a() );
     a = 1.2345;
     EXPECT_FLOAT_EQ( 1.2345, a() );
 
-    comma::packed::net_float64 b;
+    comma::packed::big_endian::float64 b;
     EXPECT_DOUBLE_EQ( 0, b() );
     b = 1.23456789;
     EXPECT_DOUBLE_EQ( 1.23456789, b() );
@@ -268,14 +269,14 @@ static void test_float32_byte_order( float value, char byte0, char byte1, char b
 
 TEST( test_packed_struct_test, test_float32_byte_order )
 {
-    test_float32_byte_order< comma::packed::float32 >( 5.2, 0x66, 0x66, 0xA6, 0x40 );
-    test_float32_byte_order< comma::packed::float32 >( -5.2, 0x66, 0x66, 0xA6, 0xC0 );
+    test_float32_byte_order< comma::packed::little_endian::float32 >( 5.2, 0x66, 0x66, 0xA6, 0x40 );
+    test_float32_byte_order< comma::packed::little_endian::float32 >( -5.2, 0x66, 0x66, 0xA6, 0xC0 );
 }
 
-TEST( test_packed_struct_test, test_net_float32_byte_order )
+TEST( test_packed_struct_test, test_big_endian_float32_byte_order )
 {
-    test_float32_byte_order< comma::packed::net_float32 >( 5.2, 0x40, 0xA6, 0x66, 0x66 );
-    test_float32_byte_order< comma::packed::net_float32 >( -5.2, 0xC0, 0xA6, 0x66, 0x66 );
+    test_float32_byte_order< comma::packed::big_endian::float32 >( 5.2, 0x40, 0xA6, 0x66, 0x66 );
+    test_float32_byte_order< comma::packed::big_endian::float32 >( -5.2, 0xC0, 0xA6, 0x66, 0x66 );
 }
 
 template< typename T >
@@ -295,18 +296,18 @@ static void test_float64_byte_order( double value, char byte0, char byte1, char
 
 TEST( test_packed_struct_test, test_float64_byte_order )
 {
-    test_float64_byte_order< comma::packed::float64 >( 5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0x40 );
-    test_float64_byte_order< comma::packed::float64 >( -5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0xC0 );
-    test_float64_byte_order< comma::packed::float64 >( -1.2e-123, 0x4E, 0x57, 0x04, 0xD1, 0x71, 0x62, 0x69, 0xA6 );
-    test_float64_byte_order< comma::packed::float64 >( -1.2e+123, 0x21, 0xBD, 0xC3, 0x60, 0x60, 0x0B, 0x7D, 0xD9 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( 5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0x40 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( -5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0xC0 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( -1.2e-123, 0x4E, 0x57, 0x04, 0xD1, 0x71, 0x62, 0x69, 0xA6 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( -1.2e+123, 0x21, 0xBD, 0xC3, 0x60, 0x60, 0x0B, 0x7D, 0xD9 );
 }
 
-TEST( test_packed_struct_test, test_net_float64_byte_order )
+TEST( test_packed_struct_test, test_big_endian_float64_byte_order )
 {
-    test_float64_byte_order< comma::packed::net_float64 >( 5.2, 0x40, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
-    test_float64_byte_order< comma::packed::net_float64 >( -5.2, 0xC0, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
-    test_float64_byte_order< comma::packed::net_float64 >( -1.2e-123, 0xA6, 0x69, 0x62, 0x71, 0xD1, 0x04, 0x57, 0x4E );
-    test_float64_byte_order< comma::packed::net_float64 >( -1.2e+123, 0xD9, 0x7D, 0x0B, 0x60, 0x60, 0xC3, 0xBD, 0x21 );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( 5.2, 0x40, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( -5.2, 0xC0, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( -1.2e-123, 0xA6, 0x69, 0x62, 0x71, 0xD1, 0x04, 0x57, 0x4E );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( -1.2e+123, 0xD9, 0x7D, 0x0B, 0x60, 0x60, 0xC3, 0xBD, 0x21 );
 }
 
 static boost::array< std::string, 16 > hex_digits_u = { { "0", "1", "2", "3", "4", "5", "6", "7", "8", "9", "A", "B", "C", "D", "E", "F" } };

From 2271eb6999bba59646f561f69de50a81a2d2d8f0 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Apr 2019 16:17:43 +1000
Subject: [PATCH 0017/1056] csv-fields: make-fields: --values convenience
 option added

---
 csv/applications/csv-fields.cpp |  9 ++++++++-
 csv/test/csv-fields/expected    | 10 ++++++++++
 csv/test/csv-fields/input       |  7 +++++--
 3 files changed, 23 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-fields.cpp b/csv/applications/csv-fields.cpp
index 2e4442673..3886f591e 100644
--- a/csv/applications/csv-fields.cpp
+++ b/csv/applications/csv-fields.cpp
@@ -95,6 +95,7 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << "    make-fixed: normalise input to a fixed number of fields" << std::endl;
     std::cerr << "        --count,--size=<n>: number of output fields" << std::endl;
+    std::cerr << "        --values=[<values>]: if present, fill missing fields with given values" << std::endl;
     std::cerr << "        --force: chop input to <n> fields if larger" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
@@ -156,6 +157,11 @@ static void usage( bool )
     std::cerr << "        a,b,c,d,," << std::endl;
     std::cerr << "        x,y,z,,," << std::endl;
     std::cerr << std::endl;
+    std::cerr << "    make-fixed" << std::endl;
+    std::cerr << "        { echo a,b; echo x,y,z; } | csv-fields make-fixed --count=6 --fields=A,B,C,D,E,F" << std::endl;
+    std::cerr << "        a,b,C,D,E,F" << std::endl;
+    std::cerr << "        x,y,z,D,E,F" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "        { echo a,b,c,d; echo x,y,z; } | csv-fields make-fixed --count=3 --force" << std::endl;
     std::cerr << "        a,b,c" << std::endl;
     std::cerr << "        x,y,z" << std::endl;
@@ -421,6 +427,7 @@ int main( int ac, char** av )
         {
             const unsigned int count = options.value< unsigned int >( "--count,--size" );
             bool force = options.exists( "--force" );
+            const std::vector< std::string >& values = comma::split( options.value< std::string >( "--values", "" ), ',', true );
             while( std::cin.good() )
             {
                 std::string line;
@@ -430,7 +437,7 @@ int main( int ac, char** av )
                 if( v.size() <= count )
                 {
                     std::cout << line;
-                    for( unsigned int i = v.size(); i < count; i++ ) { std::cout << delimiter; }
+                    for( unsigned int i = v.size(); i < count; i++ ) { std::cout << delimiter << ( i < values.size() ? values[i] : std::string() ); }
                 }
                 else
                 {
diff --git a/csv/test/csv-fields/expected b/csv/test/csv-fields/expected
index 2dddba1ee..1aafcbd77 100644
--- a/csv/test/csv-fields/expected
+++ b/csv/test/csv-fields/expected
@@ -205,3 +205,13 @@ make_fixed[2]/output="a,b,c"
 make_fixed[2]/status=0
 make_fixed[3]/output="a:b:c:d::"
 make_fixed[3]/status=0
+make_fixed[4]/output="a,b,c,4,5,6"
+make_fixed[4]/status=0
+make_fixed[5]/output="a,b,c,4,5,"
+make_fixed[5]/status=0
+make_fixed[6]/output="a,b,c,,,"
+make_fixed[6]/status=0
+make_fixed[7]/output="a,b,c,,,"
+make_fixed[7]/status=0
+make_fixed[8]/output="a,b,,4,5,6"
+make_fixed[8]/status=0
diff --git a/csv/test/csv-fields/input b/csv/test/csv-fields/input
index 9bb3ea7ca..27131ca22 100644
--- a/csv/test/csv-fields/input
+++ b/csv/test/csv-fields/input
@@ -109,5 +109,8 @@ make_fixed[0]="echo a,b,c,d | csv-fields make-fixed --count=6"
 make_fixed[1]="echo a,b,c,d | csv-fields make-fixed --count=3"
 make_fixed[2]="echo a,b,c,d | csv-fields make-fixed --count=3 --force"
 make_fixed[3]="echo a:b:c:d | csv-fields make-fixed --count=6 --delimiter=:"
-
-
+make_fixed[4]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3,4,5,6"
+make_fixed[5]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3,4,5"
+make_fixed[6]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3"
+make_fixed[7]="echo a,b,c | csv-fields make-fixed --count=6 --values 1"
+make_fixed[8]="echo a,b, | csv-fields make-fixed --count=6 --values 1,2,3,4,5,6"

From b06079d9d1b483855ea11b4b6d4e42aeb36a4e96 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Apr 2019 17:28:33 +1000
Subject: [PATCH 0018/1056] csv-fields: make-fixed: if --value given, --count
 is optional

---
 csv/applications/csv-fields.cpp | 8 +++++---
 csv/test/csv-fields/expected    | 2 ++
 csv/test/csv-fields/input       | 1 +
 3 files changed, 8 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-fields.cpp b/csv/applications/csv-fields.cpp
index 3886f591e..e56d89efb 100644
--- a/csv/applications/csv-fields.cpp
+++ b/csv/applications/csv-fields.cpp
@@ -95,7 +95,8 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << "    make-fixed: normalise input to a fixed number of fields" << std::endl;
     std::cerr << "        --count,--size=<n>: number of output fields" << std::endl;
-    std::cerr << "        --values=[<values>]: if present, fill missing fields with given values" << std::endl;
+    std::cerr << "        --values=[<values>]: fill missing fields with given values" << std::endl;
+    std::cerr << "                             if --count not specified, use number of <values> as desired number of fields" << std::endl;
     std::cerr << "        --force: chop input to <n> fields if larger" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
@@ -425,9 +426,10 @@ int main( int ac, char** av )
         }
         if( operation == "make-fixed" )
         {
-            const unsigned int count = options.value< unsigned int >( "--count,--size" );
-            bool force = options.exists( "--force" );
             const std::vector< std::string >& values = comma::split( options.value< std::string >( "--values", "" ), ',', true );
+            const unsigned int count = options.value< unsigned int >( "--count,--size", values.size() );
+            if( count == 0 ) { std::cerr << "csv-fields: make-fixed: please specify either --count or --values" << std::endl; }
+            bool force = options.exists( "--force" );
             while( std::cin.good() )
             {
                 std::string line;
diff --git a/csv/test/csv-fields/expected b/csv/test/csv-fields/expected
index 1aafcbd77..443885c0a 100644
--- a/csv/test/csv-fields/expected
+++ b/csv/test/csv-fields/expected
@@ -215,3 +215,5 @@ make_fixed[7]/output="a,b,c,,,"
 make_fixed[7]/status=0
 make_fixed[8]/output="a,b,,4,5,6"
 make_fixed[8]/status=0
+make_fixed[9]/output="a,b,c,4,5,6"
+make_fixed[9]/status=0
diff --git a/csv/test/csv-fields/input b/csv/test/csv-fields/input
index 27131ca22..7a8a3db2c 100644
--- a/csv/test/csv-fields/input
+++ b/csv/test/csv-fields/input
@@ -114,3 +114,4 @@ make_fixed[5]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3,4,5"
 make_fixed[6]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3"
 make_fixed[7]="echo a,b,c | csv-fields make-fixed --count=6 --values 1"
 make_fixed[8]="echo a,b, | csv-fields make-fixed --count=6 --values 1,2,3,4,5,6"
+make_fixed[9]="echo a,b,c | csv-fields make-fixed --values 1,2,3,4,5,6"

From 7cdfbbd28ff8abea41236007cf0f9e7bdef15be6 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 16 Apr 2019 19:35:34 +1000
Subject: [PATCH 0019/1056] csv-blocks: make-blocks: --min-gap-between-blocks:
 implementing...

---
 csv/applications/csv-blocks.cpp | 49 ++++++++++++++++++++++++++-------
 1 file changed, 39 insertions(+), 10 deletions(-)

diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index fd89c8b58..e65989747 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -255,7 +255,16 @@ static bool empty_( const std::string& s ) // quick and dirty
     return true;
 }
 
-template < typename T > static void set_fields( const comma::command_line_options& options, std::string& first_line, T& default_input )
+static double diff( const input_t& from, const input_t& to ) // quick and dirty
+{
+    if( from.key.longs.size() == 1 ) { return std::abs( double( from.key.longs[0] ) - to.key.longs[0] ); }
+    if( from.key.doubles.size() == 1 ) { return std::abs( from.key.doubles[0] - to.key.doubles[0] ); }
+    if( from.key.time.size() == 1 ) { return std::abs( double( ( from.key.time[0] - to.key.time[0] ).total_microseconds() ) / 1000000 ); }
+    if( from.key.strings.size() == 1 ) { COMMA_THROW( comma::exception, "difference for strings: not implemented" ); }
+    COMMA_THROW( comma::exception, "never here" );
+}
+
+template < typename T > static bool set_fields( const comma::command_line_options& options, std::string& first_line, T& default_input )
 {
     std::vector< std::string > v = comma::split( csv.fields, ',' );
     comma::csv::format f;
@@ -270,8 +279,29 @@ template < typename T > static void set_fields( const comma::command_line_option
     }
     // This is to load the keys into input_t structure
     unsigned int size = f.count();
-    for( std::size_t i = 0; i < size; ++i ) { if( i < v.size() ) { if( v[i] == "id" ) { v[i] = "key/" + default_input.key.append( f.offset( i ).type ); continue; } } }
+    bool has_id = false;
+    bool has_scalar = false;
+    for( std::size_t i = 0; i < size; ++i )
+    { 
+        if( i < v.size() )
+        { 
+            if( v[i] == "id" )
+            {
+                has_id = true;
+                v[i] = "key/" + default_input.key.append( f.offset( i ).type );
+            }
+            else if( v[i] == "scalar" )
+            {
+                if( has_scalar ) { COMMA_THROW( comma::exception, "expected not more than one scalar in --fields; got: \"" << csv.fields << "\"" ); }
+                has_scalar = true;
+                v[i] = "key/" + default_input.key.append( f.offset( i ).type );
+            }
+        }
+    }
+    if( !has_id && !has_scalar ) { COMMA_THROW( comma::exception, "please specify at least one id or scalar in --fields; got: \"" << csv.fields << "\"" ); }
+    if( has_id && has_scalar ) { COMMA_THROW( comma::exception, "expected either id or scalar in --fields; got both in: \"" << csv.fields << "\"" ); }
     csv.fields = comma::join( v, ',' );
+    return has_id;
 }
 
 #ifndef WIN32
@@ -472,21 +502,20 @@ int main( int ac, char** av )
         if( operation == "group" || operation == "make-blocks" )
         {
             current_block = options.value< comma::uint32 >( "--starting-block,--from", 0 ); // default is 0
-            
             std::string first_line;
             input_t default_input;
-            set_fields( options, first_line, default_input );
-            if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << std::endl; }
-            if ( default_input.key.empty() ) { std::cerr << name() << "please specify at least one id field" << std::endl; return 1; }
-            
+            bool has_id = set_fields( options, first_line, default_input );
+            if( !has_id ) { std::cerr << "csv-blocks: scalar field support: todo" << std::endl; }
+            if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << "; making blocks by " << ( has_id ? "id" : "scalar" ) << std::endl; }
+            double gap;
+            if( !has_id ) { gap = options.value< double >( "--min-gap-between-blocks,--min-gap,--gap" ); }
             comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
             comma::csv::output_stream< appended_column > ostream( std::cout, csv_out );
             comma::csv::tied< input_t, appended_column > tied( istream, ostream );
-            
             if( !first_line.empty() ) 
             { 
                 input_t p = comma::csv::ascii< input_t >( csv, default_input ).get( first_line ); 
-                if( !(keys == p.key) ) { ++current_block; }
+                if( !( keys == p.key ) ) { ++current_block; }
                 keys = p.key;
                 // This is needed because the record wasnt read in by istream
                 // Write it out
@@ -499,7 +528,7 @@ int main( int ac, char** av )
             {
                 const input_t* p = istream.read();
                 if( !p ) { break; }
-                if( !(keys == p->key) ) { ++current_block; }
+                if( !( keys == p->key ) ) { ++current_block; }
                 keys = p->key;
                 tied.append( appended_column( current_block ) );
                 if( csv.flush ) { std::cout.flush(); }

From ac92ca59977a186f13b1346dbe25c2ae16fff279 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 16 Apr 2019 23:19:44 +1000
Subject: [PATCH 0020/1056] csv-blocks: make-blocks: scalar field support
 implemented

---
 csv/applications/csv-blocks.cpp | 74 +++++++++++++++++++++++----------
 1 file changed, 51 insertions(+), 23 deletions(-)

diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index e65989747..1b5773bf9 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -27,7 +27,7 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-/// @author dewey nguyen
+/// @authors dewey nguyen, vsevolod vlaskine
 
 #include <stdio.h>
 #include <stdlib.h>
@@ -218,7 +218,6 @@ static comma::csv::options csv;
 static bool reverse_index = false;
 // All the data for this block
 static std::deque< std::string > block_records;
-static comma::csv::impl::unstructured keys;
 static comma::uint32 current_block = 1;
 static comma::int32 increment_step = 1;
 
@@ -264,7 +263,9 @@ static double diff( const input_t& from, const input_t& to ) // quick and dirty
     COMMA_THROW( comma::exception, "never here" );
 }
 
-template < typename T > static bool set_fields( const comma::command_line_options& options, std::string& first_line, T& default_input )
+struct how_t { enum values { none, by_id, by_scalar }; };
+
+template < typename T > static how_t::values set_fields( const comma::command_line_options& options, std::string& first_line, T& default_input )
 {
     std::vector< std::string > v = comma::split( csv.fields, ',' );
     comma::csv::format f;
@@ -279,29 +280,29 @@ template < typename T > static bool set_fields( const comma::command_line_option
     }
     // This is to load the keys into input_t structure
     unsigned int size = f.count();
-    bool has_id = false;
-    bool has_scalar = false;
+    how_t::values how = how_t::none;
     for( std::size_t i = 0; i < size; ++i )
     { 
         if( i < v.size() )
         { 
             if( v[i] == "id" )
             {
-                has_id = true;
+                if( how == how_t::by_scalar ) { COMMA_THROW( comma::exception, "expected either id or scalar in --fields; got both in: \"" << csv.fields << "\"" ); }
+                how = how_t::by_id;
                 v[i] = "key/" + default_input.key.append( f.offset( i ).type );
             }
             else if( v[i] == "scalar" )
             {
-                if( has_scalar ) { COMMA_THROW( comma::exception, "expected not more than one scalar in --fields; got: \"" << csv.fields << "\"" ); }
-                has_scalar = true;
+                if( how == how_t::by_id ) { COMMA_THROW( comma::exception, "expected either id or scalar in --fields; got both in: \"" << csv.fields << "\"" ); }
+                if( how == how_t::by_scalar ) { COMMA_THROW( comma::exception, "expected not more than one scalar in --fields; got: \"" << csv.fields << "\"" ); }
+                how = how_t::by_scalar;
                 v[i] = "key/" + default_input.key.append( f.offset( i ).type );
             }
         }
     }
-    if( !has_id && !has_scalar ) { COMMA_THROW( comma::exception, "please specify at least one id or scalar in --fields; got: \"" << csv.fields << "\"" ); }
-    if( has_id && has_scalar ) { COMMA_THROW( comma::exception, "expected either id or scalar in --fields; got both in: \"" << csv.fields << "\"" ); }
+    if( how == how_t::none ) { COMMA_THROW( comma::exception, "please specify at least one id or scalar in --fields; got: \"" << csv.fields << "\"" ); }
     csv.fields = comma::join( v, ',' );
-    return has_id;
+    return how;
 }
 
 #ifndef WIN32
@@ -501,24 +502,52 @@ int main( int ac, char** av )
         }
         if( operation == "group" || operation == "make-blocks" )
         {
-            current_block = options.value< comma::uint32 >( "--starting-block,--from", 0 ); // default is 0
+            current_block = options.value< comma::uint32 >( "--starting-block,--from", 0 );
             std::string first_line;
             input_t default_input;
-            bool has_id = set_fields( options, first_line, default_input );
-            if( !has_id ) { std::cerr << "csv-blocks: scalar field support: todo" << std::endl; }
-            if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << "; making blocks by " << ( has_id ? "id" : "scalar" ) << std::endl; }
-            double gap;
-            if( !has_id ) { gap = options.value< double >( "--min-gap-between-blocks,--min-gap,--gap" ); }
+            auto how = set_fields( options, first_line, default_input );
+            if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << "; making blocks by " << ( how == how_t::by_id ? "id" : "scalar" ) << std::endl; }
+            boost::optional< double > gap;
+            boost::optional< double > span;
+            if( how == how_t::by_scalar )
+            { 
+                options.assert_mutually_exclusive( "--min-gap-between-blocks,--min-gap,--gap", "--block-span,--span" );
+                gap = options.optional< double >( "--min-gap-between-blocks,--min-gap,--gap" );
+                span = options.optional< double >( "--block-span,--span" );
+            }
             comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
             comma::csv::output_stream< appended_column > ostream( std::cout, csv_out );
             comma::csv::tied< input_t, appended_column > tied( istream, ostream );
+            auto update_block = [&]( const input_t& p )
+            {
+                static boost::optional< input_t > last;
+                switch( how )
+                {
+                    case how_t::by_id:
+                        if( last && !( last->key == p.key ) ) { ++current_block; }
+                        last = p;
+                        break;
+                    case how_t::by_scalar:
+                        if( gap )
+                        {
+                            if( last && diff( *last, p ) >= *gap ) { ++current_block; }
+                            last = p;
+                        }
+                        else if( span )
+                        {
+                            if( !last ) { last = p; }
+                            else if( diff( *last, p ) >= *span ) { ++current_block; last = p; }
+                        }
+                        break;
+                    case how_t::none: // never here
+                        break;
+                }
+                    
+            };
             if( !first_line.empty() ) 
             { 
                 input_t p = comma::csv::ascii< input_t >( csv, default_input ).get( first_line ); 
-                if( !( keys == p.key ) ) { ++current_block; }
-                keys = p.key;
-                // This is needed because the record wasnt read in by istream
-                // Write it out
+                update_block( p );
                 if( istream.is_binary() ) { std::cout.write( (char*)&p, istream.binary().size() ); }
                 else { std::cout << first_line << istream.ascii().ascii().delimiter(); }
                 ostream.write( appended_column( current_block ) );
@@ -528,8 +557,7 @@ int main( int ac, char** av )
             {
                 const input_t* p = istream.read();
                 if( !p ) { break; }
-                if( !( keys == p->key ) ) { ++current_block; }
-                keys = p->key;
+                update_block( *p );
                 tied.append( appended_column( current_block ) );
                 if( csv.flush ) { std::cout.flush(); }
             }            

From 811a3c1dc7cb33fc3e84ea2b17fb3e1803a38154 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 16 Apr 2019 23:32:51 +1000
Subject: [PATCH 0021/1056] csv-blocks: --help updated; group by scalar: unit
 test: todo...

---
 csv/applications/csv-blocks.cpp | 26 +++++++++++++++++++-------
 1 file changed, 19 insertions(+), 7 deletions(-)

diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index 1b5773bf9..feda4ce44 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -139,8 +139,14 @@ static void usage( bool more )
     std::cerr << "        attention: output does not preserve input order, since there is no reasonable tradeof there" << std::endl;
     std::cerr << "                   use csv-sort for post-processing, if required" << std::endl;
     std::cerr << "    group|make-blocks" << std::endl;
-    std::cerr << "        cat something.csv | csv-blocks group --fields=,id, " << std::endl;
+    std::cerr << "        usage: cat something.csv | csv-blocks group --fields=,id, " << std::endl;
     std::cerr << "            appends group's block field based on specified id key or keys" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --fields=<fields>" << std::endl;
+    std::cerr << "                id: any number of id fields to group by" << std::endl;
+    std::cerr << "                scalar: group by scalar, which can be integer, floating point number, or time" << std::endl;
+    std::cerr << "            --block-gap,--gap=<value>; minimum gap in values between blocks, double (for time: seconds as double), see examples" << std::endl;
+    std::cerr << "            --block-span,--span=<value>; maximum block span, double (for time: seconds as double), see examples" << std::endl;
     std::cerr << "    head" << std::endl;
     std::cerr << "        reads records from first block to stdout, if --num-of-blocks=<num> specified, read more than one blocks" << std::endl;
     std::cerr << "        requires the index from 'index' mode in the inputs" << std::endl;
@@ -181,10 +187,16 @@ static void usage( bool more )
     std::cerr << "    ( echo \"a,1,2,3\"; echo \"a,4,2,3\"; echo \"b,5,5,6\"; echo \"c,7,5,6\"; echo \"c,7,8,9\"; echo \"c,7,8,9\" ) >$block_csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    group|make-blocks" << std::endl;
-    std::cerr << "        cat $block_csv | csv-blocks group --fields=id" << std::endl;
-    std::cerr << "            unique ascending block number are assigned based on one id field" << std::endl;
-    std::cerr << "        cat $block_csv | csv-blocks group --fields=id,,id" << std::endl;
-    std::cerr << "            unique ascending block number are assigned based on two id fields" << std::endl;
+    std::cerr << "        unique ascending block number are assigned based on one id field" << std::endl;
+    std::cerr << "            cat $block_csv | csv-blocks group --fields=id" << std::endl;
+    std::cerr << "        unique ascending block number are assigned based on two id fields" << std::endl;
+    std::cerr << "            cat $block_csv | csv-blocks group --fields=id,,id" << std::endl;
+    std::cerr << "        group by scalar span - try it" << std::endl;
+    std::cerr << "            seq 20 | csv-blocks group --fields=scalar --span 5" << std::endl;
+    std::cerr << "            seq 1 3 20 | csv-blocks group --fields scalar --span 4" << std::endl;
+    std::cerr << "        group by scalar gap - try it" << std::endl;
+    std::cerr << "            seq 20 | csv-blocks group --fields=scalar --gap 1" << std::endl;
+    std::cerr << "            seq 20 | csv-blocks group --fields=scalar --gap 2" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    index" << std::endl;
     std::cerr << "        cat $block_csv | csv-blocks group --fields=id | csv-blocks index --fields=,,,,block" << std::endl;
@@ -511,8 +523,8 @@ int main( int ac, char** av )
             boost::optional< double > span;
             if( how == how_t::by_scalar )
             { 
-                options.assert_mutually_exclusive( "--min-gap-between-blocks,--min-gap,--gap", "--block-span,--span" );
-                gap = options.optional< double >( "--min-gap-between-blocks,--min-gap,--gap" );
+                options.assert_mutually_exclusive( "--block-gap,--gap", "--block-span,--span" );
+                gap = options.optional< double >( "--block-gap,--gap" );
                 span = options.optional< double >( "--block-span,--span" );
             }
             comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );

From 4e3384532ac86dcfc7462b27c35fc6e769d5ee0d Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 17 Apr 2019 17:31:23 +1000
Subject: [PATCH 0022/1056] csv-block: group: --gap and --span can be used
 together now; basic unit test added

---
 csv/applications/csv-blocks.cpp | 19 +++++--------------
 1 file changed, 5 insertions(+), 14 deletions(-)

diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index feda4ce44..42d09a96d 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -523,7 +523,6 @@ int main( int ac, char** av )
             boost::optional< double > span;
             if( how == how_t::by_scalar )
             { 
-                options.assert_mutually_exclusive( "--block-gap,--gap", "--block-span,--span" );
                 gap = options.optional< double >( "--block-gap,--gap" );
                 span = options.optional< double >( "--block-span,--span" );
             }
@@ -532,28 +531,20 @@ int main( int ac, char** av )
             comma::csv::tied< input_t, appended_column > tied( istream, ostream );
             auto update_block = [&]( const input_t& p )
             {
-                static boost::optional< input_t > last;
+                static input_t first = p;
+                static input_t last = p;
                 switch( how )
                 {
                     case how_t::by_id:
-                        if( last && !( last->key == p.key ) ) { ++current_block; }
-                        last = p;
+                        if( !( last.key == p.key ) ) { ++current_block; }
                         break;
                     case how_t::by_scalar:
-                        if( gap )
-                        {
-                            if( last && diff( *last, p ) >= *gap ) { ++current_block; }
-                            last = p;
-                        }
-                        else if( span )
-                        {
-                            if( !last ) { last = p; }
-                            else if( diff( *last, p ) >= *span ) { ++current_block; last = p; }
-                        }
+                        if( ( gap && diff( last, p ) >= *gap ) || ( span && diff( first, p ) >= *span ) ) { ++current_block; first = p; }
                         break;
                     case how_t::none: // never here
                         break;
                 }
+                last = p;
                     
             };
             if( !first_line.empty() ) 

From 8a284f43c183c14f7932dc0686e39a1259fa769c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 17 Apr 2019 17:31:39 +1000
Subject: [PATCH 0023/1056] csv-block: group: --gap and --span can be used
 together now; basic unit test added

---
 csv/test/csv-blocks/group/expected | 70 ++++++++++++++++++++++++++++++
 csv/test/csv-blocks/group/input    | 15 +++++++
 2 files changed, 85 insertions(+)
 create mode 100644 csv/test/csv-blocks/group/expected
 create mode 100644 csv/test/csv-blocks/group/input

diff --git a/csv/test/csv-blocks/group/expected b/csv/test/csv-blocks/group/expected
new file mode 100644
index 000000000..5c144db16
--- /dev/null
+++ b/csv/test/csv-blocks/group/expected
@@ -0,0 +1,70 @@
+group/scalar/gap[0]/output/line[0]="1.1,0"
+group/scalar/gap[0]/output/line[1]="2,1"
+group/scalar/gap[0]/output/line[2]="5,2"
+group/scalar/gap[0]/output/line[3]="5.9,3"
+group/scalar/gap[0]/status=0
+group/scalar/gap[1]/output/line[0]="1.1,0"
+group/scalar/gap[1]/output/line[1]="2,0"
+group/scalar/gap[1]/output/line[2]="5,1"
+group/scalar/gap[1]/output/line[3]="5.9,1"
+group/scalar/gap[1]/status=0
+group/scalar/gap[2]/output/line[0]="1.1,0"
+group/scalar/gap[2]/output/line[1]="2,0"
+group/scalar/gap[2]/output/line[2]="5,0"
+group/scalar/gap[2]/output/line[3]="5.9,0"
+group/scalar/gap[2]/status=0
+group/scalar/gap[3]/output/line[0]="19700101T000001.100000,0"
+group/scalar/gap[3]/output/line[1]="19700101T000002,1"
+group/scalar/gap[3]/output/line[2]="19700101T000005,2"
+group/scalar/gap[3]/output/line[3]="19700101T000005.900000,3"
+group/scalar/gap[3]/status=0
+group/scalar/gap[4]/output/line[0]="19700101T000001.100000,0"
+group/scalar/gap[4]/output/line[1]="19700101T000002,0"
+group/scalar/gap[4]/output/line[2]="19700101T000005,1"
+group/scalar/gap[4]/output/line[3]="19700101T000005.900000,1"
+group/scalar/gap[4]/status=0
+group/scalar/gap[5]/output/line[0]="19700101T000001.100000,0"
+group/scalar/gap[5]/output/line[1]="19700101T000002,0"
+group/scalar/gap[5]/output/line[2]="19700101T000005,0"
+group/scalar/gap[5]/output/line[3]="19700101T000005.900000,0"
+group/scalar/gap[5]/status=0
+
+group/scalar/span[0]/output/line[0]="1.1,0"
+group/scalar/span[0]/output/line[1]="2,1"
+group/scalar/span[0]/output/line[2]="5,2"
+group/scalar/span[0]/output/line[3]="5.9,3"
+group/scalar/span[0]/status=0
+group/scalar/span[1]/output/line[0]="1.1,0"
+group/scalar/span[1]/output/line[1]="2,0"
+group/scalar/span[1]/output/line[2]="5,1"
+group/scalar/span[1]/output/line[3]="5.9,1"
+group/scalar/span[1]/status=0
+group/scalar/span[2]/output/line[0]="1.1,0"
+group/scalar/span[2]/output/line[1]="2,0"
+group/scalar/span[2]/output/line[2]="5,0"
+group/scalar/span[2]/output/line[3]="5.9,1"
+group/scalar/span[2]/status=0
+group/scalar/span[3]/output/line[0]="19700101T000001.100000,0"
+group/scalar/span[3]/output/line[1]="19700101T000002,1"
+group/scalar/span[3]/output/line[2]="19700101T000005,2"
+group/scalar/span[3]/output/line[3]="19700101T000005.900000,3"
+group/scalar/span[3]/status=0
+group/scalar/span[4]/output/line[0]="19700101T000001.100000,0"
+group/scalar/span[4]/output/line[1]="19700101T000002,0"
+group/scalar/span[4]/output/line[2]="19700101T000005,1"
+group/scalar/span[4]/output/line[3]="19700101T000005.900000,1"
+group/scalar/span[4]/status=0
+group/scalar/span[5]/output/line[0]="19700101T000001.100000,0"
+group/scalar/span[5]/output/line[1]="19700101T000002,0"
+group/scalar/span[5]/output/line[2]="19700101T000005,0"
+group/scalar/span[5]/output/line[3]="19700101T000005.900000,0"
+group/scalar/span[5]/status=0
+
+group/scalar/gap_and_span[0]/output/line[0]="1,0"
+group/scalar/gap_and_span[0]/output/line[1]="2,0"
+group/scalar/gap_and_span[0]/output/line[2]="5,1"
+group/scalar/gap_and_span[0]/output/line[3]="6,1"
+group/scalar/gap_and_span[0]/output/line[4]="7,1"
+group/scalar/gap_and_span[0]/output/line[5]="8,1"
+group/scalar/gap_and_span[0]/output/line[6]="9,2"
+group/scalar/gap_and_span[0]/status=0
diff --git a/csv/test/csv-blocks/group/input b/csv/test/csv-blocks/group/input
new file mode 100644
index 000000000..f4bf3e794
--- /dev/null
+++ b/csv/test/csv-blocks/group/input
@@ -0,0 +1,15 @@
+group/scalar/gap[0]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --gap 0.5"
+group/scalar/gap[1]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --gap 1"
+group/scalar/gap[2]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --gap 5"
+group/scalar/gap[3]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --gap 0.5"
+group/scalar/gap[4]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --gap 1"
+group/scalar/gap[5]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --gap 5"
+
+group/scalar/span[0]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --span 0.5"
+group/scalar/span[1]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --span 1"
+group/scalar/span[2]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --span 4"
+group/scalar/span[3]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --span 0.5"
+group/scalar/span[4]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --span 1"
+group/scalar/span[5]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --span 5"
+
+group/scalar/gap_and_span[0]="( echo 1; echo 2; echo 5; echo 6; echo 7; echo 8; echo 9 ) | csv-blocks group --fields scalar --gap 2 --span 4"

From 2753b880b6e6c4a2ce0bec1ee3ae628824638d12 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Apr 2019 12:41:01 +1000
Subject: [PATCH 0024/1056] csv-time-join: minor refactoring

---
 csv/applications/csv-time-join.cpp | 126 ++++++++---------------------
 1 file changed, 33 insertions(+), 93 deletions(-)

diff --git a/csv/applications/csv-time-join.cpp b/csv/applications/csv-time-join.cpp
index 80e3ef85b..d22c054eb 100644
--- a/csv/applications/csv-time-join.cpp
+++ b/csv/applications/csv-time-join.cpp
@@ -151,15 +151,8 @@ namespace comma { namespace visiting {
 
 template <> struct traits< Point >
 {
-    template < typename K, typename V > static void visit( const K&, const Point& p, V& v )
-    { 
-        v.apply( "t", p.timestamp );
-    }
-    
-    template < typename K, typename V > static void visit( const K&, Point& p, V& v )
-    {
-        v.apply( "t", p.timestamp );
-    }
+    template < typename K, typename V > static void visit( const K&, const Point& p, V& v ) { v.apply( "t", p.timestamp ); }
+    template < typename K, typename V > static void visit( const K&, Point& p, V& v ) { v.apply( "t", p.timestamp ); }
 };
     
 } } // namespace comma { namespace visiting {
@@ -168,17 +161,12 @@ enum class how { by_lower, by_upper, nearest, realtime };
 how method = how::by_lower;
 bool timestamp_only;
 bool select_only;
-
 comma::csv::options stdin_csv;
 comma::csv::options bounding_csv;
 boost::optional< boost::posix_time::time_duration > bound;
-
 typedef std::pair< boost::posix_time::ptime, std::string > timestring_t;
 
-boost::posix_time::ptime get_time( const Point& p )
-{
-    return p.timestamp ? *p.timestamp : boost::posix_time::microsec_clock::universal_time();
-}
+boost::posix_time::ptime get_time( const Point& p ) { return p.timestamp ? *p.timestamp : boost::posix_time::microsec_clock::universal_time(); }
 
 static void output_bounding( std::ostream& os, const timestring_t& bounding, bool stdin_first )
 {
@@ -209,16 +197,13 @@ static void output_bounding( std::ostream& os, const timestring_t& bounding, boo
 
 static void output_input( std::ostream& os, const timestring_t& input )
 {
-    if( stdin_csv.binary() ) { os.write( &input.second[0], stdin_csv.format().size() ); }
-    else { os << input.second; }
+    if( stdin_csv.binary() ) { os.write( &input.second[0], stdin_csv.format().size() ); } else { os << input.second; }
 }
 
 static void output( const timestring_t& input, const timestring_t& bounding, bool stdin_first )
 {
     if( bounding.first.is_infinity() ) { return; }
-
     if( bound && ( input.first - bounding.first > bound || bounding.first - input.first > bound )) { return; }
-
     if( stdin_first )
     {
         output_input( std::cout, input );
@@ -229,7 +214,6 @@ static void output( const timestring_t& input, const timestring_t& bounding, boo
         output_bounding( std::cout, bounding, stdin_first );
         output_input( std::cout, input );
     }
-
     if( !stdin_csv.binary() ) { std::cout << '\n'; }
     std::cout.flush();
 }
@@ -240,7 +224,6 @@ int main( int ac, char** av )
     {
         comma::signal_flag is_shutdown(comma::signal_flag::hard);
         comma::command_line_options options( ac, av, usage );
-
         if( options.exists( "--bash-completion" )) bash_completion( ac, av );
         options.assert_mutually_exclusive( "--by-lower,--by-upper,--nearest,--realtime" );
         if( options.exists( "--by-upper" )) { method = how::by_upper; }
@@ -253,7 +236,6 @@ int main( int ac, char** av )
         boost::optional< unsigned int > buffer_size = options.optional< unsigned int >( "--buffer" );
         if( options.exists( "--bound" ) ) { bound = boost::posix_time::microseconds( static_cast<unsigned int>(options.value< double >( "--bound" ) * 1000000 )); }
         stdin_csv = comma::csv::options( options, "t" );
-
         std::vector< std::string > unnamed = options.unnamed(
             "--by-lower,--by-upper,--nearest,--realtime,--select,--do-not-append,--timestamp-only,--time-only,--discard-bounding",
             "--binary,-b,--delimiter,-d,--fields,-f,--bound,--buffer,--verbose,-v" );
@@ -285,8 +267,7 @@ int main( int ac, char** av )
         if( stdin_csv.binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif // #ifdef WIN32
 
-        comma::io::istream bounding_istream( comma::split( properties, ';' )[0]
-                                           , bounding_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii );
+        comma::io::istream bounding_istream( comma::split( properties, ';' )[0], bounding_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii );
         comma::csv::input_stream< Point > bounding_stream( *bounding_istream, bounding_csv );
 
         #ifndef WIN32
@@ -298,23 +279,18 @@ int main( int ac, char** av )
         #endif // #ifndef WIN32
 
         const Point* p = NULL;
-
         if( method == how::realtime )
         {
-            #ifndef WIN32
+            #ifdef WIN32
+            COMMA_THROW( comma::exception, "--realtime mode not supported in WIN32" );
+            #else
             bool end_of_input = false;
             bool end_of_bounds = false;
-            
-            boost::optional<timestring_t> joined_line;
-            
-            while (!is_shutdown && !end_of_input)
+            boost::optional< timestring_t > joined_line;
+            while( !is_shutdown && !end_of_input )
             {
-                if ( !bounding_stream.ready() && !stdin_stream.ready() )
-                {
-                    select.wait(boost::posix_time::milliseconds(1));
-                }
-                
-                if ( !is_shutdown && !end_of_input && ( stdin_stream.ready() || ( select.check() && select.read().ready( comma::io::stdin_fd ) ) ) )
+                if( !bounding_stream.ready() && !stdin_stream.ready() ) { select.wait(boost::posix_time::milliseconds(1)); }
+                if( !is_shutdown && !end_of_input && ( stdin_stream.ready() || ( select.check() && select.read().ready( comma::io::stdin_fd ) ) ) )
                 {
                     p = stdin_stream.read();
                     if( p )
@@ -328,9 +304,7 @@ int main( int ac, char** av )
                         end_of_input = true;
                     }
                 }
-                
-                if ( !is_shutdown && !end_of_bounds &&
-                   ( bounding_stream.ready() || ( select.check() && select.read().ready( bounding_istream.fd() ))))
+                if( !is_shutdown && !end_of_bounds && ( bounding_stream.ready() || ( select.check() && select.read().ready( bounding_istream.fd() ) ) ) )
                 {
                     p = bounding_stream.read();
                     if( p )
@@ -344,22 +318,17 @@ int main( int ac, char** av )
                     }
                 }
             }
-            if (is_shutdown) { comma::verbose << "got a signal" << std::endl; return 0; }
-            #else
-            COMMA_THROW(comma::exception, "--realtime mode not supported in WIN32");
-            #endif
+            if( is_shutdown ) { comma::verbose << "got a signal" << std::endl; return 0; }
+            #endif // #ifdef WIN32
         }
         else
         {
-            std::deque<timestring_t> bounding_queue;
+            std::deque< timestring_t > bounding_queue;
             bool next = true;
             bool bounding_data_available;
             bool upper_bound_added = false;
-
-            // add a fake entry for an lower bound to allow stdin before first bound to match
-            bounding_queue.push_back( std::make_pair( boost::posix_time::neg_infin, "" ));
-
-            while( ( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) ) )
+            bounding_queue.push_back( std::make_pair( boost::posix_time::neg_infin, "" ) ); // add a fake entry for an lower bound to allow stdin before first bound to match
+            while( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) )
             {
                 if( !std::cin.good() ) { select.read().remove( 0 ); }
                 if( !bounding_istream->good() ) { select.read().remove( bounding_istream.fd() ); }
@@ -371,52 +340,35 @@ int main( int ac, char** av )
                 //check so we do not block
                 bool bounding_stream_ready = bounding_stream.ready();
                 bool stdin_stream_ready = stdin_stream.ready();
-
                 if( next )
                 {
                     if( !bounding_stream_ready || !stdin_stream_ready )
                     {
-                        if( !bounding_stream_ready && !stdin_stream_ready )
-                        {
-                            select.wait( boost::posix_time::milliseconds(10) );
-                        }
-                        else
-                        {
-                            select.check();
-                        }
+                        if( !bounding_stream_ready && !stdin_stream_ready ) { select.wait( boost::posix_time::milliseconds( 10 ) ); }
+                        else { select.check(); }
                         if( select.read().ready( bounding_istream.fd() )) { bounding_stream_ready = true; }
-                        if( select.read().ready(0) ) { stdin_stream_ready=true; }
+                        if( select.read().ready(0) ) { stdin_stream_ready = true; }
                     }
                 }
                 else
                 {
                     if( !bounding_stream_ready )
                     {
-                        bounding_stream_select.wait( boost::posix_time::milliseconds(10) );
+                        bounding_stream_select.wait( boost::posix_time::milliseconds( 10 ) );
                         if( bounding_stream_select.read().ready( bounding_istream.fd() )) { bounding_stream_ready=true; }
                     }
                 }
                 #endif //#ifdef WIN32
-
                 //keep storing available bounding data
                 if( bounding_stream_ready )
                 {
                     if( !buffer_size || bounding_queue.size() < *buffer_size || discard_bounding )
                     {
                         const Point* q = bounding_stream.read();
-                        if( q )
-                        {
-                            bounding_queue.push_back( std::make_pair( get_time( *q ), bounding_stream.last() ));
-                        }
-                        else
-                        {
-                            bounding_data_available=false;
-                        }
-                    }
-                    if( buffer_size && bounding_queue.size() > *buffer_size && discard_bounding )
-                    {
-                        bounding_queue.pop_front();
+                        if( q ) { bounding_queue.push_back( std::make_pair( get_time( *q ), bounding_stream.last() )); }
+                        else { bounding_data_available = false; }
                     }
+                    if( buffer_size && bounding_queue.size() > *buffer_size && discard_bounding ) { bounding_queue.pop_front(); }
                 }
                 if( !upper_bound_added && bounding_istream->eof() )
                 {
@@ -424,53 +376,41 @@ int main( int ac, char** av )
                     bounding_queue.push_back( std::make_pair( boost::posix_time::pos_infin, "" ));
                     upper_bound_added = true;
                 }
-
                 //if we are done with the last bounded point get next
                 if( next )
                 {
-                    if(!stdin_stream_ready) { continue; }
+                    if( !stdin_stream_ready ) { continue; }
                     p = stdin_stream.read();
                     if( !p ) { break; }
                 }
-
-                boost::posix_time::ptime t = get_time(*p);
-              
+                boost::posix_time::ptime t = get_time( *p );
                 //get bound
-                while(bounding_queue.size()>=2)
-                {
-                    if( t < bounding_queue[1].first ) { break; }
-                    bounding_queue.pop_front();
-                }
-
-                if(bounding_queue.size()<2)
+                for( ; bounding_queue.size() >= 2 && t >= bounding_queue[1].first; bounding_queue.pop_front() );
+                if( bounding_queue.size() < 2 )
                 {
                     //bound not found
                     //do we have more data?
-                    if(!bounding_data_available) { break; }
-                    next=false;
+                    if( !bounding_data_available ) { break; }
+                    next = false;
                     continue;
                 }
-
                 //bound available
-
                 if( method == how::by_lower && t < bounding_queue.front().first )
                 {
                     next = true;
                     continue;
                 }
-
                 bool is_first = ( method == how::by_lower )
                     || ( method == how::nearest && ( t - bounding_queue[0].first ) < ( bounding_queue[1].first - t ));
-
                 const timestring_t& chosen_bound = is_first ? bounding_queue[0] : bounding_queue[1];;
                 timestring_t input_line = std::make_pair( t, stdin_stream.last() );
-
                 output( input_line, chosen_bound, stdin_first );
-                next=true;
+                next = true;
             }
         }
         return 0;     
     }
     catch( std::exception& ex ) { std::cerr << "csv-time-join: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-time-join: unknown exception" << std::endl; }
+    return 1;
 }

From ef5cad882173fa8bc45dd72964843bd690c88d2c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 29 Apr 2019 14:20:59 +1000
Subject: [PATCH 0025/1056] csv-thin: --invert, --seed implemented; unit test
 added

---
 csv/applications/csv-thin.cpp | 242 ++++------------------------------
 csv/test/csv-thin/expected    |   4 +
 csv/test/csv-thin/input       |   2 +
 3 files changed, 34 insertions(+), 214 deletions(-)
 create mode 100644 csv/test/csv-thin/expected
 create mode 100644 csv/test/csv-thin/input

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index 61139202e..310da562a 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -56,26 +56,28 @@ using namespace comma;
 static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
-    std::cerr << "Read input data and thin them down by the given percentage;" << std::endl;
+    std::cerr << "read input data and thin them down by the given percentage;" << std::endl;
     std::cerr << "buffer handling optimized for a high-output producer" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "Usage: cat full.csv | csv-thin [<rate>] [<options>] > thinned.csv" << std::endl;
+    std::cerr << "usage: cat full.csv | csv-thin [<rate>] [<options>] > thinned.csv" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "options:" << std::endl;
-    std::cerr << "    --binary,-b=<format>: data is packets of fixed size given by <format>." << std::endl;
-    std::cerr << "                          Alternatively use --size" << std::endl;
-    std::cerr << "    --deterministic,-d: input is downsampled by a factor of int( 1 / <rate> )." << std::endl;
-    std::cerr << "                That is, if <rate> is 0.33, output every third packet." << std::endl;
-    std::cerr << "                Default is to output each packet with a probability of <rate>." << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --binary,-b=<format>: data is packets of fixed size given by <format>" << std::endl;
+    std::cerr << "                          alternatively use --size" << std::endl;
+    std::cerr << "    --deterministic,-d: input is downsampled by a factor of int( 1 / <rate> )" << std::endl;
+    std::cerr << "                        that is, if <rate> is 0.33, output every third packet" << std::endl;
+    std::cerr << "                        default is to output each packet with a probability of <rate>" << std::endl;
     std::cerr << "    --fields=<fields>: use timestamp in fields to determine time for --period" << std::endl;
+    std::cerr << "    --invert,-i; invert selection logic; e.g. to split data" << std::endl;
     std::cerr << "    --period=<n>: output once every <n> seconds, ignores <rate>" << std::endl;
     std::cerr << "    --size,-s=<size>: data is packets of fixed size, otherwise data is expected" << std::endl;
     std::cerr << "                      line-wise. Alternatively use --binary" << std::endl;
+    std::cerr << "    --seed=[<value>]; random seed" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "csv options:" << std::endl;
+    std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
     std::cerr << std::endl;
-    std::cerr << "examples:" << std::endl;
+    std::cerr << "examples" << std::endl;
     std::cerr << "    output 70% of data:          cat full.csv | csv-thin 0.7" << std::endl;
     std::cerr << "    output once every 2 seconds: cat full.csv | csv-thin --period 2" << std::endl;
     std::cerr << "    using timestamp from input:  cat full.csv | csv-thin --period 2 --fields t" << std::endl;
@@ -88,6 +90,8 @@ static void usage( bool verbose = false )
 
 static double rate;
 static bool deterministic;
+static bool invert;
+static boost::optional< comma::uint32 > seed;
 static boost::optional< boost::posix_time::microseconds > period;
 
 struct timestamped
@@ -107,7 +111,7 @@ template <> struct traits< timestamped >
 
 } } // namespace comma { namespace visiting {
 
-static bool ignore()
+static bool skip()
 {
     if( period )
     {
@@ -135,21 +139,19 @@ static bool ignore()
         ++count;
         if( count < ( step + 1 ) / rate ) { return true; }
         ++step;
-        if( step == size )
-        {
-            count = 0;
-            step = 0;
-        }
+        if( step == size ) { count = step = 0; }
         return false;
     }
-    static boost::mt19937 rng;
+    static boost::mt19937 rng = seed ? boost::mt19937( *seed ) : boost::mt19937();
     static boost::uniform_real<> dist( 0, 1 );
     static boost::variate_generator< boost::mt19937&, boost::uniform_real<> > random( rng, dist );
     static bool do_ignore = comma::math::less( rate, 1.0 );
     return do_ignore && random() > rate;
 }
 
-static bool ignore_by_timestamp( boost::posix_time::ptime timestamp )
+static bool keep() { return skip() == invert; }
+
+static bool skip_by_timestamp( boost::posix_time::ptime timestamp )
 {
     static boost::posix_time::ptime next_time = timestamp;
     if( timestamp <= next_time ) { return true; }
@@ -164,6 +166,8 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         bool binary = options.exists( "--size,-s,--binary,-b" );
         deterministic = options.exists( "--deterministic,-d" );
+        invert = options.exists( "--invert,-i" );
+        seed = options.optional< comma::uint32 >( "--seed" );
         if( options.exists( "--period" )) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
         #ifdef WIN32
         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
@@ -177,7 +181,7 @@ int main( int ac, char** av )
             {
                 const timestamped* p = istream.read();
                 if( !p ) { break; }
-                if( ignore_by_timestamp( p->timestamp ) ) { continue; }
+                if( skip_by_timestamp( p->timestamp ) != invert ) { continue; }
                 if( istream.is_binary()) { std::cout.write( istream.binary().last(), istream.binary().size() ); }
                 else { std::cout << comma::join( istream.ascii().last(), istream.ascii().ascii().delimiter() )<< std::endl; }
             }
@@ -191,7 +195,6 @@ int main( int ac, char** av )
             rate = boost::lexical_cast< double >( v[0] );
             if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { std::cerr << "csv-thin: expected rate between 0 and 1, got " << rate << std::endl; usage(); }
         }
-
         if( binary ) // quick and dirty, improve performance by reading larger buffer
         {
             std::size_t size = options.value( "--size,-s", 0u );
@@ -213,8 +216,8 @@ int main( int ac, char** av )
                 //std::size_t e = available < int( size ) ? size : available - available % size;
                 std::cin.read( &buf[0], size ); // quick and dirty
                 if( std::cin.gcount() <= 0 ) { break; }
-                if( std::cin.gcount() < int( size ) ) { std::cerr << "csv-thin: expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; exit( 1 ); }
-                { if( !ignore() ) { std::cout.write( &buf[0], size ); std::cout.flush(); } }
+                if( std::cin.gcount() < int( size ) ) { std::cerr << "csv-thin: expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; return 1; }
+                if( keep() ) { std::cout.write( &buf[0], size ); std::cout.flush(); }
             }
             #else
             char* cur = &buf[0];
@@ -232,7 +235,7 @@ int main( int ac, char** av )
                 capacity -= count;
                 for( ; offset >= size; cur += size, offset -= size )
                 {
-                    if( !ignore() ) { std::cout.write( cur, size ); }
+                    if( keep() ) { std::cout.write( cur, size ); }
                 }
                 if( capacity == 0 ) { cur = &buf[0]; offset = 0; capacity = buf.size(); }
                 std::cout.flush();
@@ -245,201 +248,12 @@ int main( int ac, char** av )
             while( std::cin.good() && !std::cin.eof() )
             {
                 std::getline( std::cin, line );
-                if( !line.empty() && !ignore() ) { std::cout << line << std::endl; }
+                if( !line.empty() && keep() ) { std::cout << line << std::endl; }
             }
         }
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "csv-size: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-size: unknown exception" << std::endl; }
-    usage();
+    return 1;
 }
-
-// // This file is part of comma, a generic and flexible library
-// // Copyright (c) 2011 The University of Sydney
-// // All rights reserved.
-// //
-// // Redistribution and use in source and binary forms, with or without
-// // modification, are permitted provided that the following conditions are met:
-// // 1. Redistributions of source code must retain the above copyright
-// //    notice, this list of conditions and the following disclaimer.
-// // 2. Redistributions in binary form must reproduce the above copyright
-// //    notice, this list of conditions and the following disclaimer in the
-// //    documentation and/or other materials provided with the distribution.
-// // 3. All advertising materials mentioning features or use of this software
-// //    must display the following acknowledgement:
-// //    This product includes software developed by the University of Sydney.
-// // 4. Neither the name of the University of Sydney nor the
-// //    names of its contributors may be used to endorse or promote products
-// //    derived from this software without specific prior written permission.
-// //
-// // NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// // GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// // HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// // WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// // MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// // BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-//
-// /// @author vsevolod vlaskine
-//
-// #ifdef WIN32
-// #include <stdio.h>
-// #include <fcntl.h>
-// #include <io.h>
-// #endif
-//
-// #include <iostream>
-// #include <boost/random/mersenne_twister.hpp>
-// #include <boost/random/uniform_real.hpp>
-// #include <boost/random/variate_generator.hpp>
-// #include <comma/application/command_line_options.h>
-// #include <comma/application/contact_info.h>
-// #include <comma/base/exception.h>
-// #include <comma/base/types.h>
-// #include <comma/io/file_descriptor.h>
-// #include <comma/math/compare.h>
-//
-// using namespace comma;
-//
-// static void usage()
-// {
-//     std::cerr << std::endl;
-//     std::cerr << "Read input data and thin them down by the given percentage;" << std::endl;
-//     std::cerr << "buffer handling optimized for a high-output producer" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "Usage: cat full.csv | csv-thin <rate> [<options>] > thinned.csv" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "e.g. output 70% of data:  cat full.csv | csv-thin 0.7 > thinned.csv" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "<options>" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "    --size,-s <size>: if given, data is packets of fixed size" << std::endl;
-//     std::cerr << "                      otherwise data is line-based" << std::endl;
-//     std::cerr << "    --deterministic,-d: if given, input is downsampled by a factor of int(1 / <rate>)." << std::endl;
-//     std::cerr << "                     That is, if <rate> is 0.33, output every third packet." << std::endl;
-//     std::cerr << "                     Default is to output each packet with a probability of <rate>." << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << comma::contact_info << std::endl;
-//     std::cerr << std::endl;
-//     exit( 1 );
-// }
-//
-// static double rate;
-// static bool deterministic;
-// static unsigned long long count_size;
-//
-// static bool ignore()
-// {
-//     if( deterministic )
-//     {
-//         static unsigned long long count = count_size - 1;
-//         if( ++count == count_size ) { count = 0; }
-//         if(rate<0.5)
-//         {
-//             return count != 0;
-//         }
-//         else
-//         {
-//             return count == 0;
-//         }
-//     }
-//     static boost::mt19937 rng;
-//     static boost::uniform_real<> dist( 0, 1 );
-//     static boost::variate_generator< boost::mt19937&, boost::uniform_real<> > random( rng, dist );
-//     static bool do_ignore = comma::math::less( rate, 1.0 );
-//     return do_ignore && random() > rate;
-//
-// }
-//
-// int main( int ac, char** av )
-// {
-//     try
-//     {
-//         comma::command_line_options options( ac, av );
-//         if( options.exists( "--help,-h" ) || ac == 1 ) { usage(); }
-//         bool binary = options.exists( "--size,-s" );
-//         deterministic = options.exists( "--deterministic,-d" );
-//         std::size_t size = options.value( "--size,-s", 0u );
-//         #ifdef WIN32
-//         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
-//         #endif
-//         std::vector< std::string > v = options.unnamed( "--deterministic,-d", "-.*" );
-//         if( v.empty() ) { std::cerr << "csv-thin: please specify rate" << std::endl; usage(); }
-//         rate = boost::lexical_cast< double >( v[0] );
-//         if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { std::cerr << "csv-thin: expected rate between 0 and 1, got " << rate << std::endl; usage(); }
-//
-//         if( deterministic )
-//         {
-//             if(rate<0.5)
-//             {
-//                 count_size = static_cast< unsigned long long >( 1.0 / rate );
-//             }
-//             else
-//             {
-//                 count_size = static_cast< unsigned long long >( 1.0 / (1-rate) );
-//             }
-//         }
-//
-//         if( binary ) // quick and dirty, improve performance by reading larger buffer
-//         {
-//             unsigned int factor = 65536 / size; // arbitrary
-//             if( factor == 0 ) { factor = 1; }
-//             std::vector< char > buf( size * factor );
-//             #ifdef WIN32
-//             while( std::cin.good() && !std::cin.eof() )
-//             {
-//                 // it all does not seem to work: in_avail() always returns 0
-//                 //std::streamsize available = std::cin.rdbuf()->in_avail();
-//                 //if( available < 0 ) { continue; }
-//                 //if( available > 0 ) { std::cerr << "available = " << available << std::endl; }
-//                 //std::size_t e = available < int( size ) ? size : available - available % size;
-//                 std::cin.read( &buf[0], size ); // quick and dirty
-//                 if( std::cin.gcount() <= 0 ) { break; }
-//                 if( std::cin.gcount() < int( size ) ) { std::cerr << "csv-thin: expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; exit( 1 ); }
-//                 { if( !ignore() ) { std::cout.write( &buf[0], size ); std::cout.flush(); } }
-//             }
-//             #else
-//             char* cur = &buf[0];
-//             unsigned int offset = 0;
-//             unsigned int capacity = buf.size();
-//             while( std::cin.good() && !std::cin.eof() )
-//             {
-//                 int count = ::read( comma::io::stdin_fd, cur + offset, capacity );
-//                 if( count <= 0 )
-//                 {
-//                     if( offset != 0 ) { std::cerr << "csv-thin: expected at least " << size << " bytes, got only " << offset << std::endl; return 1; }
-//                     break;
-//                 }
-//                 offset += count;
-//                 capacity -= count;
-//                 for( ; offset >= size; cur += size, offset -= size )
-//                 {
-//                     if( !ignore() ) { std::cout.write( cur, size ); }
-//                 }
-//                 if( capacity == 0 ) { cur = &buf[0]; offset = 0; capacity = buf.size(); }
-//                 std::cout.flush();
-//             }
-//             #endif
-//         }
-//         else
-//         {
-//             std::string line;
-//             while( std::cin.good() && !std::cin.eof() )
-//             {
-//                 std::getline( std::cin, line );
-//                 if( !line.empty() && !ignore() ) { std::cout << line << std::endl; }
-//             }
-//         }
-//         return 0;
-//     }
-//     catch( std::exception& ex ) { std::cerr << "csv-size: " << ex.what() << std::endl; }
-//     catch( ... ) { std::cerr << "csv-size: unknown exception" << std::endl; }
-//     usage();
-// }
diff --git a/csv/test/csv-thin/expected b/csv/test/csv-thin/expected
new file mode 100644
index 000000000..176eff035
--- /dev/null
+++ b/csv/test/csv-thin/expected
@@ -0,0 +1,4 @@
+random/deterministic[0]/output="1,3,5,7,9,"
+random/deterministic[0]/status=0
+random/inverted[0]/output="1,2,3,4,5,6,7,8,9,10,"
+random/inverted[0]/status=0
diff --git a/csv/test/csv-thin/input b/csv/test/csv-thin/input
new file mode 100644
index 000000000..b3d4aa61c
--- /dev/null
+++ b/csv/test/csv-thin/input
@@ -0,0 +1,2 @@
+random/deterministic[0]="seq 10 | csv-thin 0.5 --invert --deterministic | tr '\\\n' ','"
+random/inverted[0]="( seq 10 | csv-thin 0.5; seq 10 | csv-thin 0.5 --invert ) | csv-sort --fields i | tr '\\\n' ','"

From c806f3885178f5e504fa1e638b8a8bedfcc33c14 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 10 May 2019 23:51:09 +1000
Subject: [PATCH 0026/1056] packed: more signed int tests added

---
 packed/test/packed_test.cpp | 21 +++++++++++++++++++++
 1 file changed, 21 insertions(+)

diff --git a/packed/test/packed_test.cpp b/packed/test/packed_test.cpp
index 5ee680ff6..4509a38d2 100644
--- a/packed/test/packed_test.cpp
+++ b/packed/test/packed_test.cpp
@@ -81,7 +81,10 @@ template < typename T > static void test_packed_int( comma::int64 value )
     EXPECT_EQ( true, t == 0 );
     t = value;
     EXPECT_EQ( true, t == value );
+    std::cerr << "-------------------------------------------------" << std::endl;
+    std::cerr << "--> a: value: " << value << " t: " << t() << std::endl;
     EXPECT_EQ( value, t() );
+    std::cerr << "-------------------------------------------------" << std::endl;
 }
 
 template < typename T > static void test_packed_uint( comma::uint64 value )
@@ -90,7 +93,10 @@ template < typename T > static void test_packed_uint( comma::uint64 value )
     EXPECT_EQ( true, t == 0 );
     t = value;
     EXPECT_EQ( true, t == value );
+    std::cerr << "-------------------------------------------------" << std::endl;
+    std::cerr << "--> b: value: " << value << " t: " << t() << std::endl;
     EXPECT_EQ( value, t() );
+    std::cerr << "-------------------------------------------------" << std::endl;
 }
 
 TEST( test_packed_struct_test, test_little_endian )
@@ -106,12 +112,24 @@ TEST( test_packed_struct_test, test_little_endian )
     test_packed_uint< comma::packed::little_endian::uint64 >( comma::uint64( 0x1BCDEF1213141500ULL ) );
 
     test_packed_int< comma::packed::little_endian::int16 >( 1234 );
+    test_packed_int< comma::packed::little_endian::int16 >( 256 * 128 - 1 );
+    test_packed_int< comma::packed::little_endian::int16 >( 0 );
+    test_packed_int< comma::packed::little_endian::int16 >( -1 );
+    test_packed_int< comma::packed::little_endian::int16 >( -2 );
+    test_packed_int< comma::packed::little_endian::int16 >( -256 * 128 + 1 );
+    //for( comma::int16 i = 256 * 128 - 1; i > 0; --i ) { test_packed_uint< comma::packed::little_endian::int16 >( i ); }
+    //for( comma::int16 i = 256 * 128 - 1; i > 0; --i ) { test_packed_int< comma::packed::little_endian::int16 >( -i ); }
     test_packed_int< comma::packed::little_endian::int24 >( 1235 );
     test_packed_int< comma::packed::little_endian::int24 >( 8388607 );
     test_packed_int< comma::packed::little_endian::int32 >( 8388607 );
     test_packed_int< comma::packed::little_endian::int32 >( 1236 );
     test_packed_int< comma::packed::little_endian::int16 >( -1231 );
+    test_packed_int< comma::packed::little_endian::int24 >( -1 );
+    test_packed_int< comma::packed::little_endian::int24 >( -2 );
+    test_packed_int< comma::packed::little_endian::int24 >( -256 );
     test_packed_int< comma::packed::little_endian::int24 >( -1232 );
+    //for( unsigned int i = 0; i < 8388608; ++i ) { test_packed_int< comma::packed::little_endian::int24 >( -i ); }
+    test_packed_int< comma::packed::little_endian::int24 >( -1000000 );
     test_packed_int< comma::packed::little_endian::int24 >( -8388608 );
     test_packed_int< comma::packed::little_endian::int32 >( -1233 );
     test_packed_int< comma::packed::little_endian::int64 >( -4321 );
@@ -130,7 +148,10 @@ TEST( test_packed_struct_test, test_big_endian )
     test_packed_int< comma::packed::big_endian::int32 >( 1234 );
     test_packed_int< comma::packed::big_endian::int16 >( -1234 );
     test_packed_int< comma::packed::big_endian::int32 >( -1234 );
+    test_packed_int< comma::packed::big_endian::int24 >( -1 );
+    test_packed_int< comma::packed::big_endian::int24 >( -2 );
     test_packed_int< comma::packed::big_endian::int24 >( -1232 );
+    test_packed_int< comma::packed::big_endian::int24 >( -8388607 );
     test_packed_int< comma::packed::big_endian::int24 >( -8388608 );
 }
 

From c698148e2fb165172fb114af7579a09412669031 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 20 May 2019 12:01:37 +1000
Subject: [PATCH 0027/1056] csv-shape: repeat operation implemented

---
 csv/applications/csv-shape.cpp     | 52 ++++++++++++++++++++++--------
 csv/test/csv-shape/repeat/expected | 17 ++++++++++
 csv/test/csv-shape/repeat/input    |  2 ++
 3 files changed, 57 insertions(+), 14 deletions(-)
 create mode 100644 csv/test/csv-shape/repeat/expected
 create mode 100644 csv/test/csv-shape/repeat/input

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 5218d03af..bae53b53d 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -50,6 +50,7 @@ static void usage( bool verbose=false )
     std::cerr << "    loop:        same as concatenate, but with an additional last record:" << std::endl;
     std::cerr << "                 last input record concatenated with the first record (hence, 'loop')" << std::endl;
     std::cerr << "                 this mode always uses the sliding window for overlapping groups" << std::endl;
+    std::cerr << "    repeat:      repeat input given number of times, e.g. csv-shape repeat --size 5" << std::endl;
     std::cerr << std::endl;
     std::cerr << "Usage: cat data.csv | csv-shape <operation> [<options>]" << std::endl;
     std::cerr << std::endl;
@@ -109,11 +110,11 @@ static void simple_binary_pass_through(const comma::csv::format& f, bool flush=f
 
 bool is_binary;
 
-class concatenate_impl_
+class concatenate_
 {
 public:
 
-    concatenate_impl_() 
+    concatenate_() 
         : use_sliding_window_(false)
         , bidirectional_(false)
         , reverse_(false)
@@ -139,7 +140,7 @@ class concatenate_impl_
         if( size_ < 2 ) { std::cerr <<  comma::verbose.app_name() << ": expected --size,-n= value to be greater than 1" << std::endl; return 1; }
         expected_records_ = step_ * ( size_ - 1 ) + 1;
         if( options.exists("--expected-records") ) { std::cout << expected_records_ << std::endl; return 0; };
-        comma::csv::input_stream< input_t > istream(std::cin, csv);
+        comma::csv::input_stream< input_t > istream( std::cin, csv );
         std::deque< std::string > deque;
         std::deque< std::string > first;
         bool has_block_ = csv.has_field( "block" );
@@ -169,12 +170,9 @@ class concatenate_impl_
         return 0;
     }
 
-    struct input_t {
-        comma::uint32 block = 0;
-    };
+    struct input_t { comma::uint32 block = 0; };
 
 private:
-
     bool use_sliding_window_;
     bool bidirectional_;
     bool reverse_;
@@ -234,14 +232,42 @@ class concatenate_impl_
 
 namespace comma { namespace visiting {
 
-template <> struct traits< concatenate_impl_::input_t >
+template <> struct traits< concatenate_::input_t >
 {
-    template < typename K, typename V > static void visit( const K&, const concatenate_impl_::input_t& p, V& v ) { v.apply("block", p.block); }
-    template < typename K, typename V > static void visit( const K&, concatenate_impl_::input_t& p, V& v ) { v.apply("block", p.block); }
+    template < typename K, typename V > static void visit( const K&, const concatenate_::input_t& p, V& v ) { v.apply("block", p.block); }
+    template < typename K, typename V > static void visit( const K&, concatenate_::input_t& p, V& v ) { v.apply("block", p.block); }
 };
 
 } } // namespace comma { namespace visiting {
 
+static int repeat_( const comma::command_line_options& options, const comma::csv::options& csv )
+{
+    unsigned int size = options.value< unsigned int >( "--size,-n" );
+    if( csv.binary() )
+    {
+        typedef concatenate_::input_t input_t; // quick and dirty
+        comma::csv::input_stream< input_t > is( std::cin, csv ); // quick and dirty, will be slow on ascii
+        while( is.ready() || ( std::cin.good() && !std::cin.eof() ) )
+        {
+            const input_t* p = is.read();
+            if( !p ) { break; }
+            for( unsigned int i = 0; i < size; ++i ) { std::cout.write( is.binary().last(), csv.format().size() ); }
+            if( csv.flush ) { std::cout.flush(); }
+        }
+    }
+    else
+    {
+        while( std::cin.good() && !std::cin.eof() )
+        {
+            std::string line;
+            std::getline( std::cin, line );
+            if( comma::strip( line ).empty() ) { continue; }
+            for( unsigned int i = 0; i < size; ++i ) { std::cout << line << std::endl; }
+        }
+    }
+    return 0;
+}
+
 int main( int ac, char** av )
 {
     try
@@ -254,10 +280,8 @@ int main( int ac, char** av )
         is_binary = csv.binary();
         if( unnamed.empty() ) { std::cerr << comma::verbose.app_name() << ": please specify operations" << std::endl; exit( 1 ); }
         std::string operation = unnamed[0];
-        if( operation == "concatenate" || operation == "loop" )
-        {
-            return concatenate_impl_().run(options, csv);
-        }
+        if( operation == "concatenate" || operation == "loop" ) { return concatenate_().run(options, csv); }
+        if( operation == "repeat" ) { return repeat_( options, csv ); }
         std::cerr << comma::verbose.app_name() << ": operation not supported or unknown: '" << operation << '\'' << std::endl;
         return 1;
     }
diff --git a/csv/test/csv-shape/repeat/expected b/csv/test/csv-shape/repeat/expected
new file mode 100644
index 000000000..972463d6e
--- /dev/null
+++ b/csv/test/csv-shape/repeat/expected
@@ -0,0 +1,17 @@
+ascii/output/line[0]="hello"
+ascii/output/line[1]="hello"
+ascii/output/line[2]="hello"
+ascii/output/line[3]="world"
+ascii/output/line[4]="world"
+ascii/output/line[5]="world"
+ascii/status=0
+binary/output/line[0]="1"
+binary/output/line[1]="1"
+binary/output/line[2]="1"
+binary/output/line[3]="2"
+binary/output/line[4]="2"
+binary/output/line[5]="2"
+binary/output/line[6]="3"
+binary/output/line[7]="3"
+binary/output/line[8]="3"
+binary/status=0
diff --git a/csv/test/csv-shape/repeat/input b/csv/test/csv-shape/repeat/input
new file mode 100644
index 000000000..9d2e8c57c
--- /dev/null
+++ b/csv/test/csv-shape/repeat/input
@@ -0,0 +1,2 @@
+ascii="( echo hello; echo; echo world ) | csv-shape repeat --size 3"
+binary="( echo 1; echo 2; echo 3 ) | csv-to-bin ui | csv-shape repeat --size 3 --binary ui | csv-from-bin ui"

From 3fb92084f3b7414eabdcab1ca0e807623f9eecbd Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 27 May 2019 18:58:12 +1000
Subject: [PATCH 0028/1056] csv-interval: minor refactoring

---
 csv/applications/csv-interval.cpp | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/csv/applications/csv-interval.cpp b/csv/applications/csv-interval.cpp
index 338eaee1b..6c538c608 100644
--- a/csv/applications/csv-interval.cpp
+++ b/csv/applications/csv-interval.cpp
@@ -394,9 +394,9 @@ struct intervals
         }
     }
 
-    void run()
+    void read( std::istream& is = std::cin )
     {
-        comma::csv::input_stream< interval_t< From, To > > istream( std::cin, csv );
+        comma::csv::input_stream< interval_t< From, To > > istream( is, csv );
         comma::csv::ascii< interval_t< std::string > > ascii( csv.fields );
         if( !first_line.empty() )
         {
@@ -413,7 +413,7 @@ struct intervals
             if( verbose ) { std::cerr << app_name << ": from: " << from << " to: " << to << " payload: " << payload << std::endl; }
             add( from, to, payload );
         }
-        while( istream.ready() || std::cin.good()  )
+        while( istream.ready() || is.good()  )
         {
             const interval_t< From, To >* interval = istream.read();
             if( !interval ) { break; }
@@ -441,7 +441,12 @@ struct intervals
             if( verbose ) { std::cerr << app_name << ": from: " << from << " to: " << to << " payload: " << ( csv.binary() ? "<binary>" : payload ) << std::endl; }
             add( from, to, payload );
         }
-        write();
+    }
+
+    void run()
+    {
+        this->read();
+        this->write();
     }
 };
 

From d900b93289372ee48503bac3562cc67e2268cadb Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 28 May 2019 12:56:07 +1000
Subject: [PATCH 0029/1056] csv-interval: more refactoring

---
 csv/applications/csv-interval.cpp | 164 ++++++++++++++----------------
 1 file changed, 76 insertions(+), 88 deletions(-)

diff --git a/csv/applications/csv-interval.cpp b/csv/applications/csv-interval.cpp
index 6c538c608..41a54a662 100644
--- a/csv/applications/csv-interval.cpp
+++ b/csv/applications/csv-interval.cpp
@@ -34,6 +34,7 @@
 #include <limits>
 #include <set>
 #include <string>
+#include <tuple>
 #include <boost/icl/interval.hpp>
 #include <boost/icl/interval_map.hpp>
 #include "../../application/command_line_options.h"
@@ -46,7 +47,6 @@ static const std::string app_name = "csv-interval";
 
 static bool verbose;
 static bool debug;
-static std::string first_line;
 static bool append;
 
 template < typename T > struct limits
@@ -102,9 +102,9 @@ static void usage( bool verbose = false )
     // std::cerr << "    --input-format: print input format and exit" << std::endl;
     std::cerr << "    --output-fields: print output fields and exit" << std::endl;
     // std::cerr << "    --output-format: print output format and exit" << std::endl;
-    std::cerr << "    --empty: empty value used to signify unbounded intervals" << std::endl;
+    std::cerr << "    --empty=[<empty-value>]: empty value used to signify unbounded intervals" << std::endl;
     std::cerr << "             default for time is \"not-a-date-time\"" << std::endl;
-    std::cerr << "    --format: input format (ascii only), also affects the --limits option; if not given the format is guessed" << std::endl;
+    std::cerr << "    --format=[<format>]: input format (ascii only), also affects the --limits option; if not given the format is guessed" << std::endl;
     std::cerr << "    --intervals-only: only output the intervals, ignore payload if any" << std::endl;
     std::cerr << "    --limits,-l: replace empty bounds with type limits" << std::endl;
     std::cerr << "                 b  : " << (int)limits< char >::lowest() << " " << (int)limits< char >::max() << std::endl;
@@ -295,6 +295,7 @@ struct intervals
                                                             , intervals_only( options.exists( "--intervals-only" ) )
                                                             , use_limits( options.exists( "--limits,-l" ) )
     {
+        csv.full_xpath = false;
         if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< From, To > >(), ',' ); }
         if( ocsv.fields.empty() || intervals_only )
         {
@@ -394,7 +395,7 @@ struct intervals
         }
     }
 
-    void read( std::istream& is = std::cin )
+    void read( std::istream& is, const std::string& first_line ) // preparing for adding operations
     {
         comma::csv::input_stream< interval_t< From, To > > istream( is, csv );
         comma::csv::ascii< interval_t< std::string > > ascii( csv.fields );
@@ -443,107 +444,94 @@ struct intervals
         }
     }
 
-    void run()
+    void make( const std::string& first_line )
     {
-        this->read();
+        this->read( std::cin, first_line );
         this->write();
     }
 };
 
-// template < typename From > static void run( const comma::command_line_options& options, const comma::csv::format::types_enum to_type )
-// {
-//     switch( to_type )
-//     {
-//         case comma::csv::format::int8:          intervals< From, char >( options ).run(); break;
-//         case comma::csv::format::uint8:         intervals< From, unsigned char >( options ).run(); break;
-//         case comma::csv::format::int16:         intervals< From, comma::int16 >( options ).run(); break;
-//         case comma::csv::format::uint16:        intervals< From, comma::uint16 >( options ).run(); break;
-//         case comma::csv::format::int32:         intervals< From, comma::int32 >( options ).run(); break;
-//         case comma::csv::format::uint32:        intervals< From, comma::uint32 >( options ).run(); break;
-//         case comma::csv::format::int64:         intervals< From, comma::int64 >( options ).run(); break;
-//         case comma::csv::format::uint64:        intervals< From, comma::uint64 >( options ).run(); break;
-//         case comma::csv::format::char_t:        intervals< From, char >( options ).run(); break;
-//         case comma::csv::format::float_t:       intervals< From, float >( options ).run(); break;
-//         case comma::csv::format::double_t:      intervals< From, double >( options ).run(); break;
-//         default:                                COMMA_THROW( comma::exception, "from/to type mismatch" ); break;
-//     }
-// }
+static std::tuple< comma::csv::format::types_enum, std::string > interval_type( std::istream& is, comma::csv::options csv, const std::string& format )
+{
+    if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< double > >(), ',' ); }
+    if( !csv.has_field( "from,to" ) ) { COMMA_THROW( comma::exception, "expected from and to fields" ); }
+    std::string first_line;
+    csv.full_xpath = false;
+    if( !csv.binary() )
+    {
+        if( format.empty() )
+        {
+            while( std::cin.good() && first_line.empty() ) { std::getline( is, first_line ); }
+            if( first_line.empty() ) { exit( 0 ); } // quick and dirty
+            csv.format( comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter ) );
+            if( verbose ) { std::cerr << app_name << ": guessed format: " << csv.format().string() << std::endl;; }
+        }
+        else
+        {
+            csv.format( format );
+        }
+    }
+    const std::vector< std::string >& fields = comma::split( csv.fields, ',' );
+    unsigned int from_index = 0;
+    unsigned int to_index = 1;
+    for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "from" ) { from_index = i; break; } }
+    for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "to" ) { to_index = i; break; } }
+    const comma::csv::format::types_enum from_type = csv.format().offset( from_index ).type;
+    const comma::csv::format::types_enum to_type = csv.format().offset( to_index ).type;
+    if( ( ( from_type == comma::csv::format::time || from_type == comma::csv::format::long_time ) && ( to_type != comma::csv::format::time && to_type != comma::csv::format::long_time ) ) ||
+    ( ( ( from_type != comma::csv::format::time && from_type != comma::csv::format::long_time ) && ( to_type == comma::csv::format::time || to_type == comma::csv::format::long_time ) ) ) )
+    { COMMA_THROW( comma::exception, "from/to type mismatch; time" ); }
+    if( ( from_type == comma::csv::format::fixed_string || to_type == comma::csv::format::fixed_string ) && from_type != to_type )
+    { COMMA_THROW( comma::exception, "from/to type mismatch; string" ); }
+    if( from_type != to_type ) { std::cerr << app_name << ": support only from and to of the same type, got from: " << comma::csv::format::to_format( from_type ) << ", to: " << comma::csv::format::to_format( to_type ) << std::endl; exit( 1 ); }
+    return std::tie( to_type, first_line );
+}
 
 int main( int ac, char** av )
 {
     try
     {
-        comma::command_line_options options( ac, av );
+        comma::command_line_options options( ac, av, usage );
         verbose = options.exists( "--verbose,-v" );
         debug = options.exists( "--debug" );
-        append = options.exists( "--append,-a" );
-        if( options.exists( "--help,-h" ) ) { usage( verbose ); }
-        if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
-        if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
-        comma::csv::options csv( options );
-        csv.full_xpath = false;
-        if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< double > >(), ',' ); }
-        if( !csv.has_field( "from,to" ) ) { COMMA_THROW( comma::exception, "expected from and to fields" ); }
         options.assert_mutually_exclusive( "--binary,--format" );
-        if( options.exists( "--binary,-b" ) ) {}
-        else if( options.exists( "--format" ) ) { csv.format( options.value< std::string >( "--format" ) ); }
-        else
+        const auto& unnamed = options.unnamed( "--append,-a,--debug,--flush,--input-fields,--output-fields,--intervals-only,--limits,-l", "-.*" );
+        std::string operation = unnamed.empty() ? "make" : unnamed[0];
+        if( operation == "make" )
         {
-            while( std::cin.good() && first_line.empty() ) { std::getline( std::cin, first_line ); }
-            if( first_line.empty() ) { return 0; }
-            csv.format( comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter ) );
-            if( verbose ) { std::cerr << app_name << ": guessed format: " << csv.format().string() << std::endl;; }
+            append = options.exists( "--append,-a" );
+            if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
+            if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
+            comma::csv::options csv( options );
+            auto t = interval_type( std::cin, comma::csv::options( options ), options.value< std::string >( "--format,-f", "" ) );
+            const comma::csv::format::types_enum to_type = std::get< 0 >( t );
+            std::string first_line = std::get< 1 >( t );
+            switch( to_type )
+            {
+                case comma::csv::format::int8:          intervals< char >( options ).make( first_line ); break;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options ).make( first_line ); break;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options ).make( first_line ); break;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).make( first_line ); break;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options ).make( first_line ); break;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).make( first_line ); break;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options ).make( first_line ); break;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).make( first_line ); break;
+                case comma::csv::format::char_t:        intervals< char >( options ).make( first_line ); break;
+                case comma::csv::format::float_t:       intervals< float >( options ).make( first_line ); break;
+                case comma::csv::format::double_t:      intervals< double >( options ).make( first_line ); break;
+                case comma::csv::format::time:
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).make( first_line ); break;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options ).make( first_line ); break;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); break; // never here
+            }
+            return 0;
         }
-        const std::vector< std::string >& fields = comma::split( csv.fields, ',' );
-        unsigned int from_index = 0;
-        unsigned int to_index = 1;
-        for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "from" ) { from_index = i; break; } }
-        for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "to" ) { to_index = i; break; } }
-        const comma::csv::format::types_enum from_type = csv.format().offset( from_index ).type;
-        const comma::csv::format::types_enum to_type = csv.format().offset( to_index ).type;
-        if( ( ( from_type == comma::csv::format::time || from_type == comma::csv::format::long_time ) && ( to_type != comma::csv::format::time && to_type != comma::csv::format::long_time ) ) ||
-          ( ( ( from_type != comma::csv::format::time && from_type != comma::csv::format::long_time ) && ( to_type == comma::csv::format::time || to_type == comma::csv::format::long_time ) ) ) )
-        { COMMA_THROW( comma::exception, "from/to type mismatch; time" ); }
-        if( ( from_type == comma::csv::format::fixed_string || to_type == comma::csv::format::fixed_string ) && from_type != to_type )
-        { COMMA_THROW( comma::exception, "from/to type mismatch; string" ); }
-//         switch( from_type )
-//         {
-//             case comma::csv::format::int8:          run< char >( options, to_type ); break;
-//             case comma::csv::format::uint8:         run< unsigned char >( options, to_type ); break;
-//             case comma::csv::format::int16:         run< comma::int16 >( options, to_type ); break;
-//             case comma::csv::format::uint16:        run< comma::uint16 >( options, to_type ); break;
-//             case comma::csv::format::int32:         run< comma::int32 >( options, to_type ); break;
-//             case comma::csv::format::uint32:        run< comma::uint32 >( options, to_type ); break;
-//             case comma::csv::format::int64:         run< comma::int64 >( options, to_type ); break;
-//             case comma::csv::format::uint64:        run< comma::uint64 >( options, to_type ); break;
-//             case comma::csv::format::char_t:        run< char >( options, to_type ); break;
-//             case comma::csv::format::float_t:       run< float >( options, to_type ); break;
-//             case comma::csv::format::double_t:      run< double >( options, to_type ); break;
-//             case comma::csv::format::time:
-//             case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).run(); break;
-//             case comma::csv::format::fixed_string:  intervals< std::string >( options ).run(); break;
-//             default:                                COMMA_THROW( comma::exception, "unknown type" ); break;
-//         }
-        if( from_type != to_type ) { std::cerr << app_name << ": support only from and to of the same type, got from: " << comma::csv::format::to_format( from_type ) << ", to: " << comma::csv::format::to_format( to_type ) << std::endl; return 1; }
-        switch( to_type )
+        if( operation == "select" )
         {
-            case comma::csv::format::int8:          intervals< char >( options ).run(); break;
-            case comma::csv::format::uint8:         intervals< unsigned char >( options ).run(); break;
-            case comma::csv::format::int16:         intervals< comma::int16 >( options ).run(); break;
-            case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).run(); break;
-            case comma::csv::format::int32:         intervals< comma::int32 >( options ).run(); break;
-            case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).run(); break;
-            case comma::csv::format::int64:         intervals< comma::int64 >( options ).run(); break;
-            case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).run(); break;
-            case comma::csv::format::char_t:        intervals< char >( options ).run(); break;
-            case comma::csv::format::float_t:       intervals< float >( options ).run(); break;
-            case comma::csv::format::double_t:      intervals< double >( options ).run(); break;
-            case comma::csv::format::time:
-            case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).run(); break;
-            case comma::csv::format::fixed_string:  intervals< std::string >( options ).run(); break;            
-            default:                                COMMA_THROW( comma::exception, "from/to type mismatch" ); break;
+            std::cerr << "csv-interval: select: todo" << std::endl;
+            return 1;
         }
-        return 0;
+        std::cerr << "csv-interval: expected operation, got: '" << operation << "'" << std::endl;
     }
     catch( std::exception& ex ) { std::cerr << app_name << ": " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << app_name << ": unknown exception" << std::endl; }

From 02be391168c9eff33a2af4ffcf25512aac123820 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 28 May 2019 13:53:02 +1000
Subject: [PATCH 0030/1056] csv-interval: select operation: implementing...

---
 csv/applications/csv-interval.cpp | 71 ++++++++++++++++++++++++-------
 1 file changed, 55 insertions(+), 16 deletions(-)

diff --git a/csv/applications/csv-interval.cpp b/csv/applications/csv-interval.cpp
index 41a54a662..50c71bb81 100644
--- a/csv/applications/csv-interval.cpp
+++ b/csv/applications/csv-interval.cpp
@@ -40,8 +40,12 @@
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
-#include "../../visiting/traits.h"
+#include "../../csv/traits.h"
 #include "../../csv/impl/unstructured.h"
+#include "../../io/stream.h"
+#include "../../name_value/map.h"
+#include "../../name_value/parser.h"
+#include "../../visiting/traits.h"
 
 static const std::string app_name = "csv-interval";
 
@@ -444,10 +448,17 @@ struct intervals
         }
     }
 
-    void make( const std::string& first_line )
+    int make( const std::string& first_line )
     {
         this->read( std::cin, first_line );
         this->write();
+        return 0;
+    }
+    
+    int select( const std::string& first_line )
+    {
+        this->read( std::cin, first_line );
+        std::cerr << "csv-interval select: todo" << std::endl; exit( 1 );
     }
 };
 
@@ -508,26 +519,54 @@ int main( int ac, char** av )
             std::string first_line = std::get< 1 >( t );
             switch( to_type )
             {
-                case comma::csv::format::int8:          intervals< char >( options ).make( first_line ); break;
-                case comma::csv::format::uint8:         intervals< unsigned char >( options ).make( first_line ); break;
-                case comma::csv::format::int16:         intervals< comma::int16 >( options ).make( first_line ); break;
-                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).make( first_line ); break;
-                case comma::csv::format::int32:         intervals< comma::int32 >( options ).make( first_line ); break;
-                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).make( first_line ); break;
-                case comma::csv::format::int64:         intervals< comma::int64 >( options ).make( first_line ); break;
-                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).make( first_line ); break;
-                case comma::csv::format::char_t:        intervals< char >( options ).make( first_line ); break;
-                case comma::csv::format::float_t:       intervals< float >( options ).make( first_line ); break;
-                case comma::csv::format::double_t:      intervals< double >( options ).make( first_line ); break;
+                case comma::csv::format::int8:          intervals< char >( options ).make( first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options ).make( first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options ).make( first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).make( first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options ).make( first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).make( first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options ).make( first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).make( first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options ).make( first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options ).make( first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options ).make( first_line ); return 0;
                 case comma::csv::format::time:
-                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).make( first_line ); break;
-                case comma::csv::format::fixed_string:  intervals< std::string >( options ).make( first_line ); break;            
-                default:                                COMMA_THROW( comma::exception, "invalid type" ); break; // never here
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).make( first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options ).make( first_line ); return 0;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); return 0; // never here
             }
             return 0;
         }
         if( operation == "select" )
         {
+            // todo
+            //if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
+            //if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
+            auto i = options.value< std::string >( "--intervals" );
+            comma::csv::options csv = comma::name_value::parser().get< comma::csv::options >( i );
+            std::string format = comma::name_value::map( i ).value< std::string >( "format", "" );
+            comma::io::istream is( csv.filename );
+            auto t = interval_type( *is, csv, format );
+            const comma::csv::format::types_enum to_type = std::get< 0 >( t );
+            std::string first_line = std::get< 1 >( t );
+            switch( to_type )
+            {
+                case comma::csv::format::int8:          intervals< char >( options ).select( first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options ).select( first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options ).select( first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).select( first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options ).select( first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).select( first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options ).select( first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).select( first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options ).select( first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options ).select( first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options ).select( first_line ); return 0;
+                case comma::csv::format::time:
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).select( first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options ).select( first_line ); return 0;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); return 0; // never here
+            }
             std::cerr << "csv-interval: select: todo" << std::endl;
             return 1;
         }

From 0bc6759344c0cf84f8e8348f4e3739b3e8635f7d Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 28 May 2019 17:47:23 +1000
Subject: [PATCH 0031/1056] csv-interval: renamed to csv-intervals; operations
 introduced; contain operation implemented

---
 csv/applications/CMakeLists.txt               |   6 +-
 .../{csv-interval.cpp => csv-intervals.cpp}   | 118 ++++++++++++------
 csv/test/csv-interval/ascii/test              |   3 -
 csv/test/csv-interval/overlap-count/input     |  16 ---
 .../append/expected                           |   0
 .../append/input                              |   2 +-
 csv/test/csv-intervals/ascii/test             |   3 +
 .../ascii/test.01/expected                    |   0
 .../ascii/test.01/input                       |   0
 .../ascii/test.01/options                     |   0
 .../ascii/test.02/expected                    |   0
 .../ascii/test.02/input                       |   0
 .../ascii/test.02/options                     |   0
 .../ascii/test.03/expected                    |   0
 .../ascii/test.03/input                       |   0
 .../ascii/test.03/options                     |   0
 .../ascii/test.04/disabled                    |   0
 .../ascii/test.04/expected                    |   0
 .../ascii/test.04/input                       |   0
 .../ascii/test.04/options                     |   0
 .../ascii/test.05/expected                    |   0
 .../ascii/test.05/input                       |   0
 .../ascii/test.05/options                     |   0
 .../ascii/test.06/expected                    |   0
 .../ascii/test.06/input                       |   0
 .../ascii/test.06/options                     |   0
 .../ascii/test.07/expected                    |   0
 .../ascii/test.07/input                       |   0
 .../ascii/test.07/options                     |   0
 .../ascii/test.08/expected                    |   0
 .../ascii/test.08/input                       |   0
 .../ascii/test.08/options                     |   0
 .../ascii/test.09/expected                    |   0
 .../ascii/test.09/input                       |   0
 .../ascii/test.09/options                     |   0
 .../ascii/test.10/expected                    |   0
 .../ascii/test.10/input                       |   0
 .../ascii/test.10/options                     |   0
 .../ascii/test.11/expected                    |   0
 .../ascii/test.11/input                       |   0
 .../ascii/test.11/options                     |   0
 .../binary/test                               |   2 +-
 .../binary/test.01/expected                   |   0
 .../binary/test.01/input                      |   0
 .../binary/test.01/options                    |   0
 .../binary/test.02/expected                   |   0
 .../binary/test.02/input                      |   0
 .../binary/test.02/options                    |   0
 .../binary/test.03/disabled                   |   0
 .../binary/test.03/expected                   |   0
 .../binary/test.03/input                      |   0
 .../binary/test.03/options                    |   0
 .../binary/test.04/disabled                   |   0
 .../binary/test.04/expected                   |   0
 .../binary/test.04/input                      |   0
 .../binary/test.04/options                    |   0
 .../binary/test.05/expected                   |   0
 .../binary/test.05/input                      |   0
 .../binary/test.05/options                    |   0
 .../binary/test.06/expected                   |   0
 .../binary/test.06/input                      |   0
 .../binary/test.06/options                    |   0
 .../binary/test.07/expected                   |   0
 .../binary/test.07/input                      |   0
 .../binary/test.07/options                    |   0
 .../binary/test.08/expected                   |   0
 .../binary/test.08/input                      |   0
 .../binary/test.08/options                    |   0
 .../binary/test.09/expected                   |   0
 .../binary/test.09/input                      |   0
 .../binary/test.09/options                    |   0
 .../overlap-count/expected                    |   0
 csv/test/csv-intervals/overlap-count/input    |  16 +++
 73 files changed, 105 insertions(+), 61 deletions(-)
 rename csv/applications/{csv-interval.cpp => csv-intervals.cpp} (85%)
 delete mode 100755 csv/test/csv-interval/ascii/test
 delete mode 100644 csv/test/csv-interval/overlap-count/input
 rename csv/test/{csv-interval => csv-intervals}/append/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/append/input (79%)
 create mode 100755 csv/test/csv-intervals/ascii/test
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.01/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.01/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.01/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.02/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.02/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.02/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.03/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.03/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.03/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.04/disabled (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.04/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.04/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.04/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.05/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.05/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.05/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.06/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.06/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.06/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.07/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.07/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.07/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.08/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.08/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.08/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.09/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.09/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.09/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.10/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.10/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.10/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.11/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.11/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/ascii/test.11/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test (65%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.01/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.01/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.01/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.02/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.02/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.02/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.03/disabled (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.03/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.03/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.03/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.04/disabled (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.04/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.04/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.04/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.05/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.05/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.05/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.06/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.06/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.06/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.07/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.07/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.07/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.08/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.08/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.08/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.09/expected (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.09/input (100%)
 rename csv/test/{csv-interval => csv-intervals}/binary/test.09/options (100%)
 rename csv/test/{csv-interval => csv-intervals}/overlap-count/expected (100%)
 create mode 100644 csv/test/csv-intervals/overlap-count/input

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index 7cd1fb6c4..5a76792c2 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -102,9 +102,9 @@ add_executable( csv-enumerate ${dir}/csv-enumerate.cpp )
 target_link_libraries ( csv-enumerate ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
 install( TARGETS csv-enumerate RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
-add_executable( csv-interval ${dir}/csv-interval.cpp )
-target_link_libraries ( csv-interval ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath )
-install( TARGETS csv-interval RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+add_executable( csv-intervals ${dir}/csv-intervals.cpp )
+target_link_libraries ( csv-intervals ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath )
+install( TARGETS csv-intervals RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
          
 add_executable( csv-units ${dir}/csv-units.cpp )
 target_link_libraries ( csv-units ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
diff --git a/csv/applications/csv-interval.cpp b/csv/applications/csv-intervals.cpp
similarity index 85%
rename from csv/applications/csv-interval.cpp
rename to csv/applications/csv-intervals.cpp
index 50c71bb81..dc710ed6a 100644
--- a/csv/applications/csv-interval.cpp
+++ b/csv/applications/csv-intervals.cpp
@@ -30,6 +30,7 @@
 
 /// @author Vinny Do
 
+#include <fstream>
 #include <iostream>
 #include <limits>
 #include <set>
@@ -47,7 +48,7 @@
 #include "../../name_value/parser.h"
 #include "../../visiting/traits.h"
 
-static const std::string app_name = "csv-interval";
+static const std::string app_name = "csv-intervals";
 
 static bool verbose;
 static bool debug;
@@ -95,21 +96,22 @@ static void usage( bool verbose = false )
 {
     std::cerr << "takes csv intervals and separates them at points of overlap if any" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage: cat intervals.csv | " << app_name << " [OPTIONS...]" << std::endl;
+    std::cerr << "usage: cat intervals.csv | csv-intervals <operation> [<options>]" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    contain: given a set of intervals, take scalars on stdin, append 1 if contained in the intervals, 0 if not" << std::endl;
+    std::cerr << "    make: make intervals" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: show help; --help --verbose for more help" << std::endl;
     std::cerr << "    --verbose,-v: more info" << std::endl;
-    std::cerr << "    --append,-a: append output intervals instead of outputting them in place" << std::endl;
-    std::cerr << "    --debug: print debug" << std::endl;
+    std::cerr << "    --debug: more debug output" << std::endl;
     std::cerr << "    --input-fields: print input fields and exit" << std::endl;
     // std::cerr << "    --input-format: print input format and exit" << std::endl;
     std::cerr << "    --output-fields: print output fields and exit" << std::endl;
     // std::cerr << "    --output-format: print output format and exit" << std::endl;
     std::cerr << "    --empty=[<empty-value>]: empty value used to signify unbounded intervals" << std::endl;
     std::cerr << "             default for time is \"not-a-date-time\"" << std::endl;
-    std::cerr << "    --format=[<format>]: input format (ascii only), also affects the --limits option; if not given the format is guessed" << std::endl;
-    std::cerr << "    --intervals-only: only output the intervals, ignore payload if any" << std::endl;
     std::cerr << "    --limits,-l: replace empty bounds with type limits" << std::endl;
     std::cerr << "                 b  : " << (int)limits< char >::lowest() << " " << (int)limits< char >::max() << std::endl;
     std::cerr << "                 ub : " << (int)limits< unsigned char >::lowest() << " " << (int)limits< unsigned char >::max() << std::endl;
@@ -125,9 +127,21 @@ static void usage( bool verbose = false )
     std::cerr << "                 s  : \"" << limits< std::string >::lowest() << "\" \"" << limits< std::string >::max() << "\"" << std::endl;
     std::cerr << "                 t  : " << limits< boost::posix_time::ptime >::lowest() << " " << limits< boost::posix_time::ptime >::max() << std::endl;
     std::cerr << "                 lt : " << limits< boost::posix_time::ptime >::lowest() << " " << limits< boost::posix_time::ptime >::max() << std::endl;
-    std::cerr << "    --overlap-count=[<count>]; output only intervals with <count> overlaps" << std::endl;
-    std::cerr << "    --overlap-count-min,--min-overlap-count=[<count>]; output only intervals with at least <count> overlaps" << std::endl;
-    std::cerr << "    --overlap-count-max,--max-overlap-count=[<count>]; output only intervals with not more than <count> overlaps" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operation details" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    contain" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --intervals=<filename>: file or stream name" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    make" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --append,-a: append output intervals instead of outputting them in place" << std::endl;
+    std::cerr << "            --format=[<format>]: input format (ascii only), also affects the --limits option; if not given the format is guessed" << std::endl;
+    std::cerr << "            --intervals-only: only output the intervals, ignore payload if any" << std::endl;    
+    std::cerr << "            --overlap-count=[<count>]; output only intervals with <count> overlaps" << std::endl;
+    std::cerr << "            --overlap-count-min,--min-overlap-count=[<count>]; output only intervals with at least <count> overlaps" << std::endl;
+    std::cerr << "            --overlap-count-max,--max-overlap-count=[<count>]; output only intervals with not more than <count> overlaps" << std::endl;
     std::cerr << std::endl;
     std::cerr << "ascii notes" << std::endl;
     std::cerr << "    unbounded intervals may be indicated by no value (e.g. ,3 \u2261 -\u221e,3), both sides unbounded is also supported" << std::endl;
@@ -252,6 +266,13 @@ struct interval_t
     to_t< To > to;
 };
 
+template < typename T > struct scalar_t
+{ 
+    T scalar;
+    scalar_t() {}
+    scalar_t( const T& t ): scalar( t ) {}
+};
+
 namespace comma { namespace visiting {
 
 template < typename T > struct traits< from_t< T > >
@@ -272,6 +293,12 @@ template < typename From, typename To > struct traits< interval_t< From, To > >
     template < typename K, typename V > static void visit( const K&, const interval_t< From, To >& p, V& v ) { v.apply( "", p.from ); v.apply( "", p.to ); }
 };
 
+template < typename T > struct traits< scalar_t< T > >
+{
+    template < typename K, typename V > static void visit( const K&, scalar_t< T >& p, V& v ) { v.apply( "scalar", p.scalar ); }
+    template < typename K, typename V > static void visit( const K&, const scalar_t< T >& p, V& v ) { v.apply( "scalar", p.scalar ); }
+};
+
 } } // namespace comma { namespace visiting {
 
 template < typename From, typename To = From >
@@ -455,10 +482,29 @@ struct intervals
         return 0;
     }
     
-    int select( const std::string& first_line )
+    int contain( std::istream& is, const std::string& first_line )
     {
-        this->read( std::cin, first_line );
-        std::cerr << "csv-interval select: todo" << std::endl; exit( 1 );
+        comma::csv::options icsv( options, "", false );
+        comma::csv::input_stream< scalar_t< From > > istream( std::cin, icsv );
+        comma::csv::output_stream< scalar_t< bool > > ostream( std::cout, icsv.binary() );
+        auto tied = comma::csv::make_tied( istream, ostream );
+        this->read( is, first_line ); // todo: support block
+        while( istream.ready() || std::cin.good() )
+        {
+            auto p = istream.read();
+            if( !p ) { break; }
+            bool contained = false; // todo? use boost::...::query
+            for( typename map_t::iterator it = map.begin(); it != map.end() && !contained; ++it )
+            {
+                const bound_t< bound_type >& from = it->first.lower();
+                const bound_t< bound_type >& to = it->first.upper();
+                contained = ( !from.value || p->scalar >= *from.value ) && ( !to.value || p->scalar < *to.value );
+            }
+            tied.append( scalar_t< bool >( contained ) );
+            if( icsv.flush ) { std::cout.flush(); }
+        }
+        std::cout.flush();
+        return 0;
     }
 };
 
@@ -472,7 +518,7 @@ static std::tuple< comma::csv::format::types_enum, std::string > interval_type(
     {
         if( format.empty() )
         {
-            while( std::cin.good() && first_line.empty() ) { std::getline( is, first_line ); }
+            while( is.good() && first_line.empty() ) { std::getline( is, first_line ); }
             if( first_line.empty() ) { exit( 0 ); } // quick and dirty
             csv.format( comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter ) );
             if( verbose ) { std::cerr << app_name << ": guessed format: " << csv.format().string() << std::endl;; }
@@ -537,13 +583,12 @@ int main( int ac, char** av )
             }
             return 0;
         }
-        if( operation == "select" )
+        if( operation == "contain" )
         {
-            // todo
-            //if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
-            //if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
+            if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< scalar_t< double > >(), ',' ) << std::endl; return 0; }
+            if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< scalar_t< double > >(), ',' ) << std::endl; return 0; }
             auto i = options.value< std::string >( "--intervals" );
-            comma::csv::options csv = comma::name_value::parser().get< comma::csv::options >( i );
+            comma::csv::options csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( i );
             std::string format = comma::name_value::map( i ).value< std::string >( "format", "" );
             comma::io::istream is( csv.filename );
             auto t = interval_type( *is, csv, format );
@@ -551,28 +596,27 @@ int main( int ac, char** av )
             std::string first_line = std::get< 1 >( t );
             switch( to_type )
             {
-                case comma::csv::format::int8:          intervals< char >( options ).select( first_line ); return 0;
-                case comma::csv::format::uint8:         intervals< unsigned char >( options ).select( first_line ); return 0;
-                case comma::csv::format::int16:         intervals< comma::int16 >( options ).select( first_line ); return 0;
-                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).select( first_line ); return 0;
-                case comma::csv::format::int32:         intervals< comma::int32 >( options ).select( first_line ); return 0;
-                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).select( first_line ); return 0;
-                case comma::csv::format::int64:         intervals< comma::int64 >( options ).select( first_line ); return 0;
-                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).select( first_line ); return 0;
-                case comma::csv::format::char_t:        intervals< char >( options ).select( first_line ); return 0;
-                case comma::csv::format::float_t:       intervals< float >( options ).select( first_line ); return 0;
-                case comma::csv::format::double_t:      intervals< double >( options ).select( first_line ); return 0;
+                case comma::csv::format::int8:          intervals< char >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options ).contain( *is, first_line ); return 0;
                 case comma::csv::format::time:
-                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).select( first_line ); return 0;
-                case comma::csv::format::fixed_string:  intervals< std::string >( options ).select( first_line ); return 0;            
-                default:                                COMMA_THROW( comma::exception, "invalid type" ); return 0; // never here
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options ).contain( *is, first_line ); return 0;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); // never here
             }
-            std::cerr << "csv-interval: select: todo" << std::endl;
-            return 1;
+            return 0;
         }
-        std::cerr << "csv-interval: expected operation, got: '" << operation << "'" << std::endl;
+        std::cerr << "csv-intervals: expected operation, got: '" << operation << "'" << std::endl;
     }
-    catch( std::exception& ex ) { std::cerr << app_name << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << app_name << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-invervals: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-invervals: unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/test/csv-interval/ascii/test b/csv/test/csv-interval/ascii/test
deleted file mode 100755
index 074ec4ca8..000000000
--- a/csv/test/csv-interval/ascii/test
+++ /dev/null
@@ -1,3 +0,0 @@
-#!/bin/bash
-
-csv-interval $( cat options ) | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
diff --git a/csv/test/csv-interval/overlap-count/input b/csv/test/csv-interval/overlap-count/input
deleted file mode 100644
index f4e21571d..000000000
--- a/csv/test/csv-interval/overlap-count/input
+++ /dev/null
@@ -1,16 +0,0 @@
-min[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 0"
-min[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 1"
-min[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 2"
-min[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 3"
-
-max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 0"
-max[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 1"
-max[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 2"
-max[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 3"
-
-min_max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 1 --overlap-count-max 2"
-
-equal[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 0"
-equal[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 1"
-equal[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 2"
-equal[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 3"
diff --git a/csv/test/csv-interval/append/expected b/csv/test/csv-intervals/append/expected
similarity index 100%
rename from csv/test/csv-interval/append/expected
rename to csv/test/csv-intervals/append/expected
diff --git a/csv/test/csv-interval/append/input b/csv/test/csv-intervals/append/input
similarity index 79%
rename from csv/test/csv-interval/append/input
rename to csv/test/csv-intervals/append/input
index 2f584bfa3..bf97c221d 100644
--- a/csv/test/csv-interval/append/input
+++ b/csv/test/csv-intervals/append/input
@@ -1,3 +1,3 @@
-append[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --append"
+append[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --append"
 
 
diff --git a/csv/test/csv-intervals/ascii/test b/csv/test/csv-intervals/ascii/test
new file mode 100755
index 000000000..940042294
--- /dev/null
+++ b/csv/test/csv-intervals/ascii/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+csv-intervals make $( cat options ) | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
diff --git a/csv/test/csv-interval/ascii/test.01/expected b/csv/test/csv-intervals/ascii/test.01/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.01/expected
rename to csv/test/csv-intervals/ascii/test.01/expected
diff --git a/csv/test/csv-interval/ascii/test.01/input b/csv/test/csv-intervals/ascii/test.01/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.01/input
rename to csv/test/csv-intervals/ascii/test.01/input
diff --git a/csv/test/csv-interval/ascii/test.01/options b/csv/test/csv-intervals/ascii/test.01/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.01/options
rename to csv/test/csv-intervals/ascii/test.01/options
diff --git a/csv/test/csv-interval/ascii/test.02/expected b/csv/test/csv-intervals/ascii/test.02/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.02/expected
rename to csv/test/csv-intervals/ascii/test.02/expected
diff --git a/csv/test/csv-interval/ascii/test.02/input b/csv/test/csv-intervals/ascii/test.02/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.02/input
rename to csv/test/csv-intervals/ascii/test.02/input
diff --git a/csv/test/csv-interval/ascii/test.02/options b/csv/test/csv-intervals/ascii/test.02/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.02/options
rename to csv/test/csv-intervals/ascii/test.02/options
diff --git a/csv/test/csv-interval/ascii/test.03/expected b/csv/test/csv-intervals/ascii/test.03/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.03/expected
rename to csv/test/csv-intervals/ascii/test.03/expected
diff --git a/csv/test/csv-interval/ascii/test.03/input b/csv/test/csv-intervals/ascii/test.03/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.03/input
rename to csv/test/csv-intervals/ascii/test.03/input
diff --git a/csv/test/csv-interval/ascii/test.03/options b/csv/test/csv-intervals/ascii/test.03/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.03/options
rename to csv/test/csv-intervals/ascii/test.03/options
diff --git a/csv/test/csv-interval/ascii/test.04/disabled b/csv/test/csv-intervals/ascii/test.04/disabled
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/disabled
rename to csv/test/csv-intervals/ascii/test.04/disabled
diff --git a/csv/test/csv-interval/ascii/test.04/expected b/csv/test/csv-intervals/ascii/test.04/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/expected
rename to csv/test/csv-intervals/ascii/test.04/expected
diff --git a/csv/test/csv-interval/ascii/test.04/input b/csv/test/csv-intervals/ascii/test.04/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/input
rename to csv/test/csv-intervals/ascii/test.04/input
diff --git a/csv/test/csv-interval/ascii/test.04/options b/csv/test/csv-intervals/ascii/test.04/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/options
rename to csv/test/csv-intervals/ascii/test.04/options
diff --git a/csv/test/csv-interval/ascii/test.05/expected b/csv/test/csv-intervals/ascii/test.05/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.05/expected
rename to csv/test/csv-intervals/ascii/test.05/expected
diff --git a/csv/test/csv-interval/ascii/test.05/input b/csv/test/csv-intervals/ascii/test.05/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.05/input
rename to csv/test/csv-intervals/ascii/test.05/input
diff --git a/csv/test/csv-interval/ascii/test.05/options b/csv/test/csv-intervals/ascii/test.05/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.05/options
rename to csv/test/csv-intervals/ascii/test.05/options
diff --git a/csv/test/csv-interval/ascii/test.06/expected b/csv/test/csv-intervals/ascii/test.06/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.06/expected
rename to csv/test/csv-intervals/ascii/test.06/expected
diff --git a/csv/test/csv-interval/ascii/test.06/input b/csv/test/csv-intervals/ascii/test.06/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.06/input
rename to csv/test/csv-intervals/ascii/test.06/input
diff --git a/csv/test/csv-interval/ascii/test.06/options b/csv/test/csv-intervals/ascii/test.06/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.06/options
rename to csv/test/csv-intervals/ascii/test.06/options
diff --git a/csv/test/csv-interval/ascii/test.07/expected b/csv/test/csv-intervals/ascii/test.07/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.07/expected
rename to csv/test/csv-intervals/ascii/test.07/expected
diff --git a/csv/test/csv-interval/ascii/test.07/input b/csv/test/csv-intervals/ascii/test.07/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.07/input
rename to csv/test/csv-intervals/ascii/test.07/input
diff --git a/csv/test/csv-interval/ascii/test.07/options b/csv/test/csv-intervals/ascii/test.07/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.07/options
rename to csv/test/csv-intervals/ascii/test.07/options
diff --git a/csv/test/csv-interval/ascii/test.08/expected b/csv/test/csv-intervals/ascii/test.08/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.08/expected
rename to csv/test/csv-intervals/ascii/test.08/expected
diff --git a/csv/test/csv-interval/ascii/test.08/input b/csv/test/csv-intervals/ascii/test.08/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.08/input
rename to csv/test/csv-intervals/ascii/test.08/input
diff --git a/csv/test/csv-interval/ascii/test.08/options b/csv/test/csv-intervals/ascii/test.08/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.08/options
rename to csv/test/csv-intervals/ascii/test.08/options
diff --git a/csv/test/csv-interval/ascii/test.09/expected b/csv/test/csv-intervals/ascii/test.09/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.09/expected
rename to csv/test/csv-intervals/ascii/test.09/expected
diff --git a/csv/test/csv-interval/ascii/test.09/input b/csv/test/csv-intervals/ascii/test.09/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.09/input
rename to csv/test/csv-intervals/ascii/test.09/input
diff --git a/csv/test/csv-interval/ascii/test.09/options b/csv/test/csv-intervals/ascii/test.09/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.09/options
rename to csv/test/csv-intervals/ascii/test.09/options
diff --git a/csv/test/csv-interval/ascii/test.10/expected b/csv/test/csv-intervals/ascii/test.10/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.10/expected
rename to csv/test/csv-intervals/ascii/test.10/expected
diff --git a/csv/test/csv-interval/ascii/test.10/input b/csv/test/csv-intervals/ascii/test.10/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.10/input
rename to csv/test/csv-intervals/ascii/test.10/input
diff --git a/csv/test/csv-interval/ascii/test.10/options b/csv/test/csv-intervals/ascii/test.10/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.10/options
rename to csv/test/csv-intervals/ascii/test.10/options
diff --git a/csv/test/csv-interval/ascii/test.11/expected b/csv/test/csv-intervals/ascii/test.11/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.11/expected
rename to csv/test/csv-intervals/ascii/test.11/expected
diff --git a/csv/test/csv-interval/ascii/test.11/input b/csv/test/csv-intervals/ascii/test.11/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.11/input
rename to csv/test/csv-intervals/ascii/test.11/input
diff --git a/csv/test/csv-interval/ascii/test.11/options b/csv/test/csv-intervals/ascii/test.11/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.11/options
rename to csv/test/csv-intervals/ascii/test.11/options
diff --git a/csv/test/csv-interval/binary/test b/csv/test/csv-intervals/binary/test
similarity index 65%
rename from csv/test/csv-interval/binary/test
rename to csv/test/csv-intervals/binary/test
index 4f41eb06b..93e137d9e 100755
--- a/csv/test/csv-interval/binary/test
+++ b/csv/test/csv-intervals/binary/test
@@ -7,4 +7,4 @@ format_index=$( echo $options | fmt -1 | grep -n -- '--binary' | cut -d: -f1 )
 input_format="${args[$format_index]}"
 [[ -z "$output_format" ]] && output_format=$input_format
 
-csv-to-bin $input_format | csv-interval $options | csv-from-bin $output_format | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
+csv-to-bin $input_format | csv-intervals make $options | csv-from-bin $output_format | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
diff --git a/csv/test/csv-interval/binary/test.01/expected b/csv/test/csv-intervals/binary/test.01/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.01/expected
rename to csv/test/csv-intervals/binary/test.01/expected
diff --git a/csv/test/csv-interval/binary/test.01/input b/csv/test/csv-intervals/binary/test.01/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.01/input
rename to csv/test/csv-intervals/binary/test.01/input
diff --git a/csv/test/csv-interval/binary/test.01/options b/csv/test/csv-intervals/binary/test.01/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.01/options
rename to csv/test/csv-intervals/binary/test.01/options
diff --git a/csv/test/csv-interval/binary/test.02/expected b/csv/test/csv-intervals/binary/test.02/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.02/expected
rename to csv/test/csv-intervals/binary/test.02/expected
diff --git a/csv/test/csv-interval/binary/test.02/input b/csv/test/csv-intervals/binary/test.02/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.02/input
rename to csv/test/csv-intervals/binary/test.02/input
diff --git a/csv/test/csv-interval/binary/test.02/options b/csv/test/csv-intervals/binary/test.02/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.02/options
rename to csv/test/csv-intervals/binary/test.02/options
diff --git a/csv/test/csv-interval/binary/test.03/disabled b/csv/test/csv-intervals/binary/test.03/disabled
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/disabled
rename to csv/test/csv-intervals/binary/test.03/disabled
diff --git a/csv/test/csv-interval/binary/test.03/expected b/csv/test/csv-intervals/binary/test.03/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/expected
rename to csv/test/csv-intervals/binary/test.03/expected
diff --git a/csv/test/csv-interval/binary/test.03/input b/csv/test/csv-intervals/binary/test.03/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/input
rename to csv/test/csv-intervals/binary/test.03/input
diff --git a/csv/test/csv-interval/binary/test.03/options b/csv/test/csv-intervals/binary/test.03/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/options
rename to csv/test/csv-intervals/binary/test.03/options
diff --git a/csv/test/csv-interval/binary/test.04/disabled b/csv/test/csv-intervals/binary/test.04/disabled
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/disabled
rename to csv/test/csv-intervals/binary/test.04/disabled
diff --git a/csv/test/csv-interval/binary/test.04/expected b/csv/test/csv-intervals/binary/test.04/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/expected
rename to csv/test/csv-intervals/binary/test.04/expected
diff --git a/csv/test/csv-interval/binary/test.04/input b/csv/test/csv-intervals/binary/test.04/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/input
rename to csv/test/csv-intervals/binary/test.04/input
diff --git a/csv/test/csv-interval/binary/test.04/options b/csv/test/csv-intervals/binary/test.04/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/options
rename to csv/test/csv-intervals/binary/test.04/options
diff --git a/csv/test/csv-interval/binary/test.05/expected b/csv/test/csv-intervals/binary/test.05/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.05/expected
rename to csv/test/csv-intervals/binary/test.05/expected
diff --git a/csv/test/csv-interval/binary/test.05/input b/csv/test/csv-intervals/binary/test.05/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.05/input
rename to csv/test/csv-intervals/binary/test.05/input
diff --git a/csv/test/csv-interval/binary/test.05/options b/csv/test/csv-intervals/binary/test.05/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.05/options
rename to csv/test/csv-intervals/binary/test.05/options
diff --git a/csv/test/csv-interval/binary/test.06/expected b/csv/test/csv-intervals/binary/test.06/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.06/expected
rename to csv/test/csv-intervals/binary/test.06/expected
diff --git a/csv/test/csv-interval/binary/test.06/input b/csv/test/csv-intervals/binary/test.06/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.06/input
rename to csv/test/csv-intervals/binary/test.06/input
diff --git a/csv/test/csv-interval/binary/test.06/options b/csv/test/csv-intervals/binary/test.06/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.06/options
rename to csv/test/csv-intervals/binary/test.06/options
diff --git a/csv/test/csv-interval/binary/test.07/expected b/csv/test/csv-intervals/binary/test.07/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.07/expected
rename to csv/test/csv-intervals/binary/test.07/expected
diff --git a/csv/test/csv-interval/binary/test.07/input b/csv/test/csv-intervals/binary/test.07/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.07/input
rename to csv/test/csv-intervals/binary/test.07/input
diff --git a/csv/test/csv-interval/binary/test.07/options b/csv/test/csv-intervals/binary/test.07/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.07/options
rename to csv/test/csv-intervals/binary/test.07/options
diff --git a/csv/test/csv-interval/binary/test.08/expected b/csv/test/csv-intervals/binary/test.08/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.08/expected
rename to csv/test/csv-intervals/binary/test.08/expected
diff --git a/csv/test/csv-interval/binary/test.08/input b/csv/test/csv-intervals/binary/test.08/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.08/input
rename to csv/test/csv-intervals/binary/test.08/input
diff --git a/csv/test/csv-interval/binary/test.08/options b/csv/test/csv-intervals/binary/test.08/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.08/options
rename to csv/test/csv-intervals/binary/test.08/options
diff --git a/csv/test/csv-interval/binary/test.09/expected b/csv/test/csv-intervals/binary/test.09/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.09/expected
rename to csv/test/csv-intervals/binary/test.09/expected
diff --git a/csv/test/csv-interval/binary/test.09/input b/csv/test/csv-intervals/binary/test.09/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.09/input
rename to csv/test/csv-intervals/binary/test.09/input
diff --git a/csv/test/csv-interval/binary/test.09/options b/csv/test/csv-intervals/binary/test.09/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.09/options
rename to csv/test/csv-intervals/binary/test.09/options
diff --git a/csv/test/csv-interval/overlap-count/expected b/csv/test/csv-intervals/overlap-count/expected
similarity index 100%
rename from csv/test/csv-interval/overlap-count/expected
rename to csv/test/csv-intervals/overlap-count/expected
diff --git a/csv/test/csv-intervals/overlap-count/input b/csv/test/csv-intervals/overlap-count/input
new file mode 100644
index 000000000..5fb97b7f1
--- /dev/null
+++ b/csv/test/csv-intervals/overlap-count/input
@@ -0,0 +1,16 @@
+min[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 0"
+min[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 1"
+min[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 2"
+min[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 3"
+
+max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 0"
+max[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 1"
+max[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 2"
+max[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 3"
+
+min_max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 1 --overlap-count-max 2"
+
+equal[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 0"
+equal[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 1"
+equal[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 2"
+equal[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 3"

From 3a9d4e021de34d0e403b8f75fb0b0ac6b72f6855 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 28 May 2019 18:28:30 +1000
Subject: [PATCH 0032/1056] csv-intervals: contain: basic unit test added

---
 csv/applications/csv-intervals.cpp      | 73 +++++++++++++------------
 csv/test/csv-intervals/contain/expected | 23 ++++++++
 csv/test/csv-intervals/contain/input    |  7 +++
 3 files changed, 68 insertions(+), 35 deletions(-)
 create mode 100644 csv/test/csv-intervals/contain/expected
 create mode 100644 csv/test/csv-intervals/contain/input

diff --git a/csv/applications/csv-intervals.cpp b/csv/applications/csv-intervals.cpp
index dc710ed6a..416e23337 100644
--- a/csv/applications/csv-intervals.cpp
+++ b/csv/applications/csv-intervals.cpp
@@ -318,13 +318,14 @@ struct intervals
     unsigned int min_overlap_count;
     unsigned int max_overlap_count;
 
-    intervals( const comma::command_line_options& options ) : options( options )
-                                                            , csv( options )
-                                                            , ocsv( options )
-                                                            , ascii_csv( options )
-                                                            , empty( traits< bound_type >::cast( options.optional< std::string >( "--empty" ) ) )
-                                                            , intervals_only( options.exists( "--intervals-only" ) )
-                                                            , use_limits( options.exists( "--limits,-l" ) )
+    intervals( const comma::command_line_options& options, const comma::csv::options& csv_ ) 
+        : options( options )
+        , csv( csv_ )
+        , ocsv( csv )
+        , ascii_csv( csv )
+        , empty( traits< bound_type >::cast( options.optional< std::string >( "--empty" ) ) )
+        , intervals_only( options.exists( "--intervals-only" ) )
+        , use_limits( options.exists( "--limits,-l" ) )
     {
         csv.full_xpath = false;
         if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< From, To > >(), ',' ); }
@@ -484,7 +485,8 @@ struct intervals
     
     int contain( std::istream& is, const std::string& first_line )
     {
-        comma::csv::options icsv( options, "", false );
+        comma::csv::options icsv( options );
+        icsv.full_xpath = false;
         comma::csv::input_stream< scalar_t< From > > istream( std::cin, icsv );
         comma::csv::output_stream< scalar_t< bool > > ostream( std::cout, icsv.binary() );
         auto tied = comma::csv::make_tied( istream, ostream );
@@ -553,7 +555,8 @@ int main( int ac, char** av )
         debug = options.exists( "--debug" );
         options.assert_mutually_exclusive( "--binary,--format" );
         const auto& unnamed = options.unnamed( "--append,-a,--debug,--flush,--input-fields,--output-fields,--intervals-only,--limits,-l", "-.*" );
-        std::string operation = unnamed.empty() ? "make" : unnamed[0];
+        if( unnamed.empty() ) { std::cerr << "csv-intervals: please specify operation" << std::endl; return 1; }
+        std::string operation = unnamed[0];
         if( operation == "make" )
         {
             append = options.exists( "--append,-a" );
@@ -565,20 +568,20 @@ int main( int ac, char** av )
             std::string first_line = std::get< 1 >( t );
             switch( to_type )
             {
-                case comma::csv::format::int8:          intervals< char >( options ).make( first_line ); return 0;
-                case comma::csv::format::uint8:         intervals< unsigned char >( options ).make( first_line ); return 0;
-                case comma::csv::format::int16:         intervals< comma::int16 >( options ).make( first_line ); return 0;
-                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).make( first_line ); return 0;
-                case comma::csv::format::int32:         intervals< comma::int32 >( options ).make( first_line ); return 0;
-                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).make( first_line ); return 0;
-                case comma::csv::format::int64:         intervals< comma::int64 >( options ).make( first_line ); return 0;
-                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).make( first_line ); return 0;
-                case comma::csv::format::char_t:        intervals< char >( options ).make( first_line ); return 0;
-                case comma::csv::format::float_t:       intervals< float >( options ).make( first_line ); return 0;
-                case comma::csv::format::double_t:      intervals< double >( options ).make( first_line ); return 0;
+                case comma::csv::format::int8:          intervals< char >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options, csv ).make( first_line ); return 0;
                 case comma::csv::format::time:
-                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).make( first_line ); return 0;
-                case comma::csv::format::fixed_string:  intervals< std::string >( options ).make( first_line ); return 0;            
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options, csv ).make( first_line ); return 0;            
                 default:                                COMMA_THROW( comma::exception, "invalid type" ); return 0; // never here
             }
             return 0;
@@ -596,20 +599,20 @@ int main( int ac, char** av )
             std::string first_line = std::get< 1 >( t );
             switch( to_type )
             {
-                case comma::csv::format::int8:          intervals< char >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::uint8:         intervals< unsigned char >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::int16:         intervals< comma::int16 >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::int32:         intervals< comma::int32 >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::int64:         intervals< comma::int64 >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::char_t:        intervals< char >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::float_t:       intervals< float >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::double_t:      intervals< double >( options ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int8:          intervals< char >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options, csv ).contain( *is, first_line ); return 0;
                 case comma::csv::format::time:
-                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).contain( *is, first_line ); return 0;
-                case comma::csv::format::fixed_string:  intervals< std::string >( options ).contain( *is, first_line ); return 0;            
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options, csv ).contain( *is, first_line ); return 0;            
                 default:                                COMMA_THROW( comma::exception, "invalid type" ); // never here
             }
             return 0;
diff --git a/csv/test/csv-intervals/contain/expected b/csv/test/csv-intervals/contain/expected
new file mode 100644
index 000000000..b307e5a5c
--- /dev/null
+++ b/csv/test/csv-intervals/contain/expected
@@ -0,0 +1,23 @@
+contain/ascii[0]/output/line[0]="1,1"
+contain/ascii[0]/output/line[1]="5,0"
+contain/ascii[0]/output/line[2]="9,1"
+contain/ascii[0]/output/line[3]="11,0"
+contain/ascii[0]/status=0
+contain/ascii[1]/output/line[0]="1,1"
+contain/ascii[1]/output/line[1]="5,0"
+contain/ascii[1]/status=0
+contain/fields[0]/output/line[0]=",1,1"
+contain/fields[0]/output/line[1]=",5,0"
+contain/fields[0]/status=0
+contain/fields[1]/output/line[0]=",1,1"
+contain/fields[1]/output/line[1]=",5,0"
+contain/fields[1]/status=0
+contain/binary[0]/output/line[0]="1,1"
+contain/binary[0]/output/line[1]="5,0"
+contain/binary[0]/status=0
+contain/binary[1]/output/line[0]="1,1"
+contain/binary[1]/output/line[1]="5,0"
+contain/binary[1]/status=0
+contain/binary[2]/output/line[0]="1,1"
+contain/binary[2]/output/line[1]="5,0"
+contain/binary[2]/status=0
diff --git a/csv/test/csv-intervals/contain/input b/csv/test/csv-intervals/contain/input
new file mode 100644
index 000000000..eac7bd818
--- /dev/null
+++ b/csv/test/csv-intervals/contain/input
@@ -0,0 +1,7 @@
+contain/ascii[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals contain --intervals <( echo 0,2; echo 9,11 )"
+contain/ascii[1]="( echo 1; echo 5 ) | csv-intervals --fields scalar contain --intervals <( echo 0,2 )"
+contain/fields[0]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar contain --intervals <( echo 0,2 )"
+contain/fields[1]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar contain --intervals <( echo ,0,2 )';fields=,from,to'"
+contain/binary[0]="( echo 1; echo 5 ) | csv-to-bin ui | csv-intervals contain --binary ui --intervals <( echo 0,2; echo 9,11 ) | csv-from-bin ui,b"
+contain/binary[1]="( echo 1; echo 5 ) | csv-to-bin ui | csv-intervals contain --binary ui --intervals <( ( echo 0,2; echo 9,11 ) | csv-to-bin 2ui )';binary=2ui' | csv-from-bin ui,b"
+contain/binary[2]="( echo 1; echo 5 ) | csv-intervals contain --intervals <( ( echo 0,2; echo 9,11 ) | csv-to-bin 2ui )';binary=2ui'"

From 1be73a880e09a927e6e9f4b29aa23935e63f54fb Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 29 May 2019 19:04:59 +1000
Subject: [PATCH 0033/1056] csv-intervals: join operation: implemented (with
 somewhat suboptimal complexity); basic unit test done

---
 csv/applications/csv-intervals.cpp   | 124 +++++++++++++++++++++------
 csv/test/csv-intervals/join/expected |  15 ++++
 csv/test/csv-intervals/join/input    |   5 ++
 3 files changed, 118 insertions(+), 26 deletions(-)
 create mode 100644 csv/test/csv-intervals/join/expected
 create mode 100644 csv/test/csv-intervals/join/input

diff --git a/csv/applications/csv-intervals.cpp b/csv/applications/csv-intervals.cpp
index 416e23337..f370dd819 100644
--- a/csv/applications/csv-intervals.cpp
+++ b/csv/applications/csv-intervals.cpp
@@ -46,10 +46,9 @@
 #include "../../io/stream.h"
 #include "../../name_value/map.h"
 #include "../../name_value/parser.h"
+#include "../../string/string.h"
 #include "../../visiting/traits.h"
 
-static const std::string app_name = "csv-intervals";
-
 static bool verbose;
 static bool debug;
 static bool append;
@@ -100,6 +99,7 @@ static void usage( bool verbose = false )
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
     std::cerr << "    contain: given a set of intervals, take scalars on stdin, append 1 if contained in the intervals, 0 if not" << std::endl;
+    std::cerr << "    join: given a set of intervals, take scalars on stdin, append payloads of the intervals the scalars are contained in" << std::endl;
     std::cerr << "    make: make intervals" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
@@ -133,6 +133,9 @@ static void usage( bool verbose = false )
     std::cerr << "    contain" << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --intervals=<filename>: file or stream name" << std::endl;
+    std::cerr << "    join" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --intervals=<filename>: file or stream name" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    make" << std::endl;
     std::cerr << "        options" << std::endl;
@@ -146,7 +149,7 @@ static void usage( bool verbose = false )
     std::cerr << "ascii notes" << std::endl;
     std::cerr << "    unbounded intervals may be indicated by no value (e.g. ,3 \u2261 -\u221e,3), both sides unbounded is also supported" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "for examples see verbose help: " << app_name << " --help --verbose" << std::endl;
+    std::cerr << "for examples see verbose help: csv-intervals --help --verbose" << std::endl;
     std::cerr << std::endl;
     if( verbose )
     {
@@ -161,7 +164,7 @@ static void usage( bool verbose = false )
         std::cerr << "        B:      [2      4]"           << std::endl;
         std::cerr << "        C:           [3           6]" << std::endl;
         std::cerr << std::endl;
-        std::cerr << "        echo -e '1,5,A\\n2,4,B\\n3,6,C' | " << app_name << std::endl;
+        std::cerr << "        echo -e '1,5,A\\n2,4,B\\n3,6,C' | csv-intervals make" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        A: [1 2][2 3][3 4][4 5]"      << std::endl;
         std::cerr << "        B:      [2 3][3 4]"           << std::endl;
@@ -175,7 +178,7 @@ static void usage( bool verbose = false )
         std::cerr << "        D:            [3           8]"                    << std::endl;
         std::cerr << "        Z: [-\u221e                          +\u221e]"    << std::endl;
         std::cerr << std::endl;
-        std::cerr << "        echo -e ',4,A\\n2,4,B\\n3,6,C\\n3,8,D\\n,,Z' | " << app_name << " --format 2i" << std::endl;
+        std::cerr << "        echo -e ',4,A\\n2,4,B\\n3,6,C\\n3,8,D\\n,,Z' | csv-intervals make" << " --format 2i" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        A: [-\u221e 2][2 3][3 4]"                         << std::endl;
         std::cerr << "        B:       [2 3][3 4]"                              << std::endl;
@@ -190,7 +193,7 @@ static void usage( bool verbose = false )
         std::cerr << "        C:                                                                                       [20140916T190000 +\u221e]" << std::endl;
         std::cerr << "        Z: [-\u221e                                                                                                    +\u221e]" << std::endl;
         std::cerr << std::endl;
-        std::cerr << "        echo -e ',20140916T030000.000000,A\\n20140916T010000.000000,20140916T190000.000000,B\\n20140916T190000.000000,,C\\n,,Z' | " << app_name << " --format 2t" << std::endl;
+        std::cerr << "        echo -e ',20140916T030000.000000,A\\n20140916T010000.000000,20140916T190000.000000,B\\n20140916T190000.000000,,C\\n,,Z' | csv-intervals make" << " --format 2t" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        A: [-\u221e 20140916T010000][20140916T010000 20140916T030000]" << std::endl;
         std::cerr << "        B:                     [20140916T010000 20140916T030000][20140916T030000 20140916T190000]" << std::endl;
@@ -336,7 +339,7 @@ struct intervals
         }
         ascii_csv.fields = ocsv.fields;
         ascii_csv.quote = boost::none;
-        if( verbose ) { std::cerr << app_name << ": empty: "; empty ? std::cerr << *empty : std::cerr << "<none>"; std::cerr << std::endl; }
+        if( verbose ) { std::cerr << "csv-intervals: empty: "; empty ? std::cerr << *empty : std::cerr << "<none>"; std::cerr << std::endl; }
         options.assert_mutually_exclusive( "overlap-count-min,overlap-count-max", "overlap-count" );
         if( options.exists( "--overlap-count" ) )
         {
@@ -443,7 +446,7 @@ struct intervals
             if( !first.to.value.empty() && ( !empty || interval.to.value != *empty  ) ) { to.value = interval.to.value; }
             payload = first_line;
             if( !intervals_only && !append ) { ascii.put( interval_t< std::string >(), payload ); } // blank out interval from payload
-            if( verbose ) { std::cerr << app_name << ": from: " << from << " to: " << to << " payload: " << payload << std::endl; }
+            if( verbose ) { std::cerr << "csv-intervals: from: " << from << " to: " << to << " payload: " << payload << std::endl; }
             add( from, to, payload );
         }
         while( istream.ready() || is.good()  )
@@ -471,18 +474,11 @@ struct intervals
                 if( !intervals_only && !append ) { ascii.put( interval_t< std::string >(), buf ); } // blank out interval from payload
                 payload = comma::join( buf, csv.delimiter );
             }
-            if( verbose ) { std::cerr << app_name << ": from: " << from << " to: " << to << " payload: " << ( csv.binary() ? "<binary>" : payload ) << std::endl; }
+            if( verbose ) { std::cerr << "csv-intervals: from: " << from << " to: " << to << " payload: " << ( csv.binary() ? "<binary>" : payload ) << std::endl; }
             add( from, to, payload );
         }
     }
 
-    int make( const std::string& first_line )
-    {
-        this->read( std::cin, first_line );
-        this->write();
-        return 0;
-    }
-    
     int contain( std::istream& is, const std::string& first_line )
     {
         comma::csv::options icsv( options );
@@ -495,8 +491,8 @@ struct intervals
         {
             auto p = istream.read();
             if( !p ) { break; }
-            bool contained = false; // todo? use boost::...::query
-            for( typename map_t::iterator it = map.begin(); it != map.end() && !contained; ++it )
+            bool contained = false;
+            for( typename map_t::iterator it = map.begin(); it != map.end() && !contained; ++it ) // todo! quadratic complexity; how the heck to query icl map? use boost::...::query?
             {
                 const bound_t< bound_type >& from = it->first.lower();
                 const bound_t< bound_type >& to = it->first.upper();
@@ -505,7 +501,52 @@ struct intervals
             tied.append( scalar_t< bool >( contained ) );
             if( icsv.flush ) { std::cout.flush(); }
         }
-        std::cout.flush();
+        return 0;
+    }
+    
+    int join( std::istream& is, const std::string& first_line )
+    {
+        comma::csv::options icsv( options );
+        if( csv.binary() != icsv.binary() ) { COMMA_THROW( comma::exception, "expected both inputs ascii or both binary; got stdin " << ( icsv.binary() ? "binary" : "ascii" ) << " while --intervals " << ( csv.binary() ? "binary" : "ascii" ) ); }
+        icsv.full_xpath = false;
+        comma::csv::input_stream< scalar_t< From > > istream( std::cin, icsv );
+        append = true;
+        this->read( is, first_line ); // todo: support block
+        while( istream.ready() || std::cin.good() )
+        {
+            auto p = istream.read();
+            if( !p ) { break; }
+            for( typename map_t::iterator it = map.begin(); it != map.end(); ++it ) // todo! quadratic complexity; how the heck to query icl map? use boost::...::query?
+            {
+                const bound_t< bound_type >& from = it->first.lower();
+                const bound_t< bound_type >& to = it->first.upper();
+                if( ( !from.value || p->scalar >= *from.value ) && ( !to.value || p->scalar < *to.value ) )
+                {
+                    std::string joined = csv.binary() ? "" : comma::join( istream.ascii().last(), icsv.delimiter );
+                    for( const auto& s: it->second )
+                    {
+                        if( csv.binary() )
+                        {
+                            std::cout.write( istream.binary().last(), icsv.format().size() );
+                            std::cout.write( &s[0], s.size() );
+                        }
+                        else
+                        {
+                            std::cout << joined << icsv.delimiter << s << std::endl;
+                        }
+                    }
+                    break;
+                }
+            }
+            if( icsv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    }
+    
+    int make( const std::string& first_line )
+    {
+        this->read( std::cin, first_line );
+        this->write();
         return 0;
     }
 };
@@ -523,7 +564,7 @@ static std::tuple< comma::csv::format::types_enum, std::string > interval_type(
             while( is.good() && first_line.empty() ) { std::getline( is, first_line ); }
             if( first_line.empty() ) { exit( 0 ); } // quick and dirty
             csv.format( comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter ) );
-            if( verbose ) { std::cerr << app_name << ": guessed format: " << csv.format().string() << std::endl;; }
+            if( verbose ) { std::cerr << "csv-intervals: guessed format: " << csv.format().string() << std::endl;; }
         }
         else
         {
@@ -538,11 +579,11 @@ static std::tuple< comma::csv::format::types_enum, std::string > interval_type(
     const comma::csv::format::types_enum from_type = csv.format().offset( from_index ).type;
     const comma::csv::format::types_enum to_type = csv.format().offset( to_index ).type;
     if( ( ( from_type == comma::csv::format::time || from_type == comma::csv::format::long_time ) && ( to_type != comma::csv::format::time && to_type != comma::csv::format::long_time ) ) ||
-    ( ( ( from_type != comma::csv::format::time && from_type != comma::csv::format::long_time ) && ( to_type == comma::csv::format::time || to_type == comma::csv::format::long_time ) ) ) )
-    { COMMA_THROW( comma::exception, "from/to type mismatch; time" ); }
+        ( ( ( from_type != comma::csv::format::time && from_type != comma::csv::format::long_time ) && ( to_type == comma::csv::format::time || to_type == comma::csv::format::long_time ) ) ) )
+        { COMMA_THROW( comma::exception, "from/to type mismatch; time" ); }
     if( ( from_type == comma::csv::format::fixed_string || to_type == comma::csv::format::fixed_string ) && from_type != to_type )
-    { COMMA_THROW( comma::exception, "from/to type mismatch; string" ); }
-    if( from_type != to_type ) { std::cerr << app_name << ": support only from and to of the same type, got from: " << comma::csv::format::to_format( from_type ) << ", to: " << comma::csv::format::to_format( to_type ) << std::endl; exit( 1 ); }
+        { COMMA_THROW( comma::exception, "from/to type mismatch; string" ); }
+    if( from_type != to_type ) { std::cerr << "csv-intervals: support only from and to of the same type, got from: " << comma::csv::format::to_format( from_type ) << ", to: " << comma::csv::format::to_format( to_type ) << std::endl; exit( 1 ); }
     return std::tie( to_type, first_line );
 }
 
@@ -617,9 +658,40 @@ int main( int ac, char** av )
             }
             return 0;
         }
+        if( operation == "join" )
+        {
+            if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< scalar_t< double > >(), ',' ) << std::endl; return 0; }
+            if( options.exists( "--output-fields" ) ) { std::cerr << "csv-intervals join: does not have --output-fields" << std::endl; return 1; }
+            auto i = options.value< std::string >( "--intervals" );
+            comma::csv::options csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( i );
+            std::string format = comma::name_value::map( i ).value< std::string >( "format", "" );
+            comma::io::istream is( csv.filename );
+            auto t = interval_type( *is, csv, format );
+            const comma::csv::format::types_enum to_type = std::get< 0 >( t );
+            std::string first_line = std::get< 1 >( t );
+            switch( to_type )
+            {
+                case comma::csv::format::int8:          intervals< char >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::time:
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options, csv ).join( *is, first_line ); return 0;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); // never here
+            }
+            return 0;
+        }
         std::cerr << "csv-intervals: expected operation, got: '" << operation << "'" << std::endl;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-invervals: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-invervals: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-intervals: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-intervals: unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/test/csv-intervals/join/expected b/csv/test/csv-intervals/join/expected
new file mode 100644
index 000000000..d78db3ead
--- /dev/null
+++ b/csv/test/csv-intervals/join/expected
@@ -0,0 +1,15 @@
+join/ascii[0]/output/line[0]="1,0,2,a"
+join/ascii[0]/output/line[1]="9,9,11,b"
+join/ascii[0]/status=0
+join/ascii[1]/output/line[0]="9,0,10,b"
+join/ascii[1]/output/line[1]="9,0,10,c"
+join/ascii[1]/output/line[2]="9,0,20,d"
+join/ascii[1]/status=0
+join/fields[0]/output=",1,0,2,a"
+join/fields[0]/status=0
+join/fields[1]/output=",1,a,0,2,b"
+join/fields[1]/status=0
+join/binary[0]/output/line[0]="9,0,10,0"
+join/binary[0]/output/line[1]="9,0,10,1"
+join/binary[0]/output/line[2]="9,5,20,2"
+join/binary[0]/status=0
diff --git a/csv/test/csv-intervals/join/input b/csv/test/csv-intervals/join/input
new file mode 100644
index 000000000..9cd53fe1a
--- /dev/null
+++ b/csv/test/csv-intervals/join/input
@@ -0,0 +1,5 @@
+join/ascii[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b )"
+join/ascii[1]="( echo 9 ) | csv-intervals join --intervals <( echo 0,2,a; echo 0,10,b; echo 0,10,c; echo 0,20,d )"
+join/fields[0]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar join --intervals <( echo 0,2,a )"
+join/fields[1]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar join --intervals <( echo a,0,2,b )';fields=,from,to'"
+join/binary[0]="( echo 9 ) | csv-to-bin ui | csv-intervals join --binary ui --intervals <( ( echo 0,10,0; echo 0,10,1; echo 5,20,2 ) | csv-to-bin 3ui )';binary=3ui' | csv-from-bin 4ui"

From 162d39b2d0c241d632bd1d2a7b0704162d9c61db Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 30 May 2019 19:16:57 +1000
Subject: [PATCH 0034/1056] cmake: boost::iostreams added

---
 CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 167b087db..980e1a74e 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -171,9 +171,9 @@ IF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
     SET( Python_ADDITIONAL_VERSIONS 2.7 )
     FIND_PACKAGE( PythonLibs REQUIRED )
     INCLUDE_DIRECTORIES( ${PYTHON_INCLUDE_DIRS} )
-    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time program_options regex python )
+    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time iostreams program_options regex python )
 ELSE( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
-    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time program_options regex )
+    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time iostreams program_options regex )
 ENDIF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
 INCLUDE_DIRECTORIES( ${Boost_INCLUDE_DIRS} )
 LINK_DIRECTORIES( ${Boost_LIBRARY_DIRS} )

From d4c8b1304d3e3d7b2d0f556cd6bcf5ee0b71df24 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 31 May 2019 13:48:05 +1000
Subject: [PATCH 0035/1056] io-tee: --dry-run made exiting before checking
 whether output file is writable; output filename quoted in command to support
 filenames with special characters

---
 io/applications/io-tee.cpp | 70 ++++++++++++++++++--------------------
 1 file changed, 34 insertions(+), 36 deletions(-)

diff --git a/io/applications/io-tee.cpp b/io/applications/io-tee.cpp
index c15efb20d..a0188585a 100644
--- a/io/applications/io-tee.cpp
+++ b/io/applications/io-tee.cpp
@@ -41,11 +41,9 @@
 #include "../../io/select.h"
 #include "../../io/stream.h"
 
-static const char *app_name = "io-tee";
-
 static void show_usage()
 {
-    std::cerr << "Usage: " << app_name << " <output file> [options ... --] <command ...>\n";
+    std::cerr << "Usage: io-tee <output file> [options ... --] <command ...>\n";
 }
 
 static void show_help( bool verbose = false )
@@ -63,14 +61,14 @@ static void show_help( bool verbose = false )
         << "    --verbose,-v: more output" << std::endl
         << std::endl
         << "Note that only single commands are supported; to run multiple commands (or a pipeline), put them inside a bash function:" << std::endl
-        << "*** IMPORTANT *** use \"export -f function_name\" to make the function visible to " << app_name << "." << std::endl
-        << "Remember that " << app_name << " will not have access to the unexported variables, so pass any required values as function arguments." << std::endl
+        << "*** IMPORTANT *** use \"export -f function_name\" to make the function visible to io-tee." << std::endl
+        << "Remember that io-tee will not have access to the unexported variables, so pass any required values as function arguments." << std::endl
         << "On Ubuntu 16.04, io-tee might fail to discover a bash function even if it is exported." << std::endl
         << "In this case, comma_tee_function defined in comma-application-util should be used." << std::endl
         << std::endl
         << "If any options are used (such as --unbuffered), \"--\" must precede the command." << std::endl
         << std::endl
-        << "A note about using \"grep\": be aware grep returns 1 if the pattern is not found, which will make " << app_name << " think the command failed." << std::endl
+        << "A note about using \"grep\": be aware grep returns 1 if the pattern is not found, which will make io-tee think the command failed." << std::endl
         << "To avoid this, call grep inside a function like this: grep (pattern) || true." << std::endl
         << std::endl
         << "Example 1:" << std::endl
@@ -127,19 +125,19 @@ int main( int ac, char **av )
             else if ( av[n] == std::string( "--help" ) || av[n] == std::string( "-h" ) ) { show_help(); exit( 0 ); }
         }
         int command_offset = ( dashdash_pos == -1 ? 2 : dashdash_pos + 1 );
-        if ( command_offset >= ac ) { std::cerr << app_name << ": missing command; "; show_usage(); exit( 1 ); }
+        if ( command_offset >= ac ) { std::cerr << "io-tee: missing command; "; show_usage(); exit( 1 ); }
         // if there is no "--", there can be no command line options, just the output filename
         int options_ac = ( dashdash_pos == -1 ? 2 : dashdash_pos );
         if ( debug )
         {
-            std::cerr << app_name << ": options_ac=" << options_ac << "; command line: " << app_name;
+            std::cerr << "io-tee: options_ac=" << options_ac << "; command line: io-tee";
             for ( int m = 1; m < ac; ++m ) { std::cerr << ' ' << av[m]; }
             std::cerr << std::endl;
         }
         comma::command_line_options options( options_ac, av );
         const std::vector< std::string >& unnamed = options.unnamed( "--unbuffered,-u,--verbose,-v,--debug,--dry-run,--dry,--append,-a", "-.*" );
-        if( unnamed.empty() ) { std::cerr << app_name << ": please specify output file name" << std::endl; return 1; }
-        if( unnamed.size() > 1 ) { std::cerr << app_name << ": expected one output filename, got: " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
+        if( unnamed.empty() ) { std::cerr << "io-tee: please specify output file name" << std::endl; return 1; }
+        if( unnamed.size() > 1 ) { std::cerr << "io-tee: expected one output filename, got: " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
         std::string outfile = unnamed[0];
         // bash -c only takes a single argument, so put the whole command in single quotes, then double quote each individual argument
         std::string command = "bash -c '" + escape_quotes( av[command_offset] );
@@ -147,24 +145,24 @@ int main( int ac, char **av )
         bool append_to_outfile = options.exists( "--append,-a" );
         if( append_to_outfile ) { command += " >> "; }
         else { command += " > "; }
-        command += outfile;
+        command += '"' + outfile + '"';
         command += "'";
         bool unbuffered = options.exists( "--unbuffered,-u" );
         bool verbose = options.exists( "--verbose,-v" );
         if ( debug ) { verbose = true; }
-        if( !file_is_writable( outfile, append_to_outfile ) ) { std::cerr << app_name << ": cannot write to " << outfile << std::endl; exit( 1 ); }
         if( options.exists( "--dry-run,--dry" ) ) { std::cout << command << std::endl; return 0; }
-        if( verbose ) { std::cerr << app_name << ": will run command: " << command << std::endl; }
+        if( verbose ) { std::cerr << "io-tee: will run command: " << command << std::endl; }
+        if( !file_is_writable( outfile, append_to_outfile ) ) { std::cerr << "io-tee: cannot write to " << outfile << std::endl; exit( 1 ); }
         std::cout.flush();
         pipe = ::popen( &command[0], "w" );
-        if( pipe == NULL ) { std::cerr << app_name << ": failed to open pipe; command: " << command << std::endl; return 1; }
+        if( pipe == NULL ) { std::cerr << "io-tee: failed to open pipe; command: " << command << std::endl; return 1; }
         boost::array< char, 0xffff > buffer;
-        if ( debug ) { std::cerr << app_name << ": created buffer" << std::endl; }
+        if ( debug ) { std::cerr << "io-tee: created buffer" << std::endl; }
         comma::io::select stdin_select;
-        if ( debug ) { std::cerr << app_name << ": constructed comma::io::select" << std::endl; }
-        if( unbuffered ) { stdin_select.read().add( 0 ); if ( debug ) { std::cerr << app_name << ": did initial unbuffered read" << std::endl; } }
+        if ( debug ) { std::cerr << "io-tee: constructed comma::io::select" << std::endl; }
+        if( unbuffered ) { stdin_select.read().add( 0 ); if ( debug ) { std::cerr << "io-tee: did initial unbuffered read" << std::endl; } }
         comma::io::istream is( "-", comma::io::mode::binary );
-        if ( debug ) { std::cerr << app_name << ": opened input stream" << std::endl; }
+        if ( debug ) { std::cerr << "io-tee: opened input stream" << std::endl; }
         if( unbuffered )
         {
             std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
@@ -172,51 +170,51 @@ int main( int ac, char **av )
         }
         while( std::cin.good() )
         {
-            if ( debug ) { std::cerr << app_name << ": loop" << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: loop" << std::endl; }
             std::size_t bytes_to_read = buffer.size();
             if( unbuffered )
             {
-                if ( debug ) { std::cerr << app_name << ": calling stdin_select.wait(1)" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: calling stdin_select.wait(1)" << std::endl; }
                 if( stdin_select.wait( boost::posix_time::seconds( 1 ) ) == 0 ) { continue; }
-                if ( debug ) { std::cerr << app_name << ": after stdin_select.wait" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: after stdin_select.wait" << std::endl; }
                 std::size_t available = is.available_on_file_descriptor();
-                if ( debug ) { std::cerr << app_name << ": " << available << " bytes available" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: " << available << " bytes available" << std::endl; }
                 bytes_to_read = std::min( available, buffer.size() );
             }
-            if ( debug ) { std::cerr << app_name << ": bytes_to_read = " << bytes_to_read << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: bytes_to_read = " << bytes_to_read << std::endl; }
             std::cin.read( &buffer[0], bytes_to_read );
-            if ( debug ) { std::cerr << app_name << ": cin.gcount is " << std::cin.gcount() << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: cin.gcount is " << std::cin.gcount() << std::endl; }
             if( std::cin.gcount() <= 0 ) { break; }
             std::size_t gcount = std::cin.gcount();
-            if ( debug ) { std::cerr << app_name << ": writing " << gcount << " bytes to stdout" << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: writing " << gcount << " bytes to stdout" << std::endl; }
             std::cout.write( &buffer[0], gcount );
-            if ( debug ) { std::cerr << app_name << ": writing " << gcount << " bytes to pipe" << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: writing " << gcount << " bytes to pipe" << std::endl; }
             int r = ::fwrite( &buffer[0], sizeof( char ), gcount, pipe );
-            if ( debug ) { std::cerr << app_name << ": fwrite to pipe returned " << r << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: fwrite to pipe returned " << r << std::endl; }
             if( r != (int) gcount )
             { 
-                std::cerr << app_name << ": error on pipe: " << std::strerror( errno ) <<  std::endl;
+                std::cerr << "io-tee: error on pipe: " << std::strerror( errno ) <<  std::endl;
                 ::pclose( pipe );
                 return 1;
             }
             if( unbuffered )
             { 
-                if ( debug ) { std::cerr << app_name << ": flushing stdout" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: flushing stdout" << std::endl; }
                 std::cout.flush();
-                if ( debug ) { std::cerr << app_name << ": flushing pipe" << std::endl; }
-                if ( ::fflush( pipe ) != 0 ) { std::cerr << app_name << ": flushing pipe failed: " << std::strerror( errno ) << "; command was: " << command << std::endl; ::pclose( pipe ); exit( 1 ); }
-                if ( debug ) { std::cerr << app_name << ": flushed stdout and pipe " << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: flushing pipe" << std::endl; }
+                if ( ::fflush( pipe ) != 0 ) { std::cerr << "io-tee: flushing pipe failed: " << std::strerror( errno ) << "; command was: " << command << std::endl; ::pclose( pipe ); exit( 1 ); }
+                if ( debug ) { std::cerr << "io-tee: flushed stdout and pipe " << std::endl; }
             }
         }
         std::cout.flush();
         ::fflush( pipe );
         int result = ::pclose( pipe );
-        if ( result == -1 ) { std::cerr << app_name << ": pipe error: " << std::strerror( errno ) << "; command was: " << command << std::endl; exit( 1 ); }
-        else if ( result != 0 ) { std::cerr << app_name << ": command failed: " << command << std::endl; return 1; }
+        if ( result == -1 ) { std::cerr << "io-tee: pipe error: " << std::strerror( errno ) << "; command was: " << command << std::endl; exit( 1 ); }
+        else if ( result != 0 ) { std::cerr << "io-tee: command failed: " << command << std::endl; return 1; }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << app_name << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << app_name << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "io-tee: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "io-tee: unknown exception" << std::endl; }
     if( pipe ) { ::pclose( pipe ); }
     return 1;
 }

From 9c66ea9d92ee67137b1d6dadfd9b382c5fb50f58 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 31 May 2019 13:52:21 +1000
Subject: [PATCH 0036/1056] io-tee: unit test fixed

---
 io/test/io-tee/comma_tee_function/expected | 10 +++++-----
 io/test/io-tee/simple/expected             |  6 +++---
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/io/test/io-tee/comma_tee_function/expected b/io/test/io-tee/comma_tee_function/expected
index 9dfe99951..79d21019b 100644
--- a/io/test/io-tee/comma_tee_function/expected
+++ b/io/test/io-tee/comma_tee_function/expected
@@ -20,9 +20,9 @@ pipeline/stdout/matches="true"
 
 # commands (with quotes transformed to strings)
 
-basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-function_call_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > out(SQUOTE)"
-unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-unbuffered_fn_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > out(SQUOTE)"
-pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > out(SQUOTE)"
+basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+function_call_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+unbuffered_fn_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 
diff --git a/io/test/io-tee/simple/expected b/io/test/io-tee/simple/expected
index 6b47dcb31..36ad9793b 100644
--- a/io/test/io-tee/simple/expected
+++ b/io/test/io-tee/simple/expected
@@ -12,7 +12,7 @@ pipeline/stdout/matches="true"
 
 # commands (with quotes transformed to strings)
 
-basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > out(SQUOTE)"
+basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 

From 8b55df1425f400cc65f5c72b28c2972eb6cb6c29 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 6 Jun 2019 15:50:49 +1000
Subject: [PATCH 0037/1056] csv-paste: signature: 'line-number;binary=ui'
 support added

---
 csv/applications/csv-paste.cpp | 15 +++++++++------
 csv/test/csv-paste/expected    |  6 ++++++
 csv/test/csv-paste/input       |  2 ++
 3 files changed, 17 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index ef711b9da..56d26dbb7 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -114,7 +114,7 @@ class source
         virtual const std::string* read() = 0;
         virtual const char* read( char* buf ) = 0;
         bool binary() const { return binary_; }
-        virtual const bool is_stream() const { return false; }
+        virtual bool is_stream() const { return false; }
         const std::string& properties() const { return properties_; }
         std::size_t size() const { return value_.size(); }
         
@@ -151,7 +151,7 @@ class stream : public source
             return stream_->gcount() == int( value_.size() ) ? buf : NULL;
         }
         
-        const bool is_stream() { return true; }
+        bool is_stream() const { return true; }
         
     private:
         comma::io::istream stream_;
@@ -180,6 +180,7 @@ class line_number : public source
                 bool index;
                 bool reverse;
                 comma::uint32 begin;
+                std::string format;
                 
                 options( boost::optional< comma::uint32 > b = boost::optional< comma::uint32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false )
                     : size( size )
@@ -199,6 +200,8 @@ class line_number : public source
                     auto b = map.optional< comma::uint32 >( "begin" );
                     if( !b ) { b = o.optional< comma::uint32 >( "--begin" ); }
                     begin = begin_( b );
+                    format = map.value< std::string >( "binary", "" );
+                    if( !format.empty() && format != "ui" ) { std::cerr << "csv-paste: currently only ui supported for line-number; got: '" << format << "'" << std::endl; exit( 1 ); } // quick and dirty for now
                 }
                 
             private:
@@ -210,7 +213,7 @@ class line_number : public source
         };
         
         line_number( bool is_binary, const options& options )
-            : source( is_binary ? "binary=ui" : "" )
+            : source( options.format.empty() ? ( is_binary ? "binary=ui" : "" ) : "binary=" + options.format ) // quick and dirty
             , options_( options )
             , count_( 0 )
             , value_( options_.begin )
@@ -261,11 +264,11 @@ int main( int ac, char** av )
         std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--block-size" );
         boost::ptr_vector< source > sources;
         bool is_binary = false;
-        for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty
+        for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty; really lousy code duplication
         {
             if( unnamed[i].substr( 0, 6 ) == "value=" ) { if( value( unnamed[i] ).binary() ) { is_binary = true; } }
-            else if( unnamed[i] == "line-number" || unnamed[i].substr( 0, 12 ) == "line-number;" ) { continue; } // quick and dirty
-            if( stream( unnamed[i] ).binary() ) { is_binary = true; }
+            else if( unnamed[i] == "line-number" || unnamed[i].substr( 0, 12 ) == "line-number;" ) { if( line_number( is_binary, line_number::options( unnamed[i], options ) ).binary() ) { is_binary = true; } } // quick and dirty
+            else if( stream( unnamed[i] ).binary() ) { is_binary = true; }
         }
         for( unsigned int i = 0; i < unnamed.size(); ++i )
         {
diff --git a/csv/test/csv-paste/expected b/csv/test/csv-paste/expected
index ad48b2ffa..95f7b8c23 100644
--- a/csv/test/csv-paste/expected
+++ b/csv/test/csv-paste/expected
@@ -47,3 +47,9 @@ line_number/multiple[1]/output="0,0;0,0;0,0;0,0;0,0;0,1;1,1;1,1;1,1;1,1;"
 line_number/multiple[1]/status=0
 line_number/multiple[2]/output="0,0;0,1;0,2;0,3;0,4;1,0;1,1;1,2;1,3;1,4;"
 line_number/multiple[2]/status=0
+
+line_number/binary[0]/output/line[0]="0"
+line_number/binary[0]/output/line[1]="1"
+line_number/binary[0]/output/line[2]="2"
+line_number/binary[0]/output/line[3]="3"
+line_number/binary[0]/status=0
diff --git a/csv/test/csv-paste/input b/csv/test/csv-paste/input
index fb5037a14..f6ef59556 100644
--- a/csv/test/csv-paste/input
+++ b/csv/test/csv-paste/input
@@ -24,3 +24,5 @@ line_number/parametrized[8]="csv-paste 'line-number;size=5;index;reverse;begin=3
 line_number/multiple[0]="csv-paste line-number 'line-number;begin=4' --begin=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
 line_number/multiple[1]="csv-paste line-number 'line-number;size=5' --size=6 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
 line_number/multiple[2]="csv-paste line-number 'line-number;index' --size=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+
+line_number/binary[0]="csv-paste 'line-number;binary=ui' | csv-from-bin ui | head -n4; comma_status_ok && exit 0 || exit 1"

From d97d04166a70a1f5cf80822629585c3100a4942a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 7 Jun 2019 18:59:33 +1000
Subject: [PATCH 0038/1056] csv-intervals: join: --matching, --not-matching
 implemented

---
 csv/applications/csv-intervals.cpp   | 28 ++++++++++++++++++++++------
 csv/test/csv-intervals/join/expected | 12 ++++++++++++
 csv/test/csv-intervals/join/input    |  4 ++++
 3 files changed, 38 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-intervals.cpp b/csv/applications/csv-intervals.cpp
index f370dd819..01e02c6de 100644
--- a/csv/applications/csv-intervals.cpp
+++ b/csv/applications/csv-intervals.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author Vinny Do
 
 #include <fstream>
@@ -136,6 +135,8 @@ static void usage( bool verbose = false )
     std::cerr << "    join" << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --intervals=<filename>: file or stream name" << std::endl;
+    std::cerr << "            --matching: output matching input records, do not append the intervals" << std::endl;
+    std::cerr << "            --not-matching: output not matching input records" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    make" << std::endl;
     std::cerr << "        options" << std::endl;
@@ -506,8 +507,12 @@ struct intervals
     
     int join( std::istream& is, const std::string& first_line )
     {
+        options.assert_mutually_exclusive( "--matching,--not-matching" );
+        bool matching = options.exists( "--matching" );
+        bool not_matching = options.exists( "--not-matching" );
+        bool output_joined = !matching && !not_matching;
         comma::csv::options icsv( options );
-        if( csv.binary() != icsv.binary() ) { COMMA_THROW( comma::exception, "expected both inputs ascii or both binary; got stdin " << ( icsv.binary() ? "binary" : "ascii" ) << " while --intervals " << ( csv.binary() ? "binary" : "ascii" ) ); }
+        if( output_joined && csv.binary() != icsv.binary() ) { std::cerr << "csv-intervals: join: expected both inputs ascii or both binary; got stdin " << ( icsv.binary() ? "binary" : "ascii" ) << " while --intervals " << ( csv.binary() ? "binary" : "ascii" ) << std::endl; return 1; }
         icsv.full_xpath = false;
         comma::csv::input_stream< scalar_t< From > > istream( std::cin, icsv );
         append = true;
@@ -516,11 +521,18 @@ struct intervals
         {
             auto p = istream.read();
             if( !p ) { break; }
-            for( typename map_t::iterator it = map.begin(); it != map.end(); ++it ) // todo! quadratic complexity; how the heck to query icl map? use boost::...::query?
+            bool found = false;
+            typename map_t::iterator it;
+            for( it = map.begin(); it != map.end(); ++it ) // todo! quadratic complexity; how the heck to query icl map? use boost::...::query?
             {
                 const bound_t< bound_type >& from = it->first.lower();
                 const bound_t< bound_type >& to = it->first.upper();
-                if( ( !from.value || p->scalar >= *from.value ) && ( !to.value || p->scalar < *to.value ) )
+                found = ( !from.value || p->scalar >= *from.value ) && ( !to.value || p->scalar < *to.value );
+                if( found ) { break; }
+            }
+            if( output_joined )
+            {
+                if( found )
                 {
                     std::string joined = csv.binary() ? "" : comma::join( istream.ascii().last(), icsv.delimiter );
                     for( const auto& s: it->second )
@@ -535,9 +547,13 @@ struct intervals
                             std::cout << joined << icsv.delimiter << s << std::endl;
                         }
                     }
-                    break;
                 }
             }
+            else if( matching == found )
+            {
+                if( icsv.binary() ) { std::cout.write( istream.binary().last(), icsv.format().size() ); }
+                else { std::cout << comma::join( istream.ascii().last(), icsv.delimiter ) << std::endl; }
+            }
             if( icsv.flush ) { std::cout.flush(); }
         }
         return 0;
@@ -595,7 +611,7 @@ int main( int ac, char** av )
         verbose = options.exists( "--verbose,-v" );
         debug = options.exists( "--debug" );
         options.assert_mutually_exclusive( "--binary,--format" );
-        const auto& unnamed = options.unnamed( "--append,-a,--debug,--flush,--input-fields,--output-fields,--intervals-only,--limits,-l", "-.*" );
+        const auto& unnamed = options.unnamed( "--append,-a,--debug,--flush,--input-fields,--matching,--not-matching,--output-fields,--intervals-only,--limits,-l", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-intervals: please specify operation" << std::endl; return 1; }
         std::string operation = unnamed[0];
         if( operation == "make" )
diff --git a/csv/test/csv-intervals/join/expected b/csv/test/csv-intervals/join/expected
index d78db3ead..2d0a5a80e 100644
--- a/csv/test/csv-intervals/join/expected
+++ b/csv/test/csv-intervals/join/expected
@@ -13,3 +13,15 @@ join/binary[0]/output/line[0]="9,0,10,0"
 join/binary[0]/output/line[1]="9,0,10,1"
 join/binary[0]/output/line[2]="9,5,20,2"
 join/binary[0]/status=0
+join/matching[0]/output/line[0]="1"
+join/matching[0]/output/line[1]="9"
+join/matching[0]/status=0
+join/matching[1]/output/line[0]="1"
+join/matching[1]/output/line[1]="9"
+join/matching[1]/status=0
+join/not_matching[0]/output/line[0]="5"
+join/not_matching[0]/output/line[1]="11"
+join/not_matching[0]/status=0
+join/not_matching[1]/output/line[0]="5"
+join/not_matching[1]/output/line[1]="11"
+join/not_matching[1]/status=0
diff --git a/csv/test/csv-intervals/join/input b/csv/test/csv-intervals/join/input
index 9cd53fe1a..4ffbfd8aa 100644
--- a/csv/test/csv-intervals/join/input
+++ b/csv/test/csv-intervals/join/input
@@ -3,3 +3,7 @@ join/ascii[1]="( echo 9 ) | csv-intervals join --intervals <( echo 0,2,a; echo 0
 join/fields[0]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar join --intervals <( echo 0,2,a )"
 join/fields[1]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar join --intervals <( echo a,0,2,b )';fields=,from,to'"
 join/binary[0]="( echo 9 ) | csv-to-bin ui | csv-intervals join --binary ui --intervals <( ( echo 0,10,0; echo 0,10,1; echo 5,20,2 ) | csv-to-bin 3ui )';binary=3ui' | csv-from-bin 4ui"
+join/matching[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --matching"
+join/matching[1]="( echo 1; echo 5; echo 9; echo 11 ) | csv-to-bin ui | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --matching --binary ui | csv-from-bin ui"
+join/not_matching[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --not-matching"
+join/not_matching[1]="( echo 1; echo 5; echo 9; echo 11 ) | csv-to-bin ui | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --not-matching --binary ui | csv-from-bin ui"

From 7e8f4ee3867a0fb38315c5ea3ab74d3a3f061df5 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 25 Jun 2019 12:34:38 +1000
Subject: [PATCH 0039/1056] contact_info updated

---
 application/contact_info.h | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/application/contact_info.h b/application/contact_info.h
index 23aae6929..d4154064c 100644
--- a/application/contact_info.h
+++ b/application/contact_info.h
@@ -27,16 +27,12 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_APPLICATION_CONTACT_INFO_H_
-#define COMMA_APPLICATION_CONTACT_INFO_H_
+#pragma once
 
 namespace comma {
 
-static const char* contact_info = "more info: https://github.com/acfr/comma#readme";
+static const char* contact_info = "more info: https://gitlab.com/orthographic/comma#readme";
     
 } // namespace comma {
-    
-#endif // #ifndef COMMA_APPLICATION_CONTACT_INFO_H_

From 8bd8db3c5676e447a13896bc9efa5528b193ae88 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 25 Jun 2019 12:34:51 +1000
Subject: [PATCH 0040/1056] csv-analyse: minor brush-up

---
 csv/applications/csv-analyse.cpp | 39 +++++++++-----------------------
 1 file changed, 11 insertions(+), 28 deletions(-)

diff --git a/csv/applications/csv-analyse.cpp b/csv/applications/csv-analyse.cpp
index d07a38c4b..a551673ca 100644
--- a/csv/applications/csv-analyse.cpp
+++ b/csv/applications/csv-analyse.cpp
@@ -63,18 +63,15 @@ class histogram
         //sort, ugly
         std::multimap< std::size_t, std::size_t > sorted;
         std::size_t sum=0;
-        
         for(std::map< std::size_t, std::size_t >::const_iterator it=histogram_.begin(), end=histogram_.end(); it!=end; ++it )
         {
             sorted.insert( std::make_pair(it->second,it->first) );
             sum += it->second;
-        }
-        
+        }        
         for(std::multimap< std::size_t, std::size_t >::const_reverse_iterator it=sorted.rbegin(), end=sorted.rend(); it!=end; ++it )
         {
             os << it->second << "," << it->first << "," << (double)((double)(it->first)/(double)sum) << std::endl;
         }
-    
         return os;
     }
 
@@ -84,12 +81,9 @@ class histogram
     std::map< std::size_t, std::size_t > histogram_; //length, count
 };
 
-std::ostream& operator<<(std::ostream& os, const histogram & h)
-{
-    return h.print_sorted(os);
-}
+std::ostream& operator<<(std::ostream& os, const histogram & h) { return h.print_sorted(os); }
 
-static void usage()
+static void usage( bool )
 {
     std::cerr << std::endl;
     std::cerr << "Analyse binary data to guess message lengths in unknown binary stream: output candidate lengths, repeat counts and normalised probabilities" << std::endl;
@@ -133,33 +127,22 @@ int main( int ac, char** av )
         #ifdef WIN32
             _setmode( _fileno( stdin ), _O_BINARY );
         #endif
-
-        command_line_options options( ac, av );
-        if( ac > 1 || options.exists( "--help" ) || options.exists( "-h" ) ) { usage(); } //could just say ac > 1... but leave for future args
-
-        histogram h;
-
-        const std::size_t read_size=65535; //todo: better way?
+        command_line_options options( ac, av, usage );
+        const std::size_t read_size = 65535; // todo? better way?
         std::vector< unsigned char > data( read_size );
-        std::size_t offset=0;
-
-        //read as many bytes as available on stdin
-        while( std::cin.good() && !std::cin.eof() )
+        std::size_t offset = 0;
+        histogram h;
+        while( std::cin.good() && !std::cin.eof() ) //read as many bytes as available on stdin
         {
             int bytes_read = ::read( 0, &data[0], read_size );
             if( bytes_read <= 0 ) { break; }
-                        
-            for( int i=0; i<bytes_read; ++i )
-            {
-                h.observe(data[i],offset+i);
-            }
-            offset+=bytes_read;
+            for( int i = 0; i < bytes_read; ++i ) { h.observe( data[i], offset + i ); }
+            offset += bytes_read;
         }
-       
         std::cout << h;
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "csv-analyse: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-analyse: unknown exception" << std::endl; }
-    usage();
+    return 1;
 }

From fe03376727d51b8af9bc5be5d365f939469951d5 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 28 Jun 2019 10:57:21 +1000
Subject: [PATCH 0041/1056] comma-build: quick and dirty handling python
 installation added

---
 util/applications/comma-build | 42 ++++++++++++++++++++++++++---------
 1 file changed, 31 insertions(+), 11 deletions(-)

diff --git a/util/applications/comma-build b/util/applications/comma-build
index 0f1ea188b..487624c58 100755
--- a/util/applications/comma-build
+++ b/util/applications/comma-build
@@ -33,6 +33,9 @@
 
 source $( type -p comma-application-util ) || { echo "$basename: cannot source 'comma-application-util'" >&2; exit 1; }
 
+function say() { echo "comma-build: $@" >&2; }
+function die() { say $@; exit 1; }
+
 function description()
 {
     cat <<eof
@@ -216,12 +219,29 @@ function sudo_make_install() { cmake "../../src/$( basename $( pwd ) )" $@ && ma
 
 function run_build_command()
 {
-    local build_dir="../../build/$1"
     local src_dir="../../src/$1"
     local command=$2
-    mkdir "$build_dir" -p || { echo "comma-build: $command: failed to create '$build_dir'" >&2 ; exit 1 ; }
-    echo "comma-build: $command: running in $build_dir: ${@:2}" >&2
-    ( cd "$build_dir" && ${@:2} )
+    if [[ -f "$src_dir/CMakeLists.txt" ]]; then
+        local build_dir="../../build/$1"
+        mkdir "$build_dir" -p || { echo "comma-build: $command: failed to create '$build_dir'" >&2 ; exit 1 ; }
+        echo "comma-build: $command: running in $build_dir: ${@:2}" >&2
+        ( cd "$build_dir" && ${@:2} )
+    elif [[ -f "$src_dir/setup.py" ]]; then # quick and dirty
+        case "$command" in
+            make_install) echo "comma-build: $command: running in $src_dir on python3 setup: ${@:2}" >&2
+                          ( cd "$src_dir" && python3 setup.py install ) 
+                          ;;
+            make_only) echo "comma-build: $command: no CMakeLists.txt in $src_dir, but found setup.py; skipped" >&2
+                       ;;
+            sudo_make_install) echo "comma-build: $command: running in $src_dir on python3 setup: ${@:2}" >&2
+                               ( cd "$src_dir" && sudo python3 setup.py install ) 
+                               ;;
+            *) die "$command: on $src_dir: do not know how to handle command for python3 installations"
+               ;;
+        esac
+    else
+        die "$command: on $src_dir: CMakeLists.txt or setup.py not found; don't know how to handle"
+    fi
 }
 
 function run_cmake()
@@ -312,13 +332,13 @@ function run_pack() # quick and dirty
         [[ ! -f $src_dir/dependencies.cmake-cache ]] || cmake_options+=( -C$src_dir/dependencies.cmake-cache )
         comma-build install ${cmake_options[@]}
         if [[ -f $src_dir/dependencies.cpack-options ]]; then
-		cpack_make_opts=$(cat $src_dir/dependencies.cpack-options )
-		# The user specified different options for packing. Re-run the make so that the Cmake files are regenerated.
-		# This is primarily done so that software can be built as a standard user, and installations that would otherwise go into system directories (eg /etc/systemd) can be redirected to /usr/local/...
-		# When the software is packed however, you'd want it to go to install location (/etc).
-		comma-build make ${cpack_make_opts}
-	fi		
-	comma-build cpack -G RPM ${@:3} || exit 1 #-D CPACK_RPM_PACKAGE_RELOCATABLE=ON || exit 1 #-D CPACK_PACKAGING_INSTALL_PREFIX=$pack_dir/rpm
+            cpack_make_opts=$(cat $src_dir/dependencies.cpack-options )
+            # The user specified different options for packing. Re-run the make so that the Cmake files are regenerated.
+            # This is primarily done so that software can be built as a standard user, and installations that would otherwise go into system directories (eg /etc/systemd) can be redirected to /usr/local/...
+            # When the software is packed however, you'd want it to go to install location (/etc).
+            comma-build make ${cpack_make_opts}
+        fi
+        comma-build cpack -G RPM ${@:3} || exit 1 #-D CPACK_RPM_PACKAGE_RELOCATABLE=ON || exit 1 #-D CPACK_PACKAGING_INSTALL_PREFIX=$pack_dir/rpm
     ) || { echo "comma-build: pack failed" >&2 ; exit 1 ; }
     cat dependencies.commits | while IFS=, read what commit ; do cp $pack_dir/build/$what/*.rpm $pack_dir/rpm ; done
     cp $pack_dir/build/$top_repository/*.rpm $pack_dir/rpm

From dcb7d4465fcf5dd731cffc0c1a80ead2eef9c3a0 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 9 Jul 2019 11:00:14 +1000
Subject: [PATCH 0042/1056] name-value-apply: --unquote-numbers implemented

---
 name_value/applications/name-value-apply | 38 +++++++++++-------------
 1 file changed, 17 insertions(+), 21 deletions(-)

diff --git a/name_value/applications/name-value-apply b/name_value/applications/name-value-apply
index 2b064142b..d6d8a5ca3 100755
--- a/name_value/applications/name-value-apply
+++ b/name_value/applications/name-value-apply
@@ -3,7 +3,7 @@
 
 source $( type -p comma-application-util )
 
-function say() { echo "$scriptname: $@" >&2; }
+function say() { echo "name-value-apply: $@" >&2; }
 function die() { say "$@"; exit 1; }
 function bye() { say "$@"; exit 0; }
 function mangle_options() { comma-options-to-name-value "$@" | { grep '='; :; } | comma_path_value_mangle | sed 's/^/local options_/g'; comma_status_ok; }
@@ -11,8 +11,9 @@ function mangle_options() { comma-options-to-name-value "$@" | { grep '='; :; }
 function description()
 {
     cat <<EOF
---help,-h; output instructions for using this program and exit.
---source; for each name, show the source config instead of its value.
+--help,-h; output instructions for using this program and exit
+--source; for each name, show the source config instead of its value
+--unquote-numbers,-u; unquote numbers
 EOF
 }
 
@@ -22,23 +23,23 @@ function usage()
 {
     cat >&2 <<EOF
 
-Derive a config from multiple input configs.
+derive a config from multiple input configs
 
-Usage:
-    $scriptname [<options>] <files...>
+usage
+    name-value-apply [<options>] <files...>
 
-Options:
+options
 $( description | sed 's/^/    /' )
 
-Example:
+example
     > ( echo a=5; echo b=7 ) > cfg1.pv; ( echo a=6; echo c=8 ) > cfg2.pv
 
-    > $scriptname cfg1.pv cfg2.pv
+    > name-value-apply cfg1.pv cfg2.pv
     a="6"
     b="7"
     c="8"
 
-    > $scriptname --source cfg*
+    > name-value-apply --source cfg*
     a="cfg2.pv"
     b="cfg1.pv"
     c="cfg2.pv"
@@ -51,23 +52,18 @@ function combine_files() { for ff in "${files[@]}"; do cat "$ff" | name-value-co
 
 function execute()
 {
-    local -r scriptname=$( basename "$0" )
-
     (( $( comma_options_has --bash-completion $@ ) )) && { bash_completion; exit 0; }
     (( $( comma_options_has --help $@ ) || $( comma_options_has -h $@ ) )) && usage
-
     local mangle_text ff
     local -a files
     mangle_text=$( description | mangle_options "$@"; comma_status_ok ) || die "Invalid arguments."; eval "$mangle_text"
     mangle_text="files=( $( description | comma-options-to-name-value "$@" | grep '^"' ) )"; eval "$mangle_text"; unset mangle_text
-
-    for ff in "${files[@]}"
-    do
-        { name-value-convert < "$ff" |
-            { [[ -z $options_source ]] &&  cat - || cut -d = -f1 |  sed "s~$~=\"$ff\"~g";}
-        }
-    done | name-value-convert --take-last
+    local unquote_numbers_option
+    (( !options_unquote_numbers )) || unquote_numbers_option="--unquote-numbers"
+    
+    for ff in "${files[@]}"; do
+        name-value-convert < "$ff" | { [[ -z $options_source ]] &&  cat - || cut -d = -f1 |  sed "s~$~=\"$ff\"~g"; }
+    done | name-value-convert --take-last $unquote_numbers_option
 }
 
 [[ $( basename $0 ) != "name-value-apply" ]] || execute "$@"
-

From 2963d5dee81bc6ebf672595b368a8faa87be9a08 Mon Sep 17 00:00:00 2001
From: James McColl <jamiemccoll1@gmail.com>
Date: Wed, 10 Jul 2019 13:03:56 +1000
Subject: [PATCH 0043/1056] csv-calc: --precision implemented

---
 csv/applications/csv-calc.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 5a5b8af5d..eea012c5b 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1079,7 +1079,7 @@ struct Operation : public Operationbase
         for( std::size_t i = 0; i < input_elements_.size(); ++i )
         {
             comma::csv::format::types_enum output_type = input_elements_[i].type;
-            switch( E ) // quick and dirty, implement in operations::traits, just no time
+            switch( E ) // quick and dirty, operations::traits would be better, but likely to be optimized by compiler anyway
             {
                 case Operations::Enum::radius:
                 case Operations::Enum::diameter:
@@ -1215,7 +1215,7 @@ static void calculate( const comma::csv::options& csv, OperationsMap& operations
         {
             ( *it->second )[i].calculate();
             if( csv.binary() ) { r.append( ( *it->second )[i].buffer(), ( *it->second )[i].output_format().size() ); }
-            else { if( i > 0 ) { r += csv.delimiter; } r.append(( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, 12 )); }
+            else { if( i > 0 ) { r += csv.delimiter; } r.append(( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, csv.precision )); }
         }
         results[it->first] = r;
     }
@@ -1232,6 +1232,7 @@ int main( int ac, char** av )
         std::vector< std::string > unnamed = options.unnamed( "", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
         comma::csv::options csv( options );
         csv.full_xpath = false;
+        std::cout.precision( csv.precision );
         #ifdef WIN32
         if( csv.binary() ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif

From 6e20b573cc91fc7072b93509ebc2561cfc08a79a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 29 Jul 2019 13:03:19 +1000
Subject: [PATCH 0044/1056] csv-paste: block-size implemented for input streams

---
 csv/applications/csv-paste.cpp | 177 ++++++++-------------------------
 csv/test/csv-paste/expected    |  20 ++++
 csv/test/csv-paste/input       |  23 +++--
 3 files changed, 72 insertions(+), 148 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 56d26dbb7..3258ec73e 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -75,14 +75,19 @@ static void usage( bool verbose )
     std::cerr << "    --verbose,-v; more debug output" << std::endl;
     std::cerr << std::endl;
     std::cerr << "inputs" << std::endl;
-    std::cerr << "    <file> : <filename>[;size=<size>|binary=<format>]: file name or \"-\" for stdin; specify size or format, if binary" << std::endl;
+    std::cerr << "    <file> : <filename>[;<properties>]: file name or \"-\" for stdin; specify size or format, if binary" << std::endl;
+    std::cerr << "        properties" << std::endl;
+    std::cerr << "            binary=<format>: if input is binary, record binary format; or use 'size'" << std::endl;
+    std::cerr << "            block-size=<block-size>; repeat each record <block-size> times" << std::endl;
+    std::cerr << "            size=<size>; if input is binary, record size in bytes; or use 'binary'" << std::endl;
     std::cerr << "    value : value=<csv values>[;binary=<format>]; specify size or format, if binary" << std::endl;
     std::cerr << "    line-number[;<options>] : add the line number; as ui, if binary (quick and dirty, will override the file named \"line-number\")" << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --begin <index>: start line number count at <index>; default: 0" << std::endl;
+    std::cerr << "            --block-size,--size=<size>: number of records with the same line number; default: 1" << std::endl;
+    std::cerr << "                 WARNING: --size: deprecated, since it is confusing for files" << std::endl;
     std::cerr << "            --index; instead of block number output record index in the block" << std::endl;
-    std::cerr << "            --reverse; if --index, output index in descending order" << std::endl;
-    std::cerr << "            --size,--block-size <size>: number of records with the same line number; default: 1" << std::endl;
+    std::cerr << "            --reverse; if --index, output index in descending order" << std::endl;    
     std::cerr << "        examples (try them)" << std::endl;
     std::cerr << "            line number" << std::endl;
     std::cerr << "                seq 0 20 | csv-paste - line-number --begin 5 --size 3" << std::endl;
@@ -102,13 +107,14 @@ static void usage( bool verbose )
 class source
 {
     public:
-        source( const std::string& properties = "" ) : properties_( properties )
+        source( const std::string& properties = "" ) : properties_( properties ), block_count_( 0 ), buf_( nullptr )
         {
             comma::name_value::map map( properties, ';', '=' );
             format_ = comma::csv::format( map.value< std::string >( "binary", "" ) );
             unsigned int size = map.value< unsigned int >( "size", format_.size() );
             binary_ = size > 0;
             value_ = std::string( size, 0 );
+            block_size_ = map.value< unsigned int >( "block-size", 1 );
         }
         virtual ~source() {}
         virtual const std::string* read() = 0;
@@ -123,6 +129,9 @@ class source
         bool binary_;
         comma::csv::format format_;
         std::string properties_;
+        unsigned int block_size_;
+        unsigned int block_count_;
+        const char* buf_;
 };
 
 class stream : public source
@@ -136,19 +145,32 @@ class stream : public source
         
         const std::string* read()
         {
-            while( stream_->good() && !stream_->eof() )
+            if( block_count_ == block_size_ || value_.empty() )
             {
-                std::getline( *stream_, value_ );
-                if( !value_.empty() && *value_.rbegin() == '\r' ) { value_ = value_.substr( 0, value_.length() - 1 ); } // windows... sigh...
-                if( !value_.empty() ) { return &value_; }
+                block_count_ = 1;
+                while( stream_->good() && !stream_->eof() )
+                {
+                    std::getline( *stream_, value_ );
+                    if( !value_.empty() && *value_.rbegin() == '\r' ) { value_ = value_.substr( 0, value_.length() - 1 ); } // windows... sigh...
+                    if( !value_.empty() ) { return &value_; }
+                }
+                return nullptr;
             }
-            return NULL;
+            ++block_count_;
+            return &value_;
         }
 
         const char* read( char* buf )
         {
-            stream_->read( buf, value_.size() );
-            return stream_->gcount() == int( value_.size() ) ? buf : NULL;
+            if( block_count_ == block_size_ || buf_ == nullptr )
+            {
+                block_count_ = 1;
+                buf_ = buf; // quick and dirty
+                stream_->read( buf, value_.size() );
+                return stream_->gcount() == int( value_.size() ) ? buf : nullptr;
+            }
+            ++block_count_;
+            return buf_;
         }
         
         bool is_stream() const { return true; }
@@ -192,9 +214,9 @@ class line_number : public source
                 
                 options( const std::string& properties, const comma::command_line_options& o ) // quick and dirty: use visiting instead
                 {
-                    options defaults( boost::optional< comma::uint32 >(), o.value< comma::uint32 >( "--size,--block-size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ) );
+                    options defaults( boost::optional< comma::uint32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ) );
                     comma::name_value::map map( properties, ';', '=' );
-                    size = map.value< comma::uint32 >( "size", defaults.size );
+                    size = map.value< comma::uint32 >( map.get().find( "block-size" ) != map.get().end() ? "block-size" : "size", defaults.size ); // quick and dirty
                     index = map.value< bool >( "index", defaults.index );
                     reverse = map.value< bool >( "reverse", defaults.reverse );
                     auto b = map.optional< comma::uint32 >( "begin" );
@@ -261,7 +283,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         char delimiter = options.value( "--delimiter,-d", ',' );
-        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--block-size" );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "-.*" );
         boost::ptr_vector< source > sources;
         bool is_binary = false;
         for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty; really lousy code duplication
@@ -304,7 +326,7 @@ int main( int ac, char** av )
                 char* p = &buffer[0];
                 for( unsigned int i = 0; i < sources.size(); p += sources[i].size(), ++i )
                 {
-                    if( sources[i].read( p ) == NULL )
+                    if( sources[i].read( p ) == nullptr )
                     {
                         if( streams == 0 ) { return 0; }
                         std::cerr << "csv-paste: unexpected end of file in " << unnamed[i] << std::endl;
@@ -325,12 +347,12 @@ int main( int ac, char** av )
                 for( unsigned int i = 0; i < sources.size(); ++i )
                 {
                     const std::string* s = sources[i].read();
-                    if( s == NULL )
+                    if( s == nullptr )
                     {
                         if( streams == 0 ) { return 0; }
                         std::cerr << "csv-paste: unexpected end of file in " << unnamed[i] << std::endl; return 1;
                     }
-                    if (sources[i].is_stream()) ++streams;
+                    if( sources[i].is_stream() ) { ++streams; }
                     if( i > 0 ) { oss << delimiter; }
                     oss << *s;
                 }
@@ -343,124 +365,3 @@ int main( int ac, char** av )
     catch( ... ) { std::cerr << "csv-paste: unknown exception" << std::endl; }
     return 1;
 }
-
-
-// int main( int ac, char** av )
-// {
-//     bool show_usage = true;
-//     try
-//     {
-//         comma::command_line_options options( ac, av );
-//         if( options.exists( "--help,-h" ) ) { usage(); }
-//         char delimiter = options.value( "--delimiter,-d", ',' );
-//         std::vector< std::string > unnamed = options.unnamed( "", "--delimiter,-d" );
-//         boost::ptr_vector< std::istream > files;
-//         std::vector< std::pair< std::istream*, std::size_t > > sources;
-//         bool binary = false;
-//         for( unsigned int i = 0; i < unnamed.size(); ++i )
-//         {
-//             std::string filename = unnamed[i];
-//             std::size_t size = 0;
-//             std::vector< std::string > v = comma::split( unnamed[i], ';' );
-//             filename = v[0];
-//             for( std::size_t j = 1; j < v.size(); ++j )
-//             {
-//                 std::vector< std::string > w = comma::split( v[j], '=' );
-//                 if( w.size() != 2 ) { COMMA_THROW( comma::exception, "expected filename and options, got \"" << unnamed[i] << "\"" ); }
-//                 if( w[0] == "binary" )
-//                 {
-//                     if( i == 0 ) { binary = true; }
-//                     else if( !binary ) { COMMA_THROW( comma::exception, unnamed[0] << " is ascii, but " << filename << " is binary" ); }
-//                     size = comma::csv::format( w[1] ).size();
-//                 }
-//                 else if( w[0] == "size" )
-//                 {
-//                     if( i == 0 ) { binary = true; }
-//                     else if( !binary ) { COMMA_THROW( comma::exception, unnamed[0] << " is ascii, but " << filename << " is binary" ); }
-//                     size = boost::lexical_cast< std::size_t >( w[1] );
-//                 }
-//             }
-//             if( binary && size == 0 ) { COMMA_THROW( comma::exception, "in binary mode, please specify size or format for \"" << filename << "\"" ); }
-//             if( filename == "-" )
-//             {
-//                 sources.push_back( std::make_pair( &std::cin, size ) );
-//             }
-//             else
-//             {
-//                 files.push_back( new std::ifstream( filename.c_str() ) );
-//                 if( !files.back().good() || files.back().eof() ) { COMMA_THROW( comma::exception, "failed to open " << unnamed[i] ); }
-//                 sources.push_back( std::make_pair( &files.back(), size ) );
-//             }
-//         }
-//         if( sources.empty() ) { usage(); }
-//         #ifdef WIN32
-//         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); }
-//         #endif
-//         show_usage = false;
-//         if( binary )
-//         {
-//             std::size_t size = 0;
-//             for( unsigned int i = 0; i < sources.size(); ++i ) { size += sources[i].second; }
-//             while( true )
-//             {
-//                 for( unsigned int i = 0; i < sources.size(); ++i )
-//                 {
-//                     std::string s( sources[i].second, 0 );
-//                     char* buf = &s[0];
-//                     sources[i].first->read( buf, sources[i].second );
-//                     int count = sources[i].first->gcount();
-//                     if( count != 0 && (unsigned int)count != sources[i].second ) { COMMA_THROW( comma::exception, unnamed[i] << ": expected " << sources[i].second << " bytes, got " << count ); }
-//                     if( !sources[i].first->good() || sources[i].first->eof() )
-//                     {
-//                         bool ok = true;
-//                         for( unsigned int j = 0; j < sources.size() && ok; ++j )
-//                         {
-//                             if( j > i ) { sources[j].first->peek(); }
-//                             ok = !sources[j].first->good() || sources[j].first->eof();
-//                         }
-//                         if( ok ) { return 0; }
-//                         else { COMMA_THROW( comma::exception, unnamed[i] << ": unexpected end of file" ); }
-//                     }
-//                     std::cout << s;
-//                 }
-//             }
-//         }
-//         else
-//         {
-//             while( true )
-//             {
-//                 bool first = true;
-//                 for( unsigned int i = 0; i < sources.size(); ++i )
-//                 {
-//                     std::string s;
-//                     std::getline( *sources[i].first, s );
-//                     if( !sources[i].first->good() || sources[i].first->eof() )
-//                     {
-//                         bool ok = true;
-//                         for( unsigned int j = 0; j < sources.size() && ok; ++j )
-//                         {
-//                             if( j > i ) { sources[j].first->peek(); }
-//                             ok = !sources[j].first->good() || sources[j].first->eof();
-//                         }
-//                         if( ok ) { return 0; }
-//                         else { COMMA_THROW( comma::exception, unnamed[i] << ": unexpected end of file" ); }
-//                     }
-//                     if( !s.empty() && *s.rbegin() == '\r' ) { s = s.substr( 0, s.length() - 1 ); } // windows... sigh...
-//                     if( s.empty() ) { continue; }
-//                     if( !first ) { std::cout << delimiter; } else { first = false; }
-//                     std::cout << s;
-//                 }
-//                 std::cout << std::endl;
-//             }
-//         }
-//     }
-//     catch( std::exception& ex )
-//     {
-//         std::cerr << "csv-paste: " << ex.what() << std::endl;
-//     }
-//     catch( ... )
-//     {
-//         std::cerr << "csv-paste: unknown exception" << std::endl;
-//     }
-//     if( show_usage ) { usage(); }
-// }
diff --git a/csv/test/csv-paste/expected b/csv/test/csv-paste/expected
index 95f7b8c23..46ff006b9 100644
--- a/csv/test/csv-paste/expected
+++ b/csv/test/csv-paste/expected
@@ -53,3 +53,23 @@ line_number/binary[0]/output/line[1]="1"
 line_number/binary[0]/output/line[2]="2"
 line_number/binary[0]/output/line[3]="3"
 line_number/binary[0]/status=0
+
+block_size/ascii[0]/output/line[0]="a,0"
+block_size/ascii[0]/output/line[1]="a,0"
+block_size/ascii[0]/output/line[2]="a,1"
+block_size/ascii[0]/output/line[3]="a,1"
+block_size/ascii[0]/output/line[4]="b,2"
+block_size/ascii[0]/output/line[5]="b,2"
+block_size/ascii[0]/output/line[6]="b,3"
+block_size/ascii[0]/output/line[7]="b,3"
+block_size/ascii[0]/status=0
+
+block_size/binary[0]/output/line[0]="0,0"
+block_size/binary[0]/output/line[1]="0,0"
+block_size/binary[0]/output/line[2]="0,1"
+block_size/binary[0]/output/line[3]="0,1"
+block_size/binary[0]/output/line[4]="1,2"
+block_size/binary[0]/output/line[5]="1,2"
+block_size/binary[0]/output/line[6]="1,3"
+block_size/binary[0]/output/line[7]="1,3"
+block_size/binary[0]/status=0
diff --git a/csv/test/csv-paste/input b/csv/test/csv-paste/input
index f6ef59556..d00c48ad2 100644
--- a/csv/test/csv-paste/input
+++ b/csv/test/csv-paste/input
@@ -12,17 +12,20 @@ line_number/command_line_options[6]="csv-paste line-number --size 5 --index --re
 line_number/command_line_options[7]="csv-paste line-number --size 5 --index --reverse --begin 3 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
 
 line_number/parametrized[0]="csv-paste 'line-number;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[1]="csv-paste 'line-number;size=5' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[2]="csv-paste 'line-number;size=5;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[3]="csv-paste 'line-number;size=5;index' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[4]="csv-paste 'line-number;size=5;index;reverse' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[5]="csv-paste 'line-number;size=5;index;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[6]="csv-paste 'line-number;size=5;index;reverse;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[7]="csv-paste 'line-number;size=5;index;reverse;begin=10' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[8]="csv-paste 'line-number;size=5;index;reverse;begin=3' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[1]="csv-paste 'line-number;block-size=5' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[2]="csv-paste 'line-number;block-size=5;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[3]="csv-paste 'line-number;block-size=5;index' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[4]="csv-paste 'line-number;block-size=5;index;reverse' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[5]="csv-paste 'line-number;block-size=5;index;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[6]="csv-paste 'line-number;block-size=5;index;reverse;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[7]="csv-paste 'line-number;block-size=5;index;reverse;begin=10' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[8]="csv-paste 'line-number;block-size=5;index;reverse;begin=3' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
 
 line_number/multiple[0]="csv-paste line-number 'line-number;begin=4' --begin=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/multiple[1]="csv-paste line-number 'line-number;size=5' --size=6 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/multiple[2]="csv-paste line-number 'line-number;index' --size=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/multiple[1]="csv-paste line-number 'line-number;block-size=5' --block-size=6 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/multiple[2]="csv-paste line-number 'line-number;index' --block-size=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
 
 line_number/binary[0]="csv-paste 'line-number;binary=ui' | csv-from-bin ui | head -n4; comma_status_ok && exit 0 || exit 1"
+
+block_size/ascii[0]="csv-paste <( echo a; echo b )';block-size=4' <( echo 0; echo 1; echo 2; echo 3 )';block-size=2'"
+block_size/binary[0]="csv-paste <( { echo 0; echo 1; } | csv-to-bin ui )';size=4;block-size=4' <( { echo 0; echo 1; echo 2; echo 3; } | csv-to-bin ui )';size=4;block-size=2' | csv-from-bin 2ui"

From a48edf4bc3317655161641eee28fbcc91e8a3358 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 29 Jul 2019 17:34:09 +1000
Subject: [PATCH 0045/1056] csv-paste: bug fixed

---
 csv/applications/csv-paste.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 3258ec73e..f9043e4e8 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -283,7 +283,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         char delimiter = options.value( "--delimiter,-d", ',' );
-        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--block-size" );
         boost::ptr_vector< source > sources;
         bool is_binary = false;
         for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty; really lousy code duplication

From aa202a3ddaac0bb1198949a4717b9d2f2b017468 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Aug 2019 13:44:17 +1000
Subject: [PATCH 0046/1056] csv-split: --files implemented for block field

---
 csv/applications/csv-split.cpp   |  37 +++++------
 csv/applications/split/split.cpp | 106 +++++++++++++++++--------------
 csv/applications/split/split.h   |  21 +++---
 3 files changed, 84 insertions(+), 80 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index 6defbc18e..ab3a68c15 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifdef WIN32
@@ -43,17 +42,17 @@
 #include "../../csv/traits.h"
 #include "split/split.h"
 
-comma::csv::options csv;
-std::vector< std::string > streams;
-boost::optional< boost::posix_time::time_duration > duration;
-std::string suffix;
-unsigned int size = 0;
-bool passthrough;
+static comma::csv::options csv;
+static std::vector< std::string > streams;
+static boost::optional< boost::posix_time::time_duration > duration;
+static std::string suffix;
+static unsigned int size = 0;
+static bool passthrough;
+static std::string files;
 
-template < typename T >
-void run()
+template < typename T > static void run()
 {
-    comma::csv::applications::split< T > split( duration, suffix, csv, streams, passthrough );
+    comma::csv::applications::split< T > split( duration, suffix, csv, streams, passthrough, files );
     if( size == 0 )
     {
         std::string line;
@@ -87,16 +86,17 @@ int main( int argc, char** argv )
         boost::program_options::options_description description( "options" );
         description.add_options()
             ( "help,h", "display help message" )
-            ( "size,c", boost::program_options::value< unsigned int >( &size ), "packet size, only full packets will be written" )
+            ( "files", boost::program_options::value< std::string >( &files ), "if 'block' field present, list of files to save blocks; todo: --files for id field" )
+            ( "passthrough,pass", "pass data through to stdout" )
             ( "period,t", boost::program_options::value< double >( &period ), "period in seconds after which a new file is created" )
-            ( "suffix,s", boost::program_options::value< std::string >( &extension ), "filename extension; default will be csv or bin, depending whether it is ascii or binary" )
+            ( "size,c", boost::program_options::value< unsigned int >( &size ), "packet size, only full packets will be written" )
             ( "string", "id is string; default: 32-bit integer" )
-            ( "time", "id is time; default: 32-bit integer" )
-            ( "passthrough,pass", "pass data through to stdout" );
+            ( "suffix,s", boost::program_options::value< std::string >( &extension ), "filename extension; default will be csv or bin, depending whether it is ascii or binary" )
+            ( "time", "id is time; default: 32-bit integer" );
         description.add( comma::csv::program_options::description() );
         boost::program_options::variables_map vm;
         boost::program_options::store( boost::program_options::parse_command_line( argc, argv, description), vm );
-        boost::program_options::parsed_options parsed = boost::program_options::command_line_parser(argc, argv).options( description ).allow_unregistered().run();
+        boost::program_options::parsed_options parsed = boost::program_options::command_line_parser( argc, argv ).options( description ).allow_unregistered().run();
         boost::program_options::notify( vm );
         if ( vm.count( "help" ) || vm.count( "long-help" ) )
         {
@@ -154,16 +154,13 @@ int main( int argc, char** argv )
         if( csv.binary() ) { size = csv.format().size(); }
         bool id_is_string = vm.count( "string" );
         bool id_is_time = vm.count( "time" );
-        passthrough = vm.count("passthrough");
-        
+        passthrough = vm.count("passthrough");        
         if( id_is_string && id_is_time ) { std::cerr << "csv-split: either --string or --time" << std::endl; }
-        if( period > 0 ) { duration = boost::posix_time::microseconds( static_cast<unsigned int> (period * 1e6 )); }
+        if( period > 0 ) { duration = boost::posix_time::microseconds( static_cast< unsigned int >( period * 1e6 )); }
         if( extension.empty() ) { suffix = csv.binary() || size > 0 ? ".bin" : ".csv"; }
         else { suffix += "."; suffix += extension; }
-
         streams = boost::program_options::collect_unrecognized( parsed.options, boost::program_options::include_positional );
         if( !streams.empty() && ( csv.has_field( "block" ) || id_is_time ) ) { std::cerr << "publisher streams are not compatible with splitting by block or timestamp." << std::endl; return 1; }
-
         if( id_is_string ) { run< std::string >(); }
         else if( id_is_time ) { run< boost::posix_time::ptime >(); }
         else { run< comma::uint32 >(); }
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 71f7f8a62..1132e9912 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifdef WIN32
@@ -39,9 +38,10 @@
 #include <sys/resource.h>
 #endif
 
+#include <boost/filesystem.hpp>
 #include <boost/lexical_cast.hpp>
-#include "../../../io/file_descriptor.h"
 #include "../../../base/exception.h"
+#include "../../../io/file_descriptor.h"
 #include "split.h"
 
 namespace comma { namespace csv { namespace applications {
@@ -50,7 +50,8 @@ template < typename T >
 split< T >::split( boost::optional< boost::posix_time::time_duration > period
             , const std::string& suffix
             , const comma::csv::options& csv
-            , bool pass )
+            , bool pass
+            , const std::string& filenames )
     : ofstream_( std::bind( &split< T >::ofstream_by_time_, this ) )
     , period_( period )
     , suffix_( suffix )
@@ -62,8 +63,20 @@ split< T >::split( boost::optional< boost::posix_time::time_duration > period
     if( csv.fields.empty() ) { return; }
     if( csv.binary() ) { binary_.reset( new comma::csv::binary< input >( csv ) ); }
     else { ascii_.reset( new comma::csv::ascii< input >( csv ) ); }
-    if( csv.has_field( "block" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_block_, this ); }
-    else if( csv.has_field( "id" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_id_, this ); }
+    if( csv.has_field( "block" ) )
+    {
+        ofstream_ = std::bind( &split< T >::ofstream_by_block_, this );
+        if( !filenames.empty() )
+        {
+            filenames_.reset( new std::ifstream( filenames ) );
+            if( !filenames_->is_open() ) { COMMA_THROW( comma::exception, "failed to open '" << filenames << "'" ); }
+        }
+    }
+    else
+    {
+        if( !filenames.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); }
+        if( csv.has_field( "id" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_id_, this ); }
+    }
 }
 
 //to-do
@@ -72,46 +85,39 @@ split< T >::split( boost::optional< boost::posix_time::time_duration > period
                  , const std::string& suffix
                  , const comma::csv::options& csv
                  , const std::vector< std::string >& streams //to-do
-                 , bool pass )
-    : split( period, suffix, csv, pass )
+                 , bool pass
+                 , const std::string& filenames )
+    : split( period, suffix, csv, pass, filenames )
 {
-    if( 0 < streams.size() )
+    if( streams.empty() ) { return; }
+    auto const io_mode = csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii;
+    for( auto const& si : streams )
     {
-        auto const io_mode = csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii;
-
-        for( auto const& si : streams )
+        auto const stream_values = comma::split( si, ';' );
+        if( 2 > stream_values.size() || stream_values[ 0 ].empty() || stream_values[ 1 ].empty() ) { COMMA_THROW( comma::exception, "please specify <id> and output <stream> in format <id>;<stream>, got: " << si ); }
+        transaction t( publishers_ );
+        std::unique_ptr< comma::io::publisher > publisher( new comma::io::publisher( stream_values[1], io_mode, false, csv.flush ) );
+        if( "..." == stream_values[0] )
         {
-            auto const stream_values = comma::split( si, ';' );
-            if( 2 > stream_values.size() || stream_values[ 0 ].empty() || stream_values[ 1 ].empty() )
-            {
-                COMMA_THROW( comma::exception, "please specify <id> and output <stream> in format <id>;<stream>, got: " << si );
-            }
-
-            transaction t( publishers_ );
-            std::unique_ptr< comma::io::publisher > publisher( new comma::io::publisher( stream_values[1], io_mode, false, csv.flush ) );
+            if( default_publisher_ ) { COMMA_THROW( comma::exception, "multiple output streams have the id: ..." ); }
+            default_publisher_ = std::move( publisher );
+        }
+        else
+        {
+            auto publisher_pos = t->insert( std::move( publisher ) );
+            auto const keys = comma::split( stream_values[0], ',' );
 
-            if( "..." == stream_values[0] )
-            {
-                if( default_publisher_ ) { COMMA_THROW( comma::exception, "multiple output streams have the id: ..." ); }
-                default_publisher_ = std::move( publisher );
-            }
-            else
+            for( auto const& ki : keys )
             {
-                auto publisher_pos = t->insert( std::move( publisher ) );
-                auto const keys = comma::split( stream_values[0], ',' );
+                auto const kii = boost::lexical_cast< T >( ki );
+                if( seen_ids_.end() !=  seen_ids_.find( kii ) ) { COMMA_THROW( comma::exception, "multiple output streams have the id: " << ki ); }
+                seen_ids_.insert( kii );
 
-                for( auto const& ki : keys )
-                {
-                    auto const kii = boost::lexical_cast< T >( ki );
-                    if( seen_ids_.end() !=  seen_ids_.find( kii ) ) { COMMA_THROW( comma::exception, "multiple output streams have the id: " << ki ); }
-                    seen_ids_.insert( kii );
-
-                    mapped_publishers_.insert( std::make_pair( kii, publisher_pos.first->get() ) );
-                }
+                mapped_publishers_.insert( std::make_pair( kii, publisher_pos.first->get() ) );
             }
         }
-        acceptor_thread_ = std::thread( std::bind( &split< T >::accept_, std::ref( *this )));
     }
+    acceptor_thread_ = std::thread( std::bind( &split< T >::accept_, std::ref( *this )));
 }
 
 template < typename T >
@@ -208,23 +214,29 @@ std::ofstream& split< T >::ofstream_by_block_()
     if( !last_ || last_->block != current_.block )
     {
         file_.close();
-        std::string name = boost::lexical_cast< std::string >( current_.block ) + suffix_;
-        file_.open( name.c_str(), mode_ );
+        std::string filename;
+        if( filenames_ )
+        {
+            while( std::cin.good() && !is_shutdown_ )
+            {
+                std::getline( *filenames_, filename );
+                if( filename.empty() ) { continue; }
+                const auto& dirname = boost::filesystem::path( filename ).parent_path();
+                if( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) { break; }
+                COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << filename << "'" );
+            }
+        }
+        if( filename.empty() ) { filename = boost::lexical_cast< std::string >( current_.block ) + suffix_; }
+        file_.open( &filename[0], mode_ );
+        if( !file_.is_open() ) { COMMA_THROW( comma::exception, "failed to open '" << filename << "'" ); }
         last_ = current_;
     }
     return file_;
 }
 
-template < typename T >
-static std::string make_filename_from_id(const T& id, std::string suffix )
-{
-    return boost::lexical_cast< std::string >( id ) + suffix;
-}
+template < typename T > static std::string make_filename_from_id( const T& id, const std::string& suffix ) { return boost::lexical_cast< std::string >( id ) + suffix; }
 
-static std::string make_filename_from_id(const boost::posix_time::ptime& id, std::string suffix )
-{
-    return boost::posix_time::to_iso_string( id ) + suffix;
-}
+static std::string make_filename_from_id( const boost::posix_time::ptime& id, const std::string& suffix ) { return boost::posix_time::to_iso_string( id ) + suffix; }
 
 template < typename T >
 std::ofstream& split< T >::ofstream_by_id_()
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 053097a31..53c4a2580 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -30,8 +30,7 @@
 /// @author vsevolod vlaskine
 /// @author cedric wohlleber
 
-#ifndef COMMA_CSV_SPLIT_H
-#define COMMA_CSV_SPLIT_H
+#pragma once
 
 #include <fstream>
 #include <fstream>
@@ -119,23 +118,20 @@ class split
 {
     public:
         typedef applications::input< T > input;
-
         split( boost::optional< boost::posix_time::time_duration > period
              , const std::string& suffix
              , const comma::csv::options& csv
-             , bool passthrough );
-
-        void write( const char* data, unsigned int size );
-        void write( std::string line );
-
-        //to-do
+             , bool passthrough
+             , const std::string& filenames );
         split( boost::optional< boost::posix_time::time_duration > period
              , const std::string& suffix
              , const comma::csv::options& csv
              , const std::vector< std::string >& streams
-             , bool passthrough );
+             , bool passthrough
+             , const std::string& filenames );
         ~split();
-
+        void write( const char* data, unsigned int size );
+        void write( std::string line );
     private:
         std::ofstream& ofstream_by_time_();
         std::ofstream& ofstream_by_block_();
@@ -162,6 +158,7 @@ class split
         ids_type_ seen_ids_;
         bool pass_;
         bool flush_;
+        std::unique_ptr< std::ifstream > filenames_;
 
         //to-do
         bool published_on_stream( const char* data, unsigned int size );
@@ -174,5 +171,3 @@ class split
 };
 
 } } } // namespace comma { namespace csv { namespace applications {
-
-#endif // COMMA_CSV_SPLIT_H

From a9c3d51f0b4feeaf4dae385037f81f879a315b33 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Aug 2019 17:42:55 +1000
Subject: [PATCH 0047/1056] csv-paste: line-number: --step implemented

---
 csv/applications/csv-paste.cpp | 22 +++++++-----
 csv/test/csv-paste/expected    | 61 ++++++++++++++++++++++++++++++++++
 csv/test/csv-paste/input       |  9 +++++
 3 files changed, 83 insertions(+), 9 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index f9043e4e8..75c736079 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -87,7 +87,8 @@ static void usage( bool verbose )
     std::cerr << "            --block-size,--size=<size>: number of records with the same line number; default: 1" << std::endl;
     std::cerr << "                 WARNING: --size: deprecated, since it is confusing for files" << std::endl;
     std::cerr << "            --index; instead of block number output record index in the block" << std::endl;
-    std::cerr << "            --reverse; if --index, output index in descending order" << std::endl;    
+    std::cerr << "            --reverse; if --index, output index in descending order" << std::endl;
+    std::cerr << "            --step=<value>; default=1; line number increment/decrement step" << std::endl;        
     std::cerr << "        examples (try them)" << std::endl;
     std::cerr << "            line number" << std::endl;
     std::cerr << "                seq 0 20 | csv-paste - line-number --begin 5 --size 3" << std::endl;
@@ -201,24 +202,27 @@ class line_number : public source
                 comma::uint32 size;
                 bool index;
                 bool reverse;
+                comma::uint32 step;
                 comma::uint32 begin;
                 std::string format;
                 
-                options( boost::optional< comma::uint32 > b = boost::optional< comma::uint32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false )
+                options( boost::optional< comma::uint32 > b = boost::optional< comma::uint32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false, unsigned int s = 1 )
                     : size( size )
                     , index( index )
                     , reverse( reverse )
+                    , step( s )
                     , begin( begin_( b ) )
                 {
                 }
                 
                 options( const std::string& properties, const comma::command_line_options& o ) // quick and dirty: use visiting instead
                 {
-                    options defaults( boost::optional< comma::uint32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ) );
+                    options defaults( boost::optional< comma::uint32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::uint32 >( "--step", 1 ) );
                     comma::name_value::map map( properties, ';', '=' );
                     size = map.value< comma::uint32 >( map.get().find( "block-size" ) != map.get().end() ? "block-size" : "size", defaults.size ); // quick and dirty
                     index = map.value< bool >( "index", defaults.index );
                     reverse = map.value< bool >( "reverse", defaults.reverse );
+                    step = map.value< comma::uint32 >( "step", defaults.step );
                     auto b = map.optional< comma::uint32 >( "begin" );
                     if( !b ) { b = o.optional< comma::uint32 >( "--begin" ); }
                     begin = begin_( b );
@@ -229,8 +233,8 @@ class line_number : public source
             private:
                 comma::uint32 begin_( const boost::optional< comma::uint32 >& b )
                 {
-                    if( index && reverse && b && ( *b + 1 ) < size ) { COMMA_THROW( comma::exception, "for --reverse --index, for --size " << size << " expected --begin not less than " << ( size - 1 ) << "; got: " << *b ); }
-                    return b ? *b : reverse ? size - 1 : 0;
+                    if( index && reverse && b && ( *b + step ) < size * step ) { COMMA_THROW( comma::exception, "for --reverse --index, for --size " << size << " expected --begin not less than " << ( size - 1 ) << "; got: " << *b ); }
+                    return b ? *b : reverse ? ( size - 1 ) * step : 0;
                 }
         };
         
@@ -264,14 +268,14 @@ class line_number : public source
         
         void update_()
         {
-            ++count_;
+            ++count_; //count_ += options_.step;
             if( count_ < options_.size )
             {
-                if( options_.index ) { value_ += options_.reverse ? -1 : 1; }
+                if( options_.index ) { value_ += options_.reverse ? -options_.step : options_.step; }
             }
             else
             {
-                value_ = options_.index ? options_.begin : ( value_ + 1 );
+                value_ = options_.index ? options_.begin : ( value_ + options_.step );
                 count_ = 0;
             }
         }
@@ -283,7 +287,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         char delimiter = options.value( "--delimiter,-d", ',' );
-        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--block-size" );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--step,--block-size" );
         boost::ptr_vector< source > sources;
         bool is_binary = false;
         for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty; really lousy code duplication
diff --git a/csv/test/csv-paste/expected b/csv/test/csv-paste/expected
index 46ff006b9..ae81fcb6c 100644
--- a/csv/test/csv-paste/expected
+++ b/csv/test/csv-paste/expected
@@ -73,3 +73,64 @@ block_size/binary[0]/output/line[5]="1,2"
 block_size/binary[0]/output/line[6]="1,3"
 block_size/binary[0]/output/line[7]="1,3"
 block_size/binary[0]/status=0
+
+line_number/step[0]/output/line[0]="0"
+line_number/step[0]/output/line[1]="2"
+line_number/step[0]/output/line[2]="4"
+line_number/step[0]/output/line[3]="6"
+line_number/step[0]/status=0
+line_number/step[1]/output/line[0]="0"
+line_number/step[1]/output/line[1]="2"
+line_number/step[1]/output/line[2]="4"
+line_number/step[1]/output/line[3]="6"
+line_number/step[1]/status=0
+line_number/step[2]/output/line[0]="0"
+line_number/step[2]/output/line[1]="2"
+line_number/step[2]/output/line[2]="4"
+line_number/step[2]/output/line[3]="6"
+line_number/step[2]/status=0
+line_number/step[3]/output/line[0]="0"
+line_number/step[3]/output/line[1]="0"
+line_number/step[3]/output/line[2]="0"
+line_number/step[3]/output/line[3]="0"
+line_number/step[3]/output/line[4]="0"
+line_number/step[3]/output/line[5]="2"
+line_number/step[3]/output/line[6]="2"
+line_number/step[3]/output/line[7]="2"
+line_number/step[3]/output/line[8]="2"
+line_number/step[3]/output/line[9]="2"
+line_number/step[3]/status=0
+line_number/step[4]/output/line[0]="0"
+line_number/step[4]/output/line[1]="2"
+line_number/step[4]/output/line[2]="4"
+line_number/step[4]/output/line[3]="6"
+line_number/step[4]/output/line[4]="8"
+line_number/step[4]/output/line[5]="0"
+line_number/step[4]/output/line[6]="2"
+line_number/step[4]/output/line[7]="4"
+line_number/step[4]/output/line[8]="6"
+line_number/step[4]/output/line[9]="8"
+line_number/step[4]/status=0
+line_number/step[5]/output/line[0]="8"
+line_number/step[5]/output/line[1]="6"
+line_number/step[5]/output/line[2]="4"
+line_number/step[5]/output/line[3]="2"
+line_number/step[5]/output/line[4]="0"
+line_number/step[5]/output/line[5]="8"
+line_number/step[5]/output/line[6]="6"
+line_number/step[5]/output/line[7]="4"
+line_number/step[5]/output/line[8]="2"
+line_number/step[5]/output/line[9]="0"
+line_number/step[5]/status=0
+line_number/step[6]/output/line[0]="20"
+line_number/step[6]/output/line[1]="18"
+line_number/step[6]/output/line[2]="16"
+line_number/step[6]/output/line[3]="14"
+line_number/step[6]/output/line[4]="12"
+line_number/step[6]/output/line[5]="20"
+line_number/step[6]/output/line[6]="18"
+line_number/step[6]/output/line[7]="16"
+line_number/step[6]/output/line[8]="14"
+line_number/step[6]/output/line[9]="12"
+line_number/step[6]/status=0
+line_number/step[7]/status=1
diff --git a/csv/test/csv-paste/input b/csv/test/csv-paste/input
index d00c48ad2..331ba378d 100644
--- a/csv/test/csv-paste/input
+++ b/csv/test/csv-paste/input
@@ -29,3 +29,12 @@ line_number/binary[0]="csv-paste 'line-number;binary=ui' | csv-from-bin ui | hea
 
 block_size/ascii[0]="csv-paste <( echo a; echo b )';block-size=4' <( echo 0; echo 1; echo 2; echo 3 )';block-size=2'"
 block_size/binary[0]="csv-paste <( { echo 0; echo 1; } | csv-to-bin ui )';size=4;block-size=4' <( { echo 0; echo 1; echo 2; echo 3; } | csv-to-bin ui )';size=4;block-size=2' | csv-from-bin 2ui"
+
+line_number/step[0]="csv-paste line-number --step 2 | head -n4; comma_status_ok && exit 0 || exit 1"
+line_number/step[1]="csv-paste "line-number;step=2" | head -n4; comma_status_ok && exit 0 || exit 1"
+line_number/step[2]="csv-paste "line-number;step=2" --step 3 | head -n4; comma_status_ok && exit 0 || exit 1"
+line_number/step[3]="csv-paste "line-number;block-size=5;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[4]="csv-paste "line-number;block-size=5;index;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[5]="csv-paste "line-number;block-size=5;index;reverse;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[6]="csv-paste "line-number;block-size=5;index;reverse;begin=20;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[7]="csv-paste "line-number;block-size=5;index;reverse;begin=4;step=2" | head; comma_status_ok && exit 0 || exit 1"

From 96d13e377160bafe8bba03bd1ab4e64c288982fb Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 27 Aug 2019 18:49:19 +1000
Subject: [PATCH 0048/1056] csv-sort: --random, --random-seed implemented

---
 csv/applications/csv-sort.cpp | 86 ++++++++++++++++++++++++++++++++---
 1 file changed, 80 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index 48d216abf..c2665e071 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -29,10 +29,13 @@
 
 /// @authors matthew imhoff, dewey nguyen, vsevolod vlaskine
 
+#include <algorithm>
 #include <string.h>
 #include <deque>
 #include <iostream>
 #include <map>
+#include <memory>
+#include <random>
 #include <sstream>
 #include <string>
 #include <vector>
@@ -73,7 +76,9 @@ static void usage( bool more )
     std::cerr << "    --max: output record(s) with maximum value, same semantics as --min" << std::endl;
     std::cerr << "           --min and --max may be used together." << std::endl;
     std::cerr << "    --numeric-keys-are-floats,--floats; in ascii, if --format not present, assume that numeric fields are floating point numbers" << std::endl;
-    std::cerr << "    --order <fields>: order in which to sort fields; default is input field order" << std::endl;
+    std::cerr << "    --order=<fields>: order in which to sort fields; default is input field order" << std::endl;
+    std::cerr << "    --random: output input records in pseudo-random order" << std::endl;
+    std::cerr << "    --random-seed,--seed=[<int>]; random seed for --random" << std::endl;
     std::cerr << "    --reverse,--descending,-r: sort in reverse order" << std::endl;
     std::cerr << "    --sliding-window,--window=<size>: sort last <size> entries" << std::endl;
     std::cerr << "    --string,-s: keys are strings; a quick and dirty option to support strings" << std::endl;
@@ -577,9 +582,74 @@ int handle_operations_with_ids( const comma::command_line_options& options )
         }
         
     }
-    
     output_current_block( min_map, max_map );
-    
+    return 0;
+}
+
+static int random( const comma::command_line_options& options )
+{
+    auto seed = options.optional< int >( "--random-seed,--seed" );
+    std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
+    std::deque< std::string > records;
+    if( csv.has_field( "block" ) )
+    {
+        comma::csv::input_stream< input_with_block > is( std::cin, csv );
+        comma::uint32 block = 0;
+        while( is.ready() || std::cin.good() )
+        {
+            const input_with_block* p = is.read();
+            if( !p || p->block != block )
+            {
+                std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+                std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+                for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+                if( csv.flush ) { std::cout.flush(); }
+                records.clear();
+                if( p ) { block = p->block; }
+            }
+            if( !p ) { break; }
+            if( csv.binary() )
+            {
+                records.push_back( std::string() );
+                records.back().resize( csv.format().size() );
+                std::memcpy( &records.back()[0], is.binary().last(), csv.format().size() );
+            }
+            else
+            {
+                records.push_back( comma::join( is.ascii().last(), csv.delimiter ) + "\n" );
+            }
+        }
+    }
+    else
+    {
+        // todo: quick and dirty, code duplication
+        // todo: implement --sliding-window
+        if( csv.binary() )
+        {
+            std::string s( csv.format().size(), 0 );
+            while( std::cin.good() )
+            {
+                std::cin.read( &s[0], s.size() );
+                if( std::cin.gcount() == 0 ) { break; }
+                if( std::cin.gcount() != int( s.size() ) ) { std::cerr << "csv-sort: --random: expected " << s.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                records.push_back( std::string() );
+                records.back().resize( csv.format().size() );
+                std::memcpy( &records.back()[0], &s[0], csv.format().size() );
+            }
+        }
+        else
+        {
+            while( std::cin.good() )
+            {
+                std::string s;
+                std::getline( std::cin, s );
+                if( !s.empty() ) { records.push_back( s + "\n" ); }
+            }
+        }
+        std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+        std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+        for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+    }
     return 0;
 }
 
@@ -674,11 +744,15 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--min,--sliding-window,--window,--unique" );
-        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--max,--sliding-window,--window,--unique" );
+        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--min,--sliding-window,--window,--unique,--random" );
+        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--max,--sliding-window,--window,--unique,--random" );
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
-        return options.exists( "--first,--min,--max" ) ? handle_operations_with_ids( options ) : sort( options );
+        return   options.exists( "--first,--min,--max" )
+               ? handle_operations_with_ids( options )
+               : options.exists( "--random" )
+               ? random( options )
+               : sort( options );
     }
     catch( std::exception& ex ) { std::cerr << "csv-sort: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-sort: unknown exception" << std::endl; }

From 2dde8cd4a78051a5dda4fc67102ff5a6bdbf2e54 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 28 Aug 2019 10:57:02 +1000
Subject: [PATCH 0049/1056] packed/detail/endian: license fixed

---
 packed/detail/endian.h | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index 80b1b9b75..b27ac37e0 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -1,5 +1,5 @@
-// This file is provided in addition to snark and is not an integral
-// part of snark library.
+// This file is provided in addition to comma and is not an integral
+// part of comma library.
 // Copyright (c) 2018 Vsevolod Vlaskine
 // All rights reserved.
 //
@@ -25,7 +25,7 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-// snark is a generic and flexible library for robotics research
+// comma is a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
 //

From 1c9bdf192198ecf417f2737b74c3fea8bc9f9fe7 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 28 Aug 2019 11:29:59 +1000
Subject: [PATCH 0050/1056] csv-random: first cut of shuffle operation
 implemented

---
 csv/applications/CMakeLists.txt |   4 +
 csv/applications/csv-random.cpp | 253 ++++++++++++++++++++++++++++++++
 2 files changed, 257 insertions(+)
 create mode 100644 csv/applications/csv-random.cpp

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index 5a76792c2..a165fa65c 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -110,6 +110,10 @@ add_executable( csv-units ${dir}/csv-units.cpp )
 target_link_libraries ( csv-units ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
 install( TARGETS csv-units RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
+add_executable( csv-random ${dir}/csv-random.cpp )
+target_link_libraries ( csv-random ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+install( TARGETS csv-random RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
 add_executable( csv-update ${dir}/csv-update.cpp )
 target_link_libraries ( csv-update ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
 install( TARGETS csv-update RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
new file mode 100644
index 000000000..b01b7e827
--- /dev/null
+++ b/csv/applications/csv-random.cpp
@@ -0,0 +1,253 @@
+// This file is provided in addition to comma and is not an integral
+// part of comma library.
+// Copyright (c) 2018 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+// comma is a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+/// @author vsevolod vlaskine
+
+#include <algorithm>
+#include <string.h>
+#include <deque>
+#include <iostream>
+#include <map>
+#include <memory>
+#include <random>
+#include <sstream>
+#include <string>
+#include <vector>
+#include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../base/types.h"
+#include "../../csv/stream.h"
+#include "../../csv/traits.h"
+#include "../../string/string.h"
+#include "../../visiting/traits.h"
+
+static void usage( bool more )
+{
+    std::cerr << std::endl;
+    std::cerr << "Sort a csv file using one or several keys" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "Usage: cat something.csv | csv-random [<options>]" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "Options:" << std::endl;
+    std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
+    std::cerr << "    --discard-out-of-order,--discard-unsorted: instead of sorting, discard records out of order" << std::endl;
+    std::cerr << "    --first: first line matching given keys; first line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
+    std::cerr << "           fields" << std::endl;
+    std::cerr << "               id: if present, multiple id fields accepted; output first record for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
+    std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
+    std::cerr << "    --min: output only record(s) with minimum value for a given field." << std::endl;
+    std::cerr << "           fields" << std::endl;
+    std::cerr << "               id: if present, multiple id fields accepted; output minimum for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
+    std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
+    std::cerr << "    --max: output record(s) with maximum value, same semantics as --min" << std::endl;
+    std::cerr << "           --min and --max may be used together." << std::endl;
+    std::cerr << "    --numeric-keys-are-floats,--floats; in ascii, if --format not present, assume that numeric fields are floating point numbers" << std::endl;
+    std::cerr << "    --order=<fields>: order in which to sort fields; default is input field order" << std::endl;
+    std::cerr << "    --random: output input records in pseudo-random order" << std::endl;
+    std::cerr << "    --random-seed,--seed=[<int>]; random seed for --random" << std::endl;
+    std::cerr << "    --reverse,--descending,-r: sort in reverse order" << std::endl;
+    std::cerr << "    --sliding-window,--window=<size>: sort last <size> entries" << std::endl;
+    std::cerr << "    --string,-s: keys are strings; a quick and dirty option to support strings" << std::endl;
+    std::cerr << "                 default: double" << std::endl;
+    std::cerr << "    --unique,-u: sort input, output only the first line matching given keys; if no sorting required, use --first for better performance" << std::endl;
+    std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "    sort by first field:" << std::endl;
+    std::cerr << "        echo -e \"2\\n1\\n3\" | csv-random --fields=a" << std::endl;
+    std::cerr << "    sort by second field:" << std::endl;
+    std::cerr << "        echo -e \"2,3\\n1,1\\n3,2\" | csv-random --fields=,b" << std::endl;
+    std::cerr << "    sort by second field then first field:" << std::endl;
+    std::cerr << "        echo -e \"2,3\\n3,1\\n1,1\\n2,2\\n1,3\" | csv-random --fields=a,b --order=b,a" << std::endl;
+    std::cerr << "    minimum (using maximum would be the same):" << std::endl;
+    std::cerr << "        basic use" << std::endl;
+    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,a,3; ) | csv-random --min --fields=,,a" << std::endl;
+    std::cerr << "        using single id" << std::endl;
+    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; ) | csv-random --min --fields=a,id" << std::endl;
+    std::cerr << "        using multiple id fields" << std::endl;
+    std::cerr << "            ( echo 1,a,1; echo 1,b,1; echo 3,b,5; echo 3,b,5; ) | csv-random --min --fields=id,a,id" << std::endl;
+    std::cerr << "        using block" << std::endl;
+    std::cerr << "            ( echo 0,a,2; echo 0,a,2; echo 0,b,3; echo 0,b,1; echo 1,c,3; echo 1,c,2; ) | csv-random --min --fields=block,,a" << std::endl;
+    std::cerr << "        using block and id" << std::endl;
+    std::cerr << "            ( echo 0,a,2; echo 0,a,2; echo 0,b,3; echo 0,b,1; echo 1,c,3; echo 1,c,2; ) | csv-random --min --fields=block,id,a" << std::endl;
+    std::cerr << "    minimum and maximum:" << std::endl;
+    std::cerr << "        basic use" << std::endl;
+    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; echo 5,b,7; echo 3,b,9 ) | csv-random --max --min --fields=,,a" << std::endl;
+    std::cerr << "        using id" << std::endl;
+    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; echo 5,b,7; echo 3,b,9 ) | csv-random --max --min --fields=,id,a" << std::endl;
+    std::cerr << std::endl;
+    if( more )
+    {
+        std::cerr << std::endl;
+        std::cerr << "csv options:" << std::endl;
+        std::cerr << comma::csv::options::usage() << std::endl;
+    }
+    exit( 0 );
+}
+
+static bool verbose;
+static comma::csv::options csv;
+static boost::optional< int > seed;
+
+namespace comma { namespace applications { namespace random { namespace shuffle {
+
+struct input
+{
+    comma::uint32 block;
+    input(): block( 0 ) {}
+};
+
+} } } } // namespace comma { namespace applications { namespace random { namespace shuffle {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::applications::random::shuffle::input >
+{
+    template < typename K, typename V > static void visit( const K&, const comma::applications::random::shuffle::input& p, V& v ) { v.apply( "block", p.block ); }
+    template < typename K, typename V > static void visit( const K&, comma::applications::random::shuffle::input& p, V& v ) { v.apply( "block", p.block ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace applications { namespace random { namespace shuffle {
+
+static int run( const comma::command_line_options& options )
+{
+    std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
+    std::deque< std::string > records;
+    if( ::csv.has_field( "block" ) )
+    {
+        comma::csv::input_stream< input > is( std::cin, ::csv );
+        comma::uint32 block = 0;
+        while( is.ready() || std::cin.good() )
+        {
+            const input* p = is.read();
+            if( !p || p->block != block )
+            {
+                std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+                std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+                for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+                if( ::csv.flush ) { std::cout.flush(); }
+                records.clear();
+                if( p ) { block = p->block; }
+            }
+            if( !p ) { break; }
+            if( ::csv.binary() )
+            {
+                records.push_back( std::string() );
+                records.back().resize( ::csv.format().size() );
+                std::memcpy( &records.back()[0], is.binary().last(), ::csv.format().size() );
+            }
+            else
+            {
+                records.push_back( comma::join( is.ascii().last(), ::csv.delimiter ) + "\n" );
+            }
+        }
+    }
+    else
+    {
+        // todo: quick and dirty, code duplication
+        // todo: implement --sliding-window
+        if( ::csv.binary() )
+        {
+            std::string s( ::csv.format().size(), 0 );
+            while( std::cin.good() )
+            {
+                std::cin.read( &s[0], s.size() );
+                if( std::cin.gcount() == 0 ) { break; }
+                if( std::cin.gcount() != int( s.size() ) ) { std::cerr << "csv-random: random: expected " << s.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                records.push_back( std::string() );
+                records.back().resize( ::csv.format().size() );
+                std::memcpy( &records.back()[0], &s[0], ::csv.format().size() );
+            }
+        }
+        else
+        {
+            while( std::cin.good() )
+            {
+                std::string s;
+                std::getline( std::cin, s );
+                if( !s.empty() ) { records.push_back( s + "\n" ); }
+            }
+        }
+        std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+        std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+        for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+    }
+    return 0;
+}
+
+} } } } // namespace comma { namespace applications { namespace random { namespace shuffle {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        const auto& unnamed = options.unnamed( "--flush,--verbose,-v", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-random: please specify operation" << std::endl; return 1; }
+        csv = comma::csv::options( options );
+        seed = options.optional< int >( "--seed" );
+        verbose = options.exists( "--verbose,-v" );
+        std::string operation = unnamed[0];
+        if( operation == "shuffle" ) { return comma::applications::random::shuffle::run( options ); }
+        std::cerr << "csv-random: expection operation; got: '" << operation << "'" << std::endl;
+        return 1;
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-random: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-random: unknown exception" << std::endl; }
+    return 1;
+}

From 9018f4531685e69929e52be86ea33fd8631c8d1b Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 28 Aug 2019 18:09:26 +1000
Subject: [PATCH 0051/1056] csv-random: shuffle: help added

---
 csv/applications/csv-random.cpp | 85 +++++++++------------------------
 1 file changed, 23 insertions(+), 62 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index b01b7e827..2ca8b3bd5 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -74,67 +74,23 @@
 #include "../../string/string.h"
 #include "../../visiting/traits.h"
 
-static void usage( bool more )
+static void usage( bool verbose )
 {
     std::cerr << std::endl;
-    std::cerr << "Sort a csv file using one or several keys" << std::endl;
+    std::cerr << "random operations on input stream" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "Usage: cat something.csv | csv-random [<options>]" << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --seed=[<int>]; random seed" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "Options:" << std::endl;
-    std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
-    std::cerr << "    --discard-out-of-order,--discard-unsorted: instead of sorting, discard records out of order" << std::endl;
-    std::cerr << "    --first: first line matching given keys; first line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
-    std::cerr << "           fields" << std::endl;
-    std::cerr << "               id: if present, multiple id fields accepted; output first record for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
-    std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
-    std::cerr << "    --min: output only record(s) with minimum value for a given field." << std::endl;
-    std::cerr << "           fields" << std::endl;
-    std::cerr << "               id: if present, multiple id fields accepted; output minimum for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
-    std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
-    std::cerr << "    --max: output record(s) with maximum value, same semantics as --min" << std::endl;
-    std::cerr << "           --min and --max may be used together." << std::endl;
-    std::cerr << "    --numeric-keys-are-floats,--floats; in ascii, if --format not present, assume that numeric fields are floating point numbers" << std::endl;
-    std::cerr << "    --order=<fields>: order in which to sort fields; default is input field order" << std::endl;
-    std::cerr << "    --random: output input records in pseudo-random order" << std::endl;
-    std::cerr << "    --random-seed,--seed=[<int>]; random seed for --random" << std::endl;
-    std::cerr << "    --reverse,--descending,-r: sort in reverse order" << std::endl;
-    std::cerr << "    --sliding-window,--window=<size>: sort last <size> entries" << std::endl;
-    std::cerr << "    --string,-s: keys are strings; a quick and dirty option to support strings" << std::endl;
-    std::cerr << "                 default: double" << std::endl;
-    std::cerr << "    --unique,-u: sort input, output only the first line matching given keys; if no sorting required, use --first for better performance" << std::endl;
-    std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    shuffle: output input records in pseudo-random order" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --fields=[<fields>]; if 'block' field present shuffle each block, otherwise read whole input and then shuffle" << std::endl;
+    std::cerr << "            --sliding-window,--window=[<size>]; shuffle on sliding window of <size> records" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    sort by first field:" << std::endl;
-    std::cerr << "        echo -e \"2\\n1\\n3\" | csv-random --fields=a" << std::endl;
-    std::cerr << "    sort by second field:" << std::endl;
-    std::cerr << "        echo -e \"2,3\\n1,1\\n3,2\" | csv-random --fields=,b" << std::endl;
-    std::cerr << "    sort by second field then first field:" << std::endl;
-    std::cerr << "        echo -e \"2,3\\n3,1\\n1,1\\n2,2\\n1,3\" | csv-random --fields=a,b --order=b,a" << std::endl;
-    std::cerr << "    minimum (using maximum would be the same):" << std::endl;
-    std::cerr << "        basic use" << std::endl;
-    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,a,3; ) | csv-random --min --fields=,,a" << std::endl;
-    std::cerr << "        using single id" << std::endl;
-    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; ) | csv-random --min --fields=a,id" << std::endl;
-    std::cerr << "        using multiple id fields" << std::endl;
-    std::cerr << "            ( echo 1,a,1; echo 1,b,1; echo 3,b,5; echo 3,b,5; ) | csv-random --min --fields=id,a,id" << std::endl;
-    std::cerr << "        using block" << std::endl;
-    std::cerr << "            ( echo 0,a,2; echo 0,a,2; echo 0,b,3; echo 0,b,1; echo 1,c,3; echo 1,c,2; ) | csv-random --min --fields=block,,a" << std::endl;
-    std::cerr << "        using block and id" << std::endl;
-    std::cerr << "            ( echo 0,a,2; echo 0,a,2; echo 0,b,3; echo 0,b,1; echo 1,c,3; echo 1,c,2; ) | csv-random --min --fields=block,id,a" << std::endl;
-    std::cerr << "    minimum and maximum:" << std::endl;
-    std::cerr << "        basic use" << std::endl;
-    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; echo 5,b,7; echo 3,b,9 ) | csv-random --max --min --fields=,,a" << std::endl;
-    std::cerr << "        using id" << std::endl;
-    std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; echo 5,b,7; echo 3,b,9 ) | csv-random --max --min --fields=,id,a" << std::endl;
+    std::cerr << "csv options:" << std::endl;
+    std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;
     std::cerr << std::endl;
-    if( more )
-    {
-        std::cerr << std::endl;
-        std::cerr << "csv options:" << std::endl;
-        std::cerr << comma::csv::options::usage() << std::endl;
-    }
     exit( 0 );
 }
 
@@ -168,8 +124,16 @@ static int run( const comma::command_line_options& options )
 {
     std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
     std::deque< std::string > records;
+    auto output = []( std::deque< std::string >& records )
+    { 
+        for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+        records.clear();
+        if( ::csv.flush ) { std::cout.flush(); }
+    };
+    auto sliding_window = options.optional< unsigned int >( "--sliding-window,--window" );
     if( ::csv.has_field( "block" ) )
     {
+        if( sliding_window ) { std::cerr << "csv-random: shuffle: expected either block field or --sliding-window; got both" << std::endl; return 1; }
         comma::csv::input_stream< input > is( std::cin, ::csv );
         comma::uint32 block = 0;
         while( is.ready() || std::cin.good() )
@@ -179,9 +143,7 @@ static int run( const comma::command_line_options& options )
             {
                 std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
                 std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
-                for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
-                if( ::csv.flush ) { std::cout.flush(); }
-                records.clear();
+                output( records );
                 if( p ) { block = p->block; }
             }
             if( !p ) { break; }
@@ -197,10 +159,9 @@ static int run( const comma::command_line_options& options )
             }
         }
     }
-    else
+    else // quick and dirty
     {
-        // todo: quick and dirty, code duplication
-        // todo: implement --sliding-window
+        if( sliding_window ) { std::cerr << "csv-random: shuffle: --sliding-window: todo" << std::endl; return 1; }
         if( ::csv.binary() )
         {
             std::string s( ::csv.format().size(), 0 );
@@ -225,7 +186,7 @@ static int run( const comma::command_line_options& options )
         }
         std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
         std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
-        for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+        output( records );
     }
     return 0;
 }

From aeaeb8d43b7e248d6899497dd0515900272ddacc Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 28 Aug 2019 18:17:23 +1000
Subject: [PATCH 0052/1056] csv-random: shuffle: usage added

---
 csv/applications/csv-random.cpp | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 2ca8b3bd5..aa5e5b038 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -84,9 +84,12 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
     std::cerr << "    shuffle: output input records in pseudo-random order" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --fields=[<fields>]; if 'block' field present shuffle each block, otherwise read whole input and then shuffle" << std::endl;
-    std::cerr << "            --sliding-window,--window=[<size>]; shuffle on sliding window of <size> records" << std::endl;
+    std::cerr << "            --sliding-window,--window=[<size>]; todo: shuffle on sliding window of <size> records" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options:" << std::endl;
     std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;

From 7afae910910f9e97e7f3824df21d27ce8eda9fc1 Mon Sep 17 00:00:00 2001
From: Toby Dunne <toby@abysssolutions.com.au>
Date: Tue, 22 Oct 2019 13:53:57 +1100
Subject: [PATCH 0053/1056] zero-cat: compilation error with new boost fixed:
 milliseconds cast to long exlicitly

---
 io/applications/zero-cat.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/applications/zero-cat.cpp b/io/applications/zero-cat.cpp
index fef48ef75..52ac3750a 100644
--- a/io/applications/zero-cat.cpp
+++ b/io/applications/zero-cat.cpp
@@ -272,7 +272,7 @@ int main(int argc, char* argv[])
                 else { socket.bind( &endpoints[i][0] ); }
             }
             // we convert to milliseconds as converting to second floors the number so 0.99 becomes 0
-            if( wait_after_connect > 0 ) { boost::this_thread::sleep(boost::posix_time::milliseconds(wait_after_connect * 1000.0)); }
+            if( wait_after_connect > 0 ) { boost::this_thread::sleep(boost::posix_time::milliseconds( static_cast< long >( wait_after_connect * 1000.0 ) ) ); }
             
             std::string buffer;
             if( binary ) { buffer.resize( size ); }
@@ -311,7 +311,7 @@ int main(int argc, char* argv[])
                 else { socket.connect( endpoints[i].c_str() ); }
             }
             socket.setsockopt( ZMQ_SUBSCRIBE, "", 0 );
-            if( wait_after_connect > 0 ) { boost::this_thread::sleep( boost::posix_time::milliseconds( wait_after_connect * 1000.0 ) ); }
+            if( wait_after_connect > 0 ) { boost::this_thread::sleep( boost::posix_time::milliseconds( static_cast< long >( wait_after_connect * 1000.0 ) ) ); }
             if( vm.count( "server" ) )
             {
                 comma::io::publisher publisher( server, comma::io::mode::binary, true, false );

From d44da1e42d3969309f5c8fafb2ad743f9158eb9c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 22 Oct 2019 14:39:05 +1100
Subject: [PATCH 0054/1056] io/test/stream_test: missing include added
 (compilation failed with boost 1.67 using more consistent includes

---
 io/test/stream_test.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/io/test/stream_test.cpp b/io/test/stream_test.cpp
index 388702229..27133a78b 100644
--- a/io/test/stream_test.cpp
+++ b/io/test/stream_test.cpp
@@ -30,6 +30,7 @@
 #include <cstdio>
 #include <fstream>
 #include <gtest/gtest.h>
+#include <boost/asio/io_service.hpp>
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
 #include <boost/filesystem/operations.hpp>
@@ -146,4 +147,5 @@ int main( int argc, char* argv[] )
 {
     ::testing::InitGoogleTest(&argc, argv);
     return RUN_ALL_TESTS();
-}
\ No newline at end of file
+}
+

From cc89ca7d091685c534de5e3272edde6f3f67710d Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 14 Nov 2019 14:18:12 +1100
Subject: [PATCH 0055/1056] python/setup.py: fixed url

---
 python/setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/setup.py b/python/setup.py
index eaf1d4e55..9f31132c5 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -6,7 +6,7 @@
         name                = 'comma',
         version             = open('comma/version.py').readlines()[-1].strip().split()[-1].strip('\"'),
         description         = 'comma python utilties',
-        url                 = 'https://github.com/acfr/comma',
+        url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma.cpp_bindings': 'comma/cpp_bindings' },

From c951bfd8c1325fed4bf55c846b88d11849e6eea7 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 14 Nov 2019 14:29:38 +1100
Subject: [PATCH 0056/1056] python: small steps to port to python3

---
 python/comma/numpy/functions.py           | 20 ++++++------
 python/comma/numpy/test/test_functions.py | 37 ++++++++++++-----------
 2 files changed, 29 insertions(+), 28 deletions(-)

diff --git a/python/comma/numpy/functions.py b/python/comma/numpy/functions.py
index 277e9c8a3..3ea7fbabd 100644
--- a/python/comma/numpy/functions.py
+++ b/python/comma/numpy/functions.py
@@ -28,6 +28,7 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import absolute_import
+from __future__ import print_function
 import numpy as np
 import operator
 import re
@@ -114,14 +115,14 @@ def types_of_dtype(dtype, unroll=False):
         return tuple(types)
     except ValueError:
         import sys
-        print >>sys.stderr
-        print >>sys.stderr, "ATTENTION: types_of_dtype failed due to the version of numpy on this computer"
-        print >>sys.stderr, "           your applications using comma.csv will mostly work; sometimes they will fail"
-        print >>sys.stderr, "           early (meaning you will know straight away) until types_of_dtype is rewritten"
-        print >>sys.stderr, "           See todo comment in python/comma/numpy/functions.py"
-        print >>sys.stderr
-        for s in sys.exc_info(): print >>sys.stderr, "           " + str( s )
-        print >>sys.stderr
+        print( file = sys.stderr )
+        print( "ATTENTION: types_of_dtype failed due to the version of numpy on this computer", file = sys.stderr )
+        print( "           your applications using comma.csv will mostly work; sometimes they will fail", file = sys.stderr )
+        print( "           early (meaning you will know straight away) until types_of_dtype is rewritten", file = sys.stderr )
+        print( "           See todo comment in python/comma/numpy/functions.py", file = sys.stderr )
+        print( file = sys.stderr )
+        for s in sys.exc_info(): print( "           " + str( s ), file = sys.stderr )
+        print( file = sys.stderr )
         raise
 
 def structured_dtype(format_or_type):
@@ -140,8 +141,7 @@ def structured_dtype(format_or_type):
     >>> np.dtype('f8').names
     """
     dtype = np.dtype(format_or_type)
-    if len(dtype) != 0:
-        return dtype
+    if len(dtype) != 0: return dtype
     return np.dtype([('', format_or_type)])
 
 
diff --git a/python/comma/numpy/test/test_functions.py b/python/comma/numpy/test/test_functions.py
index 6a7f184fd..685f3d6bd 100644
--- a/python/comma/numpy/test/test_functions.py
+++ b/python/comma/numpy/test/test_functions.py
@@ -1,3 +1,4 @@
+from __future__ import print_function
 import unittest
 import numpy as np
 from comma.numpy import *
@@ -177,34 +178,34 @@ def test_structure_out_of_order(self):
             self.assertEqual( len( functions.types_of_dtype( ndtype2 ) ), 5 )  # shall be 4
         except ValueError:
             import sys
-            print >>sys.stderr
-            print >>sys.stderr, "ATTENTION: test_structure_out_of_order failed due to the version of numpy on this computer"
-            print >>sys.stderr, "           your applications using comma.csv will mostly work; sometimes they will fail"
-            print >>sys.stderr, "           early (meaning you will know straight away) until types_of_dtype is rewritten"
-            print >>sys.stderr, "           See todo comment in python/comma/numpy/functions.py"
-            print >>sys.stderr
-            for s in sys.exc_info(): print >>sys.stderr, "           " + str( s )
-            print >>sys.stderr
+            print( file = sys.stderr )
+            print( "ATTENTION: test_structure_out_of_order failed due to the version of numpy on this computer", file = sys.stderr )
+            print( "           your applications using comma.csv will mostly work; sometimes they will fail", file = sys.stderr )
+            print( "           early (meaning you will know straight away) until types_of_dtype is rewritten", file = sys.stderr )
+            print( "           See todo comment in python/comma/numpy/functions.py", file = sys.stderr )
+            print( file = sys.stderr )
+            for s in sys.exc_info(): print( "           " + str( s ), file = sys.stderr )
+            print( file = sys.stderr )
 
         if False:
             import sys
             self.assertEqual( sorted( ndtype1.descr ), sorted( ndtype2.descr ) )
             self.assertEqual( sorted( functions.types_of_dtype( ndtype1 ) ), sorted( functions.types_of_dtype( ndtype2 ) ) )
 
-            print >>sys.stderr, "observe the differences:"
+            print( "observe the differences:", file = sys.stderr )
 
-            print >>sys.stderr, "ndtype1: ", ndtype1
-            print >>sys.stderr, "ndtype2: ", ndtype2
+            print( "ndtype1: " + str( ndtype1 ), file = sys.stderr )
+            print( "ndtype2: " + str( ndtype2 ), file = sys.stderr )
 
-            print >>sys.stderr, "ndtype1.fields: ", ndtype1.fields
-            print >>sys.stderr, "ndtype2.fields: ", ndtype2.fields
-            print >>sys.stderr, "fields identical: ", sorted_fields1 == sorted_fields2
+            print( "ndtype1.fields: " + str( ndtype1.fields ), file = sys.stderr )
+            print( "ndtype2.fields: " + str( ndtype2.fields ), file = sys.stderr )
+            print( "fields identical: " + str( sorted_fields1 == sorted_fields2 ), file = sys.stderr )
 
-            print >>sys.stderr, "ndtype1.descr: ", ndtype1.descr
-            print >>sys.stderr, "ndtype2.descr: ", ndtype2.descr
+            print( "ndtype1.descr: " + str( ndtype1.descr ), file = sys.stderr )
+            print( "ndtype2.descr: " + str( ndtype2.descr ), file = sys.stderr )
 
-            print >>sys.stderr, "types_of_dtype( ndtype1 ): ", comma.numpy.functions.types_of_dtype( ndtype1 )
-            print >>sys.stderr, "types_of_dtype( ndtype2 ): ", comma.numpy.functions.types_of_dtype( ndtype2 )
+            print( "types_of_dtype( ndtype1 ): " + str( comma.numpy.functions.types_of_dtype( ndtype1 ) ), file = sys.stderr )
+            print( "types_of_dtype( ndtype2 ): " + str( comma.numpy.functions.types_of_dtype( ndtype2 ) ), file = sys.stderr )
 
 
 if __name__ == '__main__':

From dcfe6f954a77e750f3f3a10d9d47d5cbfcac6baa Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 14 Nov 2019 14:55:10 +1100
Subject: [PATCH 0057/1056] python: more small steps to port to python3

---
 python/comma/csv/test/numpy_format/test       |  3 +-
 python/comma/csv/test/numpy_guess_format/test |  3 +-
 python/comma/csv/test/numpy_time/test         |  3 +-
 python/comma/csv/test/stream/buffer_size/test |  7 ++--
 .../stream/stdin/corrupt_input/ascii/test     |  3 +-
 .../stream/stdin/corrupt_input/binary/test    |  3 +-
 python/comma/csv/test/struct/test             | 40 ++++++++++---------
 7 files changed, 36 insertions(+), 26 deletions(-)

diff --git a/python/comma/csv/test/numpy_format/test b/python/comma/csv/test/numpy_format/test
index 54ff41831..876acea0e 100755
--- a/python/comma/csv/test/numpy_format/test
+++ b/python/comma/csv/test/numpy_format/test
@@ -5,12 +5,13 @@ function comma_format_to_numpy
     local compress=$2
     compress=${compress:+", $compress"}
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
 numpy_format = comma.csv.format.to_numpy( '$1' $compress )
 numpy.dtype( ','.join( numpy_format ) )
-print ','.join( numpy_format )
+print( ','.join( numpy_format ) )
 END
 )"
 }
diff --git a/python/comma/csv/test/numpy_guess_format/test b/python/comma/csv/test/numpy_guess_format/test
index 31df8eac3..29df57222 100755
--- a/python/comma/csv/test/numpy_guess_format/test
+++ b/python/comma/csv/test/numpy_guess_format/test
@@ -3,11 +3,12 @@
 function comma_guess_format
 {
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
 guessed_format = comma.csv.format.guess_format( ['$1'] )
-print guessed_format
+print( guessed_format )
 END
 )"
 }
diff --git a/python/comma/csv/test/numpy_time/test b/python/comma/csv/test/numpy_time/test
index d71e39510..90a84acb0 100755
--- a/python/comma/csv/test/numpy_time/test
+++ b/python/comma/csv/test/numpy_time/test
@@ -2,13 +2,14 @@
 
 function comma_time_roundabout {
     python -c "$( cat <<END
+from __future__ import print_function
 import numpy
 import comma
 
 comma_time = '$@'
 numpy_time = comma.csv.time.to_numpy( comma_time )
 if isinstance( numpy_time, numpy.datetime64 ):
-  print comma.csv.time.from_numpy( numpy_time )
+  print( comma.csv.time.from_numpy( numpy_time ) )
 END
 )"
 }
diff --git a/python/comma/csv/test/stream/buffer_size/test b/python/comma/csv/test/stream/buffer_size/test
index a71d36f9c..c2da902de 100755
--- a/python/comma/csv/test/stream/buffer_size/test
+++ b/python/comma/csv/test/stream/buffer_size/test
@@ -1,16 +1,17 @@
 #!/bin/bash
 
-function get_buffer_size_in_bytes { python -c "import comma; print comma.csv.stream.buffer_size_in_bytes"; }
+function get_buffer_size_in_bytes { python -c "from __future__ import print_function; import comma; print( comma.csv.stream.buffer_size_in_bytes )"; }
 
 function get_default_size
 {
     local fields=$1
     local type=$2
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 fields='$fields'
 types = ('$type',) * len( fields.split(',') )
-print comma.csv.stream( comma.csv.struct( fields, *types ) ).size
+print( comma.csv.stream( comma.csv.struct( fields, *types ) ).size )
 END
 )"
 }
@@ -18,6 +19,6 @@ END
 echo "buffer_size_in_bytes=$( get_buffer_size_in_bytes )"
 
 fields="x,y"
-echo "number_of_fields=$( python -c "s = '$fields'; print len( s.split(',') )" )"
+echo "number_of_fields=$( python -c "from __future__ import print_function; s = '$fields'; print( len( s.split(',') ) )" )"
 echo "size/uint8=$( get_default_size $fields uint8 )"
 echo "size/float64=$( get_default_size $fields float64 )"
diff --git a/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test b/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
index 7eba8e0ce..a4754d1e1 100755
--- a/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
+++ b/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
@@ -5,6 +5,7 @@ source $( which comma-application-util )
 function process_records
 {
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
@@ -17,7 +18,7 @@ try:
     for r in record_stream.iter( size=-1 ):
         pass
 except ValueError:
-    print "exception=ValueError"
+    print( "exception=ValueError" )
 END
 )"
 }
diff --git a/python/comma/csv/test/stream/stdin/corrupt_input/binary/test b/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
index d7ed00bbd..ec1cd6000 100755
--- a/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
+++ b/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
@@ -5,6 +5,7 @@ source $( which comma-application-util )
 function process_records
 {
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
@@ -17,7 +18,7 @@ try:
     for r in record_stream.iter( size=-1 ):
         pass
 except ValueError:
-    print "exception=ValueError"
+    print( "exception=ValueError" )
 END
 )"
 }
diff --git a/python/comma/csv/test/struct/test b/python/comma/csv/test/struct/test
index 5e9980a19..fba303d46 100755
--- a/python/comma/csv/test/struct/test
+++ b/python/comma/csv/test/struct/test
@@ -52,14 +52,15 @@ END
 function shorthand
 {
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 't,coordinates', 'datetime64[us]', point_t )
 record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
 for i,name in enumerate( [ 'event', 'event/coordinates' ] ):
-  print "shorthand[{}]/name={}".format( i, name )
-  print "shorthand[{}]/value={}".format( i, ','.join( record_t.shorthand[name] ) )
+  print( "shorthand[{}]/name={}".format( i, name ) )
+  print( "shorthand[{}]/value={}".format( i, ','.join( record_t.shorthand[name] ) ) )
 END
 )"
 }
@@ -67,6 +68,7 @@ END
 function leaves
 {
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
@@ -74,7 +76,7 @@ timestamped_point_t = comma.csv.struct( 't,coordinates', 'datetime64[us]', point
 observer_t = comma.csv.struct( 'name,id', 'S3', 'uint32' )
 record_t = comma.csv.struct( 'observer,event,value', observer_t, timestamped_point_t, 'float64' )
 for leaf,xpath in record_t.xpath_of_leaf.iteritems():
-  print "leaves/{}={}".format( leaf, record_t.xpath_of_leaf.get( leaf ) )
+  print( "leaves/{}={}".format( leaf, record_t.xpath_of_leaf.get( leaf ) ) )
 END
 )"
 }
@@ -83,12 +85,13 @@ function record
 {
     local what=$1
     python -c "$( cat <<END
+from __future__ import print_function
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 't,coordinates', 'datetime64[us]', point_t )
 record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
-print ','.join( record_t.$what )
+print( ','.join( record_t.$what ) )
 END
 )"
 }
@@ -97,6 +100,7 @@ function assign()
 {
     local what=$1
     python -c "
+from __future__ import print_function
 import sys
 import numpy as np
 import time
@@ -131,23 +135,23 @@ t['e']['a'] = 40
 c = test_class()
 assign = test_struct.assign( c )
 assign( t[0] )
-print 'assign/basic/output/a=' + str( c.a )
-print 'assign/basic/output/b=' + str( c.b )
-print 'assign/basic/output/c=\"' + str( c.c ).split( '+' )[0] + '\"'
-print 'assign/basic/output/d=\"' + str( c.d ) + '\"'
-print 'assign/basic/output/e/a=' + str( c.e.a )
-#print 'assign/basic/output/f[0]=' + str( c.f[0] )
-#print 'assign/basic/output/f[1]=' + str( c.f[1] )
-#print 'assign/basic/output/g[0]/a=' + str( c.g[0].a )
-#print 'assign/basic/output/g[1]/a=' + str( c.g[1].a )
+print( 'assign/basic/output/a=' + str( c.a ) )
+print( 'assign/basic/output/b=' + str( c.b ) )
+print( 'assign/basic/output/c=\"' + str( c.c ).split( '+' )[0] + '\"' )
+print( 'assign/basic/output/d=\"' + str( c.d ) + '\"' )
+print( 'assign/basic/output/e/a=' + str( c.e.a ) )
+#print( 'assign/basic/output/f[0]=' + str( c.f[0] ) )
+#print( 'assign/basic/output/f[1]=' + str( c.f[1] ) )
+#print( 'assign/basic/output/g[0]/a=' + str( c.g[0].a ) )
+#print( 'assign/basic/output/g[1]/a=' + str( c.g[1].a ) )
 def convert( v ): return 'customized time: ' + str( v ).split( '+' )[0] if type( v ) == np.datetime64 else v
 assign = test_struct.assign( c, convert )
 assign( t[0] )
-print 'assign/convert/output/a=' + str( c.a )
-print 'assign/convert/output/b=' + str( c.b )
-print 'assign/convert/output/c=\"' + str( c.c ) + '\"'
-print 'assign/convert/output/d=\"' + str( c.d ) + '\"'
-print 'assign/convert/output/e/a=' + str( c.e.a )
+print( 'assign/convert/output/a=' + str( c.a ) )
+print( 'assign/convert/output/b=' + str( c.b ) )
+print( 'assign/convert/output/c=\"' + str( c.c ) + '\"' )
+print( 'assign/convert/output/d=\"' + str( c.d ) + '\"' )
+print( 'assign/convert/output/e/a=' + str( c.e.a ) )
 "
 }
 

From ea048c61acb6b215a1568ef10aed2f40116896df Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 14 Nov 2019 17:13:35 +1100
Subject: [PATCH 0058/1056] python: yet more small steps to port to python3

---
 python/comma/application/test/dict/test       |  3 ++-
 python/comma/csv/applications/csv_eval.py     | 27 ++++++++++---------
 .../test/csv-eval/permissive/ascii/test       |  4 +--
 .../test/csv-eval/permissive/binary/test      |  2 +-
 python/comma/csv/stream.py                    | 11 ++++----
 python/comma/signal/signal.py                 |  3 ++-
 6 files changed, 27 insertions(+), 23 deletions(-)

diff --git a/python/comma/application/test/dict/test b/python/comma/application/test/dict/test
index 70625e611..d3740e88d 100755
--- a/python/comma/application/test/dict/test
+++ b/python/comma/application/test/dict/test
@@ -11,6 +11,7 @@ function main()
     local value_type
     value_type=${input_value_type:+"value_type=$input_value_type, "}
     python -c "
+from __future__ import print_function
 import comma.application
 import argparse
 
@@ -23,7 +24,7 @@ for k, v in args.dict.iteritems():
             return '\"%s\"' % v
         else:
             return v
-    print '%s=%s' % ( k, quote_if_string( v ) )
+    print( '%s=%s' % ( k, quote_if_string( v ) ) )
 " $input_args
 }
 
diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index c634e2cb2..4ea78b482 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -27,6 +27,7 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+from __future__ import print_function
 import sys
 import os
 import argparse
@@ -253,7 +254,7 @@ def get_args():
         parser.print_help()
         parser.exit(0)
     if args.fields is None or args.fields == "": sys.exit( "csv-eval: please specify --fields" )
-    if args.init_values == '' and args.verbose: print >>sys.stderr, "csv-eval: --init currently reads one record at a time, which may be slow"
+    if args.init_values == '' and args.verbose: print( "csv-eval: --init currently reads one record at a time, which may be slow", file = sys.stderr )
     return args
 
 def ingest_deprecated_options(args):
@@ -419,7 +420,7 @@ def prepare_options(args):
         args.format = comma.csv.format.guess_format(args.first_line)
         args.binary = False
         if args.verbose:
-            print >> sys.stderr, "{}: guessed format: {}".format(__name__, args.format)
+            print( "{}: guessed format: {}".format(__name__, args.format), file = sys.stderr )
     if args.select or args.exit_if:
         return
     var_names = assignment_variable_names(args.expressions)
@@ -496,20 +497,20 @@ def initialize_update_and_output(self):
     def print_info(self, file=sys.stderr):
         fields = ','.join(self.input_t.nondefault_fields)
         format = self.input_t.format
-        print >> file, "expressions: '{}'".format(self.args.expressions)
-        print >> file, "select: '{}'".format(self.args.select)
-        print >> file, "exit_if: '{}'".format(self.args.exit_if)
-        print >> file, "default values: '{}'".format(self.args.default_values)
-        print >> file, "input fields: '{}'".format(fields)
-        print >> file, "input format: '{}'".format(format)
+        print( "expressions: '{}'".format(self.args.expressions), file = file )
+        print( "select: '{}'".format(self.args.select), file = file )
+        print( "exit_if: '{}'".format(self.args.exit_if), file = file )
+        print( "default values: '{}'".format(self.args.default_values), file = file )
+        print( "input fields: '{}'".format(fields), file = file )
+        print( "input format: '{}'".format(format), file = file )
         if self.args.select or self.args.exit_if:
             return
         update_fields = ','.join(self.update_t.fields) if self.args.update_fields else ''
         output_fields = ','.join(self.output_t.fields) if self.args.output_fields else ''
         output_format = self.output_t.format if self.args.output_fields else ''
-        print >> file, "update fields: '{}'".format(update_fields)
-        print >> file, "output fields: '{}'".format(output_fields)
-        print >> file, "output format: '{}'".format(output_format)
+        print( "update fields: '{}'".format(update_fields), file = file )
+        print( "output fields: '{}'".format(output_fields), file = file )
+        print( "output format: '{}'".format(output_format), file = file )
 
 
 def check_fields(fields, allow_numpy_names=True):
@@ -598,7 +599,7 @@ def exit_if(stream):
             if mask:
                 if not stream.args.with_error: sys.exit()
                 name = os.path.basename(sys.argv[0])
-                print >> sys.stderr, "{} error: {}".format(name, stream.args.with_error)
+                print( "{} error: {}".format(name, stream.args.with_error), file = sys.stderr )
                 sys.exit(1)
             stream.input.dump()
         input = stream.input.read()
@@ -618,7 +619,7 @@ def main():
             evaluate(stream(args))
     except csv_eval_error as e:
         name = os.path.basename(sys.argv[0])
-        print >> sys.stderr, "{} error: {}".format(name, e)
+        print( "{} error: {}".format(name, e), file = sys.stderr )
         sys.exit(1)
     except StandardError as e:
         import traceback
diff --git a/python/comma/csv/applications/test/csv-eval/permissive/ascii/test b/python/comma/csv/applications/test/csv-eval/permissive/ascii/test
index 0f4f67398..8418fab95 100755
--- a/python/comma/csv/applications/test/csv-eval/permissive/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/permissive/ascii/test
@@ -5,13 +5,13 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function csv_eval()
 {
-    csv-eval "$@" --fields=x,y 'import sys; print >> sys.stderr, "Python builtins are present!"; a=x+y'
+    csv-eval "$@" --fields=x,y 'import sys; print( "python builtins are present!" ); a=x+y'
 }
 
 function reformat_output()
 {
     prefix=$1
-    name-value-from-csv x,y,a --line-number --prefix $prefix/output | sed 's/"//g'
+    grep -v "python" | name-value-from-csv x,y,a --line-number --prefix $prefix/output | sed 's/"//g'
 }
 
 input=$( cat )
diff --git a/python/comma/csv/applications/test/csv-eval/permissive/binary/test b/python/comma/csv/applications/test/csv-eval/permissive/binary/test
index b068816d6..51bd6937d 100755
--- a/python/comma/csv/applications/test/csv-eval/permissive/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/permissive/binary/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function csv_eval()
 {
-    csv-eval "$@" --fields=x,y --binary=2d 'import sys; print >> sys.stderr, "Python builtins are present!"; a=x+y'
+    csv-eval "$@" --fields=x,y --binary=2d 'import sys; sys.stderr.write( "python builtins are present!\n" ); a=x+y'
 }
 
 function reformat_output()
diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index a950b86e1..f4509acf2 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -27,6 +27,7 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+from __future__ import print_function
 import numpy as np
 import sys
 import itertools
@@ -95,8 +96,8 @@ def __init__(self,
                                                 self.data_extraction_fields)
         #self.write_dtype = self._write_dtype()
         #self.unrolled_write_dtype = structured_dtype( ','.join( types_of_dtype( self.write_dtype, unroll=True ) ) )
-        #print >>sys.stderr, "self.write_dtype.descr = %s" % str(self.write_dtype.descr)
-        #print >>sys.stderr, "self.unrolled_write_dtype = %s" % str(self.unrolled_write_dtype)
+        #print( "self.write_dtype.descr = %s" % str(self.write_dtype.descr), file = sys.stderr )
+        #print( "self.unrolled_write_dtype = %s" % str(self.unrolled_write_dtype), file = sys.stderr )
         self._input_array = None
         self._ascii_buffer = None
         self._strings = functools.partial(map, self.numpy_scalar_to_string)
@@ -217,7 +218,7 @@ def write(self, s):
             #unrolled_array = s.view( self.unrolled_write_dtype )
             if self.tied: lines = self._tie_ascii(self.tied._ascii_buffer, unrolled_array)
             else: lines = (self._toline(scalars) for scalars in unrolled_array)
-            for line in lines: print >> self.target, line
+            for line in lines: print( line, file = self.target )
         self.target.flush()
 
     def _tie_binary(self, tied_array, array): return merge_arrays(tied_array, array)
@@ -238,7 +239,7 @@ def _dump(self):
         if self.binary:
             self._input_array.tofile(self.target)
         else:
-            for line in self._ascii_buffer: print >> self.target, line
+            for line in self._ascii_buffer: print( line, file = self.target )
         self.target.flush()
 
     def _dump_with_mask(self, mask):
@@ -257,7 +258,7 @@ def _dump_with_mask(self, mask):
             self._input_array[mask].tofile(self.target)
         else:
             for line, allowed in itertools.izip(self._ascii_buffer, mask):
-                if allowed: print >> self.target, line
+                if allowed: print( line, file = self.target )
         self.target.flush()
 
     def _warn(self, msg, verbose=True):
diff --git a/python/comma/signal/signal.py b/python/comma/signal/signal.py
index 209ba511c..efbdb0358 100644
--- a/python/comma/signal/signal.py
+++ b/python/comma/signal/signal.py
@@ -28,6 +28,7 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import absolute_import
+from __future__ import print_function
 import signal
 import sys
 import os
@@ -42,7 +43,7 @@ def __init__( self, verbose = False ):
 
     def switch_on( self, signum, frame ):
         self.state = True
-        if self.verbose: print >> sys.stderr, os.path.basename(sys.argv[0]), "caught signal:", signum
+        if self.verbose: print( os.path.basename(sys.argv[0]), "caught signal:", signum, file = sys.stderr )
 
     def __nonzero__( self ): return self.state
 

From 1b784d63227f553382e480ac1019c3c32e84e35c Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 14 Nov 2019 17:16:58 +1100
Subject: [PATCH 0059/1056] python: and yet more small steps to port to python3

---
 python/comma/csv/applications/csv-eval | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/applications/csv-eval b/python/comma/csv/applications/csv-eval
index 506d1e7d4..f170b3a22 100644
--- a/python/comma/csv/applications/csv-eval
+++ b/python/comma/csv/applications/csv-eval
@@ -1,4 +1,4 @@
-#!/usr/bin/python
+#!/usr/bin/env python
 
 # This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney

From 8bf46eb624bedbbdfe96c8118733584b63178c83 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 14 Nov 2019 19:25:49 +1100
Subject: [PATCH 0060/1056] name-value-eval*: steps to make it working with
 python3...

---
 name_value/applications/name-value-eval       |  3 +-
 .../applications/name-value-eval-preparse.cpp | 46 ++++++-------------
 2 files changed, 16 insertions(+), 33 deletions(-)

diff --git a/name_value/applications/name-value-eval b/name_value/applications/name-value-eval
index d1eb5709d..0cbaa47b0 100755
--- a/name_value/applications/name-value-eval
+++ b/name_value/applications/name-value-eval
@@ -191,7 +191,8 @@ else name-value-eval-preparse --assign > $tmp_vars; fi
 preparse_options=$output_vars_option
 if (( test_option )); then preparse_options+=" --test"; fi
 
-( cat "$tmp_vars";
+( echo "from __future__ import print_function" # uber quick and dirty
+  cat "$tmp_vars";
   if [[ -n "$input" ]]; then name-value-eval-preparse $preparse_options "$input"
   else name-value-eval-preparse $preparse_options; fi ) > $python_input
   
diff --git a/name_value/applications/name-value-eval-preparse.cpp b/name_value/applications/name-value-eval-preparse.cpp
index f1f72db67..49c968946 100644
--- a/name_value/applications/name-value-eval-preparse.cpp
+++ b/name_value/applications/name-value-eval-preparse.cpp
@@ -43,7 +43,7 @@
 static const char *exec_name = "";
 static std::string kwd_expect = "expect";
 
-void usage()
+void usage(bool)
 {
     std::cerr << "Usage: " << exec_name << " [-h|--help] [-a|--assign] [-t|--test] [-o|--output-variables=<file>] [-d|--demangle] [<input_file>]\n"
 "\n"
@@ -133,6 +133,7 @@ void usage()
 "    rules. Normally all variables that are assigned any value in the rules are output, but this can be\n"
 "    restricted to the variables listed in a file (one per line) using --output-variables.\n"
 "\n";
+exit( 0 );
 }
 
 // command line options
@@ -957,22 +958,22 @@ void process_test(std::vector<Token> &tokens, const std::string &original_line,
 
             std::cout
                 << spaces(leading_spaces)
-                << "    print '" << i->first << "/expected=" << quote(expr_str, '"') << "'\n"
+                << "    print( '" << i->first << "/expected=" << quote(expr_str, '"') << "' )\n"
                 << spaces(leading_spaces)
                 << "    sys.stdout.write('" << i->first << "/actual=\"')\n"
                 << spaces(leading_spaces)
-                << "    if __builtin__.type(" << i->second << ") == __builtin__.type({}): print dict_str(" << i->second << ")+'\"'\n"
+                << "    if __builtin__.type(" << i->second << ") == __builtin__.type({}): print( dict_str(" << i->second << ")+'\"' )\n"
                 << spaces(leading_spaces)
                 // use a Python trick to force repr() to use double quotes instead of single
                 // (for an explanation, see: http://www.gossamer-threads.com/lists/python/python/157285
                 // -- search that page for "Python delimits a string it by single quotes preferably")
-                << "    else: print repr(\"'\\0\"+str(" << i->second << "))[6:]\n";
+                << "    else: print( repr(\"'\\0\"+str(" << i->second << "))[6:] )\n";
         }
     }
     else
     {
         std::cout << spaces(leading_spaces)
-            << "    print 'false=" << quote(input_line, '\"') << "'\n";
+            << "    print( 'false=" << quote(input_line, '\"') << "' )\n";
     }
 }
 
@@ -1023,8 +1024,8 @@ void print_header()
         << "    res_val = math.sin(lat_delta / 2.0) * math.sin(lat_delta / 2.0) + math.cos(phi1) * math.cos(phi2) * math.sin(lon_delta / 2.0) * math.sin(lon_delta / 2.0)\n"
         << "    return 6366.70702 * 2.0 * math.atan2(math.sqrt(res_val), math.sqrt(1.0 - res_val))\n"
         << "def sphere_distance_nm(lat1, lon1, lat2, lon2): return km_to_nm(sphere_distance_km(lat1, lon1, lat2, lon2))\n"
-        << "def err_expr_not_bool(): print >> sys.stderr, 'File \"?\", line ' + str(inspect.currentframe().f_back.f_lineno) + '\\nTypeError: expected a true or false expression'\n"
-        << "def err_var_is_obj(v_name): print >> sys.stderr, 'TypeError: variable \"' + v_name + '\" is used in an expression but is an object (example: \"a/b = 3; a < 0\")'\n"
+        << "def err_expr_not_bool(): print( 'File \"?\", line ' + str(inspect.currentframe().f_back.f_lineno) + '\\nTypeError: expected a true or false expression', file = sys.stderr )\n"
+        << "def err_var_is_obj(v_name): print( 'TypeError: variable \"' + v_name + '\" is used in an expression but is an object (example: \"a/b = 3; a < 0\")', file = sys.stderr )\n"
         << "def dict_str(d): return \"<array of size \" + str(len(d.keys())) + \">\"\n";
         // note: err_expr_not_bool() imitates standard Python error printing:
         // 'File "name", line n' on one line, followed by the error message
@@ -1039,7 +1040,7 @@ void print_assigned_variables(const Varmap &assigned_vars)
     {
         // i->first is the demangled (original) name, i->second is the mangled name
         // (repr() puts single quotes around strings; replace with double quotes)
-        std::cout << "print '" << i->first << "='+repr(" << i->second << ").replace(\"'\", '\"')\n";
+        std::cout << "print( '" << i->first << "='+repr(" << i->second << ").replace(\"'\", '\"') )\n";
     }
 }
 
@@ -1123,49 +1124,32 @@ void process(const std::string &filename, const Options &opt, const std::set<std
 void read_restrict_vars(const std::string &filename, std::set<std::string> &restrict_vars)
 {
     std::ifstream file(filename.c_str());
-
-    if (!file)
-    {
-        std::cerr << exec_name << ": cannot open " << filename << '\n';
-        exit(1);
-    }
-
+    if (!file.is_open()) { std::cerr << exec_name << ": cannot open " << filename << '\n'; exit(1); }
     std::string line;
     while (std::getline(file, line))
     {
         std::string var_name = trim_spaces(line);
         if (!var_name.empty()) { restrict_vars.insert(mangle_id(var_name)); }
     }
-
-    if (restrict_vars.size() == 0)
-    {
-        std::cerr << exec_name << ": empty --output-variables file: " << filename << '\n';
-        exit(1);
-    }
+    if(restrict_vars.size() == 0) { std::cerr << exec_name << ": empty --output-variables file: " << filename << '\n'; exit(1); }
 }
 
 int main(int argc, char* argv[])
 {
     exec_name = argv[0];
-    comma::command_line_options options(argc, argv);
-    if (options.exists("-h,--help")) { usage(); return 0; }
-
-    // get flags
+    comma::command_line_options options(argc, argv, usage);
     Options opt;
     opt.assign = options.exists("-a,--assign");
     opt.test = options.exists("-t,--test");
     opt.restrict_vars = options.exists("-o,--output-variables");
     opt.command = !(opt.assign || opt.test);
     opt.demangle = options.exists("-d,--demangle");
-
     if (opt.test)
     {
         if (opt.assign) { std::cerr << exec_name << ": cannot have --assign and --test\n"; exit(1); }
         if (opt.restrict_vars) { std::cerr << exec_name << ": cannot have --output-variables and --test\n"; exit(1); }
     }
-
-    if (opt.demangle && (opt.assign || opt.test))
-    { std::cerr << exec_name << ": cannot use --demangle with --assign or --test\n"; exit(1); }
+    if (opt.demangle && (opt.assign || opt.test)) { std::cerr << exec_name << ": cannot use --demangle with --assign or --test\n"; exit(1); }
 
     // get unnamed options
     const char *valueless_options = "-a,--assign,-t,--test,-d,--demangle";
@@ -1173,21 +1157,19 @@ int main(int argc, char* argv[])
     std::vector<std::string> unnamed = options.unnamed(valueless_options, options_with_values);
     std::set<std::string> restrict_vars;
     std::string filename;
-
     for (size_t i = 0;i < unnamed.size();++i)
     {
         if (unnamed[i][0] == '-') { std::cerr << exec_name << ": unknown option \"" << unnamed[i] << "\"\n"; exit(1); }
         else if (filename.empty()) { filename = unnamed[i]; }
         else { std::cerr << exec_name << ": unexpected argument \"" << unnamed[i] << "\"\n"; exit(1); }
     }
-
+    
     if (opt.restrict_vars)
     {
         std::string restrict_filename = options.value<std::string> ("-o,--output-variables");
         if (restrict_filename.empty()) { std::cerr << exec_name << ": expected filename for --output-variables\n"; exit(1); }
         read_restrict_vars(restrict_filename, restrict_vars);
     }
-
     if (!opt.assign && !opt.demangle) { print_header(); }
     process(filename, opt, restrict_vars);
     return 0;

From 97416b65f496496525a4051aed267ceeefe9edc7 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Nov 2019 12:11:25 +1100
Subject: [PATCH 0061/1056] csv-eval: porting to python3...

---
 python/comma/csv/applications/csv_eval.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 4ea78b482..2afc18c24 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -561,8 +561,8 @@ def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f)
                 size = input.size
                 if stream.args.update_fields: update = stream.update_t(size)
                 if stream.args.output_fields: output = stream.output_t(size)
-                exec init_code in env, {'_input': input, '_update': update, '_output': output}
-            exec code in env, {'_input': input, '_update': update, '_output': output}
+                exec( init_code, env, {'_input': input, '_update': update, '_output': output} )
+            exec( code, env, {'_input': input, '_update': update, '_output': output} )
             if stream.args.update_fields: update_buffer(stream.input, update)
             if stream.args.output_fields: stream.output.write(output)
             else: stream.input.dump()
@@ -572,7 +572,7 @@ def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f)
 def select(stream):
     input = None
     env = restricted_numpy_env()
-    exec stream.args.default_values in env
+    exec( stream.args.default_values, env )
     fields = stream.input.fields
     code = compile(stream.args.select, '<string>', 'eval')
     is_shutdown = comma.signal.is_shutdown()
@@ -588,7 +588,7 @@ def select(stream):
 def exit_if(stream):
     input = None
     env = restricted_numpy_env()
-    exec stream.args.default_values in env
+    exec( stream.args.default_values, env )
     fields = stream.input.fields
     code = compile(stream.args.exit_if, '<string>', 'eval')
     is_shutdown = comma.signal.is_shutdown()

From 71c6c2c9d70cb0847d8b567c587fd95a2cdb8764 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Nov 2019 13:10:40 +1100
Subject: [PATCH 0062/1056] csv-eval: a lot of porting to python3...

---
 name_value/applications/name-value-calc       | 57 ++++++++++---------
 name_value/applications/name-value-eval       |  3 +
 .../applications/name-value-eval-preparse.cpp |  8 ++-
 .../test_run/black_subdirs/test.2/expected    |  4 +-
 4 files changed, 41 insertions(+), 31 deletions(-)

diff --git a/name_value/applications/name-value-calc b/name_value/applications/name-value-calc
index 638c11719..0dc525d72 100755
--- a/name_value/applications/name-value-calc
+++ b/name_value/applications/name-value-calc
@@ -156,7 +156,10 @@ function logical_op()
 function python_converter()
 {
     # todo? python2 -c "import operator...
-    python -c "import operator
+    python -c "
+from __future__ import division
+from __future__ import print_function
+import operator
 from sys import stdin
 filesep = '$file_separator'
 what = '$operation'
@@ -174,11 +177,12 @@ operands = {
              '==' : operator.eq,
              '<>' : operator.ne,
              '!=' : operator.ne,
-             '/'  : operator.div,
+             '/'  : operator.truediv,
+             '//' : operator.floordiv,
              '*'  : operator.mul,
            }
 
-arithmetic = [ '+', '-', '/', '*' ]
+arithmetic = [ '+', '-', '/', '//', '*' ]
 
 names = {}
 ordered_names = []
@@ -216,7 +220,7 @@ while True:
             names[n] = ( False, v )
             ordered_names.append( n )
     else:
-        if names.has_key( n ):
+        if n in names:
             try:
                 names[n] = ( True, op(names[n][1], v) )
             except TypeError:
@@ -225,7 +229,7 @@ while True:
 
 for n in ordered_names:
     v = names[n]
-    print '%s=\"%s\"' % ( n, str(output(v[0], v[1], logical)) )
+    print( '%s=\"%s\"' % ( n, str(output(v[0], v[1], logical)) ) )
 "
 }
 
@@ -249,31 +253,32 @@ debug=1
 
 while [[ $# -gt 0 ]]; do
     case "$1" in
-        -h|--help)               usage 0;;
-        --add)                   operation="+";;
-        --sub|--subtract)        operation="-";;
-        --mul|--mult|--multiply) operation="*";;
-        --div|--divide)          operation="/";;
-        --less)                  operation="<";;
-        --less-or-equal)         operation="<=";;
-        --more)                  operation=">";;
-        --more-or-equal)         operation=">=";;
-        --equal)                 operation="==";;
-        --non-equal)             operation="!=";;
-        --not-equal)             operation="!=";;
-        --json)                  json_format=1;;
-        --strict)                strict=1;;
-        --detailed)              detailed=1;;
-        --debug)                 debug=1;;
-        --no-debug)              debug=0;;
-        --exclude)               shift; if [[ $# == 0 ]] ; then echo "$name: --exclude lack argument" >&2; exit 1; fi; excluded+=( "$1" );;
-        -*)                      echo "$name: unrecognized option '$1'" >&2; exit 1;;
-        *)                       input_files+=( "$1" );;
+        -h|--help)                usage 0;;
+        --add)                    operation="+";;
+        --sub|--subtract)         operation="-";;
+        --mul|--mult|--multiply)  operation="*";;
+        --div|--divide|--truediv) operation="/";;
+        --floordiv)               operation="//";;
+        --less)                   operation="<";;
+        --less-or-equal)          operation="<=";;
+        --more)                   operation=">";;
+        --more-or-equal)          operation=">=";;
+        --equal)                  operation="==";;
+        --non-equal)              operation="!=";;
+        --not-equal)              operation="!=";;
+        --json)                   json_format=1;;
+        --strict)                 strict=1;;
+        --detailed)               detailed=1;;
+        --debug)                  debug=1;;
+        --no-debug)               debug=0;;
+        --exclude)                shift; if [[ $# == 0 ]] ; then echo "$name: --exclude lack argument" >&2; exit 1; fi; excluded+=( "$1" );;
+        -*)                       echo "$name: unrecognized option '$1'" >&2; exit 1;;
+        *)                        input_files+=( "$1" );;
     esac
     shift
 done
 
-binary_operands=( "-" "/" "<" "<=" ">" ">=" "==" "!=" )
+binary_operands=( "-" "/" "//" "<" "<=" ">" ">=" "==" "!=" )
 logical_operands=( "<" "<=" ">" ">=" "==" "!=" )
 
 if [[ ${#input_files[@]} == 0 ]]; then simple_usage 1; fi
diff --git a/name_value/applications/name-value-eval b/name_value/applications/name-value-eval
index 0cbaa47b0..4fadac7e3 100755
--- a/name_value/applications/name-value-eval
+++ b/name_value/applications/name-value-eval
@@ -197,6 +197,9 @@ if (( test_option )); then preparse_options+=" --test"; fi
   else name-value-eval-preparse $preparse_options; fi ) > $python_input
   
 if (( debug )); then cat $python_input | sed 's/^/debug: /g' > /dev/tty; fi
+
+#cat "$python_input" > ./python_input
+
 $python_cmd $python_input 2> $err > $out
 
 exit_code=0
diff --git a/name_value/applications/name-value-eval-preparse.cpp b/name_value/applications/name-value-eval-preparse.cpp
index 49c968946..068824190 100644
--- a/name_value/applications/name-value-eval-preparse.cpp
+++ b/name_value/applications/name-value-eval-preparse.cpp
@@ -936,7 +936,7 @@ void process_test(std::vector<Token> &tokens, const std::string &original_line,
 
     std::cout << "# SRCLINE " << line_num << " " << input_line_prefix << input_line << '\n'
         << spaces(leading_spaces) << "_result_ = (" << tokens << ")\n"
-        << spaces(leading_spaces) << "if __builtin__.type(_result_) != bool: err_expr_not_bool()\n"
+        << spaces(leading_spaces) << "if builtins_module.type(_result_) != bool: err_expr_not_bool()\n"
         << spaces(leading_spaces) << "elif not _result_:\n";
 
     if (vars.size() != 0)
@@ -962,7 +962,7 @@ void process_test(std::vector<Token> &tokens, const std::string &original_line,
                 << spaces(leading_spaces)
                 << "    sys.stdout.write('" << i->first << "/actual=\"')\n"
                 << spaces(leading_spaces)
-                << "    if __builtin__.type(" << i->second << ") == __builtin__.type({}): print( dict_str(" << i->second << ")+'\"' )\n"
+                << "    if builtins_module.type(" << i->second << ") == builtins_module.type({}): print( dict_str(" << i->second << ")+'\"' )\n"
                 << spaces(leading_spaces)
                 // use a Python trick to force repr() to use double quotes instead of single
                 // (for an explanation, see: http://www.gossamer-threads.com/lists/python/python/157285
@@ -1000,7 +1000,9 @@ void process_command(const std::vector<Token> &tokens, Varmap &assigned_vars, co
 void print_header()
 {
     std::cout
-        << "import sys, re, inspect, math, __builtin__\n"
+        << "import sys, re, inspect, math\n"
+        << "if sys.version_info.major == 2: import __builtin__; builtins_module=__builtin__\n"
+        << "else: import builtins; builtins_module=builtins\n"
         << "def near(x, y, eps): return abs(x - y) <= eps\n"
         << "def near_percent(x, y, percent): return abs(x - y) <= abs(x) * percent * 0.01\n"
         << "def max_index(dict) : return max(dict.keys())\n"
diff --git a/util/test/test_run/black_subdirs/test.2/expected b/util/test/test_run/black_subdirs/test.2/expected
index 6c0055604..936856dee 100644
--- a/util/test/test_run/black_subdirs/test.2/expected
+++ b/util/test/test_run/black_subdirs/test.2/expected
@@ -1,5 +1,5 @@
 #python
 
 expect len(expected) == 9
-expect locals().has_key('output') == False
-expect locals().has_key('stdout_log') == False
+expect ( 'output' in locals() ) == False
+expect ( 'stdout_log' in locals() ) == False

From a157ca8f3260d4bcdd3461e7649d659e15ab037a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Nov 2019 21:01:04 +1100
Subject: [PATCH 0063/1056] tests: porting to python3...

---
 bash/test/comma_background/signature/basic/test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bash/test/comma_background/signature/basic/test b/bash/test/comma_background/signature/basic/test
index ad66984bf..7e2f3b335 100755
--- a/bash/test/comma_background/signature/basic/test
+++ b/bash/test/comma_background/signature/basic/test
@@ -19,7 +19,7 @@ echo "clock_ticks_per_second=$ticks"
 comma_process_exec_and_validate "$fifo" sleep 100 || { echo "$scriptname: fatal system error, wrong background PID" >&2; exit 1; }
 background_pid=$!
 
-now=$( python -c "import sys; from numpy import int64; a = sys.stdin.readline().split()[0]; print int64(float(a) * $ticks)" < /proc/uptime )
+now=$( python -c "from __future__ import print_function; import sys; from numpy import int64; a = sys.stdin.readline().split()[0]; print( int64(float(a) * $ticks) )" < /proc/uptime )
 echo "time/now=$now"
 
 signature=$( comma_process_signature "$background_pid" )

From a4486a63d37a5a9424390572671354501078842b Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Nov 2019 21:37:09 +1100
Subject: [PATCH 0064/1056] tests: porting to python3...

---
 bash/test/comma_background/signature/args/expected | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/bash/test/comma_background/signature/args/expected b/bash/test/comma_background/signature/args/expected
index 4e62e0068..5acb607de 100644
--- a/bash/test/comma_background/signature/args/expected
+++ b/bash/test/comma_background/signature/args/expected
@@ -1,5 +1,7 @@
 #python
 
+from functools import reduce
+
 # iterate through a path of attributes: "obj/data/member/value"
 def deepgetattr(obj, attr):
     """Recurses through an attribute chain to get the ultimate value."""

From fdbdab08ffcc908c79263bfba6ed451179f3c804 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Nov 2019 21:45:29 +1100
Subject: [PATCH 0065/1056] tests: porting to python3...

---
 python/comma/numpy/functions.py           | 1 +
 python/comma/numpy/test/test_functions.py | 4 ++--
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/python/comma/numpy/functions.py b/python/comma/numpy/functions.py
index 3ea7fbabd..b0214c298 100644
--- a/python/comma/numpy/functions.py
+++ b/python/comma/numpy/functions.py
@@ -32,6 +32,7 @@
 import numpy as np
 import operator
 import re
+from functools import reduce
 
 
 def merge_arrays(first, second):
diff --git a/python/comma/numpy/test/test_functions.py b/python/comma/numpy/test/test_functions.py
index 685f3d6bd..d049183fd 100644
--- a/python/comma/numpy/test/test_functions.py
+++ b/python/comma/numpy/test/test_functions.py
@@ -162,14 +162,14 @@ def test_structure_out_of_order(self):
             itemsize = 43
 
             ndtype1 = np.dtype( dict( names=names1, formats=formats1, offsets=offsets1, itemsize=itemsize ) )
-            sorted_fields1 = sorted( list( ndtype1.fields.iteritems() ), key = lambda t: t[1] )
+            sorted_fields1 = sorted( list( ndtype1.fields.items() ), key = lambda t: t[1] )
 
             names2 = ['a3', 'word', 'a2', 'byte' ]
             formats2 = [np.dtype(('<f8', (3,))), np.dtype('uint16'), np.dtype(('<f8', (2,))), np.dtype('uint8') ]
             offsets2 = [2, 0, 27, 26 ]
 
             ndtype2 = np.dtype( dict( names=names2, formats=formats2, offsets=offsets2, itemsize=itemsize ) )
-            sorted_fields2 = sorted( list( ndtype2.fields.iteritems() ), key = lambda t: t[1] )
+            sorted_fields2 = sorted( list( ndtype2.fields.items() ), key = lambda t: t[1] )
 
             self.assertEqual( sorted_fields1, sorted_fields2 )
             self.assertEqual( len( ndtype1.descr ), 4 )

From 441ebac62d820e74412ca180e9be29a95985faaf Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Nov 2019 21:59:37 +1100
Subject: [PATCH 0066/1056] tests: porting to python3...

---
 python/comma/application/test/dict/test | 2 +-
 python/comma/csv/stream.py              | 2 +-
 python/comma/csv/struct.py              | 6 +++---
 python/comma/csv/test/struct/test       | 2 +-
 4 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/python/comma/application/test/dict/test b/python/comma/application/test/dict/test
index d3740e88d..b5ec5c40c 100755
--- a/python/comma/application/test/dict/test
+++ b/python/comma/application/test/dict/test
@@ -18,7 +18,7 @@ import argparse
 parser = argparse.ArgumentParser( )
 parser.add_argument( '--dict', metavar='DICT', help='populate a dictionary of given type', type=str, action=comma.application.set_dictionary_action, $value_type delimiter=';', default={} )
 args = parser.parse_args()
-for k, v in args.dict.iteritems():
+for k, v in args.dict.items():
     def quote_if_string( v ):
         if type( v ) == str:
             return '\"%s\"' % v
diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index f4509acf2..c13f3a3db 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -184,7 +184,7 @@ def _missing_values(self):
         missing = np.zeros(1, dtype=self.missing_dtype)
         if self.default_values:
             dtype_name_of = dict(zip(self.missing_fields, self.missing_dtype.names))
-            for field, value in self.default_values.iteritems():
+            for field, value in self.default_values.items():
                 name = dtype_name_of[field]
                 if self.missing_dtype[name] == csv_time.DTYPE:
                     try: missing[name] = csv_time.to_numpy(value)
diff --git a/python/comma/csv/struct.py b/python/comma/csv/struct.py
index cb8eae907..514438741 100644
--- a/python/comma/csv/struct.py
+++ b/python/comma/csv/struct.py
@@ -107,7 +107,7 @@ def _make_fields_map( m, fields ):
 
     def _assign( self, data, fields_map, convert ):
         functors = {}
-        for k, v in fields_map.iteritems():
+        for k, v in fields_map.items():
             if len( v ) > 0:
                 functors[k] = self._assign( getattr( data, k ), v, convert )
             else:
@@ -115,7 +115,7 @@ def functor( value, key = k ):
                     setattr( data, key, value if convert is None else convert( value ) )
                 functors[k] = functor
         def apply_functors( record ):
-            for k, f in functors.iteritems(): f( record[k] )
+            for k, f in functors.items(): f( record[k] )
         return apply_functors
     
     def _nondefault_fields(self):
@@ -172,7 +172,7 @@ def _shorthand(self):
                 continue
             fields_of_type = [name + '/' + field for field in type.fields]
             shorthand[name] = tuple(fields_of_type)
-            for subname, subfields in type.shorthand.iteritems():
+            for subname, subfields in type.shorthand.items():
                 xpath = name + '/' + subname
                 shorthand[xpath] = tuple(name + '/' + field for field in subfields)
         return shorthand
diff --git a/python/comma/csv/test/struct/test b/python/comma/csv/test/struct/test
index fba303d46..961e7525d 100755
--- a/python/comma/csv/test/struct/test
+++ b/python/comma/csv/test/struct/test
@@ -75,7 +75,7 @@ point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 't,coordinates', 'datetime64[us]', point_t )
 observer_t = comma.csv.struct( 'name,id', 'S3', 'uint32' )
 record_t = comma.csv.struct( 'observer,event,value', observer_t, timestamped_point_t, 'float64' )
-for leaf,xpath in record_t.xpath_of_leaf.iteritems():
+for leaf,xpath in record_t.xpath_of_leaf.items():
   print( "leaves/{}={}".format( leaf, record_t.xpath_of_leaf.get( leaf ) ) )
 END
 )"

From 812dd67783fd3e5a1bdcb6abc80b04de21b0305a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 16 Nov 2019 02:14:12 +1100
Subject: [PATCH 0067/1056] python/comma/csv/struct: porting to python3...

---
 python/comma/csv/struct.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/struct.py b/python/comma/csv/struct.py
index 514438741..b7cfce4f6 100644
--- a/python/comma/csv/struct.py
+++ b/python/comma/csv/struct.py
@@ -87,7 +87,7 @@ def expand_shorthand(self, compressed_fields):
         >>> outer.expand_shorthand('in')
         ('in/i', 'in/j')
         """
-        if isinstance(compressed_fields, basestring):
+        if isinstance(compressed_fields, str): #if isinstance(compressed_fields, basestring):
             compressed_fields = compressed_fields.split(',')
         expand = self.shorthand.get
         field_tuples = map(lambda name: expand(name) or (name,), compressed_fields)
@@ -123,7 +123,7 @@ def _nondefault_fields(self):
         return tuple(map(lambda f: '' if f.startswith(default_name) else f, self.fields))
 
     def _fill_blanks(self, fields):
-        if isinstance(fields, basestring):
+        if isinstance(fields, str): # if isinstance(fields, basestring):
             fields = fields.split(',')
         ntypes = len(self.concise_types)
         if len(fields) > ntypes:

From e3cd52df105935d973dc538180c591612ef3efad Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 16 Nov 2019 12:36:49 +1100
Subject: [PATCH 0068/1056] python/comma: porting to python3

---
 python/comma/csv/applications/csv_eval.py | 4 ++--
 python/comma/csv/stream.py                | 2 +-
 python/comma/csv/struct.py                | 4 ++--
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 2afc18c24..6537f4721 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -334,7 +334,7 @@ def comma_type(maybe_type, field, default_type='d', type_of_unnamed_field='s[0]'
         if len(maybe_types) > len(fields):
             msg = "format '{}' is longer than fields '{}'".format(format, ','.join(fields))
             raise ValueError(msg)
-    maybe_typed_fields = itertools.izip_longest(maybe_types, fields)
+    maybe_typed_fields = itertools.zip_longest(maybe_types, fields) if sys.version_info.major > 2 else itertools.izip_longest(maybe_types, fields) # uber quick and dirty
     types = [comma_type(maybe_type, field) for maybe_type, field in maybe_typed_fields]
     return ','.join(types)
 
@@ -621,7 +621,7 @@ def main():
         name = os.path.basename(sys.argv[0])
         print( "{} error: {}".format(name, e), file = sys.stderr )
         sys.exit(1)
-    except StandardError as e:
+    except Exception as e: #except StandardError as e:
         import traceback
         traceback.print_exc(file=sys.stderr)
         sys.exit(1)
diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index c13f3a3db..78505d855 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -289,7 +289,7 @@ def _fields(self, fields):
         return tuple(xpath(name) or name for name in fields.split(','))
 
     def _format(self, binary, format):
-        if isinstance(binary, basestring):
+        if isinstance(binary, str): # if isinstance(binary, basestring):
             if self.verbose and binary and format and binary != format:
                 msg = "ignoring '{}' and using '{}' since binary keyword has priority" \
                     .format(format, binary)
diff --git a/python/comma/csv/struct.py b/python/comma/csv/struct.py
index b7cfce4f6..f4fe66887 100644
--- a/python/comma/csv/struct.py
+++ b/python/comma/csv/struct.py
@@ -40,13 +40,13 @@ def __init__(self, concise_fields, *concise_types):
         self.concise_types = concise_types
         self.concise_fields = self._fill_blanks(concise_fields)
         self._check_fields_conciseness()
-        self.dtype = np.dtype(zip(self.concise_fields, self.concise_types))
+        self.dtype = np.dtype(list(zip(self.concise_fields, self.concise_types)))
         self.fields = self._full_xpath_fields()
         self.nondefault_fields = self._nondefault_fields()
         self.types = self._basic_types()
         self.shorthand = self._shorthand()
         self.format = ','.join(self.types)
-        self.flat_dtype = np.dtype(zip(self.fields, self.types))
+        self.flat_dtype = np.dtype(list(zip(self.fields, self.types)))
         unrolled_types = types_of_dtype(self.flat_dtype, unroll=True)
         self.unrolled_flat_dtype = structured_dtype(','.join(unrolled_types))
         self.type_of_field = dict(zip(self.fields, self.types))

From b7c7df88b50a5a115f8e8a0e386b86904eb6ef26 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 16 Nov 2019 13:47:54 +1100
Subject: [PATCH 0069/1056] python/comma: porting to python3; stream and time

---
 python/comma/csv/stream.py                | 8 ++++----
 python/comma/csv/test/unit/test_stream.py | 4 +++-
 python/comma/csv/time.py                  | 8 ++++++--
 3 files changed, 13 insertions(+), 7 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 78505d855..eb51072ef 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -361,10 +361,10 @@ def _missing_fields(self):
     def _missing_dtype(self):
         if not self.missing_fields: return
         n = len(self.input_dtype.names)
-        missing_names = ['f{}'.format(n + i) for i in xrange(len(self.missing_fields))]
+        missing_names = ['f{}'.format(n + i) for i in range(len(self.missing_fields))] # missing_names = ['f{}'.format(n + i) for i in xrange(len(self.missing_fields))]
         type_of = self.struct.type_of_field.get
         missing_types = [type_of(name) for name in self.missing_fields]
-        return np.dtype(zip(missing_names, missing_types))
+        return np.dtype(list(zip(missing_names, missing_types)))
 
     def _complete_dtype(self):
         if self.missing_dtype: return np.dtype(self.input_dtype.descr + self.missing_dtype.descr)
@@ -438,12 +438,12 @@ def numpy_scalar_to_string(scalar, precision=DEFAULT_PRECISION):
     '20150102T123456.123456'
     >>> numpy_scalar_to_string(np.timedelta64(-123, 's'))
     '-123'
-    """
-    
+    """    
     if scalar.dtype.char in np.typecodes['AllInteger']: return str(scalar)
     elif scalar.dtype.char in np.typecodes['Float']: return "{scalar:.{precision}g}".format(scalar=scalar, precision=precision)
     elif scalar.dtype.char in np.typecodes['Datetime']: return csv_time.from_numpy(scalar)
     elif scalar.dtype.char in 'S': return scalar
+    elif scalar.dtype.char in 'U': return scalar
     elif scalar.dtype.char in '?': return str( int( scalar ) ) #elif scalar.dtype.char in '?': return str( map( int, scalar ) )
     msg = "converting {} to string is not implemented".format(repr(scalar.dtype))
     raise NotImplementedError(msg)
diff --git a/python/comma/csv/test/unit/test_stream.py b/python/comma/csv/test/unit/test_stream.py
index 191a1c58b..528b72982 100644
--- a/python/comma/csv/test/unit/test_stream.py
+++ b/python/comma/csv/test/unit/test_stream.py
@@ -1,3 +1,4 @@
+from __future__ import print_function
 import unittest
 import numpy as np
 import sys
@@ -16,7 +17,8 @@ def test_use_defaults(self):
         self.assertTrue(s.full_xpath)
 
     def test_override_defaults(self):
-        from cStringIO import StringIO
+        if sys.version_info.major < 3: from cStringIO import StringIO # quick and dirty, sigh...
+        else: from io import StringIO
         source = StringIO("")
         target = StringIO("")
         t = comma.csv.stream(comma.csv.struct('id', 'S4'), delimiter=';')
diff --git a/python/comma/csv/time.py b/python/comma/csv/time.py
index 611cf6183..39c33ad3b 100644
--- a/python/comma/csv/time.py
+++ b/python/comma/csv/time.py
@@ -31,6 +31,7 @@
 import numpy as np
 import re
 import os
+import sys
 import time
 
 UNIT = 'us'
@@ -40,6 +41,7 @@
 NOT_A_DATE_TIME = np.datetime64('NaT')
 POSITIVE_INFINITY = np.datetime64('294247-01-09T04:00:54.775807')
 NEGATIVE_INFINITY = np.datetime64('-290308-12-22T19:59:05.224191')
+BASESTRING = basestring if sys.version_info.major < 3 else str # sigh...
 
 def is_undefined(numpy_time): return str(numpy_time) == str(NOT_A_DATE_TIME)
 
@@ -65,7 +67,7 @@ def to_numpy(t):
     if t in ['', 'not-a-date-time']: return NOT_A_DATE_TIME
     if t in ['+infinity', '+inf', 'infinity', 'inf']: return POSITIVE_INFINITY
     if t in ['-infinity', '-inf']: return NEGATIVE_INFINITY
-    if not (isinstance(t, basestring) and re.match(r'^(\d{8}T\d{6}(\.\d{0,6})?)$', t)):
+    if not (isinstance(t, BASESTRING) and re.match(r'^(\d{8}T\d{6}(\.\d{0,6})?)$', t)):
         msg = "expected comma time, got '{}'".format(repr(t))
         raise TypeError(msg)
     v = list(t)
@@ -100,7 +102,9 @@ def from_numpy(t):
     if is_undefined(t): return 'not-a-date-time'
     if is_negative_infinity(t): return '-infinity'
     if is_positive_infinity(t): return '+infinity'
-    return re.sub(r'(\.0{6})?([-+]\d{4}|Z)?$', '', str(t)).translate(None, ':-')
+    s = re.sub(r'(\.0{6})?([-+]\d{4}|Z)?$', '', str(t))
+    #return re.sub(r'(\.0{6})?([-+]\d{4}|Z)?$', '', str(t)).translate(None, ':-')
+    return s.translate(str.maketrans('', '', ':-')) if sys.version_info.major > 2 else s.translate(None, ':-') # sigh... cannot believe i am going this...
 
 def ascii_converters(types):
     converters = {}

From f6c81a4be74af1df269a105d4a91e56aa0091e0f Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 16 Nov 2019 14:37:04 +1100
Subject: [PATCH 0070/1056] python/comma: porting to python3; stream: floor
 division, explicit conversion of string types to str

---
 python/comma/csv/stream.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index eb51072ef..57d1fabdb 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -348,7 +348,7 @@ def _input_dtype(self):
     def _default_buffer_size(self):
         if self.tied: return self.tied.size
         elif self.flush: return 1
-        return max( 1, stream.buffer_size_in_bytes / self.input_dtype.itemsize ) # todo? too arbitrary for ascii?
+        return max( 1, stream.buffer_size_in_bytes // self.input_dtype.itemsize ) # todo? too arbitrary for ascii?
 
     def _missing_fields(self):
         missing_fields = [field for field in self.struct.fields if field not in self.fields]
@@ -442,8 +442,8 @@ def numpy_scalar_to_string(scalar, precision=DEFAULT_PRECISION):
     if scalar.dtype.char in np.typecodes['AllInteger']: return str(scalar)
     elif scalar.dtype.char in np.typecodes['Float']: return "{scalar:.{precision}g}".format(scalar=scalar, precision=precision)
     elif scalar.dtype.char in np.typecodes['Datetime']: return csv_time.from_numpy(scalar)
-    elif scalar.dtype.char in 'S': return scalar
-    elif scalar.dtype.char in 'U': return scalar
+    elif scalar.dtype.char in 'S': return str(scalar) # quick and dirty, python3, sigh...
+    elif scalar.dtype.char in 'U': return str(scalar) # quick and dirty, python3, sigh...
     elif scalar.dtype.char in '?': return str( int( scalar ) ) #elif scalar.dtype.char in '?': return str( map( int, scalar ) )
     msg = "converting {} to string is not implemented".format(repr(scalar.dtype))
     raise NotImplementedError(msg)

From d168150267d1ff8ee0993e80c00e5ab12d79f7ad Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 12:29:45 +1100
Subject: [PATCH 0071/1056] python/comma: porting to python3; stream: reading
 and writing binary data, it still outputs strings with binary decorator; in
 progress...

---
 python/comma/csv/stream.py | 34 ++++++++++++++++++++++++++--------
 1 file changed, 26 insertions(+), 8 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 57d1fabdb..eb82e631f 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -28,10 +28,11 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import print_function
+import functools
+import itertools
 import numpy as np
+import os
 import sys
-import itertools
-import functools
 import warnings
 from ..util import warning
 from ..io import readlines_unbuffered
@@ -69,6 +70,7 @@ def __init__(self,
         self.flush = flush
         self.source = source
         self.target = target
+        if target == sys.stdout: self.stdout = os.fdopen( sys.stdout.fileno(), "wb" )
         self.tied = tied
         self.full_xpath = full_xpath
         self.verbose = verbose
@@ -156,11 +158,24 @@ def read_from_line(self, line):
 
     def _read(self, size):
         if self.binary:
-            if size < 0 and self.source == sys.stdin:
-                return np.fromstring(self.source.read(), dtype=self.input_dtype)
+            if np.__version__ >= '1.16.0': # sigh...
+                if self.source == sys.stdin:
+                    if size < 0:
+                        return np.fromstring( self.source.read(), dtype = self.input_dtype )
+                    else:
+                        b = sys.stdin.buffer.read( self.input_dtype.itemsize * size )
+                        # print( "--> a: len(b):", len(b), "size:", size, "self.input_dtype.itemsize:", self.input_dtype.itemsize, file = sys.stderr )
+                        # todo! test on streams where bytes come with irregular delays!
+                        if len(b) % self.input_dtype.itemsize != 0: raise TypeError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
+                        return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )
+                else:
+                    return np.fromfile( self.source, dtype = self.input_dtype, count = -1 if size < 0 else size ) # this line may not be covered by regression test
             else:
-                count = -1 if size < 0 else size
-                return np.fromfile(self.source, dtype=self.input_dtype, count=count)
+                if size < 0 and self.source == sys.stdin:
+                    return np.fromstring(self.source.read(), dtype=self.input_dtype)
+                else:
+                    count = -1 if size < 0 else size
+                    return np.fromfile(self.source, dtype=self.input_dtype, count=count)
         else:
             with warnings.catch_warnings():
                 warnings.simplefilter('ignore')
@@ -211,8 +226,11 @@ def write(self, s):
             msg = "size {} not equal to tied size {}".format(s.size, tied_size)
             raise ValueError(msg)
         if self.binary:
-            if self.tied: self._tie_binary(self.tied._input_array, s).tofile(self.target)
-            else: s.tofile(self.target)
+            if np.__version__ >= '1.16.0' and self.target == sys.stdout: # sigh...
+                self.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
+            else:
+                if self.tied: self._tie_binary(self.tied._input_array, s).tofile(self.target)
+                else: s.tofile(self.target)
         else:
             unrolled_array = s.view(self.struct.unrolled_flat_dtype)
             #unrolled_array = s.view( self.unrolled_write_dtype )

From 741507dec7de440e5ce3db5821cbeb9ceb7f6b2c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 12:52:05 +1100
Subject: [PATCH 0072/1056] python/comma: porting to python3; struct: test: S4
 replaced with U4 string definition; in progress...

---
 python/comma/csv/test/struct/test | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/python/comma/csv/test/struct/test b/python/comma/csv/test/struct/test
index 961e7525d..2ca45ac28 100755
--- a/python/comma/csv/test/struct/test
+++ b/python/comma/csv/test/struct/test
@@ -122,7 +122,7 @@ class test_class:
 
 nested_struct = comma.csv.struct( 'a', 'uint32' )
 #test_struct = comma.csv.struct( 'a,b,c,d,e,f,g', 'uint32', 'float32', 'datetime64[us]', 'S4', nested_struct, 'uint32', ( nested_struct, ( 2, ) ) )
-test_struct = comma.csv.struct( 'a,b,c,d,e', 'uint32', 'float32', 'datetime64[us]', 'S4', nested_struct )
+test_struct = comma.csv.struct( 'a,b,c,d,e', 'uint32', 'float32', 'datetime64[us]', 'U4', nested_struct )
 t = test_struct()
 t['a'] = 10
 t['b'] = 20
@@ -135,6 +135,7 @@ t['e']['a'] = 40
 c = test_class()
 assign = test_struct.assign( c )
 assign( t[0] )
+
 print( 'assign/basic/output/a=' + str( c.a ) )
 print( 'assign/basic/output/b=' + str( c.b ) )
 print( 'assign/basic/output/c=\"' + str( c.c ).split( '+' )[0] + '\"' )

From 7d4571a82fbaea3212879f6c58bea6997de1f64a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 21:06:55 +1100
Subject: [PATCH 0073/1056] python/comma: porting to python3; stream: decode(
 'utf-8' ) added to ascii output for strings; in progress...

---
 python/comma/csv/stream.py                        | 3 +--
 python/comma/csv/test/stream/basic/test           | 6 ++++--
 python/comma/csv/test/stream/buffer_size/expected | 4 ++--
 python/comma/csv/test/stream/buffer_size/test     | 2 ++
 4 files changed, 9 insertions(+), 6 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index eb82e631f..c9f84d5df 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -164,7 +164,6 @@ def _read(self, size):
                         return np.fromstring( self.source.read(), dtype = self.input_dtype )
                     else:
                         b = sys.stdin.buffer.read( self.input_dtype.itemsize * size )
-                        # print( "--> a: len(b):", len(b), "size:", size, "self.input_dtype.itemsize:", self.input_dtype.itemsize, file = sys.stderr )
                         # todo! test on streams where bytes come with irregular delays!
                         if len(b) % self.input_dtype.itemsize != 0: raise TypeError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
                         return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )
@@ -460,7 +459,7 @@ def numpy_scalar_to_string(scalar, precision=DEFAULT_PRECISION):
     if scalar.dtype.char in np.typecodes['AllInteger']: return str(scalar)
     elif scalar.dtype.char in np.typecodes['Float']: return "{scalar:.{precision}g}".format(scalar=scalar, precision=precision)
     elif scalar.dtype.char in np.typecodes['Datetime']: return csv_time.from_numpy(scalar)
-    elif scalar.dtype.char in 'S': return str(scalar) # quick and dirty, python3, sigh...
+    elif scalar.dtype.char in 'Sa': return scalar.decode('UTF-8') # quick and dirty, python3, sigh...
     elif scalar.dtype.char in 'U': return str(scalar) # quick and dirty, python3, sigh...
     elif scalar.dtype.char in '?': return str( int( scalar ) ) #elif scalar.dtype.char in '?': return str( map( int, scalar ) )
     msg = "converting {} to string is not implemented".format(repr(scalar.dtype))
diff --git a/python/comma/csv/test/stream/basic/test b/python/comma/csv/test/stream/basic/test
index 6391c34d9..8307292ec 100755
--- a/python/comma/csv/test/stream/basic/test
+++ b/python/comma/csv/test/stream/basic/test
@@ -14,7 +14,9 @@ import numpy
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 'time,coordinates', 'datetime64[us]', point_t )
-record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
+#record_t = comma.csv.struct( 'observer,event', 'U3', timestamped_point_t 
+#record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
+record_t = comma.csv.struct( 'observer,event', 'S8', timestamped_point_t )
 record_stream = comma.csv.stream( record_t, binary=$binary )
 
 for i,r in enumerate( record_stream.iter(), start=1 ):
@@ -31,6 +33,6 @@ echo "$input" | process_records | output ascii
 comma_status_ok
 echo "ascii/status=$?"
 
-echo "$input" | csv-to-bin s[3],t,3d | process_records binary | csv-from-bin s[3],t,3d | output binary
+echo "$input" | csv-to-bin s[8],t,3d | process_records binary | csv-from-bin s[8],t,3d | output binary
 comma_status_ok
 echo "binary/status=$?"
diff --git a/python/comma/csv/test/stream/buffer_size/expected b/python/comma/csv/test/stream/buffer_size/expected
index 5f647e531..c0a29afba 100644
--- a/python/comma/csv/test/stream/buffer_size/expected
+++ b/python/comma/csv/test/stream/buffer_size/expected
@@ -1,5 +1,5 @@
 #python
 
 expect buffer_size_in_bytes = 65536
-expect size/uint8 = buffer_size_in_bytes / number_of_fields
-expect size/float64 = buffer_size_in_bytes / ( 8 * number_of_fields )
+expect size/uint8 = buffer_size_in_bytes // number_of_fields
+expect size/float64 = buffer_size_in_bytes // ( 8 * number_of_fields )
diff --git a/python/comma/csv/test/stream/buffer_size/test b/python/comma/csv/test/stream/buffer_size/test
index c2da902de..5598de759 100755
--- a/python/comma/csv/test/stream/buffer_size/test
+++ b/python/comma/csv/test/stream/buffer_size/test
@@ -8,10 +8,12 @@ function get_default_size
     local type=$2
     python -c "$( cat <<END
 from __future__ import print_function
+import sys
 import comma
 fields='$fields'
 types = ('$type',) * len( fields.split(',') )
 print( comma.csv.stream( comma.csv.struct( fields, *types ) ).size )
+sys.stdout.flush() # have to flush, since stdout gets highjacked by comma.csv.stream (which kind of make sense)
 END
 )"
 }

From 5dcc41c135b783aed46c390e83532c34c2d66977 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 21:15:51 +1100
Subject: [PATCH 0074/1056] python/comma: porting to python3; stream: call
 fdopen on stdout only on numpy version >= 1.16.0; in progress...

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index c9f84d5df..745655cab 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -70,7 +70,7 @@ def __init__(self,
         self.flush = flush
         self.source = source
         self.target = target
-        if target == sys.stdout: self.stdout = os.fdopen( sys.stdout.fileno(), "wb" )
+        if np.__version__ >= '1.16.0' and target == sys.stdout: self.stdout = os.fdopen( sys.stdout.fileno(), "wb" )
         self.tied = tied
         self.full_xpath = full_xpath
         self.verbose = verbose

From fc91e995d494ff3b26e03ff691136b88b965e2b6 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 21:24:34 +1100
Subject: [PATCH 0075/1056] python/comma: porting to python3; stream: removed
 calling fdopen on stdout on numpy version >= 1.16.0, write bytes directly to
 sys.stdout instead; in progress...

---
 python/comma/csv/stream.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 745655cab..c2879513f 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -70,7 +70,7 @@ def __init__(self,
         self.flush = flush
         self.source = source
         self.target = target
-        if np.__version__ >= '1.16.0' and target == sys.stdout: self.stdout = os.fdopen( sys.stdout.fileno(), "wb" )
+        #if np.__version__ >= '1.16.0' and target == sys.stdout: self.stdout = os.fdopen( sys.stdout.fileno(), "wb" )
         self.tied = tied
         self.full_xpath = full_xpath
         self.verbose = verbose
@@ -226,7 +226,8 @@ def write(self, s):
             raise ValueError(msg)
         if self.binary:
             if np.__version__ >= '1.16.0' and self.target == sys.stdout: # sigh...
-                self.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
+                #self.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
+                sys.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
             else:
                 if self.tied: self._tie_binary(self.tied._input_array, s).tofile(self.target)
                 else: s.tofile(self.target)

From 374388d968c1ef98ff3ebbed4778bfdda09e5774 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 21:25:10 +1100
Subject: [PATCH 0076/1056] python/comma: porting to python3; test_stream: use
 // instead of / for division; in progress...

---
 python/comma/csv/test/unit/test_stream.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/test/unit/test_stream.py b/python/comma/csv/test/unit/test_stream.py
index 528b72982..d17ef8b3c 100644
--- a/python/comma/csv/test/unit/test_stream.py
+++ b/python/comma/csv/test/unit/test_stream.py
@@ -135,11 +135,11 @@ def test_size(self):
         s = comma.csv.struct('x,id', 'f8', 'u4')
         tied = comma.csv.stream(comma.csv.struct('i', 'u2'))
         t1 = comma.csv.stream(s)
-        self.assertEqual(t1.size, comma.csv.stream.buffer_size_in_bytes / 12)
+        self.assertEqual(t1.size, comma.csv.stream.buffer_size_in_bytes // 12)
         t2 = comma.csv.stream(s, flush=True)
         self.assertEqual(t2.size, 1)
         t3 = comma.csv.stream(s, tied=tied)
-        self.assertEqual(t3.size, comma.csv.stream.buffer_size_in_bytes / 2)
+        self.assertEqual(t3.size, comma.csv.stream.buffer_size_in_bytes // 2)
 
     def test_ascii_simple_single_field(self):
         s = comma.csv.struct('x', 'f8')

From c816c8eb4a60f52e636988a6effe9f07122efc99 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 21:48:54 +1100
Subject: [PATCH 0077/1056] python/comma: porting to python3; stream: using
 sys.stdout.buffer.write() instead of sys.stdout.write(); in progress...

---
 python/comma/csv/stream.py              | 2 +-
 python/comma/io/readlines_unbuffered.py | 5 +++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index c2879513f..89ed2b663 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -227,7 +227,7 @@ def write(self, s):
         if self.binary:
             if np.__version__ >= '1.16.0' and self.target == sys.stdout: # sigh...
                 #self.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
-                sys.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
+                sys.stdout.buffer.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
             else:
                 if self.tied: self._tie_binary(self.tied._input_array, s).tofile(self.target)
                 else: s.tofile(self.target)
diff --git a/python/comma/io/readlines_unbuffered.py b/python/comma/io/readlines_unbuffered.py
index 5d34e1561..6e6d5d286 100644
--- a/python/comma/io/readlines_unbuffered.py
+++ b/python/comma/io/readlines_unbuffered.py
@@ -28,7 +28,8 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 import sys
-import itertools
+if sys.version_info.major < 3: from itertools import ifilter
+else: ifilter = filter # quick and dirty, tired of googling...
 
 
 def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
@@ -54,7 +55,7 @@ def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
             number_of_lines += 1
         return lines
     if skip_blank_lines:
-        source_ = itertools.ifilter(lambda line: line.strip(), source)
+        source_ = ifilter(lambda line: line.strip(), source)
     else:
         source_ = source
     return [line.rstrip('\n') for line in source_]

From a6f29c56edf05f96dbaa2fbee3cfc25a4d59d41a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 22:06:36 +1100
Subject: [PATCH 0078/1056] python/comma: porting to python3; stream: handling
 size -1 in _read()... not necessarily correctly...; in progress...

---
 python/comma/csv/stream.py | 11 ++++-------
 1 file changed, 4 insertions(+), 7 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 89ed2b663..6674934c3 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -160,13 +160,10 @@ def _read(self, size):
         if self.binary:
             if np.__version__ >= '1.16.0': # sigh...
                 if self.source == sys.stdin:
-                    if size < 0:
-                        return np.fromstring( self.source.read(), dtype = self.input_dtype )
-                    else:
-                        b = sys.stdin.buffer.read( self.input_dtype.itemsize * size )
-                        # todo! test on streams where bytes come with irregular delays!
-                        if len(b) % self.input_dtype.itemsize != 0: raise TypeError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
-                        return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )
+                    b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size > 0 else self.size ) )
+                    # todo! test on streams where bytes come with irregular delays!
+                    if len(b) % self.input_dtype.itemsize != 0: raise TypeError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
+                    return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )
                 else:
                     return np.fromfile( self.source, dtype = self.input_dtype, count = -1 if size < 0 else size ) # this line may not be covered by regression test
             else:

From f50a03f572f66845017ec82c18f06d5971e76368 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 17 Nov 2019 22:11:18 +1100
Subject: [PATCH 0079/1056] python/comma: porting to python3; stream: throwing
 valueerror instead of typeerror; in progress...

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 6674934c3..0ca19e6f0 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -162,7 +162,7 @@ def _read(self, size):
                 if self.source == sys.stdin:
                     b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size > 0 else self.size ) )
                     # todo! test on streams where bytes come with irregular delays!
-                    if len(b) % self.input_dtype.itemsize != 0: raise TypeError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
+                    if len(b) % self.input_dtype.itemsize != 0: raise ValueError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
                     return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )
                 else:
                     return np.fromfile( self.source, dtype = self.input_dtype, count = -1 if size < 0 else size ) # this line may not be covered by regression test

From 687c884aca569b4486890348f2a7a8311c2622d0 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Mon, 18 Nov 2019 10:50:18 +1100
Subject: [PATCH 0080/1056] csv-eval: !/usr/bin/env python replaced with
 /usr/bin/python until fully ported to python3

---
 python/comma/csv/applications/csv-eval | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/python/comma/csv/applications/csv-eval b/python/comma/csv/applications/csv-eval
index f170b3a22..340655a02 100644
--- a/python/comma/csv/applications/csv-eval
+++ b/python/comma/csv/applications/csv-eval
@@ -1,4 +1,5 @@
-#!/usr/bin/env python
+#!/usr/bin/python
+# todo: once fully ported to python3: !/usr/bin/env python
 
 # This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney

From 0abbe1fd5a0d396044f0f316ba2072cedf9ce241 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Mon, 18 Nov 2019 13:54:11 +1100
Subject: [PATCH 0081/1056] python/comma: porting to python3; stream: reading
 stdin conditioned on python version instead of numpy version; in progress...

---
 python/comma/csv/stream.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 0ca19e6f0..af273094d 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -158,7 +158,8 @@ def read_from_line(self, line):
 
     def _read(self, size):
         if self.binary:
-            if np.__version__ >= '1.16.0': # sigh...
+            #if np.__version__ >= '1.16.0': # sigh...
+            if sys.version_info.major > 2:
                 if self.source == sys.stdin:
                     b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size > 0 else self.size ) )
                     # todo! test on streams where bytes come with irregular delays!

From 87574731c73423cf1cc454ce1ff71b6f9aedfad1 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 16:26:39 +1100
Subject: [PATCH 0082/1056] python/comma: porting to python3; stream: write():
 checking numpy version replaced with checking python version; in progress...

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index af273094d..1b3e5f37b 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -223,7 +223,7 @@ def write(self, s):
             msg = "size {} not equal to tied size {}".format(s.size, tied_size)
             raise ValueError(msg)
         if self.binary:
-            if np.__version__ >= '1.16.0' and self.target == sys.stdout: # sigh...
+            if sys.version_info > 2 and self.target == sys.stdout: # sigh...
                 #self.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
                 sys.stdout.buffer.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
             else:

From be459087195bca376d5961673de9275163e43612 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 19:52:25 +1100
Subject: [PATCH 0083/1056] python/comma: porting to python3; signal: ported to
 python3; in progress...

---
 python/comma/csv/applications/csv_eval.py | 6 +++++-
 python/comma/signal/signal.py             | 6 ++++--
 2 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 6537f4721..df54118ec 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -553,9 +553,12 @@ def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f)
     update = None
     output = None
     input = None
-    is_shutdown = comma.signal.is_shutdown()
+    is_shutdown = comma.signal.is_shutdown( verbose = stream.args.verbose )
+    if is_shutdown: print( '--> a: is shutdown', file = sys.stderr )
     if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
+    print( '--> b', file = sys.stderr )
     while not is_shutdown:
+        print( '--> c', file = sys.stderr )
         if input is not None:
             if size != input.size:
                 size = input.size
@@ -568,6 +571,7 @@ def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f)
             else: stream.input.dump()
         input = stream.input.read( read_size )
         if input is None: break
+    print( '--> d', file = sys.stderr )
 
 def select(stream):
     input = None
diff --git a/python/comma/signal/signal.py b/python/comma/signal/signal.py
index efbdb0358..34ed994bb 100644
--- a/python/comma/signal/signal.py
+++ b/python/comma/signal/signal.py
@@ -43,8 +43,10 @@ def __init__( self, verbose = False ):
 
     def switch_on( self, signum, frame ):
         self.state = True
-        if self.verbose: print( os.path.basename(sys.argv[0]), "caught signal:", signum, file = sys.stderr )
+        if self.verbose: print( os.path.basename( sys.argv[0] ), ": caught signal:", signum, file = sys.stderr )
 
-    def __nonzero__( self ): return self.state
+    def __bool__( self ): return self.state
+
+    __nonzero__ = __bool__
 
 signal.signal( signal.SIGPIPE, signal.SIG_DFL )

From a877fef6bc1b94a2f6adff676f60afbc68b34365 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 19:53:01 +1100
Subject: [PATCH 0084/1056] python/comma: porting to python3; debug output
 commented; in progress...

---
 python/comma/csv/applications/csv_eval.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index df54118ec..003cfd4ef 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -554,11 +554,11 @@ def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f)
     output = None
     input = None
     is_shutdown = comma.signal.is_shutdown( verbose = stream.args.verbose )
-    if is_shutdown: print( '--> a: is shutdown', file = sys.stderr )
+    #if is_shutdown: print( '--> a: is shutdown', file = sys.stderr )
     if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
-    print( '--> b', file = sys.stderr )
+    #print( '--> b', file = sys.stderr )
     while not is_shutdown:
-        print( '--> c', file = sys.stderr )
+        #print( '--> c', file = sys.stderr )
         if input is not None:
             if size != input.size:
                 size = input.size
@@ -571,7 +571,7 @@ def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f)
             else: stream.input.dump()
         input = stream.input.read( read_size )
         if input is None: break
-    print( '--> d', file = sys.stderr )
+    #print( '--> d', file = sys.stderr )
 
 def select(stream):
     input = None

From c761e82bd9bd3336f0f6122dbb9d8399ae329249 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 20:19:38 +1100
Subject: [PATCH 0085/1056] python/comma: porting to python3; csv_eval: fixed
 non-backward compatible python3 change in filter semantics; in progress...

---
 python/comma/csv/applications/csv_eval.py | 44 +++++++++++------------
 1 file changed, 20 insertions(+), 24 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 003cfd4ef..1387a56c4 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -472,7 +472,7 @@ def __init__(self, args):
         if self.args.verbose: self.print_info()
 
     def initialize_input(self):
-        self.nonblank_input_fields = filter(None, self.args.fields)
+        self.nonblank_input_fields = list( filter( None, self.args.fields ) )
         if not self.nonblank_input_fields: raise csv_eval_error("please specify input stream fields, e.g. --fields=x,y")
         check_fields(self.nonblank_input_fields)
         types = comma.csv.format.to_numpy(self.args.format)
@@ -528,50 +528,46 @@ def check_output_fields(fields, input_fields):
         raise csv_eval_error(msg)
 
 def evaluate(stream):
-    def disperse(var, fields): return '\n'.join("{f} = {v}['{f}']".format(v=var, f=f) for f in fields)
-    def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f) for f in fields)
+    def disperse( var, fields ): return '\n'.join("{f} = {v}['{f}']".format( v = var, f = f ) for f in fields )
+    def collect( var, fields ): return '\n'.join("{v}['{f}'] = {f}".format( v = var, f = f ) for f in fields )
     if stream.args.init_values == '':
         read_size = None
         init_code_string = ''
     else:
         read_size = 1
-        init_code_string = '\n'.join([stream.args.default_values,
-                                stream.args.init_values,
-                                disperse('_input', stream.nonblank_input_fields),
-                                collect('_update', stream.args.update_fields),
-                                collect('_output', stream.args.output_fields)])
-    code_string = '\n'.join([stream.args.default_values,
-                             disperse('_input', stream.nonblank_input_fields),
-                             disperse('_output', stream.args.output_fields),
-                             stream.args.expressions,
-                             collect('_update', stream.args.update_fields),
-                             collect('_output', stream.args.output_fields)])
-    init_code = compile(init_code_string, '<string>', 'exec')
-    code = compile(code_string, '<string>', 'exec')
-    env = np.__dict__ if stream.args.permissive else restricted_numpy_env()
+        init_code_string = '\n'.join( [ stream.args.default_values,
+                                        stream.args.init_values,
+                                        disperse( '_input', stream.nonblank_input_fields ),
+                                        collect( '_update', stream.args.update_fields ),
+                                        collect( '_output', stream.args.output_fields ) ] )
+    code_string = '\n'.join( [ stream.args.default_values,
+                               disperse( '_input', stream.nonblank_input_fields ),
+                               disperse( '_output', stream.args.output_fields ),
+                               stream.args.expressions,
+                               collect( '_update', stream.args.update_fields ),
+                               collect( '_output', stream.args.output_fields ) ] )
+    init_code = compile( init_code_string, '<string>', 'exec' )
+    code = compile( code_string, '<string>', 'exec' )
+    env = np.__dict__ if stream.args.permissive else restricted_numpy_env()    
     size = None
     update = None
     output = None
     input = None
     is_shutdown = comma.signal.is_shutdown( verbose = stream.args.verbose )
-    #if is_shutdown: print( '--> a: is shutdown', file = sys.stderr )
-    if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
-    #print( '--> b', file = sys.stderr )
+    if stream.args.first_line: input = stream.input.read_from_line( stream.args.first_line )
     while not is_shutdown:
-        #print( '--> c', file = sys.stderr )
         if input is not None:
             if size != input.size:
                 size = input.size
                 if stream.args.update_fields: update = stream.update_t(size)
                 if stream.args.output_fields: output = stream.output_t(size)
-                exec( init_code, env, {'_input': input, '_update': update, '_output': output} )
-            exec( code, env, {'_input': input, '_update': update, '_output': output} )
+                exec( init_code, env, { '_input': input, '_update': update, '_output': output } )
+            exec( code, env, { '_input': input, '_update': update, '_output': output } )
             if stream.args.update_fields: update_buffer(stream.input, update)
             if stream.args.output_fields: stream.output.write(output)
             else: stream.input.dump()
         input = stream.input.read( read_size )
         if input is None: break
-    #print( '--> d', file = sys.stderr )
 
 def select(stream):
     input = None

From 41b7c3dfbc5ab13ce0a363d8d0946fc394626e18 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 20:30:50 +1100
Subject: [PATCH 0086/1056] python/comma: porting to python3; csv_eval, stream:
 using zip instead itertools.izip, with potential performance deterioration;
 in progress...

---
 python/comma/csv/applications/csv_eval.py | 12 +++++++-----
 python/comma/csv/stream.py                |  6 ++++--
 2 files changed, 11 insertions(+), 7 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 1387a56c4..8582b1e05 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -28,13 +28,15 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import print_function
-import sys
-import os
 import argparse
+import ast
+import itertools
 import numpy as np
+import os
 import re
-import itertools
-import ast
+import sys
+if sys.version_info.major < 3: from itertools import izip
+else: izip = zip # todo! watch performance! it's reported python3 zip is some 30% slower than izip
 import comma
 
 description = """
@@ -449,7 +451,7 @@ def update_buffer(stream, update_array):
             stream._input_array[fields[index(f)]] = update_array[f]
     else:
         def updated_lines():
-            for line, scalars in itertools.izip(stream._ascii_buffer, update_array):
+            for line, scalars in izip(stream._ascii_buffer, update_array):
                 values = line.split(stream.delimiter)
                 for f, s in zip(update_array.dtype.names, stream._strings(scalars)):
                     values[index(f)] = s
diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 1b3e5f37b..cbfc59438 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -34,6 +34,8 @@
 import os
 import sys
 import warnings
+if sys.version_info.major < 3: from itertools import izip
+else: izip = zip # todo! watch performance! it's reported python3 zip is some 30% slower than izip
 from ..util import warning
 from ..io import readlines_unbuffered
 from ..numpy import merge_arrays, types_of_dtype, structured_dtype
@@ -240,7 +242,7 @@ def write(self, s):
     def _tie_binary(self, tied_array, array): return merge_arrays(tied_array, array)
 
     def _tie_ascii(self, tied_buffer, unrolled_array):
-        for tied_line, scalars in itertools.izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + self._strings(scalars))
+        for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + self._strings(scalars))
 
     def _toline(self, scalars): return self.delimiter.join(self._strings(scalars))
 
@@ -273,7 +275,7 @@ def _dump_with_mask(self, mask):
         if self.binary:
             self._input_array[mask].tofile(self.target)
         else:
-            for line, allowed in itertools.izip(self._ascii_buffer, mask):
+            for line, allowed in izip(self._ascii_buffer, mask):
                 if allowed: print( line, file = self.target )
         self.target.flush()
 

From dd5882ed9ff4838041955d62f7c71f229b995176 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 20:57:24 +1100
Subject: [PATCH 0087/1056] python/comma: porting to python3; stream: convert
 mapped stuff to the list, with potential performance deterioration; in
 progress...

---
 python/comma/csv/stream.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index cbfc59438..a363f31ff 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -242,9 +242,9 @@ def write(self, s):
     def _tie_binary(self, tied_array, array): return merge_arrays(tied_array, array)
 
     def _tie_ascii(self, tied_buffer, unrolled_array):
-        for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + self._strings(scalars))
+        for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + list(self._strings(scalars)))
 
-    def _toline(self, scalars): return self.delimiter.join(self._strings(scalars))
+    def _toline(self, scalars): return list(self.delimiter.join(self._strings(scalars)))
 
     def dump(self, mask=None):
         """

From d22dfa6d344f5bd03b6c85aaba0d35fee1c461e7 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 21:13:21 +1100
Subject: [PATCH 0088/1056] python/comma: porting to python3; stream: typo
 fixed; in progress...

---
 python/comma/csv/stream.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index a363f31ff..cb000045f 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -160,8 +160,7 @@ def read_from_line(self, line):
 
     def _read(self, size):
         if self.binary:
-            #if np.__version__ >= '1.16.0': # sigh...
-            if sys.version_info.major > 2:
+            if sys.version_info.major > 2: #if np.__version__ >= '1.16.0': # sigh...
                 if self.source == sys.stdin:
                     b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size > 0 else self.size ) )
                     # todo! test on streams where bytes come with irregular delays!
@@ -225,7 +224,7 @@ def write(self, s):
             msg = "size {} not equal to tied size {}".format(s.size, tied_size)
             raise ValueError(msg)
         if self.binary:
-            if sys.version_info > 2 and self.target == sys.stdout: # sigh...
+            if sys.version_info.major > 2 and self.target == sys.stdout: # sigh...
                 #self.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
                 sys.stdout.buffer.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
             else:

From 95a9240fbe8eeed2d5a113741aa024cc9180c254 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 18 Nov 2019 22:09:46 +1100
Subject: [PATCH 0089/1056] python/comma: porting to python3; stream: _toline()
 fixed, which seems to have fixed most of the ascii tests; in progress...

---
 python/comma/csv/stream.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index cb000045f..a17e5443e 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -240,10 +240,14 @@ def write(self, s):
 
     def _tie_binary(self, tied_array, array): return merge_arrays(tied_array, array)
 
-    def _tie_ascii(self, tied_buffer, unrolled_array):
-        for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + list(self._strings(scalars)))
-
-    def _toline(self, scalars): return list(self.delimiter.join(self._strings(scalars)))
+    if sys.version_info.major < 3: # python3, sigh... don't ask
+        def _tie_ascii(self, tied_buffer, unrolled_array):
+            for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + self._strings(scalars))
+    else:
+        def _tie_ascii(self, tied_buffer, unrolled_array):
+            for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + list(self._strings(scalars)))
+
+    def _toline(self, scalars): return self.delimiter.join(self._strings(scalars))
 
     def dump(self, mask=None):
         """

From 5dd2ab16962850ee336bd6c73781f46ee32bbe38 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 19 Nov 2019 17:54:44 +1100
Subject: [PATCH 0090/1056] python/comma: porting to python3; stream: dump()
 and update_fields fixed (tobytes() and deepcopy() used respectively); in
 progress...

---
 python/comma/csv/stream.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index a17e5443e..5e685c55e 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -28,6 +28,7 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import print_function
+import copy
 import functools
 import itertools
 import numpy as np
@@ -129,7 +130,7 @@ def read(self, size=None):
         if no records have been read, return None
         """
         if size is None: size = self.size
-        self._input_array = self._read(size)
+        self._input_array = copy.deepcopy( self._read( size ) ) if sys.version_info.major > 2 else self._read( size ) # todo! watch performance in python3!
         if self._input_array.size == 0: return
         return self._struct_array(self._input_array, self.missing_values)
 
@@ -258,7 +259,10 @@ def dump(self, mask=None):
 
     def _dump(self):
         if self.binary:
-            self._input_array.tofile(self.target)
+            if sys.version_info.major > 2 and self.target == sys.stdout: # sigh...
+                sys.stdout.buffer.write( self._input_array.tobytes() )
+            else:
+                self._input_array.tofile( self.target )
         else:
             for line in self._ascii_buffer: print( line, file = self.target )
         self.target.flush()

From 4d3c4dfb670dec5d1a65daf1b263822da650b4c1 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 19 Nov 2019 21:48:34 +1100
Subject: [PATCH 0091/1056] python/comma: porting to python3; stream: zip...
 replaced with list(zip...), since in python3 it returns iterator, not
 container; dump: tobytes used instead of tofile for stdout output; in
 progress...

---
 python/comma/csv/stream.py | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 5e685c55e..2e4ac9931 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -97,8 +97,7 @@ def __init__(self,
         self.default_values = self._default_values(default_values)
         self.missing_values = self._missing_values()
         self.data_extraction_fields = self._data_extraction_fields()
-        self.struct_and_extraction_fields = zip(self.struct.flat_dtype.names,
-                                                self.data_extraction_fields)
+        self.struct_and_extraction_fields = list( zip( self.struct.flat_dtype.names, self.data_extraction_fields ) )
         #self.write_dtype = self._write_dtype()
         #self.unrolled_write_dtype = structured_dtype( ','.join( types_of_dtype( self.write_dtype, unroll=True ) ) )
         #print( "self.write_dtype.descr = %s" % str(self.write_dtype.descr), file = sys.stderr )
@@ -280,7 +279,10 @@ def _dump_with_mask(self, mask):
             msg = "mask size {} not equal to data size {}".format(mask.size, data_size)
             raise ValueError(msg)
         if self.binary:
-            self._input_array[mask].tofile(self.target)
+            if sys.version_info.major > 2 and self.target == sys.stdout: # sigh...
+                sys.stdout.buffer.write( self._input_array[mask].tobytes() )
+            else:
+                self._input_array[mask].tofile(self.target)
         else:
             for line, allowed in izip(self._ascii_buffer, mask):
                 if allowed: print( line, file = self.target )

From 804bf7038b0af0087339cb801b28bb2e20a33d31 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 19 Nov 2019 22:44:28 +1100
Subject: [PATCH 0092/1056] python/comma: porting to python3; stream._read():
 bug fixed: if size is 0, keep it 0; in progress...

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 2e4ac9931..aa60094dd 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -162,7 +162,7 @@ def _read(self, size):
         if self.binary:
             if sys.version_info.major > 2: #if np.__version__ >= '1.16.0': # sigh...
                 if self.source == sys.stdin:
-                    b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size > 0 else self.size ) )
+                    b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size >= 0 else self.size ) )
                     # todo! test on streams where bytes come with irregular delays!
                     if len(b) % self.input_dtype.itemsize != 0: raise ValueError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
                     return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )

From 1517f75f4c5255f13db55e9fd281559872346f10 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 20 Nov 2019 21:43:12 +1100
Subject: [PATCH 0093/1056] python/comma: porting to python3;
 io.readlines_unbuffered: bug fixed: filter replaced with list( filter ); in
 progress...

---
 python/comma/io/readlines_unbuffered.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/python/comma/io/readlines_unbuffered.py b/python/comma/io/readlines_unbuffered.py
index 6e6d5d286..5e94259b7 100644
--- a/python/comma/io/readlines_unbuffered.py
+++ b/python/comma/io/readlines_unbuffered.py
@@ -42,6 +42,7 @@ def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
         - a blank line is a line that has only whitespace characters or no characters
         - blank lines are not counted towards size
     """
+    print( '--> readlines_unbuffered(): size:', size, file=sys.stderr )
     if size >= 0:
         lines = []
         number_of_lines = 0
@@ -55,7 +56,7 @@ def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
             number_of_lines += 1
         return lines
     if skip_blank_lines:
-        source_ = ifilter(lambda line: line.strip(), source)
+        source_ = list( ifilter(lambda line: line.strip(), source) )
     else:
         source_ = source
     return [line.rstrip('\n') for line in source_]

From cdaf88466a9191092c8a2be95ea1c9d8ca3a0803 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 20 Nov 2019 22:14:52 +1100
Subject: [PATCH 0094/1056] python/comma: porting to python3;
 io.readlines_unbuffered: debug print removed; in progress...

---
 python/comma/io/readlines_unbuffered.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/python/comma/io/readlines_unbuffered.py b/python/comma/io/readlines_unbuffered.py
index 5e94259b7..94ec2a389 100644
--- a/python/comma/io/readlines_unbuffered.py
+++ b/python/comma/io/readlines_unbuffered.py
@@ -42,7 +42,6 @@ def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
         - a blank line is a line that has only whitespace characters or no characters
         - blank lines are not counted towards size
     """
-    print( '--> readlines_unbuffered(): size:', size, file=sys.stderr )
     if size >= 0:
         lines = []
         number_of_lines = 0

From c1635349618e4b41fc87253e8d20ccdceb7ca5ff Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 20 Nov 2019 22:38:36 +1100
Subject: [PATCH 0095/1056] python/comma: porting to python3; unicode string vs
 bytes: limitation resolved and documented in --help; in progress...

---
 python/comma/csv/applications/csv_eval.py                  | 7 ++++++-
 .../csv/applications/test/csv-eval/select/basic/ascii/test | 2 +-
 .../applications/test/csv-eval/select/basic/binary/test    | 2 +-
 .../applications/test/csv-eval/select/fields/ascii/test    | 2 +-
 .../applications/test/csv-eval/select/fields/binary/test   | 2 +-
 .../test/csv-eval/select/select_all/ascii/test             | 2 +-
 .../test/csv-eval/select/select_all/binary/test            | 2 +-
 7 files changed, 12 insertions(+), 7 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 8582b1e05..6acdd6a5b 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -142,9 +142,14 @@
 
 string functions:
     http://docs.scipy.org/doc/numpy/reference/routines.char.html
-
+    
     ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(path,"/")' --output-format=ui
     ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'r=char.replace(path,"/","_")' --output-format=s[36]
+    
+    LIMITATION: in python3, csv-eval represents strings as np.bytes_ (for consistent binary support)
+        python2: you could write: ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(path,"/")' --output-format=ui
+        python3: you should write: ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(char.decode(path),"/")' --output-format=ui
+                 for backward compatibility, use the latter variant
 
 time arithmetic:
     http://docs.scipy.org/doc/numpy/reference/arrays.datetime.html#datetime-and-timedelta-arithmetic
diff --git a/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test b/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test
index 714e7a66b..595d55549 100755
--- a/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-eval -v --fields=a,b,name --format=2i,s[1] --select "(a < b - 1) & (name == 'y')" \
+csv-eval -v --fields=a,b,name --format=2i,s[1] --select "logical_and( a < b - 1, char.decode( name ) == 'y' )" \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/basic/binary/test b/python/comma/csv/applications/test/csv-eval/select/basic/binary/test
index 12baee557..cd3dafd9d 100755
--- a/python/comma/csv/applications/test/csv-eval/select/basic/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/select/basic/binary/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "(a < b - 1) & (name == 'y')" | csv-from-bin 2i,s[1] \
+csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "logical_and( a < b - 1, char.decode( name ) == 'y' )" | csv-from-bin 2i,s[1] \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test b/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test
index 151033cd8..c6cc4ce90 100755
--- a/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-eval -v --fields=a,b,,name --format=2i,,s[1] --select "(a < b - 1) & (name == 'y')" \
+csv-eval -v --fields=a,b,,name --format=2i,,s[1] --select "logical_and(a < b - 1, char.decode(name) == 'y')" \
     | name-value-from-csv a,b,dummy,allow,payload --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/fields/binary/test b/python/comma/csv/applications/test/csv-eval/select/fields/binary/test
index 53c017294..2bd0f5714 100755
--- a/python/comma/csv/applications/test/csv-eval/select/fields/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/select/fields/binary/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-to-bin 2i,2s[1],ui | csv-eval -v --fields=a,b,,name --binary=2i,2s[1],ui --select "(a < b - 1) & (name == 'y')" | csv-from-bin 2i,2s[1],ui \
+csv-to-bin 2i,2s[1],ui | csv-eval -v --fields=a,b,,name --binary=2i,2s[1],ui --select "logical_and(a < b - 1, char.decode(name) == 'y')" | csv-from-bin 2i,2s[1],ui \
     | name-value-from-csv a,b,dummy,allow,payload --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test b/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test
index a7ba750aa..581b09f4f 100755
--- a/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-eval --fields=a,b,name --format=2i,s[1] --select "(a < b) & ( name == 'y')" \
+csv-eval --fields=a,b,name --format=2i,s[1] --select "(a < b) & ( char.decode(name) == 'y')" \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test b/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test
index 6f22710aa..5d339db17 100755
--- a/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "(a < b) & ( name == 'y')" | csv-from-bin 2i,s[1] \
+csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "(a < b) & ( char.decode(name) == 'y')" | csv-from-bin 2i,s[1] \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'

From eec858c3e687de0b052b9e42d7c3bf4871ce7f79 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 20 Nov 2019 22:59:57 +1100
Subject: [PATCH 0096/1056] python/comma: porting to python3; unicode string vs
 bytes: more tests fixed and examples added to --help; in progress...

---
 python/comma/csv/applications/csv_eval.py                     | 4 ++++
 .../csv/applications/test/csv-eval/default_format/ascii/test  | 2 +-
 .../csv/applications/test/csv-eval/strings/count/ascii/test   | 2 +-
 .../csv/applications/test/csv-eval/strings/count/binary/test  | 2 +-
 4 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 6acdd6a5b..7e2ad7a07 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -150,6 +150,10 @@
         python2: you could write: ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(path,"/")' --output-format=ui
         python3: you should write: ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(char.decode(path),"/")' --output-format=ui
                  for backward compatibility, use the latter variant
+        it may lead to ugly constructs for python3:
+            python2: csv-eval --fields=s --format s[36] 'u=char.upper(name)' --output-format=s[36]
+            python3: csv-eval --fields=s --format s[36] 'u=char.encode(char.upper(char.decode(name)))' --output-format=s[36]
+        but unfortunately, this limitation is unlikely to go away
 
 time arithmetic:
     http://docs.scipy.org/doc/numpy/reference/arrays.datetime.html#datetime-and-timedelta-arithmetic
diff --git a/python/comma/csv/applications/test/csv-eval/default_format/ascii/test b/python/comma/csv/applications/test/csv-eval/default_format/ascii/test
index 4c5bc4761..33e23bfaa 100755
--- a/python/comma/csv/applications/test/csv-eval/default_format/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/default_format/ascii/test
@@ -1,3 +1,3 @@
 #!/bin/bash
 
-csv-eval --fields=,path,x,name --format ,s[36],,s[4] 'n=char.count(path,"/");y=x+1;uname=char.upper(name)' --output-format=s[36],,s[4] | name-value-from-csv blank,path,x,name,n,y,uname --line-number --prefix output | tr -d '"'
+csv-eval --fields=,path,x,name --format ,s[36],,s[4] 'n=char.count(char.decode(path),"/");y=x+1;uname=char.encode(char.upper(char.decode(name)))' --output-format=s[36],,s[4] | name-value-from-csv blank,path,x,name,n,y,uname --line-number --prefix output | tr -d '"'
diff --git a/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test b/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test
index 95fb5eaca..8b3efe3b6 100755
--- a/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test
@@ -1,3 +1,3 @@
 #!/bin/bash
 
-csv-eval --fields=,path --format i,s[36],ui,s[4] 'n=char.count(path,"/")' --output-format=s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'
+csv-eval --fields=,path --format i,s[36],ui,s[4] 'n=char.count(char.decode(path),"/")' --output-format=s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'
diff --git a/python/comma/csv/applications/test/csv-eval/strings/count/binary/test b/python/comma/csv/applications/test/csv-eval/strings/count/binary/test
index 0cf2f3691..e44699078 100755
--- a/python/comma/csv/applications/test/csv-eval/strings/count/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/strings/count/binary/test
@@ -1,3 +1,3 @@
 #!/bin/bash
 
-csv-to-bin i,s[36],ui,s[4] | csv-eval --fields=,path --binary i,s[36],ui,s[4] 'n=char.count(path,"/")' --output-format=s[36] | csv-from-bin i,s[36],ui,s[4],s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'
+csv-to-bin i,s[36],ui,s[4] | csv-eval --fields=,path --binary i,s[36],ui,s[4] 'n=char.count(char.decode(path),"/")' --output-format=s[36] | csv-from-bin i,s[36],ui,s[4],s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'

From a7f8742e269fa30e561ba426afae201bb8532fab Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 21 Nov 2019 09:16:53 +1100
Subject: [PATCH 0097/1056] python/comma: porting to python3;
 name_value/test/eval: test case fixed: integer division: // used instead of
 /; in progress...

---
 name_value/test/eval/data/input_3 | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/name_value/test/eval/data/input_3 b/name_value/test/eval/data/input_3
index 936c66d69..e3bd4042d 100644
--- a/name_value/test/eval/data/input_3
+++ b/name_value/test/eval/data/input_3
@@ -7,4 +7,4 @@ x != 3
 x != "some string"
 
 # integer division
-x = 11 / 5
+x = 11 // 5

From 66d328dc4717b4f5bf896ebffd71689960c7c4fa Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 21 Nov 2019 09:35:32 +1100
Subject: [PATCH 0098/1056] python/comma: porting to python3; stream.py:
 warnings seem to be buggy in python3.7; use print for now; in progress...

---
 python/comma/csv/stream.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index aa60094dd..afa5c7e64 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -290,8 +290,10 @@ def _dump_with_mask(self, mask):
 
     def _warn(self, msg, verbose=True):
         if verbose:
-            with warning(custom_formatwarning) as warn:
-                warn(msg)
+            if sys.version_info.major < 3: # sigh, something is broken at least in python3.7; dumb it down for now
+                with warning(custom_formatwarning) as warn: warn(msg)
+            else:
+                print( 'stream.py: warning:', msg, file=sys.stderr )
 
     def _struct(self, s):
         if not isinstance(s, struct):

From 15e703a21c5e5f607a71a8b9e9f9d0c6d836b46c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 22 Nov 2019 12:10:48 +1100
Subject: [PATCH 0099/1056] python/comma: porting to python3; name-value-eval:
 test fixed in a quick and dirty manner; by right, the whole test is too rigid
 and needs to be fully rewritten; porting more or less done

---
 name_value/test/eval/data/stderr_13 |  3 ++-
 name_value/test/eval/data/stderr_14 |  3 ++-
 name_value/test/eval/data/stderr_27 |  3 ++-
 name_value/test/eval/data/stderr_8  |  3 ++-
 name_value/test/eval/test           | 16 ++++++++++++----
 5 files changed, 20 insertions(+), 8 deletions(-)

diff --git a/name_value/test/eval/data/stderr_13 b/name_value/test/eval/data/stderr_13
index 49a434b97..ec96e98a6 100644
--- a/name_value/test/eval/data/stderr_13
+++ b/name_value/test/eval/data/stderr_13
@@ -1 +1,2 @@
-name-value-eval: line 1: AttributeError: OBJ instance has no attribute 'whatever'
+python2:name-value-eval: line 1: AttributeError: OBJ instance has no attribute 'whatever'
+python3:name-value-eval: line 1: AttributeError: 'OBJ' object has no attribute 'whatever'
\ No newline at end of file
diff --git a/name_value/test/eval/data/stderr_14 b/name_value/test/eval/data/stderr_14
index 224f578e7..cfa22eede 100644
--- a/name_value/test/eval/data/stderr_14
+++ b/name_value/test/eval/data/stderr_14
@@ -1 +1,2 @@
-name-value-eval: line 2: AttributeError: OBJ instance has no attribute '__getitem__'
+python2:name-value-eval: line 2: AttributeError: OBJ instance has no attribute '__getitem__'
+python3:name-value-eval: line 2: TypeError: 'OBJ' object does not support indexing
\ No newline at end of file
diff --git a/name_value/test/eval/data/stderr_27 b/name_value/test/eval/data/stderr_27
index 811dc83b2..e2105bdbe 100644
--- a/name_value/test/eval/data/stderr_27
+++ b/name_value/test/eval/data/stderr_27
@@ -1 +1,2 @@
-name-value-eval: TypeError: variable "route" is used in an expression but is an object (example: "a/b = 3; a < 0")
+python2:name-value-eval: TypeError: variable "route" is used in an expression but is an object (example: "a/b = 3; a < 0")
+python3:name-value-eval: line 1: TypeError: unorderable types: OBJ() > int()
\ No newline at end of file
diff --git a/name_value/test/eval/data/stderr_8 b/name_value/test/eval/data/stderr_8
index 790deb67b..0570fd918 100644
--- a/name_value/test/eval/data/stderr_8
+++ b/name_value/test/eval/data/stderr_8
@@ -1 +1,2 @@
-name-value-eval: line 1: TypeError: cannot concatenate 'str' and 'int' objects
+python2:name-value-eval: line 1: TypeError: cannot concatenate 'str' and 'int' objects
+python3:name-value-eval: line 1: TypeError: Can't convert 'int' object to str implicitly
\ No newline at end of file
diff --git a/name_value/test/eval/test b/name_value/test/eval/test
index b6f7de6e9..580bdc23a 100755
--- a/name_value/test/eval/test
+++ b/name_value/test/eval/test
@@ -11,7 +11,8 @@ if [[ ! -d "$data_dir" ]]; then
 fi
 
 tmpdir="output/tmp"
-mkdir $tmpdir
+rm -rf $tmpdir
+mkdir $tmpdir -p
 verbose=0
 
 while [[ $# -gt 0 ]]; do
@@ -27,6 +28,8 @@ done
 variables="$data_dir/variable_vals"
 pass_count=0
 total_count=0
+python_version="$( python -c "from __future__ import print_function; import sys; print( sys.version_info.major )" )" # sigh...
+python_prefix="python${python_version}:"
 
 for input in $data_dir/input*; do
     (( ++total_count ))
@@ -34,13 +37,18 @@ for input in $data_dir/input*; do
     if (( verbose )); then echo "$name: running test $suffix" >&2; fi
     stdout="$tmpdir/stdout.$suffix"
     stderr="$tmpdir/stderr.$suffix"
+    if grep -q "$python_prefix" < "$data_dir/stderr_$suffix"; then
+        expected_stderr="$( grep "^$python_prefix" < "$data_dir/stderr_$suffix" | sed "s#^$python_prefix##" )" # quick and dirty; sigh...
+    else
+        expected_stderr="$( cat "$data_dir/stderr_$suffix" )"
+    fi
     cat $input | name-value-eval --variables=$variables --test > $stdout 2> $stderr
+    actual_stderr=$( cat $stderr )
     if ! cmp --quiet $stdout $data_dir/stdout_$suffix; then
         echo "$name: test failed for input_$suffix (stdout is different):" >&2
         diff $stdout $data_dir/stdout_$suffix >&2
-    elif ! cmp --quiet $stderr $data_dir/stderr_$suffix; then
-        echo "$name: test failed for input_$suffix (stderr is different):" >&2
-        diff $stderr $data_dir/stderr_$suffix >&2
+    elif ! cmp --quiet <( echo "$actual_stderr" ) <( echo "$expected_stderr" ); then
+        diff <( echo "$actual_stderr" ) <( echo "$expected_stderr" ) >&2
     else
         (( ++pass_count ))
         if (( verbose )); then echo "$name: test $suffix passed" >&2; fi

From ad42b42793f9c928106bc833996e743cba96bc97 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 10 Dec 2019 13:04:03 +1100
Subject: [PATCH 0100/1056] application/command_line_options: bug fixed: now
 allows unnamed values; unit test added

---
 .../test/comma-options-validate/expected      | 18 ++++++++++++++++++
 .../test/comma-options-validate/input         | 19 +++++++++++++++++++
 application/command_line_options.cpp          |  1 +
 3 files changed, 38 insertions(+)
 create mode 100644 application/applications/test/comma-options-validate/expected
 create mode 100644 application/applications/test/comma-options-validate/input

diff --git a/application/applications/test/comma-options-validate/expected b/application/applications/test/comma-options-validate/expected
new file mode 100644
index 000000000..5840f904e
--- /dev/null
+++ b/application/applications/test/comma-options-validate/expected
@@ -0,0 +1,18 @@
+valid_options/valueless[0]/status=0
+valid_options/valueless[1]/status=0
+valid_options/valueless[2]/status=0
+valid_options/valueless[3]/status=0
+valid_options/valueless[4]/status=0
+valid_options/valueless[5]/status=0
+valid_options/valued[0]/status=0
+valid_options/valued[1]/status=0
+valid_options/valued[2]/status=0
+valid_options/valued[3]/status=0
+valid_options/valued[4]/status=0
+valid_options/valued[5]/status=0
+invalid_options/valueless[0]/status=1
+invalid_options/valueless[1]/status=1
+invalid_options/valueless[2]/status=1
+invalid_options/valueless[3]/status=1
+invalid_options/valued[0]/status=1
+invalid_options/valued[1]/status=1
diff --git a/application/applications/test/comma-options-validate/input b/application/applications/test/comma-options-validate/input
new file mode 100644
index 000000000..4782830e9
--- /dev/null
+++ b/application/applications/test/comma-options-validate/input
@@ -0,0 +1,19 @@
+valid_options/valueless[0]="echo '--verbose,-v' | comma-options-validate -v"
+valid_options/valueless[1]="echo '--verbose,-v' | comma-options-validate hello -v"
+valid_options/valueless[2]="echo '--verbose,-v' | comma-options-validate -v world"
+valid_options/valueless[3]="echo '--verbose,-v' | comma-options-validate -v hello world"
+valid_options/valueless[4]="echo '--verbose,-v' | comma-options-validate -v -"
+valid_options/valueless[5]="echo '--verbose,-v' | comma-options-validate - -v"
+valid_options/valued[0]="echo '--file,-f=<v>' | comma-options-validate -f -5"
+valid_options/valued[1]="echo '--file,-f=<v>' | comma-options-validate -f -5 6"
+valid_options/valued[2]="echo '--file,-f=<v>' | comma-options-validate 4 -f -5"
+valid_options/valued[3]="echo '--file,-f=<v>' | comma-options-validate 4 -f -5 6"
+valid_options/valued[4]="echo '--file,-f=<v>' | comma-options-validate -f -5 -"
+valid_options/valued[5]="echo '--file,-f=<v>' | comma-options-validate - -f -5"
+
+invalid_options/valueless[0]="echo '--verbose,-v' | comma-options-validate -v -g"
+invalid_options/valueless[1]="echo '--verbose,-v' | comma-options-validate hello -g -v"
+invalid_options/valueless[2]="echo '--verbose,-v' | comma-options-validate -v -g world"
+invalid_options/valueless[3]="echo '--verbose,-v' | comma-options-validate -v world -g"
+invalid_options/valued[0]="echo '--file,-f=<v>' | comma-options-validate -g -f 5"
+invalid_options/valued[1]="echo '--file,-f=<v>' | comma-options-validate -f 5 -g"
diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index f7b3e601d..ecbff9b45 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -195,6 +195,7 @@ void command_line_options::assert_valid( const std::vector< description >& d, bo
     for( unsigned int i = 0; i < d.size(); ++i ) { for( unsigned int j = 0; j < d[i].names.size(); ++j ) { m[ d[i].names[j] ] = d[i].has_value; } }
     for( unsigned int i = 1; i < argv_.size(); ++i )
     {
+        if( !boost::regex_match( argv_[i], boost::regex( "-.+" ) ) ) { continue; }
         auto it = m.find( argv_[i] );
         if( it == m.end() ) { COMMA_THROW( comma::exception, "unknown option " << argv_[i] ); }
         if( it->second ) { ++i; }

From 7638273ebb70d980986747d1330e4e70167455ac Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 10 Dec 2019 17:28:59 +1100
Subject: [PATCH 0101/1056] application/applications/test/test added

---
 application/applications/test/test | 6 ++++++
 1 file changed, 6 insertions(+)
 create mode 100755 application/applications/test/test

diff --git a/application/applications/test/test b/application/applications/test/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/application/applications/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From cc5acabe3391f03749a3a1abeb05a94ab8226db4 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 19 Dec 2019 17:38:08 +1100
Subject: [PATCH 0102/1056] csv/stream: passed::write( v ) implemented

---
 csv/stream.h             | 91 +++++++++++++++++++++++++++++-----------
 csv/test/stream_test.cpp | 26 +++++++++++-
 2 files changed, 91 insertions(+), 26 deletions(-)

diff --git a/csv/stream.h b/csv/stream.h
index c862c011b..2f7ba849e 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -436,11 +436,26 @@ template < typename S >
 class passed
 {
     public:
-        passed( const input_stream< S >& is, std::ostream& os, bool flush=false ) : is_( is ), os_( os ), flush(flush)
-        {
-            #ifdef WIN32
-            if( is_.is_binary() && os == std::cout ) { _setmode( _fileno( stdout ), _O_BINARY ); }
-            #endif // #ifdef WIN32
+        passed( const input_stream< S >& is, std::ostream& os, bool flush = false );
+
+        void write();
+        
+        void write( const S& s );
+
+    private:
+        const input_stream< S >& is_;
+        std::ostream& os_;
+        std::string buffer_;
+        bool flush;
+        bool is_stdout_;
+};
+
+template < typename S >
+inline passed< S >::passed( const input_stream< S >& is, std::ostream& os, bool flush ) : is_( is ), os_( os ), flush( flush )
+{
+    #ifdef WIN32
+    if( is_.is_binary() && os == std::cout ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+    #endif // #ifdef WIN32
 // In using view-points in 'pass' mode there were issues with the write method.
 // How to reproduce: take some nav data in t,6d format. Store as in.bin and other.bin.
 //
@@ -485,29 +500,57 @@ class passed
 //  - according to git grep, only view-points was using this class template at the moment; therefore,
 //    the change is very localized and we preserve it in this class
 //  - however, all the other similar modifications have been commented out using /// symbol
-            is_stdout_ = os.rdbuf() == std::cout.rdbuf();
-        }
+    is_stdout_ = os.rdbuf() == std::cout.rdbuf();
+}
 
-        void write()
+template < typename S >
+inline void passed< S >::write()
+{
+    if( is_.is_binary() )
+    {
+        if( is_stdout_ )
         {
-            if( is_.is_binary() ) {
-                if ( is_stdout_ ) {
-                    ::write( 1, is_.binary().last(), is_.binary().size() );
-                    if(flush) { ::fflush( stdout ); }
-                } else {
-                    os_.write( is_.binary().last(), is_.binary().size() );
-                    if(flush) { os_.flush(); }
-                }
-            }
-            else os_ << comma::join( is_.ascii().last(), is_.ascii().ascii().delimiter() ) << std::endl;
+            ::write( 1, is_.binary().last(), is_.binary().size() );
+            if( flush ) { ::fflush( stdout ); }
         }
+        else
+        {
+            os_.write( is_.binary().last(), is_.binary().size() );
+            if( flush ) { os_.flush(); }
+        }
+    }
+    else
+    {
+        os_ << comma::join( is_.ascii().last(), is_.ascii().ascii().delimiter() ) << std::endl;
+    }
+}
 
-    private:
-        const input_stream< S >& is_;
-        std::ostream& os_;
-        bool flush;
-        bool is_stdout_;
-};
+template < typename S >
+inline void passed< S >::write( const S& s )
+{
+    if( is_.is_binary() )
+    {
+        buffer_.resize( is_.binary().size() );
+        ::memcpy( &buffer_[0], is_.binary().last(), is_.binary().size() ); // quick and dirty
+        is_.binary().binary().put( s, &buffer_[0] );
+        if( is_stdout_ )
+        {
+            ::write( 1, &buffer_[0], is_.binary().size() );
+            if( flush ) { ::fflush( stdout ); }
+        }
+        else
+        {
+            os_.write( &buffer_[0], is_.binary().size() );
+            if( flush ) { os_.flush(); }
+        }
+    }
+    else
+    {
+        std::vector< std::string > v = is_.ascii().last();
+        is_.ascii().ascii().put( s, v );
+        os_ << comma::join( v, is_.ascii().ascii().delimiter() ) << std::endl;
+    }
+}
 
 template < typename S >
 inline ascii_input_stream< S >::ascii_input_stream( std::istream& is, const std::string& column_names, char delimiter, bool full_path_as_name, const S& sample )
diff --git a/csv/test/stream_test.cpp b/csv/test/stream_test.cpp
index bef1731db..04a788baf 100644
--- a/csv/test/stream_test.cpp
+++ b/csv/test/stream_test.cpp
@@ -100,7 +100,7 @@ TEST( csv, container )
         test_container sample; sample.vector = std::vector< int >( 5, 1 );
         comma::csv::input_stream< test_container > istream( iss, csv, sample );
         const test_container *c = istream.read();
-        EXPECT_EQ( c->vector.size(), 5 );
+        EXPECT_EQ( int( c->vector.size() ), 5 );
         std::string so = comma::join( c->vector, ',' );
         EXPECT_EQ( so, "2,3,1,1,6" );
     }
@@ -111,11 +111,33 @@ TEST( csv, container )
         c.vector[1] = 5;
         c.vector[2] = 3;
         ostream.write( c );
-        EXPECT_EQ( c.vector.size(), 5 );
+        EXPECT_EQ( int( c.vector.size() ), 5 );
         EXPECT_EQ( oss.str(), "1,5,3,1,1\n" );
     }
 }
 
+TEST( csv, passed_ascii )
+{
+    {
+        std::istringstream iss( "1,2\n3,4" );
+        comma::csv::input_stream< test_struct > is( iss );
+        std::ostringstream oss;
+        comma::csv::passed< test_struct > p( is, oss );
+        is.read();
+        p.write();
+        EXPECT_EQ( "1,2\n", oss.str() );
+        is.read();
+        p.write();
+        EXPECT_EQ( "1,2\n3,4\n", oss.str() );
+        is.read();
+        p.write( test_struct( 10, 20 ) );
+        EXPECT_EQ( "1,2\n3,4\n10,20\n", oss.str() );
+    }
+    {
+        // todo! binary test
+    }
+}
+
 } } } // namespace comma { namespace csv { namespace stream_test {
 
 namespace comma { namespace csv { namespace stream_test {

From c180f35d35062cb38c43008def19c895785912a5 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Mon, 30 Dec 2019 12:10:59 +1100
Subject: [PATCH 0103/1056] application: unit test added

---
 application/test/application_test.cpp | 36 +++++++++++++++++++++++----
 1 file changed, 31 insertions(+), 5 deletions(-)

diff --git a/application/test/application_test.cpp b/application/test/application_test.cpp
index 037ae84e0..f3cfd2481 100644
--- a/application/test/application_test.cpp
+++ b/application/test/application_test.cpp
@@ -118,6 +118,32 @@ TEST( application, unnamed )
             EXPECT_EQ( free[5], "free5" );
         }
     }
+    {
+        std::vector< std::string > argv;
+        argv.push_back( "application" );
+        argv.push_back( "--no-value" );
+        argv.push_back( "--value" );
+        argv.push_back( "some-value" );
+        comma::command_line_options options( argv );
+        {
+            std::vector< std::string > unnamed = options.unnamed( "--no-value", "-.*" );
+            EXPECT_EQ( 0u, unnamed.size() );
+        }
+    }
+    {
+        std::vector< std::string > argv;
+        argv.push_back( "application" );
+        argv.push_back( "unnamed" );
+        argv.push_back( "--no-value" );
+        argv.push_back( "--value" );
+        argv.push_back( "x,y,z" );
+        comma::command_line_options options( argv );
+        {
+            std::vector< std::string > unnamed = options.unnamed( "--no-value", "-.*" );
+            EXPECT_EQ( 1u, unnamed.size() );
+            EXPECT_EQ( "unnamed", unnamed[0] );
+        }
+    }
     // TODO: definitely more tests!
 }
 
@@ -180,7 +206,7 @@ TEST( application, command_line_options_description_parsing )
 {
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--verbose" );
-        EXPECT_EQ( 1, d.names.size() );
+        EXPECT_EQ( 1u, d.names.size() );
         EXPECT_EQ( "--verbose", d.names[0] );
         EXPECT_FALSE( d.has_value );
         EXPECT_TRUE( d.is_optional );
@@ -188,7 +214,7 @@ TEST( application, command_line_options_description_parsing )
     }
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--verbose,-v" );
-        EXPECT_EQ( 2, d.names.size() );
+        EXPECT_EQ( 2u, d.names.size() );
         EXPECT_EQ( "--verbose", d.names[0] );
         EXPECT_EQ( "-v", d.names[1] );
         EXPECT_FALSE( d.has_value );
@@ -197,7 +223,7 @@ TEST( application, command_line_options_description_parsing )
     }
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--filename,-f=<filename>; some filename" );
-        EXPECT_EQ( 2, d.names.size() );
+        EXPECT_EQ( 2u, d.names.size() );
         EXPECT_EQ( "--filename", d.names[0] );
         EXPECT_EQ( "-f", d.names[1] );
         EXPECT_TRUE( d.has_value );
@@ -207,7 +233,7 @@ TEST( application, command_line_options_description_parsing )
     }
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--filename,-f=[<filename>]; some filename" );
-        EXPECT_EQ( 2, d.names.size() );
+        EXPECT_EQ( 2u, d.names.size() );
         EXPECT_EQ( "--filename", d.names[0] );
         EXPECT_EQ( "-f", d.names[1] );
         EXPECT_TRUE( d.has_value );
@@ -226,7 +252,7 @@ void check_default_value( const std::string& line, const std::string& default_va
 {
     typedef comma::command_line_options::description description;
     description d = description::from_string( line );
-    EXPECT_EQ( 2, d.names.size() );
+    EXPECT_EQ( 2u, d.names.size() );
     EXPECT_EQ( "--filename", d.names[0] );
     EXPECT_EQ( "-f", d.names[1] );
     EXPECT_TRUE( d.has_value );

From 889b42ac28c44a0280304f6556c936d2db88a6ef Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 7 Jan 2020 12:18:19 +1100
Subject: [PATCH 0104/1056] csv-enumerate: refactored to make adding more
 output features easier

---
 csv/applications/csv-enumerate.cpp | 53 +++++++++++++++++-------------
 1 file changed, 31 insertions(+), 22 deletions(-)

diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index ff5d4955a..3fd3ee910 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -61,6 +61,22 @@ static void usage( bool verbose )
     exit( 0 );
 }
 
+struct output
+{
+    comma::uint32 id;
+    output( comma::uint32 id = 0 ): id( id ) {}
+};
+
+namespace comma { namespace visiting {
+
+template <> struct traits< output >
+{
+    template < typename K, typename V > static void visit( const K&, const output& p, V& v ) { v.apply( "id", p.id ); }
+    template < typename K, typename V > static void visit( const K&, output& p, V& v ) { v.apply( "id", p.id ); }
+};
+
+} } // namespace comma { namespace visiting {
+
 int main( int ac, char** av )
 {
     typedef comma::csv::impl::unstructured input_t;
@@ -94,10 +110,6 @@ int main( int ac, char** av )
         }
         if( verbose ) { std::cerr << "csv-enumerate: fields " << csv.fields << " interpreted as: " << comma::join( v, ',' ) << std::endl; }
         csv.fields = comma::join( v, ',' );
-        comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
-        #ifdef WIN32
-        if( istream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
-        #endif
         static map_t map;
         comma::uint32 id = 0;
         if( !first_line.empty() )
@@ -106,6 +118,15 @@ int main( int ac, char** av )
             map[ comma::csv::ascii< input_t >( csv, default_input ).get( first_line ) ] = std::make_pair( id++, 1 );
             if( !output_map ) { std::cout << first_line << csv.delimiter << 0 << std::endl; }
         }
+        comma::csv::options output_csv;
+        output_csv.delimiter = csv.delimiter;
+        if( csv.binary() ) { output_csv.format( comma::csv::format::value< output >() ); }
+        comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
+        comma::csv::output_stream< output > ostream( std::cout, output_csv );
+        comma::csv::tied< input_t, output > tied( istream, ostream );
+        #ifdef WIN32
+        if( istream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        #endif
         while( istream.ready() || std::cin.good() )
         {
             const input_t* p = istream.read();
@@ -113,26 +134,14 @@ int main( int ac, char** av )
             map_t::iterator it = map.find( *p );
             comma::uint32 cur = id;
             if( it == map.end() ) { map[ *p ] = std::make_pair( id++, 1 ); } else { cur = it->second.first; ++( it->second.second ); }
-            if( !output_map )
-            {
-                if( csv.binary() )
-                {
-                    std::cout.write( istream.binary().last(), csv.format().size() );
-                    std::cout.write( reinterpret_cast< const char* >( &cur ), sizeof( comma::uint32 ) );
-                    if( csv.flush ) { std::cout.flush(); }
-                }
-                else
-                {
-                    std::cout << comma::join( istream.ascii().last(), csv.delimiter ) << csv.delimiter << cur << std::endl;
-                }
-            }
+            if( !output_map ) { tied.append( output( cur ) ); }
         }
         if( !output_map ) { return 0; }
-        comma::csv::options output_csv;
-        output_csv.delimiter = csv.delimiter;
-        if( csv.binary() ) { output_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" ); }
-        comma::csv::output_stream< map_t::value_type > ostream( std::cout, output_csv, std::make_pair( default_input, std::make_pair( 0, 0 ) ) );
-        for( map_t::const_iterator it = map.begin(); it != map.end(); ++it ) { ostream.write( *it ); }
+        comma::csv::options output_map_csv;
+        output_map_csv.delimiter = csv.delimiter;
+        if( csv.binary() ) { output_map_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" ); }
+        comma::csv::output_stream< map_t::value_type > omstream( std::cout, output_map_csv, std::make_pair( default_input, std::make_pair( 0, 0 ) ) );
+        for( map_t::const_iterator it = map.begin(); it != map.end(); ++it ) { omstream.write( *it ); }
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "csv-enumerate: " << ex.what() << std::endl; }

From 777bfd1adea19d91d712958eeaf006469b3a431e Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 7 Jan 2020 12:22:04 +1100
Subject: [PATCH 0105/1056] csv-enumerate: --verbose documented

---
 csv/applications/csv-enumerate.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index 3fd3ee910..82a3e89c9 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -54,9 +54,10 @@ static void usage( bool verbose )
     std::cerr << "                            - list of input key values; in same binary as input" << std::endl;
     std::cerr << "                            - corresponding enumeration index as ui" << std::endl;
     std::cerr << "                            - number of values for this enumeration index as ui" << std::endl;
+    std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
-    if( verbose ) { std::cerr << comma::csv::options::usage() << std::endl; } else { std::cerr << "    run csv-enumerate --help --verbose for more..." << std::endl; }
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }

From 7cfc1c7ee7c8bc7c5e2edecd132cf198dd55bae8 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 8 Jan 2020 14:33:24 +1100
Subject: [PATCH 0106/1056] csv-split: --files: explicit mapping of ids to
 filenames implemented

---
 csv/applications/csv-split.cpp   | 26 +++++-----
 csv/applications/split/split.cpp | 83 ++++++++++++++++++++++++++------
 csv/applications/split/split.h   |  3 +-
 3 files changed, 84 insertions(+), 28 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index ab3a68c15..c9cfc9477 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -37,7 +37,6 @@
 
 #include <boost/optional.hpp>
 #include <boost/program_options.hpp>
-#include "../../application/contact_info.h"
 #include "../../csv/impl/program_options.h"
 #include "../../csv/traits.h"
 #include "split/split.h"
@@ -115,7 +114,12 @@ int main( int argc, char** argv )
             std::cerr << "    split by block field, output to files" << std::endl;
             std::cerr << "        if block field present in --fields:" << std::endl;
             std::cerr << "        output records with this block to a separate file, on change of block, open a new file, e.g. 0.csv, 1.csv, etc" << std::endl;
-            std::cerr << "        example: ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block" << std::endl;
+            std::cerr << "        by block with default filenames, e.g:" << std::endl;
+            std::cerr << "            ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block" << std::endl;
+            std::cerr << "        by block with specified filenames" << std::endl;
+            std::cerr << "            ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo a; echo b; echo c )" << std::endl;
+            std::cerr << "        by block with filenames mapped to block ids" << std::endl;
+            std::cerr << "            ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'" << std::endl;
             std::cerr << std::endl;
             std::cerr << "    split by t field, output to files" << std::endl;
             std::cerr << "        if t (timestamp) field present in --fields:" << std::endl;
@@ -126,17 +130,17 @@ int main( int argc, char** argv )
             std::cerr << "        if output streams (see example below) are present on the command line and id field present in --fields:" << std::endl;
             std::cerr << "        output records with the given ids to the corresponding streams, while outputing the rest into files" << std::endl;
             std::cerr << "        records with ids for which output stream is not specified will be discarded, unless ... stream is specified:" << std::endl;
-	    std::cerr << std::endl;
-	    std::cerr << "        outputs: <keys>;<stream>; to send records with a given set of ids to this stream" << std::endl;
+            std::cerr << std::endl;
+            std::cerr << "        outputs: <keys>;<stream>; to send records with a given set of ids to this stream" << std::endl;
             std::cerr << "            keys:" << std::endl;
             std::cerr << "                <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc" << std::endl;
             std::cerr << "                ...: three dots mean: send to this stream all the records with ids for which no other stream is specified (see example below)" << std::endl;
             std::cerr << "            stream:" << std::endl;
-	    std::cerr << "                tcp:<port>: e.g. tcp:1234" << std::endl;
-	    std::cerr << "                udp:<port>: e.g. udp:1234 (todo)" << std::endl;
-	    std::cerr << "                local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
-	    std::cerr << "                <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
-	    std::cerr << "                <filename>: a regular file" << std::endl;
+            std::cerr << "                tcp:<port>: e.g. tcp:1234" << std::endl;
+            std::cerr << "                udp:<port>: e.g. udp:1234 (todo)" << std::endl;
+            std::cerr << "                local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
+            std::cerr << "                <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
+            std::cerr << "                <filename>: a regular file" << std::endl;
             std::cerr << "        example: ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) | csv-split --fields id \"0,1;tcp:5999\" \"...;local:/tmp/named_fifo\"" << std::endl;
             std::cerr << std::endl;
             std::cerr << description << std::endl;
@@ -145,10 +149,8 @@ int main( int argc, char** argv )
             std::cerr << "    block: split on the block number change" << std::endl;
             std::cerr << "    id: split by id (same as block, except does not have to be contiguous by the price of worse performance)" << std::endl;
             std::cerr << "    t: if present, use timestamp from the packet; if absent, use system time" << std::endl;
-	    std::cerr << std::endl;
-            std::cerr << comma::contact_info << std::endl;
             std::cerr << std::endl;
-            return 1;
+            return 0;
         }
         csv = comma::csv::program_options::get( vm );
         if( csv.binary() ) { size = csv.format().size(); }
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 1132e9912..2714a6665 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -38,20 +38,75 @@
 #include <sys/resource.h>
 #endif
 
+#include <unordered_map>
 #include <boost/filesystem.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../../base/exception.h"
+#include "../../../csv/stream.h"
+#include "../../../csv/traits.h"
 #include "../../../io/file_descriptor.h"
+#include "../../../name_value/parser.h"
+#include "../../../visiting/traits.h"
 #include "split.h"
 
 namespace comma { namespace csv { namespace applications {
 
+struct filename_record
+{
+    comma::uint32 id;
+    std::string filename;
+    filename_record( comma::uint32 id = 0, const std::string& filename = "" ): id( id ), filename( filename ) {}
+};
+
+} } } // namespace comma { namespace csv { namespace applications {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv::applications::filename_record >
+{
+    template< typename K, typename V > static void visit( const K& k, comma::csv::applications::filename_record& t, V& v )
+    {
+        v.apply( "id", t.id );
+        v.apply( "filename", t.filename );
+    }
+
+    template< typename K, typename V > static void visit( const K& k, const comma::csv::applications::filename_record& t, V& v )
+    {
+        v.apply( "id", t.id );
+        v.apply( "filename", t.filename );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace csv { namespace applications {
+
+std::pair< std::unordered_map< comma::uint32, std::string >, bool > static filenames( const std::string& filename )
+{
+    auto csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( filename );
+    if( csv.fields.empty() ) { csv.fields = "filename"; }
+    std::ifstream ifs( csv.filename );
+    if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "could not open --files='" << csv.filename << "'" ); }
+    comma::csv::input_stream< filename_record > is( ifs, csv );
+    comma::uint32 id = 0;
+    std::pair< std::unordered_map< comma::uint32, std::string >, bool > r;
+    r.second = csv.has_field( "id" );
+    while( is.ready() || ifs.good() )
+    {
+        auto p = is.read();
+        if( p == nullptr ) { break; }
+        r.first[ r.second ? p->id : id++ ] = p->filename; // quick and dirty
+    }
+    if( r.first.empty() ) { COMMA_THROW( comma::exception, "got no filenames from '" << csv.filename << "'" ); }
+    return r;
+}
+    
 template < typename T >
 split< T >::split( boost::optional< boost::posix_time::time_duration > period
-            , const std::string& suffix
-            , const comma::csv::options& csv
-            , bool pass
-            , const std::string& filenames )
+                 , const std::string& suffix
+                 , const comma::csv::options& csv
+                 , bool pass
+                 , const std::string& filenames )
     : ofstream_( std::bind( &split< T >::ofstream_by_time_, this ) )
     , period_( period )
     , suffix_( suffix )
@@ -66,11 +121,7 @@ split< T >::split( boost::optional< boost::posix_time::time_duration > period
     if( csv.has_field( "block" ) )
     {
         ofstream_ = std::bind( &split< T >::ofstream_by_block_, this );
-        if( !filenames.empty() )
-        {
-            filenames_.reset( new std::ifstream( filenames ) );
-            if( !filenames_->is_open() ) { COMMA_THROW( comma::exception, "failed to open '" << filenames << "'" ); }
-        }
+        if( !filenames.empty() ) { boost::tie( filenames_, filenames_with_id_ ) = applications::filenames( filenames ); }
     }
     else
     {
@@ -211,18 +262,19 @@ std::ofstream& split< T >::ofstream_by_time_()
 template < typename T >
 std::ofstream& split< T >::ofstream_by_block_()
 {
+    static comma::uint32 id = 0;
     if( !last_ || last_->block != current_.block )
     {
         file_.close();
         std::string filename;
-        if( filenames_ )
+        if( !filenames_.empty() )
         {
-            while( std::cin.good() && !is_shutdown_ )
+            auto it = filenames_.find( filenames_with_id_ ? current_.block : id );
+            if( it == filenames_.end() ) { COMMA_THROW( comma::exception, "filename not found for block " << current_.block << "; todo: skipping blocks with no matching filenames" ); }
+            filename = it->second;
+            const auto& dirname = boost::filesystem::path( filename ).parent_path();
+            if( !( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) )
             {
-                std::getline( *filenames_, filename );
-                if( filename.empty() ) { continue; }
-                const auto& dirname = boost::filesystem::path( filename ).parent_path();
-                if( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) { break; }
                 COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << filename << "'" );
             }
         }
@@ -230,6 +282,7 @@ std::ofstream& split< T >::ofstream_by_block_()
         file_.open( &filename[0], mode_ );
         if( !file_.is_open() ) { COMMA_THROW( comma::exception, "failed to open '" << filename << "'" ); }
         last_ = current_;
+        ++id;
     }
     return file_;
 }
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 53c4a2580..3322e8b72 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -158,7 +158,8 @@ class split
         ids_type_ seen_ids_;
         bool pass_;
         bool flush_;
-        std::unique_ptr< std::ifstream > filenames_;
+        std::unordered_map< comma::uint32, std::string > filenames_;
+        bool filenames_with_id_;
 
         //to-do
         bool published_on_stream( const char* data, unsigned int size );

From 7b3d52d656a64280ea9ae2696ba2c01376944fc0 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 8 Jan 2020 14:52:41 +1100
Subject: [PATCH 0107/1056] csv-split: minor refactoring to prepare for more
 generic use of --files

---
 csv/applications/split/split.cpp | 14 ++++++++------
 csv/applications/split/split.h   |  1 +
 2 files changed, 9 insertions(+), 6 deletions(-)

diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 2714a6665..541eabf99 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -130,7 +130,6 @@ split< T >::split( boost::optional< boost::posix_time::time_duration > period
     }
 }
 
-//to-do
 template < typename T >
 split< T >::split( boost::optional< boost::posix_time::time_duration > period
                  , const std::string& suffix
@@ -157,13 +156,11 @@ split< T >::split( boost::optional< boost::posix_time::time_duration > period
         {
             auto publisher_pos = t->insert( std::move( publisher ) );
             auto const keys = comma::split( stream_values[0], ',' );
-
             for( auto const& ki : keys )
             {
                 auto const kii = boost::lexical_cast< T >( ki );
                 if( seen_ids_.end() !=  seen_ids_.find( kii ) ) { COMMA_THROW( comma::exception, "multiple output streams have the id: " << ki ); }
                 seen_ids_.insert( kii );
-
                 mapped_publishers_.insert( std::make_pair( kii, publisher_pos.first->get() ) );
             }
         }
@@ -287,9 +284,14 @@ std::ofstream& split< T >::ofstream_by_block_()
     return file_;
 }
 
-template < typename T > static std::string make_filename_from_id( const T& id, const std::string& suffix ) { return boost::lexical_cast< std::string >( id ) + suffix; }
+template < typename T > std::string to_string( const T& v ) { return boost::lexical_cast< std::string >( v ); }
+template <> std::string to_string< boost::posix_time::ptime >( const boost::posix_time::ptime& v ) { return boost::posix_time::to_iso_string( v ); }
 
-static std::string make_filename_from_id( const boost::posix_time::ptime& id, const std::string& suffix ) { return boost::posix_time::to_iso_string( id ) + suffix; }
+template < typename T >
+std::string split< T >::filename_from_id_( const T& id )
+{ 
+    return to_string( id ) + suffix_;
+}
 
 template < typename T >
 std::ofstream& split< T >::ofstream_by_id_()
@@ -309,7 +311,7 @@ std::ofstream& split< T >::ofstream_by_id_()
         std::ios_base::openmode mode = mode_;
         if( seen_ids_.find( current_.id ) == seen_ids_.end() ) { seen_ids_.insert( current_.id ); }
         else { mode |= std::ofstream::app; }
-        std::string name = make_filename_from_id( current_.id, suffix_);
+        std::string name = filename_from_id_( current_.id );
         std::shared_ptr< std::ofstream > stmp( new std::ofstream( name.c_str(), mode ) );
         it = files_.insert( std::make_pair( current_.id, stmp ) ).first;
     }
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 3322e8b72..7799a1c47 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -136,6 +136,7 @@ class split
         std::ofstream& ofstream_by_time_();
         std::ofstream& ofstream_by_block_();
         std::ofstream& ofstream_by_id_();
+        std::string filename_from_id_( const T& id );
         void update_( const char* data, unsigned int size );
         void update_( const std::string& line );
         void accept_();

From 4e3b7fd676e6d72216660403ed53fef33bcef6ee Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 8 Jan 2020 18:24:20 +1100
Subject: [PATCH 0108/1056] csv-split: id field: --files implemente3d

---
 csv/applications/split/split.cpp | 51 +++++++++++++++++++++-----------
 csv/applications/split/split.h   |  2 +-
 2 files changed, 34 insertions(+), 19 deletions(-)

diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 541eabf99..d039e3cc8 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -51,26 +51,26 @@
 
 namespace comma { namespace csv { namespace applications {
 
-struct filename_record
+template < typename T > struct filename_record
 {
-    comma::uint32 id;
+    T id;
     std::string filename;
-    filename_record( comma::uint32 id = 0, const std::string& filename = "" ): id( id ), filename( filename ) {}
+    filename_record( const T& id = 0, const std::string& filename = "" ): id( id ), filename( filename ) {}
 };
 
 } } } // namespace comma { namespace csv { namespace applications {
 
 namespace comma { namespace visiting {
 
-template <> struct traits< comma::csv::applications::filename_record >
+template < typename T > struct traits< comma::csv::applications::filename_record< T > >
 {
-    template< typename K, typename V > static void visit( const K& k, comma::csv::applications::filename_record& t, V& v )
+    template< typename K, typename V > static void visit( const K& k, comma::csv::applications::filename_record< T >& t, V& v )
     {
         v.apply( "id", t.id );
         v.apply( "filename", t.filename );
     }
 
-    template< typename K, typename V > static void visit( const K& k, const comma::csv::applications::filename_record& t, V& v )
+    template< typename K, typename V > static void visit( const K& k, const comma::csv::applications::filename_record< T >& t, V& v )
     {
         v.apply( "id", t.id );
         v.apply( "filename", t.filename );
@@ -83,13 +83,15 @@ namespace comma { namespace csv { namespace applications {
 
 std::pair< std::unordered_map< comma::uint32, std::string >, bool > static filenames( const std::string& filename )
 {
+    std::pair< std::unordered_map< comma::uint32, std::string >, bool > r;
+    r.second = false;
+    if( filename.empty() ) { return r; }
     auto csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( filename );
     if( csv.fields.empty() ) { csv.fields = "filename"; }
     std::ifstream ifs( csv.filename );
     if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "could not open --files='" << csv.filename << "'" ); }
-    comma::csv::input_stream< filename_record > is( ifs, csv );
+    comma::csv::input_stream< filename_record< comma::uint32 > > is( ifs, csv ); // quick and dirty; todo: support templated map
     comma::uint32 id = 0;
-    std::pair< std::unordered_map< comma::uint32, std::string >, bool > r;
     r.second = csv.has_field( "id" );
     while( is.ready() || ifs.good() )
     {
@@ -118,15 +120,21 @@ split< T >::split( boost::optional< boost::posix_time::time_duration > period
     if( csv.fields.empty() ) { return; }
     if( csv.binary() ) { binary_.reset( new comma::csv::binary< input >( csv ) ); }
     else { ascii_.reset( new comma::csv::ascii< input >( csv ) ); }
+    boost::tie( filenames_, filenames_have_id_ ) = applications::filenames( filenames );
     if( csv.has_field( "block" ) )
     {
         ofstream_ = std::bind( &split< T >::ofstream_by_block_, this );
-        if( !filenames.empty() ) { boost::tie( filenames_, filenames_with_id_ ) = applications::filenames( filenames ); }
     }
     else
     {
-        if( !filenames.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); }
-        if( csv.has_field( "id" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_id_, this ); }
+        if( csv.has_field( "id" ) )
+        { 
+            ofstream_ = std::bind( &split< T >::ofstream_by_id_, this );
+        }
+        else
+        {    
+            if( !filenames_.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); }
+        }
     }
 }
 
@@ -266,7 +274,7 @@ std::ofstream& split< T >::ofstream_by_block_()
         std::string filename;
         if( !filenames_.empty() )
         {
-            auto it = filenames_.find( filenames_with_id_ ? current_.block : id );
+            auto it = filenames_.find( filenames_have_id_ ? current_.block : id );
             if( it == filenames_.end() ) { COMMA_THROW( comma::exception, "filename not found for block " << current_.block << "; todo: skipping blocks with no matching filenames" ); }
             filename = it->second;
             const auto& dirname = boost::filesystem::path( filename ).parent_path();
@@ -284,15 +292,22 @@ std::ofstream& split< T >::ofstream_by_block_()
     return file_;
 }
 
-template < typename T > std::string to_string( const T& v ) { return boost::lexical_cast< std::string >( v ); }
+template < typename T > static std::string to_string( const T& v ) { return boost::lexical_cast< std::string >( v ); }
+
 template <> std::string to_string< boost::posix_time::ptime >( const boost::posix_time::ptime& v ) { return boost::posix_time::to_iso_string( v ); }
 
-template < typename T >
-std::string split< T >::filename_from_id_( const T& id )
-{ 
-    return to_string( id ) + suffix_;
+template < typename T, typename M > static std::string find_( const M& m, const T& id ) { COMMA_THROW( comma::exception, "id-to-filename map not implemented for this type" ); }
+
+template <> std::string find_< comma::uint32, std::unordered_map< comma::uint32, std::string > >( const std::unordered_map< comma::uint32, std::string >& m, const comma::uint32& id )
+{
+    auto it = m.find( id );
+    if( it == m.end() ) { COMMA_THROW( comma::exception, "filename not found for id " << id << "; todo: skipping id with no matching filenames" ); }
+    return it->second;
 }
 
+template < typename T >
+std::string split< T >::filename_from_id_( const T& id ) { return filenames_.empty() ? to_string( id ) + suffix_ : find_( filenames_, id ); }
+
 template < typename T >
 std::ofstream& split< T >::ofstream_by_id_()
 {
@@ -312,7 +327,7 @@ std::ofstream& split< T >::ofstream_by_id_()
         if( seen_ids_.find( current_.id ) == seen_ids_.end() ) { seen_ids_.insert( current_.id ); }
         else { mode |= std::ofstream::app; }
         std::string name = filename_from_id_( current_.id );
-        std::shared_ptr< std::ofstream > stmp( new std::ofstream( name.c_str(), mode ) );
+        std::shared_ptr< std::ofstream > stmp( new std::ofstream( &name[0], mode ) );
         it = files_.insert( std::make_pair( current_.id, stmp ) ).first;
     }
     return *it->second;
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 7799a1c47..2f0e9b57f 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -160,7 +160,7 @@ class split
         bool pass_;
         bool flush_;
         std::unordered_map< comma::uint32, std::string > filenames_;
-        bool filenames_with_id_;
+        bool filenames_have_id_;
 
         //to-do
         bool published_on_stream( const char* data, unsigned int size );

From de04cf74caff4c6d259965742dd2b78d9817490f Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 8 Jan 2020 20:10:11 +1100
Subject: [PATCH 0109/1056] csv-split: --files: discarding unmatched ids added;
 --default-file: placeholder added, left for later

---
 csv/applications/csv-split.cpp   | 24 ++++++++++------
 csv/applications/split/split.cpp | 49 +++++++++++++++++++-------------
 csv/applications/split/split.h   | 19 +++++++------
 3 files changed, 56 insertions(+), 36 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index c9cfc9477..c9df78092 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -48,6 +48,7 @@ static std::string suffix;
 static unsigned int size = 0;
 static bool passthrough;
 static std::string files;
+static std::string default_filename;
 
 template < typename T > static void run()
 {
@@ -85,7 +86,8 @@ int main( int argc, char** argv )
         boost::program_options::options_description description( "options" );
         description.add_options()
             ( "help,h", "display help message" )
-            ( "files", boost::program_options::value< std::string >( &files ), "if 'block' field present, list of files to save blocks; todo: --files for id field" )
+            ( "default-file", boost::program_options::value< std::string >( &default_filename ), "todo: if --files present, unmatched ids will be put in the file with a given name; otherwise, unmatched values will be ignored" )
+            ( "files", boost::program_options::value< std::string >( &files ), "if 'block' or 'id' field present, list of output files (see examples below)" )
             ( "passthrough,pass", "pass data through to stdout" )
             ( "period,t", boost::program_options::value< double >( &period ), "period in seconds after which a new file is created" )
             ( "size,c", boost::program_options::value< unsigned int >( &size ), "packet size, only full packets will be written" )
@@ -109,17 +111,22 @@ int main( int argc, char** argv )
             std::cerr << "    split by id field, output to files" << std::endl;
             std::cerr << "        if id field present in --fields:" << std::endl;
             std::cerr << "        for each id value, output records with this id to a separate file, e.g. 0.csv, 1.csv, etc" << std::endl;
-            std::cerr << "        example: ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) | csv-split --fields id" << std::endl;
+            std::cerr << "        - by id with default filenames, e.g:" << std::endl;
+            std::cerr << "              ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields id" << std::endl;
+            std::cerr << "        - by id with specified filenames" << std::endl;
+            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields id --files <( echo a; echo b; echo c )" << std::endl;
+            std::cerr << "        - by id with filenames mapped to block ids" << std::endl;
+            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields id --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'" << std::endl;
             std::cerr << std::endl;
             std::cerr << "    split by block field, output to files" << std::endl;
             std::cerr << "        if block field present in --fields:" << std::endl;
             std::cerr << "        output records with this block to a separate file, on change of block, open a new file, e.g. 0.csv, 1.csv, etc" << std::endl;
-            std::cerr << "        by block with default filenames, e.g:" << std::endl;
-            std::cerr << "            ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block" << std::endl;
-            std::cerr << "        by block with specified filenames" << std::endl;
-            std::cerr << "            ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo a; echo b; echo c )" << std::endl;
-            std::cerr << "        by block with filenames mapped to block ids" << std::endl;
-            std::cerr << "            ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'" << std::endl;
+            std::cerr << "        - by block with default filenames, e.g:" << std::endl;
+            std::cerr << "              ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block" << std::endl;
+            std::cerr << "        - by block with specified filenames" << std::endl;
+            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo a; echo b; echo c )" << std::endl;
+            std::cerr << "        - by block with filenames mapped to block ids" << std::endl;
+            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'" << std::endl;
             std::cerr << std::endl;
             std::cerr << "    split by t field, output to files" << std::endl;
             std::cerr << "        if t (timestamp) field present in --fields:" << std::endl;
@@ -153,6 +160,7 @@ int main( int argc, char** argv )
             return 0;
         }
         csv = comma::csv::program_options::get( vm );
+        if( !default_filename.empty() ) { std::cerr << "csv-split: --default-filename: todo, just ask" << std::endl; }
         if( csv.binary() ) { size = csv.format().size(); }
         bool id_is_string = vm.count( "string" );
         bool id_is_time = vm.count( "time" );
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index d039e3cc8..31e93695e 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -104,11 +104,12 @@ std::pair< std::unordered_map< comma::uint32, std::string >, bool > static filen
 }
     
 template < typename T >
-split< T >::split( boost::optional< boost::posix_time::time_duration > period
+split< T >::split( const boost::optional< boost::posix_time::time_duration >& period
                  , const std::string& suffix
                  , const comma::csv::options& csv
                  , bool pass
-                 , const std::string& filenames )
+                 , const std::string& filenames
+                 , const std::string& default_filename )
     : ofstream_( std::bind( &split< T >::ofstream_by_time_, this ) )
     , period_( period )
     , suffix_( suffix )
@@ -139,13 +140,14 @@ split< T >::split( boost::optional< boost::posix_time::time_duration > period
 }
 
 template < typename T >
-split< T >::split( boost::optional< boost::posix_time::time_duration > period
+split< T >::split( const boost::optional< boost::posix_time::time_duration >& period
                  , const std::string& suffix
                  , const comma::csv::options& csv
                  , const std::vector< std::string >& streams //to-do
                  , bool pass
-                 , const std::string& filenames )
-    : split( period, suffix, csv, pass, filenames )
+                 , const std::string& filenames
+                 , const std::string& default_filename )
+    : split( period, suffix, csv, pass, filenames, default_filename )
 {
     if( streams.empty() ) { return; }
     auto const io_mode = csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii;
@@ -227,8 +229,12 @@ void split< T >::write( const char* data, unsigned int size )
     else { current_.timestamp = boost::get_system_time(); }
     if( !published_on_stream( data, size ) ) // todo? or bind write function on initialisation and call it here?
     {
-        ofstream_().write( data, size );
-        if( flush_ ) { ofstream_().flush(); }
+        auto ofs = ofstream_();
+        if( ofs )
+        {
+            ofs->write( data, size );
+            if( flush_ ) { ofs->flush(); }
+        }
     }
     if ( pass_ ) { std::cout.write( data, size ); std::cout.flush(); }
 }
@@ -242,16 +248,19 @@ void split< T >::write ( std::string line )
     line += '\n';
     if( !published_on_stream( &line[0], line.size()) ) // todo? or bind write function on initialisation and call it here?
     {
-        std::ofstream& ofs = ofstream_();
-        ofs.write( &line[0], line.size() );
-        //ofs.put( '\n' );
-        if( flush_ ) { ofs.flush(); }
+        auto ofs = ofstream_();
+        if( ofs )
+        {
+            ofs->write( &line[0], line.size() );
+            //ofs.put( '\n' );
+            if( flush_ ) { ofs->flush(); }
+        }
     }
     if ( pass_ ) { std::cout.write( &line[0], line.size() ); /*std::cout.put('\n');*/ std::cout.flush(); }
 }
 
 template < typename T >
-std::ofstream& split< T >::ofstream_by_time_()
+std::ofstream* split< T >::ofstream_by_time_()
 {
     if( !last_ || current_.timestamp > ( last_->timestamp + *period_ ) )
     {
@@ -261,11 +270,11 @@ std::ofstream& split< T >::ofstream_by_time_()
         file_.open( ( time + suffix_ ).c_str(), mode_ );
         last_ = current_;
     }
-    return file_;
+    return &file_;
 }
 
 template < typename T >
-std::ofstream& split< T >::ofstream_by_block_()
+std::ofstream* split< T >::ofstream_by_block_()
 {
     static comma::uint32 id = 0;
     if( !last_ || last_->block != current_.block )
@@ -275,7 +284,7 @@ std::ofstream& split< T >::ofstream_by_block_()
         if( !filenames_.empty() )
         {
             auto it = filenames_.find( filenames_have_id_ ? current_.block : id );
-            if( it == filenames_.end() ) { COMMA_THROW( comma::exception, "filename not found for block " << current_.block << "; todo: skipping blocks with no matching filenames" ); }
+            if( it == filenames_.end() ) { return nullptr; }
             filename = it->second;
             const auto& dirname = boost::filesystem::path( filename ).parent_path();
             if( !( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) )
@@ -289,7 +298,7 @@ std::ofstream& split< T >::ofstream_by_block_()
         last_ = current_;
         ++id;
     }
-    return file_;
+    return &file_;
 }
 
 template < typename T > static std::string to_string( const T& v ) { return boost::lexical_cast< std::string >( v ); }
@@ -301,15 +310,14 @@ template < typename T, typename M > static std::string find_( const M& m, const
 template <> std::string find_< comma::uint32, std::unordered_map< comma::uint32, std::string > >( const std::unordered_map< comma::uint32, std::string >& m, const comma::uint32& id )
 {
     auto it = m.find( id );
-    if( it == m.end() ) { COMMA_THROW( comma::exception, "filename not found for id " << id << "; todo: skipping id with no matching filenames" ); }
-    return it->second;
+    return it == m.end() ? std::string() : it->second;
 }
 
 template < typename T >
 std::string split< T >::filename_from_id_( const T& id ) { return filenames_.empty() ? to_string( id ) + suffix_ : find_( filenames_, id ); }
 
 template < typename T >
-std::ofstream& split< T >::ofstream_by_id_()
+std::ofstream* split< T >::ofstream_by_id_()
 {
     typename Files::iterator it = files_.find( current_.id );
     if( it == files_.end() )
@@ -327,10 +335,11 @@ std::ofstream& split< T >::ofstream_by_id_()
         if( seen_ids_.find( current_.id ) == seen_ids_.end() ) { seen_ids_.insert( current_.id ); }
         else { mode |= std::ofstream::app; }
         std::string name = filename_from_id_( current_.id );
+        if( name.empty() ) { return nullptr; }
         std::shared_ptr< std::ofstream > stmp( new std::ofstream( &name[0], mode ) );
         it = files_.insert( std::make_pair( current_.id, stmp ) ).first;
     }
-    return *it->second;
+    return it->second.get();
 }
 
 template class split< comma::uint32 >;
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 2f0e9b57f..7fb36b57d 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -118,30 +118,32 @@ class split
 {
     public:
         typedef applications::input< T > input;
-        split( boost::optional< boost::posix_time::time_duration > period
+        split( const boost::optional< boost::posix_time::time_duration >& period
              , const std::string& suffix
              , const comma::csv::options& csv
              , bool passthrough
-             , const std::string& filenames );
-        split( boost::optional< boost::posix_time::time_duration > period
+             , const std::string& filenames
+             , const std::string& default_filename = "" );
+        split( const boost::optional< boost::posix_time::time_duration >& period
              , const std::string& suffix
              , const comma::csv::options& csv
              , const std::vector< std::string >& streams
              , bool passthrough
-             , const std::string& filenames );
+             , const std::string& filenames
+             , const std::string& default_filename = "" );
         ~split();
         void write( const char* data, unsigned int size );
         void write( std::string line );
     private:
-        std::ofstream& ofstream_by_time_();
-        std::ofstream& ofstream_by_block_();
-        std::ofstream& ofstream_by_id_();
+        std::ofstream* ofstream_by_time_();
+        std::ofstream* ofstream_by_block_();
+        std::ofstream* ofstream_by_id_();
         std::string filename_from_id_( const T& id );
         void update_( const char* data, unsigned int size );
         void update_( const std::string& line );
         void accept_();
 
-        std::function< std::ofstream&() > ofstream_;
+        std::function< std::ofstream*() > ofstream_;
         std::unique_ptr< comma::csv::ascii< input > > ascii_;
         std::unique_ptr< comma::csv::binary< input > > binary_;
         boost::optional< boost::posix_time::time_duration > period_;
@@ -160,6 +162,7 @@ class split
         bool pass_;
         bool flush_;
         std::unordered_map< comma::uint32, std::string > filenames_;
+        // todo? std::unique_ptr< comma::io::publisher > default_file_;
         bool filenames_have_id_;
 
         //to-do

From df6c53ca531c300076b21d1ea9b51dc61dfd482e Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 9 Jan 2020 12:49:57 +1100
Subject: [PATCH 0110/1056] csv::ascii::sample() added

---
 csv/ascii.h | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/csv/ascii.h b/csv/ascii.h
index 0e1fdf3ed..cb653b627 100644
--- a/csv/ascii.h
+++ b/csv/ascii.h
@@ -87,6 +87,9 @@ class ascii
         
         /// return quote sign
         boost::optional< char > quote() const { return quote_; }
+        
+        /// return default value
+        const S& sample() const { return sample_; }
 
     private:
         char delimiter_;

From 405fb8f363da1ca0558da95afc21c8547786ad19 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 23 Jan 2020 19:22:45 +1100
Subject: [PATCH 0111/1056] csv-strings: in progress...

---
 csv/applications/CMakeLists.txt  |   4 +
 csv/applications/csv-strings.cpp | 199 +++++++++++++++++++++++++++++++
 2 files changed, 203 insertions(+)
 create mode 100644 csv/applications/csv-strings.cpp

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index a165fa65c..f615f4c5c 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -114,6 +114,10 @@ add_executable( csv-random ${dir}/csv-random.cpp )
 target_link_libraries ( csv-random ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
 install( TARGETS csv-random RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
+add_executable( csv-strings ${dir}/csv-strings.cpp )
+target_link_libraries ( csv-strings ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+install( TARGETS csv-strings RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
 add_executable( csv-update ${dir}/csv-update.cpp )
 target_link_libraries ( csv-update ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
 install( TARGETS csv-update RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
new file mode 100644
index 000000000..b42e5a86d
--- /dev/null
+++ b/csv/applications/csv-strings.cpp
@@ -0,0 +1,199 @@
+// This file is provided in addition to comma and is not an integral
+// part of comma library.
+// Copyright (c) 2018 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+// comma is a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+/// @author vsevolod vlaskine
+
+#include <functional>
+#include <iostream>
+#include <boost/lexical_cast.hpp>
+#include "../../application/command_line_options.h"
+#include "../../csv/stream.h"
+#include "../../csv/traits.h"
+#include "../../string/string.h"
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "operations on strings" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    usage: cat input.csv | csv-strings <operation> [<options>] > output.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    path-basename" << std::endl;
+    std::cerr << "    path-dirname" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    options" << std::endl;
+    std::cerr << "        --fields=[<fields>]; will perform operation on any non-empty fields" << std::endl;
+    std::cerr << "                             unless different semantics specified for operation" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "path-basename" << std::endl;
+    std::cerr << "    options" << std::endl;
+    std::cerr << "        --depth=<depth>; default=1; if path length less than depth, output empty string" << std::endl;
+    std::cerr << "        --emplace; perform operation emplace" << std::endl;
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "path-dirname" << std::endl;
+    std::cerr << "    options" << std::endl;
+    std::cerr << "        --depth=<depth>; default=1; if path length less than depth, output empty string" << std::endl;
+    std::cerr << "        --emplace; perform operation emplace" << std::endl;
+    std::cerr << "        --fixed-depth=[<depth>]; output paths of fixed depth starting from root" << std::endl;
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options:" << std::endl;
+    std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+static comma::csv::options csv;
+
+namespace comma { namespace applications { namespace strings { namespace path {
+
+struct input
+{ 
+    std::vector< std::string > strings;
+    input( unsigned int n = 0 ): strings( n ) {}
+};
+
+} } } } // namespace comma { namespace applications { namespace strings { namespace path {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::applications::strings::path::input >
+{
+    template < typename K, typename V > static void visit( const K&, const comma::applications::strings::path::input& p, V& v ) { v.apply( "strings", p.strings ); }
+    template < typename K, typename V > static void visit( const K&, comma::applications::strings::path::input& p, V& v ) { v.apply( "strings", p.strings ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace applications { namespace strings { namespace path {
+
+template < typename T >
+static int run( const comma::command_line_options& options )
+{
+    auto v = comma::split( ::csv.fields, ',' );
+    unsigned int n = 0;
+    for( unsigned int i = 0; i < v.size(); ++i )
+    {
+        if( v.empty() ) { continue; }
+        v[i] = "strings[" + boost::lexical_cast< std::string >( i ) + "]";
+        ++n;
+    }
+    if( n == 0 ) { std::cerr << "csv-strings: path-" << T::name() << ": please specify at least one non-empty field" << std::endl; exit( 1 ); }
+    ::csv.fields = comma::join( v, ',' );
+    comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
+    std::function< void( const input& p ) > write;
+    auto run_ = [&]()->int
+    {
+        while( istream.ready() || std::cin.good() )
+        {
+            const input* p = istream.read();
+            if( !p ) { break; }
+            input r( n );
+            for( unsigned int i = 0; i < p->strings.size(); ++i ) { r.strings[i] = T::convert( p->strings[i] ); }
+            write( r );
+            if( ::csv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    };
+    if( options.exists( "--emplace" ) )
+    {
+        comma::csv::passed< input > passed( istream, std::cout, ::csv.flush );
+        write = [&]( const input& p ) { passed.write( p ); };
+        return run_();
+    }
+    comma::csv::options output_csv = ::csv;
+    output_csv.fields = "strings";
+    if( ::csv.binary() ) { std::cerr << "csv-strings: path-" << T::name() << ": binary mode supported only for --emplace; todo, just ask" << std::endl; exit( 1 ); }
+    comma::csv::output_stream< input > ostream( std::cout, output_csv, input( n ) );
+    comma::csv::tied< input, input > tied( istream, ostream );
+    write = [&]( const input& p ) { tied.append( p ); };
+    return run_();
+}
+
+struct basename
+{
+    static const char* name() { return "basename"; }
+    static std::string convert( const std::string& s ) { return "basename: todo"; }
+};
+
+struct dirname
+{
+    static const char* name() { return "dirname"; }
+    static std::string convert( const std::string& s ) { return "dirname: todo"; }
+};
+
+} } } } // namespace comma { namespace applications { namespace strings { namespace path {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-strings: please specify operation" << std::endl; return 1; }
+        std::string operation = unnamed[0];
+        csv = comma::csv::options( options );
+        if( operation == "path-basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
+        if( operation == "path-dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
+        std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
+        return 1;
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-strings: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-strings: unknown exception" << std::endl; }
+    return 1;
+}

From cf0fcc4afcb26ef068239781c13bcef14d9937c7 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Fri, 24 Jan 2020 13:01:05 +1100
Subject: [PATCH 0112/1056] csv-string: basename, dirname: implemented, tested

---
 csv/applications/csv-strings.cpp |  83 +++++++++++++++++----
 csv/test/csv-strings/expected    | 122 +++++++++++++++++++++++++++++++
 csv/test/csv-strings/input       |  48 ++++++++++++
 3 files changed, 239 insertions(+), 14 deletions(-)
 create mode 100644 csv/test/csv-strings/expected
 create mode 100644 csv/test/csv-strings/input

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index b42e5a86d..cc1318f1c 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -60,6 +60,7 @@
 #include <iostream>
 #include <boost/lexical_cast.hpp>
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
 #include "../../csv/stream.h"
 #include "../../csv/traits.h"
 #include "../../string/string.h"
@@ -72,12 +73,14 @@ static void usage( bool verbose )
     std::cerr << "    usage: cat input.csv | csv-strings <operation> [<options>] > output.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
-    std::cerr << "    path-basename" << std::endl;
-    std::cerr << "    path-dirname" << std::endl;
+    std::cerr << "    path-basename,basename" << std::endl;
+    std::cerr << "    path-dirname,dirname" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    options" << std::endl;
-    std::cerr << "        --fields=[<fields>]; will perform operation on any non-empty fields" << std::endl;
-    std::cerr << "                             unless different semantics specified for operation" << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --fields=[<fields>]; will perform operation on any non-empty fields" << std::endl;
+    std::cerr << "                         unless different semantics specified for operation" << std::endl;
+    std::cerr << "                         default: perform operation on the first field" << std::endl;
+    std::cerr << "    --strict; exit on strings on which operation does not make sense" << std::endl;
     std::cerr << std::endl;
     std::cerr << "path-basename" << std::endl;
     std::cerr << "    options" << std::endl;
@@ -98,6 +101,7 @@ static void usage( bool verbose )
     exit( 0 );
 }
 
+static bool strict;
 static comma::csv::options csv;
 
 namespace comma { namespace applications { namespace strings { namespace path {
@@ -129,22 +133,24 @@ static int run( const comma::command_line_options& options )
     unsigned int n = 0;
     for( unsigned int i = 0; i < v.size(); ++i )
     {
-        if( v.empty() ) { continue; }
-        v[i] = "strings[" + boost::lexical_cast< std::string >( i ) + "]";
+        if( v[i].empty() ) { continue; }
+        v[i] = "strings[" + boost::lexical_cast< std::string >( n ) + "]";
         ++n;
     }
-    if( n == 0 ) { std::cerr << "csv-strings: path-" << T::name() << ": please specify at least one non-empty field" << std::endl; exit( 1 ); }
-    ::csv.fields = comma::join( v, ',' );
+    ::csv.fields = n == 0 ? std::string( "strings[0]" ) : comma::join( v, ',' );
+    if( n == 0 ) { ++n; }
+    char delimiter = options.value( "--path-delimiter,-p", '/' );
     comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
     std::function< void( const input& p ) > write;
     auto run_ = [&]()->int
     {
+        T t( options );
         while( istream.ready() || std::cin.good() )
         {
             const input* p = istream.read();
             if( !p ) { break; }
             input r( n );
-            for( unsigned int i = 0; i < p->strings.size(); ++i ) { r.strings[i] = T::convert( p->strings[i] ); }
+            for( unsigned int i = 0; i < p->strings.size(); ++i ) { r.strings[i] = t.convert( comma::split( p->strings[i], delimiter ) ); }
             write( r );
             if( ::csv.flush ) { std::cout.flush(); }
         }
@@ -167,14 +173,62 @@ static int run( const comma::command_line_options& options )
 
 struct basename
 {
+    unsigned int depth;
+    char delimiter;
+    
     static const char* name() { return "basename"; }
-    static std::string convert( const std::string& s ) { return "basename: todo"; }
+    
+    basename( const comma::command_line_options& options )
+        : depth( options.value( "--depth", 1 ) )
+        , delimiter( options.value( "--path-delimiter,-p", '/' ) )
+    {
+    }
+    
+    std::string convert( const std::vector< std::string >& s )
+    {
+        if( s.size() < depth )
+        {
+            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << depth << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+            return "";
+        }
+        return comma::join( s.end() - depth, s.end(), delimiter );
+    }
 };
 
 struct dirname
 {
+    unsigned int depth;
+    unsigned int fixed_depth;
+    char delimiter;
+    
     static const char* name() { return "dirname"; }
-    static std::string convert( const std::string& s ) { return "dirname: todo"; }
+    
+    dirname( const comma::command_line_options& options )
+        : depth( options.value( "--depth", 1 ) )
+        , fixed_depth( options.value( "--fixed-depth", 0 ) )
+        , delimiter( options.value( "--path-delimiter,-p", '/' ) )
+    {
+        options.assert_mutually_exclusive( "--depth,--fixed-depth" );
+    }
+    
+    std::string convert( const std::vector< std::string >& s )
+    {
+        if( fixed_depth > 0 )
+        {
+            if( s.size() < fixed_depth )
+            {
+                if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << fixed_depth << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+                return "";
+            }
+            return comma::join( s, fixed_depth, delimiter );
+        }
+        if( s.size() < depth )
+        {
+            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << depth << "; got: '" << comma::join( s, '/' ) << "'" ); }
+            return "";
+        }
+        return comma::join( s.begin(), s.end() - depth, delimiter );
+    }
 };
 
 } } } } // namespace comma { namespace applications { namespace strings { namespace path {
@@ -187,9 +241,10 @@ int main( int ac, char** av )
         const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-strings: please specify operation" << std::endl; return 1; }
         std::string operation = unnamed[0];
+        strict = options.exists( "--strict" );
         csv = comma::csv::options( options );
-        if( operation == "path-basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
-        if( operation == "path-dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
+        if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
+        if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
         std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
         return 1;
     }
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
new file mode 100644
index 000000000..47409cc92
--- /dev/null
+++ b/csv/test/csv-strings/expected
@@ -0,0 +1,122 @@
+basename/append[0]/output/line[0]="a,a"
+basename/append[0]/output/line[1]="a/b,b"
+basename/append[0]/output/line[2]="a/b/c,c"
+basename/append[1]/output/line[0]="a,"
+basename/append[1]/output/line[1]="a/b,a/b"
+basename/append[1]/output/line[2]="a/b/c,b/c"
+basename/append[2]/output/line[0]="a,"
+basename/append[2]/output/line[1]="a/b,"
+basename/append[2]/output/line[2]="a/b/c,a/b/c"
+basename/append[3]/output/line[0]="a,"
+basename/append[3]/output/line[1]="a/b,"
+basename/append[3]/output/line[2]="a/b/c,"
+
+basename/emplace[0]/output/line[0]="a"
+basename/emplace[0]/output/line[1]="b"
+basename/emplace[0]/output/line[2]="c"
+basename/emplace[1]/output/line[0]=""
+basename/emplace[1]/output/line[1]="a/b"
+basename/emplace[1]/output/line[2]="b/c"
+basename/emplace[2]/output/line[0]=""
+basename/emplace[2]/output/line[1]=""
+basename/emplace[2]/output/line[2]="a/b/c"
+basename/emplace[3]/output/line[0]=","
+basename/emplace[3]/output/line[1]=","
+basename/emplace[3]/output/line[2]=","
+
+dirname/depth/append[0]/output/line[0]="a,"
+dirname/depth/append[0]/output/line[1]="a/b,a"
+dirname/depth/append[0]/output/line[2]="a/b/c,a/b"
+dirname/depth/append[1]/output/line[0]="a,"
+dirname/depth/append[1]/output/line[1]="a/b,"
+dirname/depth/append[1]/output/line[2]="a/b/c,a"
+dirname/depth/append[2]/output/line[0]="a,"
+dirname/depth/append[2]/output/line[1]="a/b,"
+dirname/depth/append[2]/output/line[2]="a/b/c,"
+dirname/depth/append[3]/output/line[0]="a,"
+dirname/depth/append[3]/output/line[1]="a/b,"
+dirname/depth/append[3]/output/line[2]="a/b/c,"
+
+dirname/depth/emplace[0]/output/line[0]=""
+dirname/depth/emplace[0]/output/line[1]="a"
+dirname/depth/emplace[0]/output/line[2]="a/b"
+dirname/depth/emplace[1]/output/line[0]=""
+dirname/depth/emplace[1]/output/line[1]=""
+dirname/depth/emplace[1]/output/line[2]="a"
+dirname/depth/emplace[2]/output/line[0]=","
+dirname/depth/emplace[2]/output/line[1]=","
+dirname/depth/emplace[2]/output/line[2]=","
+dirname/depth/emplace[3]/output/line[0]=","
+dirname/depth/emplace[3]/output/line[1]=","
+dirname/depth/emplace[3]/output/line[2]=","
+
+dirname/fixed_depth/append[0]/output/line[0]="a,"
+dirname/fixed_depth/append[0]/output/line[1]="a/b,a"
+dirname/fixed_depth/append[0]/output/line[2]="a/b/c,a/b"
+dirname/fixed_depth/append[1]/output/line[0]="a,"
+dirname/fixed_depth/append[1]/output/line[1]="a/b,a/b"
+dirname/fixed_depth/append[1]/output/line[2]="a/b/c,a/b"
+dirname/fixed_depth/append[2]/output/line[0]="a,"
+dirname/fixed_depth/append[2]/output/line[1]="a/b,"
+dirname/fixed_depth/append[2]/output/line[2]="a/b/c,a/b/c"
+dirname/fixed_depth/append[3]/output/line[0]="a,"
+dirname/fixed_depth/append[3]/output/line[1]="a/b,"
+dirname/fixed_depth/append[3]/output/line[2]="a/b/c,"
+
+dirname/fixed_depth/emplace[0]/output/line[0]=""
+dirname/fixed_depth/emplace[0]/output/line[1]="a"
+dirname/fixed_depth/emplace[0]/output/line[2]="a/b"
+dirname/fixed_depth/emplace[1]/output/line[0]=""
+dirname/fixed_depth/emplace[1]/output/line[1]="a/b"
+dirname/fixed_depth/emplace[1]/output/line[2]="a/b"
+dirname/fixed_depth/emplace[2]/output/line[0]=""
+dirname/fixed_depth/emplace[2]/output/line[1]=""
+dirname/fixed_depth/emplace[2]/output/line[2]="a/b/c"
+dirname/fixed_depth/emplace[3]/output/line[0]=","
+dirname/fixed_depth/emplace[3]/output/line[1]=","
+dirname/fixed_depth/emplace[3]/output/line[2]=","
+
+delimiter[0]/output/line[0]="a.a"
+delimiter[0]/output/line[1]="a.b.a"
+delimiter[0]/output/line[2]="a.b/c.d/e.a"
+delimiter[1]/output/line[0]="a"
+delimiter[1]/output/line[1]="a.b"
+delimiter[1]/output/line[2]="a.b/c.d/e"
+delimiter[2]/output/line[0]="a."
+delimiter[2]/output/line[1]="a.b."
+delimiter[2]/output/line[2]="a.b/c.d/e."
+delimiter[3]/output/line[0]=""
+delimiter[3]/output/line[1]=".b"
+delimiter[3]/output/line[2]=".b/c.d/e"
+
+strict[0]/output="a/b/c,a/b/c"
+strict[0]/status=1
+strict[1]/output="a/b/c"
+strict[1]/status=1
+strict[2]/output="a/b/c,"
+strict[2]/status=1
+strict[3]/output=""
+strict[3]/status=1
+strict[4]/output="a/b/c,a/b/c"
+strict[4]/status=1
+strict[5]/output="a/b/c"
+strict[5]/status=1
+
+fields[0]/output/line[0]="k,,a,,x,a,x"
+fields[0]/output/line[1]="l,,a/b,,x/y,b,y"
+fields[0]/output/line[2]="m,,a/b/c,,x/y/z,c,z"
+fields[1]/output/line[0]="k,,a,,x"
+fields[1]/output/line[1]="l,,b,,y"
+fields[1]/output/line[2]="m,,c,,z"
+fields[2]/output/line[0]="k,,,,"
+fields[2]/output/line[1]="l,,a/b,,x/y"
+fields[2]/output/line[2]="m,,b/c,,y/z"
+fields[3]/output/line[0]="k,,a,,x,,"
+fields[3]/output/line[1]="l,,a/b,,x/y,a,x"
+fields[3]/output/line[2]="m,,a/b/c,,x/y/z,a/b,x/y"
+fields[4]/output/line[0]="k,,,,"
+fields[4]/output/line[1]="l,,a,,x"
+fields[4]/output/line[2]="m,,a/b,,x/y"
+fields[5]/output/line[0]="k,,,,"
+fields[5]/output/line[1]="l,,,,"
+fields[5]/output/line[2]="m,,a,,x"
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
new file mode 100644
index 000000000..4c176c25f
--- /dev/null
+++ b/csv/test/csv-strings/input
@@ -0,0 +1,48 @@
+basename/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename"
+basename/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 2"
+basename/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 3"
+basename/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 4"
+
+basename/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --emplace"
+basename/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 2 --emplace"
+basename/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 3 --emplace"
+basename/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-basename --depth 4 --emplace"
+
+dirname/depth/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
+dirname/depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 2"
+dirname/depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 3"
+dirname/depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 4"
+
+dirname/depth/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
+dirname/depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 2 --emplace"
+dirname/depth/emplace[2]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --depth 3 --emplace"
+dirname/depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --depth 4 --emplace"
+
+dirname/fixed_depth/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
+dirname/fixed_depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 2"
+dirname/fixed_depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 3"
+dirname/fixed_depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 4"
+
+dirname/fixed_depth/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
+dirname/fixed_depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 2 --emplace"
+dirname/fixed_depth/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 3 --emplace"
+dirname/fixed_depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --fixed-depth 4 --emplace"
+
+delimiter[0]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=."
+delimiter[1]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=. --emplace"
+delimiter[2]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-dirname --delimiter=."
+delimiter[3]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-dirname --delimiter=. --emplace"
+
+strict[0]="( echo a/b/c; echo a/b ) | csv-strings path-basename --depth 3 --strict"
+strict[1]="( echo a/b/c; echo a/b ) | csv-strings path-basename --depth 3 --emplace --strict"
+strict[2]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --depth 3 --strict"
+strict[3]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --depth 3 --emplace --strict"
+strict[4]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --fixed-depth 3 --strict"
+strict[5]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --fixed-depth 3 --emplace --strict"
+
+fields[0]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n"
+fields[1]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n --emplace"
+fields[2]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n --emplace --depth 2"
+fields[3]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n"
+fields[4]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace"
+fields[5]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace --depth 2"

From 698259fddcdba67cd163de9c5f755cae54854aad Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Fri, 24 Jan 2020 14:54:39 +1100
Subject: [PATCH 0113/1056] csv-strings: path-canonical operation implemented

---
 csv/applications/csv-strings.cpp | 44 ++++++++++++++++++++++++++------
 1 file changed, 36 insertions(+), 8 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index cc1318f1c..1baa1741c 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -58,6 +58,7 @@
 
 #include <functional>
 #include <iostream>
+#include <boost/filesystem.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
@@ -75,26 +76,30 @@ static void usage( bool verbose )
     std::cerr << "operations" << std::endl;
     std::cerr << "    path-basename,basename" << std::endl;
     std::cerr << "    path-dirname,dirname" << std::endl;
+    std::cerr << "    path-realpath,path-canonical,canonical" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
+    std::cerr << "    --emplace; perform operation emplace" << std::endl;
     std::cerr << "    --fields=[<fields>]; will perform operation on any non-empty fields" << std::endl;
     std::cerr << "                         unless different semantics specified for operation" << std::endl;
     std::cerr << "                         default: perform operation on the first field" << std::endl;
     std::cerr << "    --strict; exit on strings on which operation does not make sense" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "path-basename" << std::endl;
+    std::cerr << "path-basename,basename" << std::endl;
     std::cerr << "    options" << std::endl;
     std::cerr << "        --depth=<depth>; default=1; if path length less than depth, output empty string" << std::endl;
-    std::cerr << "        --emplace; perform operation emplace" << std::endl;
     std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "path-dirname" << std::endl;
+    std::cerr << "path-dirname,dirname" << std::endl;
     std::cerr << "    options" << std::endl;
     std::cerr << "        --depth=<depth>; default=1; if path length less than depth, output empty string" << std::endl;
-    std::cerr << "        --emplace; perform operation emplace" << std::endl;
     std::cerr << "        --fixed-depth=[<depth>]; output paths of fixed depth starting from root" << std::endl;
     std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "path-realpath,path-canonical,canonical" << std::endl;
+    std::cerr << "    options" << std::endl;
+    std::cerr << "        --base=[<path>]; base path, default: current directory" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "csv options:" << std::endl;
     std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;
     std::cerr << std::endl;
@@ -139,7 +144,6 @@ static int run( const comma::command_line_options& options )
     }
     ::csv.fields = n == 0 ? std::string( "strings[0]" ) : comma::join( v, ',' );
     if( n == 0 ) { ++n; }
-    char delimiter = options.value( "--path-delimiter,-p", '/' );
     comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
     std::function< void( const input& p ) > write;
     auto run_ = [&]()->int
@@ -150,7 +154,7 @@ static int run( const comma::command_line_options& options )
             const input* p = istream.read();
             if( !p ) { break; }
             input r( n );
-            for( unsigned int i = 0; i < p->strings.size(); ++i ) { r.strings[i] = t.convert( comma::split( p->strings[i], delimiter ) ); }
+            for( unsigned int i = 0; i < p->strings.size(); ++i ) { r.strings[i] = t.convert( p->strings[i] ); }
             write( r );
             if( ::csv.flush ) { std::cout.flush(); }
         }
@@ -184,8 +188,9 @@ struct basename
     {
     }
     
-    std::string convert( const std::vector< std::string >& s )
+    std::string convert( const std::string& t )
     {
+        const auto& s = comma::split( t, delimiter );
         if( s.size() < depth )
         {
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << depth << "; got: '" << comma::join( s, delimiter ) << "'" ); }
@@ -211,8 +216,9 @@ struct dirname
         options.assert_mutually_exclusive( "--depth,--fixed-depth" );
     }
     
-    std::string convert( const std::vector< std::string >& s )
+    std::string convert( const std::string& t )
     {
+        const auto& s = comma::split( t, delimiter );
         if( fixed_depth > 0 )
         {
             if( s.size() < fixed_depth )
@@ -231,6 +237,27 @@ struct dirname
     }
 };
 
+struct canonical
+{
+    boost::filesystem::path base;
+    
+    static const char* name() { return "canonical"; }
+    
+    canonical( const comma::command_line_options& options )
+        : base( options.exists( "--base" )
+        ? boost::filesystem::path( options.value< std::string >( "--base" ) )
+        : boost::filesystem::current_path() )
+    {
+        if( ( options.value( "--path-delimiter,-p", '/' ) ) != '/' ) { COMMA_THROW( comma::exception, "path-canonical: expected path delimiter '/'; got: '" << options.value( "--path-delimiter,-p", '/' ) << "'" ); }
+    }
+    
+    std::string convert( const std::string& s )
+    {
+        try { return boost::filesystem::canonical( boost::filesystem::path( s ), base ).string(); } catch( ... ) { if( strict ) { throw; } }
+        return s;
+    }
+};
+
 } } } } // namespace comma { namespace applications { namespace strings { namespace path {
 
 int main( int ac, char** av )
@@ -245,6 +272,7 @@ int main( int ac, char** av )
         csv = comma::csv::options( options );
         if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
         if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
+        if( operation == "path-realpath" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::path::run< comma::applications::strings::path::canonical >( options ); }
         std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
         return 1;
     }

From 3f4288eeefae03ef050b61beef8d16da7183cd3c Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Fri, 24 Jan 2020 14:57:44 +1100
Subject: [PATCH 0114/1056] csv-strings: path-realpath renamed to path-real

---
 csv/applications/csv-strings.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 1baa1741c..1f9d5cf36 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -76,7 +76,7 @@ static void usage( bool verbose )
     std::cerr << "operations" << std::endl;
     std::cerr << "    path-basename,basename" << std::endl;
     std::cerr << "    path-dirname,dirname" << std::endl;
-    std::cerr << "    path-realpath,path-canonical,canonical" << std::endl;
+    std::cerr << "    path-real,path-canonical,canonical" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --emplace; perform operation emplace" << std::endl;
@@ -96,7 +96,7 @@ static void usage( bool verbose )
     std::cerr << "        --fixed-depth=[<depth>]; output paths of fixed depth starting from root" << std::endl;
     std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "path-realpath,path-canonical,canonical" << std::endl;
+    std::cerr << "path-real,path-canonical,canonical" << std::endl;
     std::cerr << "    options" << std::endl;
     std::cerr << "        --base=[<path>]; base path, default: current directory" << std::endl;
     std::cerr << std::endl;
@@ -272,7 +272,7 @@ int main( int ac, char** av )
         csv = comma::csv::options( options );
         if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
         if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
-        if( operation == "path-realpath" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::path::run< comma::applications::strings::path::canonical >( options ); }
+        if( operation == "path-real" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::path::run< comma::applications::strings::path::canonical >( options ); }
         std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
         return 1;
     }

From 77d22ff530945bd1a07e11efcdf6b0b5abef4125 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Fri, 24 Jan 2020 19:18:18 +1100
Subject: [PATCH 0115/1056] string: split_bracketed(): first cut implemented

---
 string/split.cpp            | 40 ++++++++++++++++++++++++++++++++++++-
 string/split.h              | 11 +++++-----
 string/test/string_test.cpp | 33 ++++++++++++++++++++++++++++++
 3 files changed, 78 insertions(+), 6 deletions(-)

diff --git a/string/split.cpp b/string/split.cpp
index fd09fe931..25b4d80ae 100644
--- a/string/split.cpp
+++ b/string/split.cpp
@@ -70,7 +70,7 @@ std::vector< std::string > split_escaped( const std::string & s, const char * se
     std::vector< std::string > v;
     const char* begin( &s[0] );
     const char* const end( begin + s.length() );
-    boost::optional<char> quoted;
+    boost::optional< char > quoted;
     v.push_back( std::string() );
     for( const char* p = begin; p < end; ++p )
     {
@@ -108,4 +108,42 @@ std::vector< std::string > split_escaped( const std::string & s, char separator,
     return split_escaped( s, separators, quotes, escape );
 }
 
+std::vector< std::string > split_bracketed( const std::string& s, const char* separators, char lbracket, char rbracket )
+{
+    std::vector< std::string > v;
+    const char* begin( &s[0] );
+    const char* const end( begin + s.length() );
+    unsigned int depth = 0;
+    v.push_back( std::string() );
+    for( const char* p = begin; p < end; ++p )
+    {
+        if( lbracket == *p )
+        {
+            ++depth;
+            v.back() += *p;
+        }
+        else if( rbracket == *p )
+        {
+            if( depth > 0 ) { --depth; }
+            v.back() += *p;
+        }
+        else if( depth == 0 && string::is_one_of( *p, separators ) )
+        {
+            v.push_back( std::string() );
+        }
+        else
+        {
+            v.back() += *p;
+        }
+    }
+    return v;
+}
+
+std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket, char rbracket )
+{
+    const char separators[] = { separator, 0 };
+    return split_bracketed( s, separators, lbracket, rbracket );
+}
+
+
 } // namespace comma {
diff --git a/string/split.h b/string/split.h
index ec8f176e3..8de556dbc 100644
--- a/string/split.h
+++ b/string/split.h
@@ -27,11 +27,9 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_STRING_SPLIT_H_
-#define COMMA_STRING_SPLIT_H_
+#pragma once
 
 #include <string>
 #include <vector>
@@ -59,7 +57,7 @@ std::vector< std::string > split( const std::string& s, char separator, bool emp
 /// An escape character will only escape a delimiter, quote or escape character;
 /// escaping any other character will result in both being kept;
 /// e.g. c:\windows\ will be kept as c:\windows\ with the trailing backslash
-/// e.g. fname;delimiter=\\;field=a,b will be kept as fname;delimiter=\;field=a,b 
+/// e.g. filename;delimiter=\\;fields=a,b will be kept as filename;delimiter=\;fields=a,b 
 ///
 /// A quote may be anywhere in a string. Quotes must be closed; i.e Each start
 /// quote must be paired with an end quote, or an exception is thrown.
@@ -69,7 +67,10 @@ std::vector< std::string > split_escaped( const std::string& s, const char * sep
 /// split string into tokens; always contains at least one element;
 /// skips backslash escaped seperator, handle boolean quotes 
 std::vector< std::string > split_escaped( const std::string& s, char separator, const char * quotes = "\"\'", char escape = '\\' );
+/// skips bracketed separators
+std::vector< std::string > split_bracketed( const std::string& s, const char * separators = " ", char lbracket = '(', char rbrackets = ')' );
+/// skips bracketed separators
+std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket = '(', char rbracket = ')' );
 
 } // namespace comma {
 
-#endif // COMMA_STRING_SPLIT_H_
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 4fb612134..00a6775b3 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -282,6 +282,39 @@ TEST( string, split_escaped_quoted )
     }
 }
 
+TEST( string, split_bracketed )
+{
+    {
+        std::vector< std::string > v( split_bracketed( "" ) );
+        EXPECT_EQ( 1u, v.size() );
+        EXPECT_EQ( "", v[0] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( ")()" ) );
+        EXPECT_EQ( 1u, v.size() );
+        EXPECT_EQ( ")()", v[0] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( ")(,)" ) );
+        EXPECT_EQ( 1u, v.size() );
+        EXPECT_EQ( ")(,)", v[0] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "a[,b,c],d", ',', '[', ']' ) );
+        EXPECT_EQ( 2u, v.size() );
+        EXPECT_EQ( "a[,b,c]", v[0] );
+        EXPECT_EQ( "d", v[1] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "a,( b, c, d ),e( f ( g, h ) ), i", ',' ) );
+        EXPECT_EQ( 4u, v.size() );
+        EXPECT_EQ( "a", v[0] );
+        EXPECT_EQ( "( b, c, d )", v[1] );
+        EXPECT_EQ( "e( f ( g, h ) )", v[2] );
+        EXPECT_EQ( " i", v[3] );
+    }
+}
+
 TEST( string, strip )
 {
     EXPECT_EQ( strip( "", ";" ), "" );

From 4aff56b60f57d9aa43972b0985bc03d08c8f7f09 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Fri, 24 Jan 2020 19:50:22 +1100
Subject: [PATCH 0116/1056] string: split_bracketed(): strip_brackets parameter
 added, default set to true

---
 string/split.cpp            | 17 ++++++++++-----
 string/split.h              |  4 ++--
 string/test/string_test.cpp | 43 ++++++++++++++++++++++++++++---------
 3 files changed, 47 insertions(+), 17 deletions(-)

diff --git a/string/split.cpp b/string/split.cpp
index 25b4d80ae..8a4eb6888 100644
--- a/string/split.cpp
+++ b/string/split.cpp
@@ -108,7 +108,7 @@ std::vector< std::string > split_escaped( const std::string & s, char separator,
     return split_escaped( s, separators, quotes, escape );
 }
 
-std::vector< std::string > split_bracketed( const std::string& s, const char* separators, char lbracket, char rbracket )
+std::vector< std::string > split_bracketed( const std::string& s, const char* separators, char lbracket, char rbracket, bool strip_brackets )
 {
     std::vector< std::string > v;
     const char* begin( &s[0] );
@@ -119,13 +119,20 @@ std::vector< std::string > split_bracketed( const std::string& s, const char* se
     {
         if( lbracket == *p )
         {
+            if( strip_brackets && depth == 0 )
+            {
+                if( !v.back().empty() ) { COMMA_THROW( comma::exception, "asked to strip brackets; expected opening bracket immediately following separator, got'" << s << "'" ); }
+            }
+            else
+            {
+                v.back() += *p;
+            }
             ++depth;
-            v.back() += *p;
         }
         else if( rbracket == *p )
         {
+            if( !strip_brackets || depth > 1 ) { v.back() += *p; }
             if( depth > 0 ) { --depth; }
-            v.back() += *p;
         }
         else if( depth == 0 && string::is_one_of( *p, separators ) )
         {
@@ -139,10 +146,10 @@ std::vector< std::string > split_bracketed( const std::string& s, const char* se
     return v;
 }
 
-std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket, char rbracket )
+std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket, char rbracket, bool strip_brackets )
 {
     const char separators[] = { separator, 0 };
-    return split_bracketed( s, separators, lbracket, rbracket );
+    return split_bracketed( s, separators, lbracket, rbracket, strip_brackets );
 }
 
 
diff --git a/string/split.h b/string/split.h
index 8de556dbc..a12403aa1 100644
--- a/string/split.h
+++ b/string/split.h
@@ -68,9 +68,9 @@ std::vector< std::string > split_escaped( const std::string& s, const char * sep
 /// skips backslash escaped seperator, handle boolean quotes 
 std::vector< std::string > split_escaped( const std::string& s, char separator, const char * quotes = "\"\'", char escape = '\\' );
 /// skips bracketed separators
-std::vector< std::string > split_bracketed( const std::string& s, const char * separators = " ", char lbracket = '(', char rbrackets = ')' );
+std::vector< std::string > split_bracketed( const std::string& s, const char * separators = " ", char lbracket = '(', char rbrackets = ')', bool strip_brackets = true );
 /// skips bracketed separators
-std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket = '(', char rbracket = ')' );
+std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket = '(', char rbracket = ')', bool strip_brackets = true );
 
 } // namespace comma {
 
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 00a6775b3..8b9e75059 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -290,27 +290,50 @@ TEST( string, split_bracketed )
         EXPECT_EQ( "", v[0] );
     }
     {
-        std::vector< std::string > v( split_bracketed( ")()" ) );
+        std::vector< std::string > v( split_bracketed( "()", ',' ) );
         EXPECT_EQ( 1u, v.size() );
-        EXPECT_EQ( ")()", v[0] );
+        EXPECT_EQ( "", v[0] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "(),(),()", ',' ) );
+        EXPECT_EQ( 3u, v.size() );
+        EXPECT_EQ( "", v[0] );
+        EXPECT_EQ( "", v[1] );
+        EXPECT_EQ( "", v[2] );
     }
     {
-        std::vector< std::string > v( split_bracketed( ")(,)" ) );
+        std::vector< std::string > v( split_bracketed( ")()", ',', '(', ')', false ) );
         EXPECT_EQ( 1u, v.size() );
-        EXPECT_EQ( ")(,)", v[0] );
+        EXPECT_EQ( ")()", v[0] );
     }
     {
-        std::vector< std::string > v( split_bracketed( "a[,b,c],d", ',', '[', ']' ) );
-        EXPECT_EQ( 2u, v.size() );
-        EXPECT_EQ( "a[,b,c]", v[0] );
-        EXPECT_EQ( "d", v[1] );
+        std::vector< std::string > v( split_bracketed( "(),(,),(,)", ',' ) );
+        EXPECT_EQ( 3u, v.size() );
+        EXPECT_EQ( "", v[0] );
+        EXPECT_EQ( ",", v[1] );
+        EXPECT_EQ( ",", v[2] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "a,[,b,[c]],d", ',', '[', ']' ) );
+        EXPECT_EQ( 3u, v.size() );
+        EXPECT_EQ( "a", v[0] );
+        EXPECT_EQ( ",b,[c]", v[1] );
+        EXPECT_EQ( "d", v[2] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "a,( b, c, d ),( f ( g, h ) ), i", ',' ) );
+        EXPECT_EQ( 4u, v.size() );
+        EXPECT_EQ( "a", v[0] );
+        EXPECT_EQ( " b, c, d ", v[1] );
+        EXPECT_EQ( " f ( g, h ) ", v[2] );
+        EXPECT_EQ( " i", v[3] );
     }
     {
-        std::vector< std::string > v( split_bracketed( "a,( b, c, d ),e( f ( g, h ) ), i", ',' ) );
+        std::vector< std::string > v( split_bracketed( "a,( b, c, d ),( f ( g, h ) ), i", ',', '(', ')', false ) );
         EXPECT_EQ( 4u, v.size() );
         EXPECT_EQ( "a", v[0] );
         EXPECT_EQ( "( b, c, d )", v[1] );
-        EXPECT_EQ( "e( f ( g, h ) )", v[2] );
+        EXPECT_EQ( "( f ( g, h ) )", v[2] );
         EXPECT_EQ( " i", v[3] );
     }
 }

From d7a2dcddfba0124a3add3fe7d57a67d5cd1077df Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 28 Jan 2020 17:56:57 +1100
Subject: [PATCH 0117/1056] csv-string: minor refactoring

---
 csv/applications/csv-strings.cpp | 54 +++++++++++++++++++++++---------
 1 file changed, 40 insertions(+), 14 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 1f9d5cf36..2f2ec04b8 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -111,20 +111,23 @@ static comma::csv::options csv;
 
 namespace comma { namespace applications { namespace strings { namespace path {
 
-struct input
+template < typename T >
+struct record
 { 
-    std::vector< std::string > strings;
-    input( unsigned int n = 0 ): strings( n ) {}
+    std::vector< T > values;
+    record( unsigned int n = 0 ): values( n ) {}
 };
 
+typedef record< std::string > input;
+
 } } } } // namespace comma { namespace applications { namespace strings { namespace path {
 
 namespace comma { namespace visiting {
 
-template <> struct traits< comma::applications::strings::path::input >
+template < typename T > struct traits< comma::applications::strings::path::record< T > >
 {
-    template < typename K, typename V > static void visit( const K&, const comma::applications::strings::path::input& p, V& v ) { v.apply( "strings", p.strings ); }
-    template < typename K, typename V > static void visit( const K&, comma::applications::strings::path::input& p, V& v ) { v.apply( "strings", p.strings ); }
+    template < typename K, typename V > static void visit( const K&, const comma::applications::strings::path::record< T >& p, V& v ) { v.apply( "values", p.values ); }
+    template < typename K, typename V > static void visit( const K&, comma::applications::strings::path::record< T >& p, V& v ) { v.apply( "values", p.values ); }
 };
 
 } } // namespace comma { namespace visiting {
@@ -139,10 +142,10 @@ static int run( const comma::command_line_options& options )
     for( unsigned int i = 0; i < v.size(); ++i )
     {
         if( v[i].empty() ) { continue; }
-        v[i] = "strings[" + boost::lexical_cast< std::string >( n ) + "]";
+        v[i] = "values[" + boost::lexical_cast< std::string >( n ) + "]";
         ++n;
     }
-    ::csv.fields = n == 0 ? std::string( "strings[0]" ) : comma::join( v, ',' );
+    ::csv.fields = n == 0 ? std::string( "values[0]" ) : comma::join( v, ',' );
     if( n == 0 ) { ++n; }
     comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
     std::function< void( const input& p ) > write;
@@ -153,8 +156,8 @@ static int run( const comma::command_line_options& options )
         {
             const input* p = istream.read();
             if( !p ) { break; }
-            input r( n );
-            for( unsigned int i = 0; i < p->strings.size(); ++i ) { r.strings[i] = t.convert( p->strings[i] ); }
+            typename T::output_t r( n );
+            for( unsigned int i = 0; i < p->values.size(); ++i ) { r.values[i] = t.convert( p->values[i] ); }
             write( r );
             if( ::csv.flush ) { std::cout.flush(); }
         }
@@ -167,16 +170,18 @@ static int run( const comma::command_line_options& options )
         return run_();
     }
     comma::csv::options output_csv = ::csv;
-    output_csv.fields = "strings";
+    output_csv.fields = "values";
     if( ::csv.binary() ) { std::cerr << "csv-strings: path-" << T::name() << ": binary mode supported only for --emplace; todo, just ask" << std::endl; exit( 1 ); }
-    comma::csv::output_stream< input > ostream( std::cout, output_csv, input( n ) );
-    comma::csv::tied< input, input > tied( istream, ostream );
-    write = [&]( const input& p ) { tied.append( p ); };
+    comma::csv::output_stream< typename T::output_t > ostream( std::cout, output_csv, input( n ) );
+    comma::csv::tied< input, typename T::output_t > tied( istream, ostream );
+    write = [&]( const typename T::output_t& p ) { tied.append( p ); };
     return run_();
 }
 
 struct basename
 {
+    typedef input output_t;
+    
     unsigned int depth;
     char delimiter;
     
@@ -202,6 +207,8 @@ struct basename
 
 struct dirname
 {
+    typedef input output_t;
+    
     unsigned int depth;
     unsigned int fixed_depth;
     char delimiter;
@@ -239,6 +246,8 @@ struct dirname
 
 struct canonical
 {
+    typedef input output_t;
+    
     boost::filesystem::path base;
     
     static const char* name() { return "canonical"; }
@@ -258,6 +267,22 @@ struct canonical
     }
 };
 
+// struct is_leaf // todo: refactor, reuse generic run
+// {
+//     typedef record< unsigned int > output_t;
+//     
+//     std::string last;
+//     
+//     static const char* name() { return "is-leaf"; }
+//     
+//     is_leaf( const comma::command_line_options& ) {}
+//     
+//     unsigned int convert( const std::string& s )
+//     {
+//         bool r = s 
+//     }
+// };
+
 } } } } // namespace comma { namespace applications { namespace strings { namespace path {
 
 int main( int ac, char** av )
@@ -272,6 +297,7 @@ int main( int ac, char** av )
         csv = comma::csv::options( options );
         if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
         if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
+        if( operation == "path-is-leaf" || operation == "is-leaf" ) {} //{ return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
         if( operation == "path-real" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::path::run< comma::applications::strings::path::canonical >( options ); }
         std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
         return 1;

From 91fa88e4fb858f9f7d22c1b379474ea22b208bd5 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 28 Jan 2020 18:02:58 +1100
Subject: [PATCH 0118/1056] csv-string: commented code removed

---
 csv/applications/csv-strings.cpp | 17 -----------------
 1 file changed, 17 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 2f2ec04b8..9acc1b6e1 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -267,22 +267,6 @@ struct canonical
     }
 };
 
-// struct is_leaf // todo: refactor, reuse generic run
-// {
-//     typedef record< unsigned int > output_t;
-//     
-//     std::string last;
-//     
-//     static const char* name() { return "is-leaf"; }
-//     
-//     is_leaf( const comma::command_line_options& ) {}
-//     
-//     unsigned int convert( const std::string& s )
-//     {
-//         bool r = s 
-//     }
-// };
-
 } } } } // namespace comma { namespace applications { namespace strings { namespace path {
 
 int main( int ac, char** av )
@@ -297,7 +281,6 @@ int main( int ac, char** av )
         csv = comma::csv::options( options );
         if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
         if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
-        if( operation == "path-is-leaf" || operation == "is-leaf" ) {} //{ return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
         if( operation == "path-real" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::path::run< comma::applications::strings::path::canonical >( options ); }
         std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
         return 1;

From ce440fac972947173504d82f73f4313a6c7300c9 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 29 Jan 2020 14:48:39 +1100
Subject: [PATCH 0119/1056] csv-strings: --fixed-depth, --depth: replaced with
 --head and --tail

---
 csv/applications/csv-strings.cpp | 53 ++++++++++++++++----------------
 csv/test/csv-strings/input       | 52 +++++++++++++++----------------
 2 files changed, 53 insertions(+), 52 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 9acc1b6e1..c1fa2feea 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -87,13 +87,14 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "path-basename,basename" << std::endl;
     std::cerr << "    options" << std::endl;
-    std::cerr << "        --depth=<depth>; default=1; if path length less than depth, output empty string" << std::endl;
+    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to remove" << std::endl;
+    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to keep" << std::endl;
     std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
     std::cerr << std::endl;
     std::cerr << "path-dirname,dirname" << std::endl;
     std::cerr << "    options" << std::endl;
-    std::cerr << "        --depth=<depth>; default=1; if path length less than depth, output empty string" << std::endl;
-    std::cerr << "        --fixed-depth=[<depth>]; output paths of fixed depth starting from root" << std::endl;
+    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to keep" << std::endl;
+    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to remove" << std::endl;
     std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
     std::cerr << std::endl;
     std::cerr << "path-real,path-canonical,canonical" << std::endl;
@@ -182,26 +183,32 @@ struct basename
 {
     typedef input output_t;
     
-    unsigned int depth;
+    unsigned int head;
+    unsigned int tail;
     char delimiter;
     
     static const char* name() { return "basename"; }
     
     basename( const comma::command_line_options& options )
-        : depth( options.value( "--depth", 1 ) )
+        : head( options.value( "--head", 0 ) )
+        , tail( options.value( "--tail", 1 ) )
         , delimiter( options.value( "--path-delimiter,-p", '/' ) )
     {
+        options.assert_mutually_exclusive( "--head,--tail" );
     }
     
     std::string convert( const std::string& t )
     {
         const auto& s = comma::split( t, delimiter );
-        if( s.size() < depth )
+        if( head > 0 )
         {
-            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << depth << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+            if( s.size() >= head ) { return comma::join( s.begin() + head, s.end(), delimiter ); }
+            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
             return "";
         }
-        return comma::join( s.end() - depth, s.end(), delimiter );
+        if( s.size() >= tail ) { return comma::join( s.end() - tail, s.end(), delimiter ); }
+        if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+        return "";
     }
 };
 
@@ -209,38 +216,32 @@ struct dirname
 {
     typedef input output_t;
     
-    unsigned int depth;
-    unsigned int fixed_depth;
+    unsigned int head;
+    unsigned int tail;
     char delimiter;
     
     static const char* name() { return "dirname"; }
     
     dirname( const comma::command_line_options& options )
-        : depth( options.value( "--depth", 1 ) )
-        , fixed_depth( options.value( "--fixed-depth", 0 ) )
+        : head( options.value( "--head", 0 ) )
+        , tail( options.value( "--tail", 1 ) )
         , delimiter( options.value( "--path-delimiter,-p", '/' ) )
     {
-        options.assert_mutually_exclusive( "--depth,--fixed-depth" );
+        options.assert_mutually_exclusive( "--head,--tail" );
     }
     
     std::string convert( const std::string& t )
     {
         const auto& s = comma::split( t, delimiter );
-        if( fixed_depth > 0 )
+        if( head > 0 )
         {
-            if( s.size() < fixed_depth )
-            {
-                if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << fixed_depth << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-                return "";
-            }
-            return comma::join( s, fixed_depth, delimiter );
-        }
-        if( s.size() < depth )
-        {
-            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << depth << "; got: '" << comma::join( s, '/' ) << "'" ); }
+            if( s.size() >= head ) { return comma::join( s.begin(), s.begin() + head, delimiter ); }
+            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
             return "";
         }
-        return comma::join( s.begin(), s.end() - depth, delimiter );
+        if( s.size() >= tail ) { return comma::join( s.begin(), s.end() - tail, delimiter ); }
+        if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+        return "";
     }
 };
 
@@ -274,7 +275,7 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace", "-.*" );
+        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace,--strict", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-strings: please specify operation" << std::endl; return 1; }
         std::string operation = unnamed[0];
         strict = options.exists( "--strict" );
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index 4c176c25f..3966a6308 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -1,48 +1,48 @@
 basename/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename"
-basename/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 2"
-basename/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 3"
-basename/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 4"
+basename/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 2"
+basename/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3"
+basename/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 4"
 
 basename/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --emplace"
-basename/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 2 --emplace"
-basename/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --depth 3 --emplace"
-basename/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-basename --depth 4 --emplace"
+basename/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 2 --emplace"
+basename/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3 --emplace"
+basename/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-basename --tail 4 --emplace"
 
 dirname/depth/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
-dirname/depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 2"
-dirname/depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 3"
-dirname/depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 4"
+dirname/depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2"
+dirname/depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 3"
+dirname/depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 4"
 
 dirname/depth/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
-dirname/depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --depth 2 --emplace"
-dirname/depth/emplace[2]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --depth 3 --emplace"
-dirname/depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --depth 4 --emplace"
+dirname/depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2 --emplace"
+dirname/depth/emplace[2]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 3 --emplace"
+dirname/depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 4 --emplace"
 
 dirname/fixed_depth/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
-dirname/fixed_depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 2"
-dirname/fixed_depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 3"
-dirname/fixed_depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 4"
+dirname/fixed_depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2"
+dirname/fixed_depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3"
+dirname/fixed_depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 4"
 
 dirname/fixed_depth/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
-dirname/fixed_depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 2 --emplace"
-dirname/fixed_depth/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --fixed-depth 3 --emplace"
-dirname/fixed_depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --fixed-depth 4 --emplace"
+dirname/fixed_depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2 --emplace"
+dirname/fixed_depth/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3 --emplace"
+dirname/fixed_depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --head 4 --emplace"
 
 delimiter[0]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=."
 delimiter[1]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=. --emplace"
 delimiter[2]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-dirname --delimiter=."
 delimiter[3]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-dirname --delimiter=. --emplace"
 
-strict[0]="( echo a/b/c; echo a/b ) | csv-strings path-basename --depth 3 --strict"
-strict[1]="( echo a/b/c; echo a/b ) | csv-strings path-basename --depth 3 --emplace --strict"
-strict[2]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --depth 3 --strict"
-strict[3]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --depth 3 --emplace --strict"
-strict[4]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --fixed-depth 3 --strict"
-strict[5]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --fixed-depth 3 --emplace --strict"
+strict[0]="( echo a/b/c; echo a/b ) | csv-strings path-basename --tail 3 --strict"
+strict[1]="( echo a/b/c; echo a/b ) | csv-strings path-basename --tail 3 --emplace --strict"
+strict[2]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --tail 3 --strict"
+strict[3]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --tail 3 --emplace --strict"
+strict[4]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --head 3 --strict"
+strict[5]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --head 3 --emplace --strict"
 
 fields[0]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n"
 fields[1]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n --emplace"
-fields[2]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n --emplace --depth 2"
+fields[2]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n --emplace --tail 2"
 fields[3]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n"
 fields[4]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace"
-fields[5]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace --depth 2"
+fields[5]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace --tail 2"

From f9ca8f4e841142a912df3429499bd2f044536696 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 29 Jan 2020 14:58:19 +1100
Subject: [PATCH 0120/1056] csv-strings: basename --head: unit tests added

---
 csv/test/csv-strings/expected | 110 +++++++++++++++++++---------------
 csv/test/csv-strings/input    |  44 ++++++++------
 2 files changed, 87 insertions(+), 67 deletions(-)

diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index 47409cc92..4432d8d83 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -24,57 +24,71 @@ basename/emplace[3]/output/line[0]=","
 basename/emplace[3]/output/line[1]=","
 basename/emplace[3]/output/line[2]=","
 
-dirname/depth/append[0]/output/line[0]="a,"
-dirname/depth/append[0]/output/line[1]="a/b,a"
-dirname/depth/append[0]/output/line[2]="a/b/c,a/b"
-dirname/depth/append[1]/output/line[0]="a,"
-dirname/depth/append[1]/output/line[1]="a/b,"
-dirname/depth/append[1]/output/line[2]="a/b/c,a"
-dirname/depth/append[2]/output/line[0]="a,"
-dirname/depth/append[2]/output/line[1]="a/b,"
-dirname/depth/append[2]/output/line[2]="a/b/c,"
-dirname/depth/append[3]/output/line[0]="a,"
-dirname/depth/append[3]/output/line[1]="a/b,"
-dirname/depth/append[3]/output/line[2]="a/b/c,"
+basename/head/append[0]/output/line[0]="a,"
+basename/head/append[0]/output/line[1]="a/b,b"
+basename/head/append[0]/output/line[2]="a/b/c,b/c"
+basename/head/append[1]/output/line[0]="a,"
+basename/head/append[1]/output/line[1]="a/b,"
+basename/head/append[1]/output/line[2]="a/b/c,c"
 
-dirname/depth/emplace[0]/output/line[0]=""
-dirname/depth/emplace[0]/output/line[1]="a"
-dirname/depth/emplace[0]/output/line[2]="a/b"
-dirname/depth/emplace[1]/output/line[0]=""
-dirname/depth/emplace[1]/output/line[1]=""
-dirname/depth/emplace[1]/output/line[2]="a"
-dirname/depth/emplace[2]/output/line[0]=","
-dirname/depth/emplace[2]/output/line[1]=","
-dirname/depth/emplace[2]/output/line[2]=","
-dirname/depth/emplace[3]/output/line[0]=","
-dirname/depth/emplace[3]/output/line[1]=","
-dirname/depth/emplace[3]/output/line[2]=","
+basename/head/emplace[0]/output/line[0]=""
+basename/head/emplace[0]/output/line[1]="b"
+basename/head/emplace[0]/output/line[2]="b/c"
+basename/head/emplace[1]/output/line[0]=""
+basename/head/emplace[1]/output/line[1]=""
+basename/head/emplace[1]/output/line[2]="c"
 
-dirname/fixed_depth/append[0]/output/line[0]="a,"
-dirname/fixed_depth/append[0]/output/line[1]="a/b,a"
-dirname/fixed_depth/append[0]/output/line[2]="a/b/c,a/b"
-dirname/fixed_depth/append[1]/output/line[0]="a,"
-dirname/fixed_depth/append[1]/output/line[1]="a/b,a/b"
-dirname/fixed_depth/append[1]/output/line[2]="a/b/c,a/b"
-dirname/fixed_depth/append[2]/output/line[0]="a,"
-dirname/fixed_depth/append[2]/output/line[1]="a/b,"
-dirname/fixed_depth/append[2]/output/line[2]="a/b/c,a/b/c"
-dirname/fixed_depth/append[3]/output/line[0]="a,"
-dirname/fixed_depth/append[3]/output/line[1]="a/b,"
-dirname/fixed_depth/append[3]/output/line[2]="a/b/c,"
+dirname/tail/append[0]/output/line[0]="a,"
+dirname/tail/append[0]/output/line[1]="a/b,a"
+dirname/tail/append[0]/output/line[2]="a/b/c,a/b"
+dirname/tail/append[1]/output/line[0]="a,"
+dirname/tail/append[1]/output/line[1]="a/b,"
+dirname/tail/append[1]/output/line[2]="a/b/c,a"
+dirname/tail/append[2]/output/line[0]="a,"
+dirname/tail/append[2]/output/line[1]="a/b,"
+dirname/tail/append[2]/output/line[2]="a/b/c,"
+dirname/tail/append[3]/output/line[0]="a,"
+dirname/tail/append[3]/output/line[1]="a/b,"
+dirname/tail/append[3]/output/line[2]="a/b/c,"
 
-dirname/fixed_depth/emplace[0]/output/line[0]=""
-dirname/fixed_depth/emplace[0]/output/line[1]="a"
-dirname/fixed_depth/emplace[0]/output/line[2]="a/b"
-dirname/fixed_depth/emplace[1]/output/line[0]=""
-dirname/fixed_depth/emplace[1]/output/line[1]="a/b"
-dirname/fixed_depth/emplace[1]/output/line[2]="a/b"
-dirname/fixed_depth/emplace[2]/output/line[0]=""
-dirname/fixed_depth/emplace[2]/output/line[1]=""
-dirname/fixed_depth/emplace[2]/output/line[2]="a/b/c"
-dirname/fixed_depth/emplace[3]/output/line[0]=","
-dirname/fixed_depth/emplace[3]/output/line[1]=","
-dirname/fixed_depth/emplace[3]/output/line[2]=","
+dirname/tail/emplace[0]/output/line[0]=""
+dirname/tail/emplace[0]/output/line[1]="a"
+dirname/tail/emplace[0]/output/line[2]="a/b"
+dirname/tail/emplace[1]/output/line[0]=""
+dirname/tail/emplace[1]/output/line[1]=""
+dirname/tail/emplace[1]/output/line[2]="a"
+dirname/tail/emplace[2]/output/line[0]=","
+dirname/tail/emplace[2]/output/line[1]=","
+dirname/tail/emplace[2]/output/line[2]=","
+dirname/tail/emplace[3]/output/line[0]=","
+dirname/tail/emplace[3]/output/line[1]=","
+dirname/tail/emplace[3]/output/line[2]=","
+
+dirname/head/append[0]/output/line[0]="a,"
+dirname/head/append[0]/output/line[1]="a/b,a"
+dirname/head/append[0]/output/line[2]="a/b/c,a/b"
+dirname/head/append[1]/output/line[0]="a,"
+dirname/head/append[1]/output/line[1]="a/b,a/b"
+dirname/head/append[1]/output/line[2]="a/b/c,a/b"
+dirname/head/append[2]/output/line[0]="a,"
+dirname/head/append[2]/output/line[1]="a/b,"
+dirname/head/append[2]/output/line[2]="a/b/c,a/b/c"
+dirname/head/append[3]/output/line[0]="a,"
+dirname/head/append[3]/output/line[1]="a/b,"
+dirname/head/append[3]/output/line[2]="a/b/c,"
+
+dirname/head/emplace[0]/output/line[0]=""
+dirname/head/emplace[0]/output/line[1]="a"
+dirname/head/emplace[0]/output/line[2]="a/b"
+dirname/head/emplace[1]/output/line[0]=""
+dirname/head/emplace[1]/output/line[1]="a/b"
+dirname/head/emplace[1]/output/line[2]="a/b"
+dirname/head/emplace[2]/output/line[0]=""
+dirname/head/emplace[2]/output/line[1]=""
+dirname/head/emplace[2]/output/line[2]="a/b/c"
+dirname/head/emplace[3]/output/line[0]=","
+dirname/head/emplace[3]/output/line[1]=","
+dirname/head/emplace[3]/output/line[2]=","
 
 delimiter[0]/output/line[0]="a.a"
 delimiter[0]/output/line[1]="a.b.a"
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index 3966a6308..b02076f42 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -8,25 +8,31 @@ basename/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basenam
 basename/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3 --emplace"
 basename/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-basename --tail 4 --emplace"
 
-dirname/depth/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
-dirname/depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2"
-dirname/depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 3"
-dirname/depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 4"
-
-dirname/depth/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
-dirname/depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2 --emplace"
-dirname/depth/emplace[2]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 3 --emplace"
-dirname/depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 4 --emplace"
-
-dirname/fixed_depth/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
-dirname/fixed_depth/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2"
-dirname/fixed_depth/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3"
-dirname/fixed_depth/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 4"
-
-dirname/fixed_depth/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
-dirname/fixed_depth/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2 --emplace"
-dirname/fixed_depth/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3 --emplace"
-dirname/fixed_depth/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --head 4 --emplace"
+basename/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1"
+basename/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2"
+
+basename/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1 --emplace"
+basename/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2 --emplace"
+
+dirname/tail/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
+dirname/tail/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2"
+dirname/tail/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 3"
+dirname/tail/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 4"
+
+dirname/tail/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
+dirname/tail/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2 --emplace"
+dirname/tail/emplace[2]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 3 --emplace"
+dirname/tail/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 4 --emplace"
+
+dirname/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
+dirname/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2"
+dirname/head/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3"
+dirname/head/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 4"
+
+dirname/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
+dirname/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2 --emplace"
+dirname/head/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3 --emplace"
+dirname/head/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --head 4 --emplace"
 
 delimiter[0]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=."
 delimiter[1]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=. --emplace"

From a36ed3bc3db3d22da85736b5068ba4a262a98b6c Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Fri, 31 Jan 2020 17:56:27 +1100
Subject: [PATCH 0121/1056] csv-shuffle: removed flushing in binary on every
 record; from now on, if flush required, --flush has to be given on command
 line

---
 csv/applications/csv-shuffle.cpp | 12 +++---------
 1 file changed, 3 insertions(+), 9 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index aecceed64..dbd2b1331 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -156,7 +156,7 @@ int main( int ac, char** av )
                 {
                     std::cout.write( &buf[ elements[k].offset ], elements[k].size );
                 }
-                std::cout.flush(); // todo: flushing too often?
+                if( csv.flush ) { std::cout.flush(); }
             }
         }
         else
@@ -192,13 +192,7 @@ int main( int ac, char** av )
         }
         return 0;
     }
-    catch( std::exception& ex )
-    {
-        std::cerr << "csv-shuffle: " << ex.what() << std::endl;
-    }
-    catch( ... )
-    {
-        std::cerr << "csv-shuffle: unknown exception" << std::endl;
-    }
+    catch( std::exception& ex ) { std::cerr << "csv-shuffle: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-shuffle: unknown exception" << std::endl; }
     return 1;
 }

From 7d58f161ffeb06c6f0929fa23fc39e02284e2453 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Mon, 3 Feb 2020 10:11:49 +1100
Subject: [PATCH 0122/1056] csv-split: --files: example added

---
 csv/applications/csv-split.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index c9df78092..0372668ff 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -148,7 +148,9 @@ int main( int argc, char** argv )
             std::cerr << "                local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
             std::cerr << "                <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
             std::cerr << "                <filename>: a regular file" << std::endl;
-            std::cerr << "        example: ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) | csv-split --fields id \"0,1;tcp:5999\" \"...;local:/tmp/named_fifo\"" << std::endl;
+            std::cerr << "        examples" << std::endl;
+            std::cerr << "            ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) | csv-split --fields id \"0,1;tcp:5999\" \"...;local:/tmp/named_fifo\"" << std::endl;
+            std::cerr << "            ( echo 0,a; echo 1,b ) | csv-split --fields id --files <( echo '1,one.csv'; echo '0,zero.csv' )';fields=id,filename'" << std::endl;
             std::cerr << std::endl;
             std::cerr << description << std::endl;
             std::cerr << std::endl;

From 2395f31ab9c1a18f752e1fa0e1907ffcd02b5ee4 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 4 Feb 2020 18:29:52 +1100
Subject: [PATCH 0123/1056] csv-shuffle: tried to improve performance, but
 commented it out, since it did not work

---
 csv/applications/csv-shuffle.cpp | 52 ++++++++++++++++++++++++++++++++
 1 file changed, 52 insertions(+)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index dbd2b1331..5b159a262 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -125,6 +125,58 @@ int main( int ac, char** av )
             if( !fields[i].input_index ) { std::cerr << "csv-shuffle: \"" << fields[i].name << "\" not found in input fields " << csv.fields << std::endl; return 1; }
         }
         if( csv.binary() )
+//         {
+//             #ifdef WIN32
+//             _setmode( _fileno( stdin ), _O_BINARY );
+//             _setmode( _fileno( stdout ), _O_BINARY );
+//             #endif
+//             std::vector< char > in( csv.format().size() );
+//             std::vector< comma::csv::format::element > elements;
+//             elements.reserve( csv.format().count() ); // quick and dirty, can be really wasteful on large things like images
+//             for( unsigned int i = 0; i < elements.capacity(); ++i )
+//             {
+//                 elements.push_back( csv.format().offset( i ) );
+//             }
+//             unsigned int previous_index = 0;
+//             unsigned int output_size = 0;
+//             for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
+//             {
+//                 for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k ) { output_size += elements[k].size; }
+//                 output_size += fields[i].size;
+//                 previous_index = fields[i].index + 1;
+//             }
+//             for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k ) { output_size += elements[k].size; }
+//             std::vector< char > out( output_size );
+//             while( std::cin.good() && !std::cin.eof() )
+//             {
+//                 // todo: quick and dirty; if performance is an issue, you could read more than
+//                 // one record every time see comma::csv::binary_input_stream::read() for reference
+//                 std::cin.read( &in[0], csv.format().size() );
+//                 if( std::cin.gcount() == 0 ) { continue; }
+//                 if( std::cin.gcount() < int( csv.format().size() ) ) { std::cerr << "csv-shuffle: expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() << std::endl; return 1; }
+//                 unsigned int offset = 0;
+//                 unsigned int previous_index = 0;
+//                 for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
+//                 {
+//                     for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k )
+//                     {
+//                         std::memcpy( &out[offset], &in[ elements[k].offset ], elements[k].size ); // std::cout.write( &in[ elements[k].offset ], elements[k].size );
+//                         offset += elements[k].size;
+//                     }
+//                     std::memcpy( &out[offset], &in[ fields[i].input_offset ], fields[i].size ); // std::cout.write( &in[ fields[i].input_offset ], fields[i].size );
+//                     offset += fields[i].size;
+//                     previous_index = fields[i].index + 1;
+//                 }
+//                 //std::cerr << "--> previous_index: " << previous_index << " elements.size(): " << elements.size() << std::endl;
+//                 for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k )
+//                 {
+//                     std::memcpy( &out[offset], &in[ elements[k].offset ], elements[k].size ); // std::cout.write( &in[ elements[k].offset ], elements[k].size );
+//                     offset += elements[k].size;
+//                 }
+//                 std::cout.write( &out[0], out.size() );
+//                 if( csv.flush ) { std::cout.flush(); }
+//             }
+//         }
         {
             #ifdef WIN32
             _setmode( _fileno( stdin ), _O_BINARY );

From 34836b00e239a99f6d7d585a1d335236fc964f21 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 4 Feb 2020 18:47:50 +1100
Subject: [PATCH 0124/1056] csv-shuffle: output: flushing fixed, performance
 improved

---
 csv/applications/csv-shuffle.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 5b159a262..7e8f03368 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -147,6 +147,7 @@ int main( int ac, char** av )
 //             }
 //             for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k ) { output_size += elements[k].size; }
 //             std::vector< char > out( output_size );
+//             if( !csv.flush ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
 //             while( std::cin.good() && !std::cin.eof() )
 //             {
 //                 // todo: quick and dirty; if performance is an issue, you could read more than
@@ -186,6 +187,7 @@ int main( int ac, char** av )
             std::vector< comma::csv::format::element > elements;
             elements.reserve( csv.format().count() ); // quick and dirty, can be really wasteful on large things like images
             for( unsigned int i = 0; i < elements.capacity(); ++i ) { elements.push_back( csv.format().offset( i ) ); }
+            if( !csv.flush ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
             while( std::cin.good() && !std::cin.eof() )
             {
                 // todo: quick and dirty; if performance is an issue, you could read more than

From 6c591814f55e63ea0285dbce2a1f393ca4d3be9d Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 5 Feb 2020 18:29:28 +1100
Subject: [PATCH 0125/1056] csv-cast: --flush implemented; not flushing stdout
 by default now

---
 csv/applications/csv-cast.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-cast.cpp b/csv/applications/csv-cast.cpp
index a1b1a83ac..7370731bc 100644
--- a/csv/applications/csv-cast.cpp
+++ b/csv/applications/csv-cast.cpp
@@ -55,6 +55,7 @@ static void usage()
     std::cerr << std::endl;
     std::cerr << "    --binary,-b,--from: input binary format" << std::endl;
     std::cerr << "    --output-binary,--output,-o,--to: output binary format" << std::endl;
+    std::cerr << "    --flush: flush stdout after each record" << std::endl;
     std::cerr << "    --force: allow narrowing conversions" << std::endl;
     std::cerr << std::endl;
     std::cerr << comma::csv::format::usage() << std::endl;
@@ -262,15 +263,18 @@ int main( int ac, char** av )
         comma::csv::format iformat( options.value< std::string >( "--binary,-b,--from", av[1] ) );
         comma::csv::format oformat( options.value< std::string >( "--output-binary,--output,-o,--to", av[2] ) );
         check_conversions( iformat, oformat, options.exists( "--force" ) );
+        bool flush = options.exists( "--flush" );
         std::vector< char > in( iformat.size() );
         std::vector< char > out( oformat.size() );
+        if( !flush ) { std::cin.tie( NULL ); }
         while( std::cin.good() )
         {
             std::cin.read( &in[0], iformat.size() );
             if( std::cin.gcount() == 0 ) { break; }
             if( std::cin.gcount() < static_cast< int >( iformat.size() ) ) { COMMA_THROW( comma::exception, "expected " << iformat.size() << " bytes, got only " << std::cin.gcount() ); }
             cast( iformat, in, oformat, out );
-            std::cout.write( &out[0], oformat.size() ).flush();
+            std::cout.write( &out[0], oformat.size() );
+            if( flush ) { std::cout.flush(); }
         }
         return 0;
     }

From 1d16fd8c79f5de7e4f6e5d6af9060e693608dd69 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 5 Feb 2020 22:00:06 +1100
Subject: [PATCH 0126/1056] csv-shuffle, csv-calc, csv-to-bin: --flush: when
 absent, don't flush stdout on each input

---
 csv/applications/csv-calc.cpp    | 6 ++++--
 csv/applications/csv-shuffle.cpp | 4 ++--
 csv/applications/csv-to-bin.cpp  | 3 ++-
 3 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index eea012c5b..488802095 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1181,7 +1181,7 @@ static void output( const comma::csv::options& csv, ResultsMap& results, boost::
         {
             if( has_id )  { std::cout.write( reinterpret_cast< const char* >( &it->first ), sizeof( comma::uint32 ) ); } // quick and dirty
             if( has_block ) { std::cout.write( reinterpret_cast< const char* >( &( *block ) ), sizeof( comma::uint32 ) ); } // quick and dirty
-            std::cout.flush();
+            if( csv.flush ) { std::cout.flush(); }
         }
         else
         {
@@ -1201,6 +1201,7 @@ static void append_and_output( const comma::csv::options& csv, Inputs& inputs, R
         if (!csv.binary()) { std::cout << csv.delimiter; }
         std::cout << results.find(inputs[i].first)->second;
         if (!csv.binary()) { std::cout << std::endl; }
+        if( csv.flush ) { std::cout.flush(); }
     }
     results.clear();
     inputs.clear();
@@ -1294,7 +1295,8 @@ int main( int ac, char** av )
             if (has_block && !append) { std::cout << csv.delimiter << "ui"; }
             std::cout << std::endl;
             return 0;
-        } 
+        }
+        if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); }
         while( std::cin.good() && !std::cin.eof() )
         {
             const Values* v = csv.binary() ? binary->read() : ascii->read();
diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 7e8f03368..f6d460289 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -147,7 +147,7 @@ int main( int ac, char** av )
 //             }
 //             for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k ) { output_size += elements[k].size; }
 //             std::vector< char > out( output_size );
-//             if( !csv.flush ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
+//             if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
 //             while( std::cin.good() && !std::cin.eof() )
 //             {
 //                 // todo: quick and dirty; if performance is an issue, you could read more than
@@ -187,7 +187,7 @@ int main( int ac, char** av )
             std::vector< comma::csv::format::element > elements;
             elements.reserve( csv.format().count() ); // quick and dirty, can be really wasteful on large things like images
             for( unsigned int i = 0; i < elements.capacity(); ++i ) { elements.push_back( csv.format().offset( i ) ); }
-            if( !csv.flush ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
+            if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
             while( std::cin.good() && !std::cin.eof() )
             {
                 // todo: quick and dirty; if performance is an issue, you could read more than
diff --git a/csv/applications/csv-to-bin.cpp b/csv/applications/csv-to-bin.cpp
index d3b029ca6..acf8ed667 100644
--- a/csv/applications/csv-to-bin.cpp
+++ b/csv/applications/csv-to-bin.cpp
@@ -76,7 +76,8 @@ int main( int ac, char** av )
         char delimiter = options.value( "--delimiter", ',' );
         bool flush = options.exists( "--flush" );
         comma::csv::format format( av[1] );
-        //{ ProfilerStart( "csv-to-bin.prof" );
+        if( !flush ) { std::cin.tie( NULL ); }
+        //{ ProfilerStart( "csvg-to-bin.prof" );
         while( std::cin.good() && !std::cin.eof() )
         {
             std::getline( std::cin, line );

From 3058abd99dd0bf8d0b3639a8a9669dc9e6fff869 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 6 Feb 2020 12:28:28 +1100
Subject: [PATCH 0127/1056] csv-calc: (unsuccessfully) tried to improve
 performance on large number of ids; minor refactoring in the process

---
 csv/applications/csv-calc.cpp | 124 ++++++++++++++++++++--------------
 1 file changed, 72 insertions(+), 52 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 488802095..044eb4136 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -309,7 +309,7 @@ class ascii_input
             return values_.get();
         }
 
-        const std::string line() { return line_; }
+        const std::string& line() const { return line_; }
         
     private:
         comma::csv::options csv_;
@@ -334,10 +334,15 @@ class binary_input
         {
             while( true )
             {
+                //std::cin.read( &buffer_[0], csv_.format().size() );
+                //if( std::cin.gcount() == 0 ) { return NULL; }
+                //if( std::cin.gcount() != int( csv_.format().size() ) ) { COMMA_THROW( comma::exception, "expected " << csv_.format().size() << " bytes; got " << std::cin.gcount() ); }
+                //values_.set( &buffer_[0] );
+                //return &values_;
                 if( offset_ >= csv_.format().size() )
                 {
                     values_.set( cur_ );
-                    line_ = std::string(cur_, csv_.format().size());
+                    line_ = std::string( cur_, csv_.format().size() );
                     cur_ += csv_.format().size();
                     offset_ -= csv_.format().size();
                     if( cur_ == end_ ) { cur_ = &buffer_[0]; offset_ = 0; }
@@ -348,7 +353,8 @@ class binary_input
                 offset_ += count;
             }
         }
-        const std::string line() { return line_; }
+        
+        const std::string& line() const { return line_; }
 
     private:
         comma::csv::options csv_;
@@ -1035,13 +1041,13 @@ namespace Operations
     template <> struct traits< Enum::kurtosis > { template < typename T, comma::csv::format::types_enum F > struct FromEnum { typedef Kurtosis< T, F > Type; }; };
 } // namespace Operations
 
-class Operationbase
+class operation_base
 {
     public:
-        virtual ~Operationbase() {}
+        virtual ~operation_base() {}
         virtual void push( const char* buf ) = 0;
         virtual void calculate() = 0;
-        virtual Operationbase* clone() const = 0;
+        virtual operation_base* clone() const = 0;
         const comma::csv::format& output_format() const { return output_format_; }
         const char* buffer() const { return &buffer_[0]; }
 
@@ -1053,7 +1059,7 @@ class Operationbase
         std::vector< comma::csv::format::element > output_elements_;
         std::vector< char > buffer_;
 
-        Operationbase* deep_copy_to_( Operationbase* lhs ) const
+        operation_base* deep_copy_to_( operation_base* lhs ) const
         {
             lhs->input_format_ = input_format_;
             lhs->input_elements_ = input_elements_;
@@ -1066,7 +1072,7 @@ class Operationbase
 };
 
 template < Operations::Enum::Values E >
-struct Operation : public Operationbase
+struct Operation : public operation_base
 {
     Operation() {}
     Operation( const comma::csv::format& format
@@ -1132,18 +1138,18 @@ struct Operation : public Operationbase
         for( std::size_t i = 0; i < operations_.size(); ++i ) { operations_[i].calculate( &buffer_[0] + output_elements_[i].offset ); }
     }
 
-    Operationbase* clone() const { Operation< E >* op = new Operation< E >; return deep_copy_to_( op ); }
+    operation_base* clone() const { Operation< E >* op = new Operation< E >; return deep_copy_to_( op ); }
 };
 
-typedef boost::unordered_map< comma::uint32, boost::ptr_vector< Operationbase >* > OperationsMap;
-typedef boost::unordered_map< comma::uint32, std::string > ResultsMap;
+typedef boost::unordered_map< comma::uint32, boost::ptr_vector< operation_base >* > operations_map_t;
+typedef boost::unordered_map< comma::uint32, std::string > results_map_t;
 typedef std::vector< std::pair < comma::uint32, std::string > > Inputs;
 
-static void init_operations( boost::ptr_vector< Operationbase >& operations
+static void init_operations( boost::ptr_vector< operation_base >& operations
                            , const std::vector< Operations::operation_parameters >& operations_parameters
                            , const comma::csv::format& format )
 {
-    static boost::ptr_vector< Operationbase > sample;
+    static boost::ptr_vector< operation_base > sample;
     if( sample.empty() )
     {
         sample.reserve( operations_parameters.size() );
@@ -1169,14 +1175,15 @@ static void init_operations( boost::ptr_vector< Operationbase >& operations
         }
     }
     operations.clear();
-    for( std::size_t i = 0; i < sample.size(); ++i ) { operations.push_back( sample[i].clone() ); }
+    operations.reserve( sample.size() );
+    for( auto& s: sample ) { operations.push_back( s.clone() ); } // todo! this is really slow, if there are many ids
 }
 
-static void output( const comma::csv::options& csv, ResultsMap& results, boost::optional< comma::uint32 > block, bool has_block, bool has_id )
+static void output( const comma::csv::options& csv, results_map_t& results, boost::optional< comma::uint32 > block, bool has_block, bool has_id )
 {
-    for( ResultsMap::iterator it = results.begin(); it != results.end(); ++it )
+    for( results_map_t::iterator it = results.begin(); it != results.end(); ++it )
     {
-        std::cout << it->second;
+        std::cout.write( &it->second[0], it->second.size() );
         if( csv.binary() )
         {
             if( has_id )  { std::cout.write( reinterpret_cast< const char* >( &it->first ), sizeof( comma::uint32 ) ); } // quick and dirty
@@ -1193,34 +1200,48 @@ static void output( const comma::csv::options& csv, ResultsMap& results, boost::
     results.clear();
 }
 
-static void append_and_output( const comma::csv::options& csv, Inputs& inputs, ResultsMap& results )
-{    
+static void append_and_output( const comma::csv::options& csv, Inputs& inputs, results_map_t& results )
+{
     for ( size_t i = 0; i < inputs.size(); ++i )
     {
         std::cout << inputs[i].second;
-        if (!csv.binary()) { std::cout << csv.delimiter; }
-        std::cout << results.find(inputs[i].first)->second;
-        if (!csv.binary()) { std::cout << std::endl; }
+        if( !csv.binary() ) { std::cout << csv.delimiter; }
+        const auto& r = results.find( inputs[i].first )->second;
+        std::cout.write( &r[0], r.size() );
+        if( !csv.binary() ) { std::cout << std::endl; }
         if( csv.flush ) { std::cout.flush(); }
     }
     results.clear();
     inputs.clear();
 }
 
-static void calculate( const comma::csv::options& csv, OperationsMap& operations, ResultsMap& results )
+static void calculate( const comma::csv::options& csv, operations_map_t& operations, results_map_t& results )
 {
-    for( OperationsMap::iterator it = operations.begin(); it != operations.end(); ++it )
+    for( operations_map_t::iterator it = operations.begin(); it != operations.end(); ++it )
     {
         std::string r;
+        if( csv.binary() )
+        {
+            unsigned int size = 0;
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i].output_format().size(); }
+            r.reserve( size );
+        }
         for( std::size_t i = 0; i < it->second->size(); ++i )
         {
             ( *it->second )[i].calculate();
-            if( csv.binary() ) { r.append( ( *it->second )[i].buffer(), ( *it->second )[i].output_format().size() ); }
-            else { if( i > 0 ) { r += csv.delimiter; } r.append(( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, csv.precision )); }
+            if( csv.binary() )
+            { 
+                r.append( ( *it->second )[i].buffer(), ( *it->second )[i].output_format().size() );
+            }
+            else
+            {
+                if( i > 0 ) { r += csv.delimiter; }
+                r.append( ( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, csv.precision ) );
+            }
         }
-        results[it->first] = r;
+        results[ it->first ] = r;
     }
-    for( OperationsMap::iterator it = operations.begin(); it != operations.end(); ++it ) { delete it->second; } // quick and dirty
+    for( operations_map_t::iterator it = operations.begin(); it != operations.end(); ++it ) { delete it->second; } // quick and dirty
     operations.clear();
 }
 
@@ -1230,13 +1251,14 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
-        std::vector< std::string > unnamed = options.unnamed( "", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
+        std::vector< std::string > unnamed = options.unnamed( "--append,--flush,--output-fields,--output-format", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
         comma::csv::options csv( options );
         csv.full_xpath = false;
         std::cout.precision( csv.precision );
         #ifdef WIN32
         if( csv.binary() ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
+        if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); std::ios_base::sync_with_stdio( false ); } // todo? quick and dirty, redesign binary_input instead?
         if( unnamed.empty() ) { std::cerr << comma::verbose.app_name() << ": please specify operations" << std::endl; exit( 1 ); }
         std::vector< std::string > v = comma::split( unnamed[0], ',' );
         std::vector< Operations::operation_parameters > operations_parameters( v.size() );
@@ -1253,14 +1275,13 @@ int main( int ac, char** av )
         boost::scoped_ptr< binary_input > binary;
         if( csv.binary() ) { binary.reset( new binary_input( csv ) ); }
         else { ascii.reset( new ascii_input( csv, format ) ); }
-        OperationsMap operations;
-        ResultsMap results;
+        operations_map_t operations;
+        results_map_t results;
         Inputs inputs;
         boost::optional< comma::uint32 > block = boost::make_optional< comma::uint32 >( false, 0 );
         bool has_block = csv.has_field( "block" );
         bool has_id = csv.has_field( "id" );
-        bool append = options.exists("--append");
-        
+        bool append = options.exists( "--append" );
         if( options.exists( "--output-fields" ) )
         {
             std::vector < std::string > fields = comma::split(csv.fields, ',');
@@ -1270,33 +1291,32 @@ int main( int ac, char** av )
                 std::replace(v[op].begin(), v[op].end(), '=', '_');
                 std::replace(v[op].begin(), v[op].end(), '.', '_');
                 std::replace(v[op].begin(), v[op].end(), ':', '_');
-                for (std::size_t f = 0; f < fields.size(); f++ )
+                for( std::size_t f = 0; f < fields.size(); f++ )
                 {
-                    if (fields[f] == "" || fields[f] == "id" || fields[f] == "block") { continue; }
-                    output_fields.push_back(fields[f] + "/" + v[op]);
+                    if( fields[f] == "" || fields[f] == "id" || fields[f] == "block" ) { continue; }
+                    output_fields.push_back( fields[f] + "/" + v[op] );
                 }
             }
-            if (has_id && !append) { output_fields.push_back("id"); }
-            if (has_block && !append ) { output_fields.push_back("block"); }
-            std::cout << comma::join(output_fields, ',') << std::endl;
+            if( has_id && !append ) { output_fields.push_back( "id" ); }
+            if( has_block && !append ) { output_fields.push_back( "block" ); }
+            std::cout << comma::join( output_fields, ',' ) << std::endl;
             return 0;
         }
-        if (options.exists("--output-format"))
+        if( options.exists( "--output-format" ) )
         {
             if ( !format ) { std::cerr << comma::verbose.app_name() << ": option --output-format requires input format to be specified, please use --format or --binary" << std::endl; return 1; }
-            boost::ptr_vector< Operationbase > ops;
-            init_operations(ops, operations_parameters, Values(csv, *format).format());
+            boost::ptr_vector< operation_base > ops;
+            init_operations( ops, operations_parameters, Values(csv, *format).format() );
             for ( std::size_t i = 0; i < ops.size(); ++i ) 
             { 
                 if ( i > 0 ) { std::cout << csv.delimiter; }
                 std::cout << ops[i].output_format().string();
             }
-            if (has_id && !append) { std::cout << csv.delimiter << "ui"; }
-            if (has_block && !append) { std::cout << csv.delimiter << "ui"; }
+            if( has_id && !append ) { std::cout << csv.delimiter << "ui"; }
+            if( has_block && !append ) { std::cout << csv.delimiter << "ui"; }
             std::cout << std::endl;
             return 0;
         }
-        if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); }
         while( std::cin.good() && !std::cin.eof() )
         {
             const Values* v = csv.binary() ? binary->read() : ascii->read();
@@ -1305,23 +1325,23 @@ int main( int ac, char** av )
             {
                 if( block && *block != v->block() ) 
                 { 
-                    calculate(csv, operations, results);
-                    if ( append ) { append_and_output(csv, inputs, results); inputs.clear(); }
+                    calculate( csv, operations, results );
+                    if ( append ) { append_and_output( csv, inputs, results ); inputs.clear(); }
                     else { output( csv, results, block, has_block, has_id ); }
                 }
                 block = v->block();
             }
-            OperationsMap::iterator it = operations.find( v->id() );
+            operations_map_t::iterator it = operations.find( v->id() );
             if( it == operations.end() )
             {
-                it = operations.insert( std::make_pair( v->id(), new boost::ptr_vector< Operationbase > ) ).first;
+                it = operations.insert( std::make_pair( v->id(), new boost::ptr_vector< operation_base > ) ).first;
                 init_operations( *it->second, operations_parameters, v->format() );
             }
-            if (append) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
+            if( append ) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
             for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i].push( v->buffer() ); }
         }
-        calculate(csv, operations, results);
-        if ( append ) { append_and_output(csv, inputs, results); }
+        calculate( csv, operations, results );
+        if ( append ) { append_and_output( csv, inputs, results ); }
         else { output( csv, results, block, has_block, has_id ); }
         return 0;
     }

From c84e16aeebb73498fba4332b1574d7b43ecfd71c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 7 Feb 2020 12:25:32 +1100
Subject: [PATCH 0128/1056] csv-calc: trying to speed up for high number of ids
 vs polymorhic operations; performance improved by some 60%, but still is very
 slow

---
 csv/applications/csv-calc.cpp | 165 ++++++++++++++++++++++------------
 1 file changed, 106 insertions(+), 59 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 044eb4136..a145ef85a 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifdef WIN32
@@ -437,6 +436,7 @@ namespace Operations
     struct base
     {
         virtual ~base() {}
+        virtual void reset() = 0;
         virtual void push( const char* ) = 0;
         virtual void calculate( char* ) = 0;
         virtual base* clone() const = 0;
@@ -451,6 +451,7 @@ namespace Operations
     class Min : public base
     {
         public:
+            void reset() { min_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 const T& t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -469,6 +470,7 @@ namespace Operations
     class Max : public base
     {
         public:
+            void reset() { max_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -487,6 +489,7 @@ namespace Operations
     class Sum : public base
     {
         public:
+            void reset() { sum_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -501,6 +504,7 @@ namespace Operations
     template < comma::csv::format::types_enum F >
     class Sum< boost::posix_time::ptime, F > : public base
     {
+        void reset() { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         base* clone() const { COMMA_THROW( comma::exception, "sum not defined for time" ); }
@@ -510,6 +514,7 @@ namespace Operations
     class Centre : public base
     {
         public:
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< T, F >::to_bin( *min_.min_ + ( *max_.max_ - *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Centre< T, F >( *this ); }
@@ -525,6 +530,7 @@ namespace Operations
     class Mode : public base
     {
         public:
+            void reset() { value_count_ = impl::value_count< T >(); }
             void push( const char* buf ) { value_count_.update( comma::csv::format::traits< T, F >::from_bin( buf ) ); }
             void calculate( char* buf ) { if( !value_count_.map().empty() ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value_count_.mode().first ), buf ); } }
             base* clone() const { return new Mode< T, F >( *this ); }
@@ -537,6 +543,7 @@ namespace Operations
     {
         public:
             Mean() : count_( 0 ) {}
+            void reset() { mean_ = boost::none; count_ = 0; }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -641,6 +648,8 @@ namespace Operations
             }
 
             base* clone() const { return new Percentile< T, F >( *this ); }
+            
+            void reset() { values_.clear(); percentile_ = 0; }
 
         private:
             std::multiset< T > values_;
@@ -651,6 +660,7 @@ namespace Operations
     template < comma::csv::format::types_enum F >
     class Percentile< boost::posix_time::ptime, F > : public base
     {
+        void reset() { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         base* clone() const { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
@@ -728,6 +738,8 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return previous_.mean(); }
             
+            void reset() { previous_.reset(); value_ = 0; count_ = 0; }
+            
         private:
             Moment< T, M - 1 > previous_;
             typename result_traits< T >::type value_;
@@ -739,6 +751,7 @@ namespace Operations
     {
         public:
             Moment() : value_( 0 ), count_( 0 ) {}
+            
             void update ( const T t )
             {   
                 ++count_;
@@ -747,6 +760,8 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return value_; }
             
+            void reset() { value_ = 0; count_ = 0; }
+            
         private:
             typename result_traits< T >::type value_;
             std::size_t count_;
@@ -768,6 +783,7 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( std::sqrt( static_cast< long double >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() )  ) ) ), buf ); } }
             base* clone() const { return new Stddev< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
             boost::optional<T> first_;
@@ -788,6 +804,7 @@ namespace Operations
             }
             void calculate( char* buf ) { stddev_.calculate(buf); }
             base* clone() const { return new Stddev< boost::posix_time::ptime, F >( *this ); }
+            void reset() { stddev_.reset(); first_ = boost::none; }
         private:
             Stddev< double, F > stddev_;
             boost::optional<boost::posix_time::ptime> first_;
@@ -809,6 +826,7 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() ) ), buf ); } }
             base* clone() const { return new Variance< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
             boost::optional<T> first_;
@@ -829,9 +847,10 @@ namespace Operations
             }
             void calculate( char* buf ) { variance_.calculate(buf); }
             base* clone() const { return new Variance< boost::posix_time::ptime, F >( *this ); }
+            void reset() { variance_.reset(); first_ = boost::none; }
         private:
-            Variance< double, F> variance_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Variance< double, F > variance_;
+            boost::optional< boost::posix_time::ptime > first_;
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -852,7 +871,6 @@ namespace Operations
                 if( moments_.count() > 0 ) 
                 { 
                     typename result_traits< T >::type n = moments_.count();
-                    
                     // corrected sample skew requires at least 3 samples
                     typename result_traits< T >::type correction = sample_ ? sqrt( n * ( n - 1 ) ) / ( n - 2 ) : 1 ;
                     typename result_traits< T >::type m2 = moments_.previous().value();
@@ -861,9 +879,10 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Skew< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 3 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_;
             bool sample_;
     };
 
@@ -881,9 +900,10 @@ namespace Operations
             }
             void calculate( char* buf ) { skew_.calculate(buf); }
             base* clone() const { return new Skew< boost::posix_time::ptime, F >( *this ); }
+            void reset() { skew_.reset(); first_ = boost::none; }
         private:
-            Skew< double, F> skew_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Skew< double, F > skew_;
+            boost::optional< boost::posix_time::ptime > first_;
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -895,8 +915,8 @@ namespace Operations
             { 
                 for (std::size_t i = 0; i < options.size(); i++) 
                 {
-                    if ( options[i] == "sample" ) { sample_ = true; }
-                    else if ( options[i] == "excess" ) { excess_ = true; }
+                    if( options[i] == "sample" ) { sample_ = true; }
+                    else if( options[i] == "excess" ) { excess_ = true; }
                 }
             }
             void push( const char* buf ) 
@@ -923,9 +943,10 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Kurtosis< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 4 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_;
             bool sample_;
             bool excess_;
     };
@@ -944,9 +965,10 @@ namespace Operations
             }
             void calculate( char* buf ) { kurtosis_.calculate(buf); }
             base* clone() const { return new Kurtosis< boost::posix_time::ptime, F >( *this ); }
+            void reset() { kurtosis_.reset(); first_ = boost::none; }
         private:
-            Kurtosis< double, F> kurtosis_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Kurtosis< double, F > kurtosis_;
+            boost::optional< boost::posix_time::ptime > first_;
     };
     
     template < typename T > struct Diff
@@ -968,6 +990,7 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ), buf ); } }
             base* clone() const { return new Diameter< T, F >( *this ); }
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -980,6 +1003,7 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Radius< T, F >( *this ); }
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -993,6 +1017,7 @@ namespace Operations
             void push( const char* ) { ++count_; }
             void calculate( char* buf ) { comma::csv::format::traits< comma::uint32 >::to_bin( count_, buf ); }
             base* clone() const { return new Size< T, F >( *this ); }
+            void reset() { count_ = 0; }
         private:
             std::size_t count_;
     };
@@ -1048,6 +1073,7 @@ class operation_base
         virtual void push( const char* buf ) = 0;
         virtual void calculate() = 0;
         virtual operation_base* clone() const = 0;
+        virtual void reset() = 0;
         const comma::csv::format& output_format() const { return output_format_; }
         const char* buffer() const { return &buffer_[0]; }
 
@@ -1137,48 +1163,74 @@ struct Operation : public operation_base
     {
         for( std::size_t i = 0; i < operations_.size(); ++i ) { operations_[i].calculate( &buffer_[0] + output_elements_[i].offset ); }
     }
+    
+    void reset() { for( auto& o: operations_ ) { o.reset(); } }
 
     operation_base* clone() const { Operation< E >* op = new Operation< E >; return deep_copy_to_( op ); }
 };
 
-typedef boost::unordered_map< comma::uint32, boost::ptr_vector< operation_base >* > operations_map_t;
+typedef boost::unordered_map< comma::uint32, std::vector< operation_base* >* > operations_map_t;
 typedef boost::unordered_map< comma::uint32, std::string > results_map_t;
 typedef std::vector< std::pair < comma::uint32, std::string > > Inputs;
 
-static void init_operations( boost::ptr_vector< operation_base >& operations
-                           , const std::vector< Operations::operation_parameters >& operations_parameters
-                           , const comma::csv::format& format )
+class operations_battery_farm_t // all this pain is because operations polymorhism is too slow when there are a lot of ids
 {
-    static boost::ptr_vector< operation_base > sample;
-    if( sample.empty() )
-    {
-        sample.reserve( operations_parameters.size() );
-        for( std::size_t i = 0; i < operations_parameters.size(); ++i )
+    public:
+        typedef std::vector< operation_base* > operations_t;
+        
+        operations_battery_farm_t(): end_( 0 ) {}
+        
+        ~operations_battery_farm_t()
+        { 
+            for( auto& sample: operations_ ) { for( auto& s: sample ) { delete s; } } // quick and dirty; shame on me
+        }
+        
+        operations_t& make( const std::vector< Operations::operation_parameters >& operations_parameters, const comma::csv::format& format )
         {
-            switch( operations_parameters[i].type )
+            if( operations_.empty() )
             {
-                case Operations::Enum::min: sample.push_back( new Operation< Operations::Enum::min >( format ) ); break;
-                case Operations::Enum::max: sample.push_back( new Operation< Operations::Enum::max >( format ) ); break;
-                case Operations::Enum::centre: sample.push_back( new Operation< Operations::Enum::centre >( format ) ); break;
-                case Operations::Enum::mean: sample.push_back( new Operation< Operations::Enum::mean >( format ) ); break;
-                case Operations::Enum::mode: sample.push_back( new Operation< Operations::Enum::mode >( format ) ); break;
-                case Operations::Enum::percentile: sample.push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::radius: sample.push_back( new Operation< Operations::Enum::radius >( format ) ); break;
-                case Operations::Enum::diameter: sample.push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
-                case Operations::Enum::variance: sample.push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::stddev: sample.push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::skew: sample.push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::kurtosis: sample.push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::sum: sample.push_back( new Operation< Operations::Enum::sum >( format ) ); break;
-                case Operations::Enum::size: sample.push_back( new Operation< Operations::Enum::size >( format ) ); break;
+                operations_.push_back( operations_t() );
+                operations_[0].reserve( operations_parameters.size() );
+                for( std::size_t i = 0; i < operations_parameters.size(); ++i )
+                {
+                    switch( operations_parameters[i].type )
+                    {
+                        case Operations::Enum::min: operations_[0].push_back( new Operation< Operations::Enum::min >( format ) ); break;
+                        case Operations::Enum::max: operations_[0].push_back( new Operation< Operations::Enum::max >( format ) ); break;
+                        case Operations::Enum::centre: operations_[0].push_back( new Operation< Operations::Enum::centre >( format ) ); break;
+                        case Operations::Enum::mean: operations_[0].push_back( new Operation< Operations::Enum::mean >( format ) ); break;
+                        case Operations::Enum::mode: operations_[0].push_back( new Operation< Operations::Enum::mode >( format ) ); break;
+                        case Operations::Enum::percentile: operations_[0].push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::radius: operations_[0].push_back( new Operation< Operations::Enum::radius >( format ) ); break;
+                        case Operations::Enum::diameter: operations_[0].push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
+                        case Operations::Enum::variance: operations_[0].push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::stddev: operations_[0].push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::skew: operations_[0].push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::kurtosis: operations_[0].push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::sum: operations_[0].push_back( new Operation< Operations::Enum::sum >( format ) ); break;
+                        case Operations::Enum::size: operations_[0].push_back( new Operation< Operations::Enum::size >( format ) ); break;
+                    }
+                }
             }
+            if( end_ == operations_.size() )
+            {
+                operations_.push_back( operations_t() );
+                for( auto& s: operations_[0] ) { operations_.back().push_back( s->clone() ); }
+            }
+            for( auto& s: operations_[end_] ) { s->reset(); }
+            return operations_[ end_++ ];
         }
-    }
-    operations.clear();
-    operations.reserve( sample.size() );
-    for( auto& s: sample ) { operations.push_back( s.clone() ); } // todo! this is really slow, if there are many ids
-}
+        
+        void reset() { end_ = 0; }
+        
+    private:
+        typedef std::deque< operations_t > operations_t_;
+        operations_t_ operations_;
+        unsigned int end_;
+};
 
+static operations_battery_farm_t operations_battery_farm;
+        
 static void output( const comma::csv::options& csv, results_map_t& results, boost::optional< comma::uint32 > block, bool has_block, bool has_id )
 {
     for( results_map_t::iterator it = results.begin(); it != results.end(); ++it )
@@ -1223,26 +1275,26 @@ static void calculate( const comma::csv::options& csv, operations_map_t& operati
         if( csv.binary() )
         {
             unsigned int size = 0;
-            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i].output_format().size(); }
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i]->output_format().size(); }
             r.reserve( size );
         }
         for( std::size_t i = 0; i < it->second->size(); ++i )
         {
-            ( *it->second )[i].calculate();
+            ( *it->second )[i]->calculate();
             if( csv.binary() )
             { 
-                r.append( ( *it->second )[i].buffer(), ( *it->second )[i].output_format().size() );
+                r.append( ( *it->second )[i]->buffer(), ( *it->second )[i]->output_format().size() );
             }
             else
             {
                 if( i > 0 ) { r += csv.delimiter; }
-                r.append( ( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, csv.precision ) );
+                r.append( ( *it->second )[i]->output_format().bin_to_csv( ( *it->second )[i]->buffer(), csv.delimiter, csv.precision ) );
             }
         }
         results[ it->first ] = r;
     }
-    for( operations_map_t::iterator it = operations.begin(); it != operations.end(); ++it ) { delete it->second; } // quick and dirty
     operations.clear();
+    operations_battery_farm.reset();
 }
 
 int main( int ac, char** av )
@@ -1305,15 +1357,11 @@ int main( int ac, char** av )
         if( options.exists( "--output-format" ) )
         {
             if ( !format ) { std::cerr << comma::verbose.app_name() << ": option --output-format requires input format to be specified, please use --format or --binary" << std::endl; return 1; }
-            boost::ptr_vector< operation_base > ops;
-            init_operations( ops, operations_parameters, Values(csv, *format).format() );
-            for ( std::size_t i = 0; i < ops.size(); ++i ) 
-            { 
-                if ( i > 0 ) { std::cout << csv.delimiter; }
-                std::cout << ops[i].output_format().string();
-            }
-            if( has_id && !append ) { std::cout << csv.delimiter << "ui"; }
-            if( has_block && !append ) { std::cout << csv.delimiter << "ui"; }
+            auto ops = operations_battery_farm.make( operations_parameters, Values( csv, *format ).format() );
+            std::cout << ops[0]->output_format().string();
+            for( std::size_t i = 1; i < ops.size(); ++i ) { std::cout << ',' << ops[i]->output_format().string(); }
+            if( has_id && !append ) { std::cout << ",ui"; }
+            if( has_block && !append ) { std::cout << ",ui"; }
             std::cout << std::endl;
             return 0;
         }
@@ -1324,7 +1372,7 @@ int main( int ac, char** av )
             if( has_block )
             {
                 if( block && *block != v->block() ) 
-                { 
+                {
                     calculate( csv, operations, results );
                     if ( append ) { append_and_output( csv, inputs, results ); inputs.clear(); }
                     else { output( csv, results, block, has_block, has_id ); }
@@ -1334,11 +1382,10 @@ int main( int ac, char** av )
             operations_map_t::iterator it = operations.find( v->id() );
             if( it == operations.end() )
             {
-                it = operations.insert( std::make_pair( v->id(), new boost::ptr_vector< operation_base > ) ).first;
-                init_operations( *it->second, operations_parameters, v->format() );
+                it = operations.insert( std::make_pair( v->id(), &operations_battery_farm.make( operations_parameters, v->format() ) ) ).first;
             }
             if( append ) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
-            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i].push( v->buffer() ); }
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i]->push( v->buffer() ); }
         }
         calculate( csv, operations, results );
         if ( append ) { append_and_output( csv, inputs, results ); }

From facc5d549c2b96891035548ce378384144122580 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 7 Feb 2020 12:41:08 +1100
Subject: [PATCH 0129/1056] csv-calc: reverted to previous version due to the
 bugs

---
 csv/applications/csv-calc.cpp | 165 ++++++++++++----------------------
 1 file changed, 59 insertions(+), 106 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index a145ef85a..044eb4136 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -27,6 +27,7 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+
 /// @author vsevolod vlaskine
 
 #ifdef WIN32
@@ -436,7 +437,6 @@ namespace Operations
     struct base
     {
         virtual ~base() {}
-        virtual void reset() = 0;
         virtual void push( const char* ) = 0;
         virtual void calculate( char* ) = 0;
         virtual base* clone() const = 0;
@@ -451,7 +451,6 @@ namespace Operations
     class Min : public base
     {
         public:
-            void reset() { min_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 const T& t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -470,7 +469,6 @@ namespace Operations
     class Max : public base
     {
         public:
-            void reset() { max_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -489,7 +487,6 @@ namespace Operations
     class Sum : public base
     {
         public:
-            void reset() { sum_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -504,7 +501,6 @@ namespace Operations
     template < comma::csv::format::types_enum F >
     class Sum< boost::posix_time::ptime, F > : public base
     {
-        void reset() { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         base* clone() const { COMMA_THROW( comma::exception, "sum not defined for time" ); }
@@ -514,7 +510,6 @@ namespace Operations
     class Centre : public base
     {
         public:
-            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< T, F >::to_bin( *min_.min_ + ( *max_.max_ - *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Centre< T, F >( *this ); }
@@ -530,7 +525,6 @@ namespace Operations
     class Mode : public base
     {
         public:
-            void reset() { value_count_ = impl::value_count< T >(); }
             void push( const char* buf ) { value_count_.update( comma::csv::format::traits< T, F >::from_bin( buf ) ); }
             void calculate( char* buf ) { if( !value_count_.map().empty() ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value_count_.mode().first ), buf ); } }
             base* clone() const { return new Mode< T, F >( *this ); }
@@ -543,7 +537,6 @@ namespace Operations
     {
         public:
             Mean() : count_( 0 ) {}
-            void reset() { mean_ = boost::none; count_ = 0; }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -648,8 +641,6 @@ namespace Operations
             }
 
             base* clone() const { return new Percentile< T, F >( *this ); }
-            
-            void reset() { values_.clear(); percentile_ = 0; }
 
         private:
             std::multiset< T > values_;
@@ -660,7 +651,6 @@ namespace Operations
     template < comma::csv::format::types_enum F >
     class Percentile< boost::posix_time::ptime, F > : public base
     {
-        void reset() { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         base* clone() const { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
@@ -738,8 +728,6 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return previous_.mean(); }
             
-            void reset() { previous_.reset(); value_ = 0; count_ = 0; }
-            
         private:
             Moment< T, M - 1 > previous_;
             typename result_traits< T >::type value_;
@@ -751,7 +739,6 @@ namespace Operations
     {
         public:
             Moment() : value_( 0 ), count_( 0 ) {}
-            
             void update ( const T t )
             {   
                 ++count_;
@@ -760,8 +747,6 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return value_; }
             
-            void reset() { value_ = 0; count_ = 0; }
-            
         private:
             typename result_traits< T >::type value_;
             std::size_t count_;
@@ -783,7 +768,6 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( std::sqrt( static_cast< long double >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() )  ) ) ), buf ); } }
             base* clone() const { return new Stddev< T, F >( *this ); }
-            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
             boost::optional<T> first_;
@@ -804,7 +788,6 @@ namespace Operations
             }
             void calculate( char* buf ) { stddev_.calculate(buf); }
             base* clone() const { return new Stddev< boost::posix_time::ptime, F >( *this ); }
-            void reset() { stddev_.reset(); first_ = boost::none; }
         private:
             Stddev< double, F > stddev_;
             boost::optional<boost::posix_time::ptime> first_;
@@ -826,7 +809,6 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() ) ), buf ); } }
             base* clone() const { return new Variance< T, F >( *this ); }
-            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
             boost::optional<T> first_;
@@ -847,10 +829,9 @@ namespace Operations
             }
             void calculate( char* buf ) { variance_.calculate(buf); }
             base* clone() const { return new Variance< boost::posix_time::ptime, F >( *this ); }
-            void reset() { variance_.reset(); first_ = boost::none; }
         private:
-            Variance< double, F > variance_;
-            boost::optional< boost::posix_time::ptime > first_;
+            Variance< double, F> variance_;
+            boost::optional<boost::posix_time::ptime> first_;
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -871,6 +852,7 @@ namespace Operations
                 if( moments_.count() > 0 ) 
                 { 
                     typename result_traits< T >::type n = moments_.count();
+                    
                     // corrected sample skew requires at least 3 samples
                     typename result_traits< T >::type correction = sample_ ? sqrt( n * ( n - 1 ) ) / ( n - 2 ) : 1 ;
                     typename result_traits< T >::type m2 = moments_.previous().value();
@@ -879,10 +861,9 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Skew< T, F >( *this ); }
-            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 3 > moments_;
-            boost::optional< T > first_;
+            boost::optional<T> first_;
             bool sample_;
     };
 
@@ -900,10 +881,9 @@ namespace Operations
             }
             void calculate( char* buf ) { skew_.calculate(buf); }
             base* clone() const { return new Skew< boost::posix_time::ptime, F >( *this ); }
-            void reset() { skew_.reset(); first_ = boost::none; }
         private:
-            Skew< double, F > skew_;
-            boost::optional< boost::posix_time::ptime > first_;
+            Skew< double, F> skew_;
+            boost::optional<boost::posix_time::ptime> first_;
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -915,8 +895,8 @@ namespace Operations
             { 
                 for (std::size_t i = 0; i < options.size(); i++) 
                 {
-                    if( options[i] == "sample" ) { sample_ = true; }
-                    else if( options[i] == "excess" ) { excess_ = true; }
+                    if ( options[i] == "sample" ) { sample_ = true; }
+                    else if ( options[i] == "excess" ) { excess_ = true; }
                 }
             }
             void push( const char* buf ) 
@@ -943,10 +923,9 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Kurtosis< T, F >( *this ); }
-            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 4 > moments_;
-            boost::optional< T > first_;
+            boost::optional<T> first_;
             bool sample_;
             bool excess_;
     };
@@ -965,10 +944,9 @@ namespace Operations
             }
             void calculate( char* buf ) { kurtosis_.calculate(buf); }
             base* clone() const { return new Kurtosis< boost::posix_time::ptime, F >( *this ); }
-            void reset() { kurtosis_.reset(); first_ = boost::none; }
         private:
-            Kurtosis< double, F > kurtosis_;
-            boost::optional< boost::posix_time::ptime > first_;
+            Kurtosis< double, F> kurtosis_;
+            boost::optional<boost::posix_time::ptime> first_;
     };
     
     template < typename T > struct Diff
@@ -990,7 +968,6 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ), buf ); } }
             base* clone() const { return new Diameter< T, F >( *this ); }
-            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -1003,7 +980,6 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Radius< T, F >( *this ); }
-            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -1017,7 +993,6 @@ namespace Operations
             void push( const char* ) { ++count_; }
             void calculate( char* buf ) { comma::csv::format::traits< comma::uint32 >::to_bin( count_, buf ); }
             base* clone() const { return new Size< T, F >( *this ); }
-            void reset() { count_ = 0; }
         private:
             std::size_t count_;
     };
@@ -1073,7 +1048,6 @@ class operation_base
         virtual void push( const char* buf ) = 0;
         virtual void calculate() = 0;
         virtual operation_base* clone() const = 0;
-        virtual void reset() = 0;
         const comma::csv::format& output_format() const { return output_format_; }
         const char* buffer() const { return &buffer_[0]; }
 
@@ -1163,74 +1137,48 @@ struct Operation : public operation_base
     {
         for( std::size_t i = 0; i < operations_.size(); ++i ) { operations_[i].calculate( &buffer_[0] + output_elements_[i].offset ); }
     }
-    
-    void reset() { for( auto& o: operations_ ) { o.reset(); } }
 
     operation_base* clone() const { Operation< E >* op = new Operation< E >; return deep_copy_to_( op ); }
 };
 
-typedef boost::unordered_map< comma::uint32, std::vector< operation_base* >* > operations_map_t;
+typedef boost::unordered_map< comma::uint32, boost::ptr_vector< operation_base >* > operations_map_t;
 typedef boost::unordered_map< comma::uint32, std::string > results_map_t;
 typedef std::vector< std::pair < comma::uint32, std::string > > Inputs;
 
-class operations_battery_farm_t // all this pain is because operations polymorhism is too slow when there are a lot of ids
+static void init_operations( boost::ptr_vector< operation_base >& operations
+                           , const std::vector< Operations::operation_parameters >& operations_parameters
+                           , const comma::csv::format& format )
 {
-    public:
-        typedef std::vector< operation_base* > operations_t;
-        
-        operations_battery_farm_t(): end_( 0 ) {}
-        
-        ~operations_battery_farm_t()
-        { 
-            for( auto& sample: operations_ ) { for( auto& s: sample ) { delete s; } } // quick and dirty; shame on me
-        }
-        
-        operations_t& make( const std::vector< Operations::operation_parameters >& operations_parameters, const comma::csv::format& format )
+    static boost::ptr_vector< operation_base > sample;
+    if( sample.empty() )
+    {
+        sample.reserve( operations_parameters.size() );
+        for( std::size_t i = 0; i < operations_parameters.size(); ++i )
         {
-            if( operations_.empty() )
+            switch( operations_parameters[i].type )
             {
-                operations_.push_back( operations_t() );
-                operations_[0].reserve( operations_parameters.size() );
-                for( std::size_t i = 0; i < operations_parameters.size(); ++i )
-                {
-                    switch( operations_parameters[i].type )
-                    {
-                        case Operations::Enum::min: operations_[0].push_back( new Operation< Operations::Enum::min >( format ) ); break;
-                        case Operations::Enum::max: operations_[0].push_back( new Operation< Operations::Enum::max >( format ) ); break;
-                        case Operations::Enum::centre: operations_[0].push_back( new Operation< Operations::Enum::centre >( format ) ); break;
-                        case Operations::Enum::mean: operations_[0].push_back( new Operation< Operations::Enum::mean >( format ) ); break;
-                        case Operations::Enum::mode: operations_[0].push_back( new Operation< Operations::Enum::mode >( format ) ); break;
-                        case Operations::Enum::percentile: operations_[0].push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
-                        case Operations::Enum::radius: operations_[0].push_back( new Operation< Operations::Enum::radius >( format ) ); break;
-                        case Operations::Enum::diameter: operations_[0].push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
-                        case Operations::Enum::variance: operations_[0].push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
-                        case Operations::Enum::stddev: operations_[0].push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
-                        case Operations::Enum::skew: operations_[0].push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
-                        case Operations::Enum::kurtosis: operations_[0].push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
-                        case Operations::Enum::sum: operations_[0].push_back( new Operation< Operations::Enum::sum >( format ) ); break;
-                        case Operations::Enum::size: operations_[0].push_back( new Operation< Operations::Enum::size >( format ) ); break;
-                    }
-                }
+                case Operations::Enum::min: sample.push_back( new Operation< Operations::Enum::min >( format ) ); break;
+                case Operations::Enum::max: sample.push_back( new Operation< Operations::Enum::max >( format ) ); break;
+                case Operations::Enum::centre: sample.push_back( new Operation< Operations::Enum::centre >( format ) ); break;
+                case Operations::Enum::mean: sample.push_back( new Operation< Operations::Enum::mean >( format ) ); break;
+                case Operations::Enum::mode: sample.push_back( new Operation< Operations::Enum::mode >( format ) ); break;
+                case Operations::Enum::percentile: sample.push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
+                case Operations::Enum::radius: sample.push_back( new Operation< Operations::Enum::radius >( format ) ); break;
+                case Operations::Enum::diameter: sample.push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
+                case Operations::Enum::variance: sample.push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
+                case Operations::Enum::stddev: sample.push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
+                case Operations::Enum::skew: sample.push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
+                case Operations::Enum::kurtosis: sample.push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
+                case Operations::Enum::sum: sample.push_back( new Operation< Operations::Enum::sum >( format ) ); break;
+                case Operations::Enum::size: sample.push_back( new Operation< Operations::Enum::size >( format ) ); break;
             }
-            if( end_ == operations_.size() )
-            {
-                operations_.push_back( operations_t() );
-                for( auto& s: operations_[0] ) { operations_.back().push_back( s->clone() ); }
-            }
-            for( auto& s: operations_[end_] ) { s->reset(); }
-            return operations_[ end_++ ];
         }
-        
-        void reset() { end_ = 0; }
-        
-    private:
-        typedef std::deque< operations_t > operations_t_;
-        operations_t_ operations_;
-        unsigned int end_;
-};
+    }
+    operations.clear();
+    operations.reserve( sample.size() );
+    for( auto& s: sample ) { operations.push_back( s.clone() ); } // todo! this is really slow, if there are many ids
+}
 
-static operations_battery_farm_t operations_battery_farm;
-        
 static void output( const comma::csv::options& csv, results_map_t& results, boost::optional< comma::uint32 > block, bool has_block, bool has_id )
 {
     for( results_map_t::iterator it = results.begin(); it != results.end(); ++it )
@@ -1275,26 +1223,26 @@ static void calculate( const comma::csv::options& csv, operations_map_t& operati
         if( csv.binary() )
         {
             unsigned int size = 0;
-            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i]->output_format().size(); }
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i].output_format().size(); }
             r.reserve( size );
         }
         for( std::size_t i = 0; i < it->second->size(); ++i )
         {
-            ( *it->second )[i]->calculate();
+            ( *it->second )[i].calculate();
             if( csv.binary() )
             { 
-                r.append( ( *it->second )[i]->buffer(), ( *it->second )[i]->output_format().size() );
+                r.append( ( *it->second )[i].buffer(), ( *it->second )[i].output_format().size() );
             }
             else
             {
                 if( i > 0 ) { r += csv.delimiter; }
-                r.append( ( *it->second )[i]->output_format().bin_to_csv( ( *it->second )[i]->buffer(), csv.delimiter, csv.precision ) );
+                r.append( ( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, csv.precision ) );
             }
         }
         results[ it->first ] = r;
     }
+    for( operations_map_t::iterator it = operations.begin(); it != operations.end(); ++it ) { delete it->second; } // quick and dirty
     operations.clear();
-    operations_battery_farm.reset();
 }
 
 int main( int ac, char** av )
@@ -1357,11 +1305,15 @@ int main( int ac, char** av )
         if( options.exists( "--output-format" ) )
         {
             if ( !format ) { std::cerr << comma::verbose.app_name() << ": option --output-format requires input format to be specified, please use --format or --binary" << std::endl; return 1; }
-            auto ops = operations_battery_farm.make( operations_parameters, Values( csv, *format ).format() );
-            std::cout << ops[0]->output_format().string();
-            for( std::size_t i = 1; i < ops.size(); ++i ) { std::cout << ',' << ops[i]->output_format().string(); }
-            if( has_id && !append ) { std::cout << ",ui"; }
-            if( has_block && !append ) { std::cout << ",ui"; }
+            boost::ptr_vector< operation_base > ops;
+            init_operations( ops, operations_parameters, Values(csv, *format).format() );
+            for ( std::size_t i = 0; i < ops.size(); ++i ) 
+            { 
+                if ( i > 0 ) { std::cout << csv.delimiter; }
+                std::cout << ops[i].output_format().string();
+            }
+            if( has_id && !append ) { std::cout << csv.delimiter << "ui"; }
+            if( has_block && !append ) { std::cout << csv.delimiter << "ui"; }
             std::cout << std::endl;
             return 0;
         }
@@ -1372,7 +1324,7 @@ int main( int ac, char** av )
             if( has_block )
             {
                 if( block && *block != v->block() ) 
-                {
+                { 
                     calculate( csv, operations, results );
                     if ( append ) { append_and_output( csv, inputs, results ); inputs.clear(); }
                     else { output( csv, results, block, has_block, has_id ); }
@@ -1382,10 +1334,11 @@ int main( int ac, char** av )
             operations_map_t::iterator it = operations.find( v->id() );
             if( it == operations.end() )
             {
-                it = operations.insert( std::make_pair( v->id(), &operations_battery_farm.make( operations_parameters, v->format() ) ) ).first;
+                it = operations.insert( std::make_pair( v->id(), new boost::ptr_vector< operation_base > ) ).first;
+                init_operations( *it->second, operations_parameters, v->format() );
             }
             if( append ) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
-            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i]->push( v->buffer() ); }
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i].push( v->buffer() ); }
         }
         calculate( csv, operations, results );
         if ( append ) { append_and_output( csv, inputs, results ); }

From 638e20b2f382ae3c3f5bd63d2fb37fab67fc766b Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 7 Feb 2020 13:11:38 +1100
Subject: [PATCH 0130/1056] csv-calc: performance on large number of ids
 somewhat improved...

---
 csv/applications/csv-calc.cpp | 171 +++++++++++++++++++++-------------
 1 file changed, 108 insertions(+), 63 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 044eb4136..18f2e94ce 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifdef WIN32
@@ -437,6 +436,7 @@ namespace Operations
     struct base
     {
         virtual ~base() {}
+        virtual void reset() = 0;
         virtual void push( const char* ) = 0;
         virtual void calculate( char* ) = 0;
         virtual base* clone() const = 0;
@@ -451,6 +451,7 @@ namespace Operations
     class Min : public base
     {
         public:
+            void reset() { min_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 const T& t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -469,6 +470,7 @@ namespace Operations
     class Max : public base
     {
         public:
+            void reset() { max_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -487,6 +489,7 @@ namespace Operations
     class Sum : public base
     {
         public:
+            void reset() { sum_ = boost::optional< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -501,6 +504,7 @@ namespace Operations
     template < comma::csv::format::types_enum F >
     class Sum< boost::posix_time::ptime, F > : public base
     {
+        void reset() { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         base* clone() const { COMMA_THROW( comma::exception, "sum not defined for time" ); }
@@ -510,6 +514,7 @@ namespace Operations
     class Centre : public base
     {
         public:
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< T, F >::to_bin( *min_.min_ + ( *max_.max_ - *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Centre< T, F >( *this ); }
@@ -525,6 +530,7 @@ namespace Operations
     class Mode : public base
     {
         public:
+            void reset() { value_count_ = impl::value_count< T >(); }
             void push( const char* buf ) { value_count_.update( comma::csv::format::traits< T, F >::from_bin( buf ) ); }
             void calculate( char* buf ) { if( !value_count_.map().empty() ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value_count_.mode().first ), buf ); } }
             base* clone() const { return new Mode< T, F >( *this ); }
@@ -537,6 +543,7 @@ namespace Operations
     {
         public:
             Mean() : count_( 0 ) {}
+            void reset() { mean_ = boost::none; count_ = 0; }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -615,8 +622,7 @@ namespace Operations
                             comma::verbose << "NIST linear interpolation method" << std::endl;
                             comma::verbose << "see http://www.itl.nist.gov/div898/handbook/prc/section2/prc262.htm" << std::endl;
                             double x = percentile_ * ( count + 1 );
-                            comma::verbose << "p = " << percentile_ << "; N = " << count
-                                           << "; p(N + 1) = " << x;
+                            comma::verbose << "p = " << percentile_ << "; N = " << count << "; p(N + 1) = " << x;
                             if( x <= 1.0 ) {
                                 comma::verbose << "; below 1 - choosing smallest value" << std::endl;
                                 value = *it;
@@ -631,8 +637,7 @@ namespace Operations
                                 double v1 = *it;
                                 double v2 = *++it;
                                 value = v1 + ( v2 - v1 ) * remainder;
-                                comma::verbose << "v1 = " << v1 << "; v2 = " << v2
-                                               << "; result = " << value << std::endl;
+                                comma::verbose << "v1 = " << v1 << "; v2 = " << v2 << "; result = " << value << std::endl;
                             }
                             break;
                     }
@@ -641,6 +646,8 @@ namespace Operations
             }
 
             base* clone() const { return new Percentile< T, F >( *this ); }
+            
+            void reset() { values_.clear(); }
 
         private:
             std::multiset< T > values_;
@@ -651,6 +658,7 @@ namespace Operations
     template < comma::csv::format::types_enum F >
     class Percentile< boost::posix_time::ptime, F > : public base
     {
+        void reset() { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         base* clone() const { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
@@ -728,6 +736,8 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return previous_.mean(); }
             
+            void reset() { previous_.reset(); value_ = 0; count_ = 0; }
+            
         private:
             Moment< T, M - 1 > previous_;
             typename result_traits< T >::type value_;
@@ -739,6 +749,7 @@ namespace Operations
     {
         public:
             Moment() : value_( 0 ), count_( 0 ) {}
+            
             void update ( const T t )
             {   
                 ++count_;
@@ -747,6 +758,8 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return value_; }
             
+            void reset() { value_ = 0; count_ = 0; }
+            
         private:
             typename result_traits< T >::type value_;
             std::size_t count_;
@@ -768,6 +781,7 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( std::sqrt( static_cast< long double >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() )  ) ) ), buf ); } }
             base* clone() const { return new Stddev< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
             boost::optional<T> first_;
@@ -788,6 +802,7 @@ namespace Operations
             }
             void calculate( char* buf ) { stddev_.calculate(buf); }
             base* clone() const { return new Stddev< boost::posix_time::ptime, F >( *this ); }
+            void reset() { stddev_.reset(); first_ = boost::none; }
         private:
             Stddev< double, F > stddev_;
             boost::optional<boost::posix_time::ptime> first_;
@@ -809,6 +824,7 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() ) ), buf ); } }
             base* clone() const { return new Variance< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
             boost::optional<T> first_;
@@ -829,9 +845,10 @@ namespace Operations
             }
             void calculate( char* buf ) { variance_.calculate(buf); }
             base* clone() const { return new Variance< boost::posix_time::ptime, F >( *this ); }
+            void reset() { variance_.reset(); first_ = boost::none; }
         private:
-            Variance< double, F> variance_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Variance< double, F > variance_;
+            boost::optional< boost::posix_time::ptime > first_;
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -852,7 +869,6 @@ namespace Operations
                 if( moments_.count() > 0 ) 
                 { 
                     typename result_traits< T >::type n = moments_.count();
-                    
                     // corrected sample skew requires at least 3 samples
                     typename result_traits< T >::type correction = sample_ ? sqrt( n * ( n - 1 ) ) / ( n - 2 ) : 1 ;
                     typename result_traits< T >::type m2 = moments_.previous().value();
@@ -861,9 +877,10 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Skew< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 3 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_;
             bool sample_;
     };
 
@@ -881,9 +898,10 @@ namespace Operations
             }
             void calculate( char* buf ) { skew_.calculate(buf); }
             base* clone() const { return new Skew< boost::posix_time::ptime, F >( *this ); }
+            void reset() { skew_.reset(); first_ = boost::none; }
         private:
-            Skew< double, F> skew_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Skew< double, F > skew_;
+            boost::optional< boost::posix_time::ptime > first_;
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -895,8 +913,8 @@ namespace Operations
             { 
                 for (std::size_t i = 0; i < options.size(); i++) 
                 {
-                    if ( options[i] == "sample" ) { sample_ = true; }
-                    else if ( options[i] == "excess" ) { excess_ = true; }
+                    if( options[i] == "sample" ) { sample_ = true; }
+                    else if( options[i] == "excess" ) { excess_ = true; }
                 }
             }
             void push( const char* buf ) 
@@ -923,9 +941,10 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Kurtosis< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 4 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_;
             bool sample_;
             bool excess_;
     };
@@ -944,9 +963,10 @@ namespace Operations
             }
             void calculate( char* buf ) { kurtosis_.calculate(buf); }
             base* clone() const { return new Kurtosis< boost::posix_time::ptime, F >( *this ); }
+            void reset() { kurtosis_.reset(); first_ = boost::none; }
         private:
-            Kurtosis< double, F> kurtosis_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Kurtosis< double, F > kurtosis_;
+            boost::optional< boost::posix_time::ptime > first_;
     };
     
     template < typename T > struct Diff
@@ -968,6 +988,7 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ), buf ); } }
             base* clone() const { return new Diameter< T, F >( *this ); }
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -980,6 +1001,7 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Radius< T, F >( *this ); }
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -993,6 +1015,7 @@ namespace Operations
             void push( const char* ) { ++count_; }
             void calculate( char* buf ) { comma::csv::format::traits< comma::uint32 >::to_bin( count_, buf ); }
             base* clone() const { return new Size< T, F >( *this ); }
+            void reset() { count_ = 0; }
         private:
             std::size_t count_;
     };
@@ -1048,6 +1071,7 @@ class operation_base
         virtual void push( const char* buf ) = 0;
         virtual void calculate() = 0;
         virtual operation_base* clone() const = 0;
+        virtual void reset() = 0;
         const comma::csv::format& output_format() const { return output_format_; }
         const char* buffer() const { return &buffer_[0]; }
 
@@ -1137,48 +1161,74 @@ struct Operation : public operation_base
     {
         for( std::size_t i = 0; i < operations_.size(); ++i ) { operations_[i].calculate( &buffer_[0] + output_elements_[i].offset ); }
     }
+    
+    void reset() { for( auto& o: operations_ ) { o.reset(); } }
 
     operation_base* clone() const { Operation< E >* op = new Operation< E >; return deep_copy_to_( op ); }
 };
 
-typedef boost::unordered_map< comma::uint32, boost::ptr_vector< operation_base >* > operations_map_t;
+typedef boost::unordered_map< comma::uint32, std::vector< operation_base* >* > operations_map_t;
 typedef boost::unordered_map< comma::uint32, std::string > results_map_t;
 typedef std::vector< std::pair < comma::uint32, std::string > > Inputs;
 
-static void init_operations( boost::ptr_vector< operation_base >& operations
-                           , const std::vector< Operations::operation_parameters >& operations_parameters
-                           , const comma::csv::format& format )
+class operations_battery_farm_t // all this pain is because operations polymorhism is too slow when there are a lot of ids
 {
-    static boost::ptr_vector< operation_base > sample;
-    if( sample.empty() )
-    {
-        sample.reserve( operations_parameters.size() );
-        for( std::size_t i = 0; i < operations_parameters.size(); ++i )
+    public:
+        typedef std::vector< operation_base* > operations_t;
+        
+        operations_battery_farm_t(): end_( 0 ) {}
+        
+        ~operations_battery_farm_t()
+        { 
+            for( auto& sample: operations_ ) { for( auto& s: sample ) { delete s; } } // quick and dirty; shame on me
+        }
+        
+        operations_t& make( const std::vector< Operations::operation_parameters >& operations_parameters, const comma::csv::format& format )
         {
-            switch( operations_parameters[i].type )
+            if( operations_.empty() )
             {
-                case Operations::Enum::min: sample.push_back( new Operation< Operations::Enum::min >( format ) ); break;
-                case Operations::Enum::max: sample.push_back( new Operation< Operations::Enum::max >( format ) ); break;
-                case Operations::Enum::centre: sample.push_back( new Operation< Operations::Enum::centre >( format ) ); break;
-                case Operations::Enum::mean: sample.push_back( new Operation< Operations::Enum::mean >( format ) ); break;
-                case Operations::Enum::mode: sample.push_back( new Operation< Operations::Enum::mode >( format ) ); break;
-                case Operations::Enum::percentile: sample.push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::radius: sample.push_back( new Operation< Operations::Enum::radius >( format ) ); break;
-                case Operations::Enum::diameter: sample.push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
-                case Operations::Enum::variance: sample.push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::stddev: sample.push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::skew: sample.push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::kurtosis: sample.push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::sum: sample.push_back( new Operation< Operations::Enum::sum >( format ) ); break;
-                case Operations::Enum::size: sample.push_back( new Operation< Operations::Enum::size >( format ) ); break;
+                operations_.push_back( operations_t() );
+                operations_[0].reserve( operations_parameters.size() );
+                for( std::size_t i = 0; i < operations_parameters.size(); ++i )
+                {
+                    switch( operations_parameters[i].type )
+                    {
+                        case Operations::Enum::min: operations_[0].push_back( new Operation< Operations::Enum::min >( format ) ); break;
+                        case Operations::Enum::max: operations_[0].push_back( new Operation< Operations::Enum::max >( format ) ); break;
+                        case Operations::Enum::centre: operations_[0].push_back( new Operation< Operations::Enum::centre >( format ) ); break;
+                        case Operations::Enum::mean: operations_[0].push_back( new Operation< Operations::Enum::mean >( format ) ); break;
+                        case Operations::Enum::mode: operations_[0].push_back( new Operation< Operations::Enum::mode >( format ) ); break;
+                        case Operations::Enum::percentile: operations_[0].push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::radius: operations_[0].push_back( new Operation< Operations::Enum::radius >( format ) ); break;
+                        case Operations::Enum::diameter: operations_[0].push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
+                        case Operations::Enum::variance: operations_[0].push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::stddev: operations_[0].push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::skew: operations_[0].push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::kurtosis: operations_[0].push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::sum: operations_[0].push_back( new Operation< Operations::Enum::sum >( format ) ); break;
+                        case Operations::Enum::size: operations_[0].push_back( new Operation< Operations::Enum::size >( format ) ); break;
+                    }
+                }
             }
+            if( end_ == operations_.size() )
+            {
+                operations_.push_back( operations_t() );
+                for( auto& s: operations_[0] ) { operations_.back().push_back( s->clone() ); }
+            }
+            for( auto& s: operations_[end_] ) { s->reset(); }
+            return operations_[ end_++ ];
         }
-    }
-    operations.clear();
-    operations.reserve( sample.size() );
-    for( auto& s: sample ) { operations.push_back( s.clone() ); } // todo! this is really slow, if there are many ids
-}
+        
+        void reset() { end_ = 0; }
+        
+    private:
+        typedef std::deque< operations_t > operations_t_;
+        operations_t_ operations_;
+        unsigned int end_;
+};
 
+static operations_battery_farm_t operations_battery_farm;
+        
 static void output( const comma::csv::options& csv, results_map_t& results, boost::optional< comma::uint32 > block, bool has_block, bool has_id )
 {
     for( results_map_t::iterator it = results.begin(); it != results.end(); ++it )
@@ -1223,26 +1273,26 @@ static void calculate( const comma::csv::options& csv, operations_map_t& operati
         if( csv.binary() )
         {
             unsigned int size = 0;
-            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i].output_format().size(); }
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i]->output_format().size(); }
             r.reserve( size );
         }
         for( std::size_t i = 0; i < it->second->size(); ++i )
         {
-            ( *it->second )[i].calculate();
+            ( *it->second )[i]->calculate();
             if( csv.binary() )
             { 
-                r.append( ( *it->second )[i].buffer(), ( *it->second )[i].output_format().size() );
+                r.append( ( *it->second )[i]->buffer(), ( *it->second )[i]->output_format().size() );
             }
             else
             {
                 if( i > 0 ) { r += csv.delimiter; }
-                r.append( ( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, csv.precision ) );
+                r.append( ( *it->second )[i]->output_format().bin_to_csv( ( *it->second )[i]->buffer(), csv.delimiter, csv.precision ) );
             }
         }
         results[ it->first ] = r;
     }
-    for( operations_map_t::iterator it = operations.begin(); it != operations.end(); ++it ) { delete it->second; } // quick and dirty
     operations.clear();
+    operations_battery_farm.reset();
 }
 
 int main( int ac, char** av )
@@ -1305,15 +1355,11 @@ int main( int ac, char** av )
         if( options.exists( "--output-format" ) )
         {
             if ( !format ) { std::cerr << comma::verbose.app_name() << ": option --output-format requires input format to be specified, please use --format or --binary" << std::endl; return 1; }
-            boost::ptr_vector< operation_base > ops;
-            init_operations( ops, operations_parameters, Values(csv, *format).format() );
-            for ( std::size_t i = 0; i < ops.size(); ++i ) 
-            { 
-                if ( i > 0 ) { std::cout << csv.delimiter; }
-                std::cout << ops[i].output_format().string();
-            }
-            if( has_id && !append ) { std::cout << csv.delimiter << "ui"; }
-            if( has_block && !append ) { std::cout << csv.delimiter << "ui"; }
+            auto ops = operations_battery_farm.make( operations_parameters, Values( csv, *format ).format() );
+            std::cout << ops[0]->output_format().string();
+            for( std::size_t i = 1; i < ops.size(); ++i ) { std::cout << ',' << ops[i]->output_format().string(); }
+            if( has_id && !append ) { std::cout << ",ui"; }
+            if( has_block && !append ) { std::cout << ",ui"; }
             std::cout << std::endl;
             return 0;
         }
@@ -1324,7 +1370,7 @@ int main( int ac, char** av )
             if( has_block )
             {
                 if( block && *block != v->block() ) 
-                { 
+                {
                     calculate( csv, operations, results );
                     if ( append ) { append_and_output( csv, inputs, results ); inputs.clear(); }
                     else { output( csv, results, block, has_block, has_id ); }
@@ -1334,11 +1380,10 @@ int main( int ac, char** av )
             operations_map_t::iterator it = operations.find( v->id() );
             if( it == operations.end() )
             {
-                it = operations.insert( std::make_pair( v->id(), new boost::ptr_vector< operation_base > ) ).first;
-                init_operations( *it->second, operations_parameters, v->format() );
+                it = operations.insert( std::make_pair( v->id(), &operations_battery_farm.make( operations_parameters, v->format() ) ) ).first;
             }
             if( append ) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
-            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i].push( v->buffer() ); }
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i]->push( v->buffer() ); }
         }
         calculate( csv, operations, results );
         if ( append ) { append_and_output( csv, inputs, results ); }

From 1b9c02e982dd5dd43d3c8aec058d0d4694d70000 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 7 Feb 2020 13:42:39 +1100
Subject: [PATCH 0131/1056] csv-calc: minor refactoring to improve
 performance...

---
 csv/applications/csv-calc.cpp | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 18f2e94ce..69b326619 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -596,7 +596,6 @@ namespace Operations
             void calculate( char* buf )
             {
                 std::size_t count = values_.size();
-
                 if( count > 0 )
                 {
                     comma::verbose << "calculating " << percentile_*100 << "th percentile using ";
@@ -1180,7 +1179,7 @@ class operations_battery_farm_t // all this pain is because operations polymorhi
         
         ~operations_battery_farm_t()
         { 
-            for( auto& sample: operations_ ) { for( auto& s: sample ) { delete s; } } // quick and dirty; shame on me
+            for( auto& operation: operations_ ) { for( auto& o: operation ) { delete o; } } // quick and dirty; shame on me
         }
         
         operations_t& make( const std::vector< Operations::operation_parameters >& operations_parameters, const comma::csv::format& format )
@@ -1212,8 +1211,8 @@ class operations_battery_farm_t // all this pain is because operations polymorhi
             }
             if( end_ == operations_.size() )
             {
-                operations_.push_back( operations_t() );
-                for( auto& s: operations_[0] ) { operations_.back().push_back( s->clone() ); }
+                operations_.push_back( operations_t( operations_[0].size() ) );
+                for( unsigned int i = 0; i < operations_[0].size(); ++i ) { operations_.back()[i] = operations_[0][i]->clone(); }
             }
             for( auto& s: operations_[end_] ) { s->reset(); }
             return operations_[ end_++ ];

From 33eba1b3dffae79421d1af845cf070d5aa74d7f2 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 7 Feb 2020 15:59:17 +1100
Subject: [PATCH 0132/1056] csv-calc: trivial refactoring

---
 csv/applications/csv-calc.cpp | 120 +++++++++++++++-------------------
 1 file changed, 54 insertions(+), 66 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 69b326619..7ca448927 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -543,7 +543,7 @@ namespace Operations
     {
         public:
             Mean() : count_( 0 ) {}
-            void reset() { mean_ = boost::none; count_ = 0; }
+            void reset() { mean_.reset(); count_ = 0; }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -565,83 +565,71 @@ namespace Operations
 
             Percentile() : percentile_( 0.0 ), method_( nearest ) {}
 
-            void push( const char* buf )
-            {
-                values_.insert( comma::csv::format::traits< T, F >::from_bin( buf ));
-            }
+            void push( const char* buf ) { values_.insert( comma::csv::format::traits< T, F >::from_bin( buf ) ); }
 
             void set_options( const std::vector< std::string >& options )
             {
-                if( options.size() == 0 ) {
-                    std::cerr << comma::verbose.app_name() << ": percentile operation requires a percentile" << std::endl;
-                    exit( 1 );
-                }
-
+                if( options.empty() ) { std::cerr << comma::verbose.app_name() << ": percentile operation requires a percentile" << std::endl; exit( 1 ); }
                 percentile_ = boost::lexical_cast< double >( options[0] );
-                if( percentile_ < 0.0 || percentile_ > 1.0 ) {
-                    std::cerr << comma::verbose.app_name() << ": percentile value should be between 0 and 1, got " << percentile_ << std::endl;
-                    exit( 1 );
-                }
-
-                if( options.size() == 2 ) {
-                    if( options[1] == "nearest" ) method_ = nearest;
-                    else if( options[1] == "interpolate" ) method_ = interpolate;
-                    else {
-                        std::cerr << comma::verbose.app_name() << ": expected percentile method, got " << options[1] << std::endl;
-                        exit( 1 );
-                    }
-                }
+                if( percentile_ < 0.0 || percentile_ > 1.0 ) { std::cerr << comma::verbose.app_name() << ": percentile value should be between 0 and 1, got " << percentile_ << std::endl; exit( 1 ); }
+                if( options.size() < 2 ) { return; }
+                if( options[1] == "nearest" ) { method_ = nearest; }
+                else if( options[1] == "interpolate" ) { method_ = interpolate; }
+                else { std::cerr << comma::verbose.app_name() << ": expected percentile method, got '" << options[1] << "'" << std::endl; exit( 1 ); }
             }
 
             void calculate( char* buf )
             {
+                if( values_.empty() ) { return; }
                 std::size_t count = values_.size();
-                if( count > 0 )
+                comma::verbose << "calculating " << percentile_*100 << "th percentile using ";
+                T value;
+                typename std::multiset< T >::iterator it = values_.begin();
+                switch( method_ )
                 {
-                    comma::verbose << "calculating " << percentile_*100 << "th percentile using ";
-                    T value;
-                    typename std::multiset< T >::iterator it = values_.begin();
-                    switch( method_ )
-                    {
-                        std::size_t rank;
-                        
-                        case nearest:
-                            // https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method
-                            comma::verbose << "nearest rank method" << std::endl;
-                            comma::verbose << "see https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method" << std::endl;
-                            rank = ( percentile_ == 0.0 ? 1 : std::ceil( count * percentile_ ));
-                            comma::verbose << "n = " << rank << std::endl;
-                            std::advance( it, rank - 1 );
+                    std::size_t rank;
+                    
+                    case nearest:
+                        // https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method
+                        comma::verbose << "nearest rank method" << std::endl;
+                        comma::verbose << "see https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method" << std::endl;
+                        rank = ( percentile_ == 0.0 ? 1 : std::ceil( count * percentile_ ));
+                        comma::verbose << "n = " << rank << std::endl;
+                        std::advance( it, rank - 1 );
+                        value = *it;
+                        break;
+
+                    case interpolate:
+                        // https://en.wikipedia.org/wiki/Percentile#The_Linear_Interpolation_Between_Closest_Ranks_method
+                        // (third method in that section)
+                        comma::verbose << "NIST linear interpolation method" << std::endl;
+                        comma::verbose << "see http://www.itl.nist.gov/div898/handbook/prc/section2/prc262.htm" << std::endl;
+                        double x = percentile_ * ( count + 1 );
+                        comma::verbose << "p = " << percentile_ << "; N = " << count << "; p(N + 1) = " << x;
+                        if( x <= 1.0 )
+                        {
+                            comma::verbose << "; below 1 - choosing smallest value" << std::endl;
                             value = *it;
-                            break;
-
-                        case interpolate:
-                            // https://en.wikipedia.org/wiki/Percentile#The_Linear_Interpolation_Between_Closest_Ranks_method
-                            // (third method in that section)
-                            comma::verbose << "NIST linear interpolation method" << std::endl;
-                            comma::verbose << "see http://www.itl.nist.gov/div898/handbook/prc/section2/prc262.htm" << std::endl;
-                            double x = percentile_ * ( count + 1 );
-                            comma::verbose << "p = " << percentile_ << "; N = " << count << "; p(N + 1) = " << x;
-                            if( x <= 1.0 ) {
-                                comma::verbose << "; below 1 - choosing smallest value" << std::endl;
-                                value = *it;
-                            } else if( x >= count ) {
-                                comma::verbose << "; above N - choosing largest value" << std::endl;
-                                value = *( values_.rbegin() );
-                            } else {
-                                rank = x;
-                                double remainder = x - rank;
-                                comma::verbose << "; k = " << rank << "; d = " << remainder << std::endl;
-                                std::advance( it, rank - 1 );
-                                double v1 = *it;
-                                double v2 = *++it;
-                                value = v1 + ( v2 - v1 ) * remainder;
-                                comma::verbose << "v1 = " << v1 << "; v2 = " << v2 << "; result = " << value << std::endl;
-                            }
-                            break;
-                    }
-                    comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value ), buf );
+                        }
+                        else if( x >= count )
+                        {
+                            comma::verbose << "; above N - choosing largest value" << std::endl;
+                            value = *( values_.rbegin() );
+                        }
+                        else
+                        {
+                            rank = x;
+                            double remainder = x - rank;
+                            comma::verbose << "; k = " << rank << "; d = " << remainder << std::endl;
+                            std::advance( it, rank - 1 );
+                            double v1 = *it;
+                            double v2 = *++it;
+                            value = v1 + ( v2 - v1 ) * remainder;
+                            comma::verbose << "v1 = " << v1 << "; v2 = " << v2 << "; result = " << value << std::endl;
+                        }
+                        break;
                 }
+                comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value ), buf );
             }
 
             base* clone() const { return new Percentile< T, F >( *this ); }

From 59ad3efdcb8cd3c14993d2aeb073b7e98ebfd874 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 7 Feb 2020 16:07:30 +1100
Subject: [PATCH 0133/1056] csv-calc: trivial refactoring

---
 csv/applications/csv-calc.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 7ca448927..181e6ab60 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1077,7 +1077,7 @@ class operation_base
             lhs->output_format_ = output_format_;
             lhs->output_elements_ = output_elements_;
             lhs->buffer_ = buffer_;
-            for( std::size_t i = 0; i < operations_.size(); ++i ) { lhs->operations_.push_back( operations_[i].clone() ); }
+            for( auto& o: operations_ ) { lhs->operations_.push_back( o.clone() ); }
             return lhs;
         }
 };

From d888ccb61520adf05039898f35f65529b29f0ed1 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 11 Feb 2020 09:46:21 +1100
Subject: [PATCH 0134/1056] csv-strings: add operation implemented

---
 csv/applications/csv-strings.cpp | 41 ++++++++++++++++++++++++--------
 csv/test/csv-strings/expected    |  3 +++
 csv/test/csv-strings/input       |  3 +++
 3 files changed, 37 insertions(+), 10 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index c1fa2feea..f1140f820 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -74,6 +74,7 @@ static void usage( bool verbose )
     std::cerr << "    usage: cat input.csv | csv-strings <operation> [<options>] > output.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
+    std::cerr << "    add" << std::endl;
     std::cerr << "    path-basename,basename" << std::endl;
     std::cerr << "    path-dirname,dirname" << std::endl;
     std::cerr << "    path-real,path-canonical,canonical" << std::endl;
@@ -85,6 +86,11 @@ static void usage( bool verbose )
     std::cerr << "                         default: perform operation on the first field" << std::endl;
     std::cerr << "    --strict; exit on strings on which operation does not make sense" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "add" << std::endl;
+    std::cerr << "    options" << std::endl;
+    std::cerr << "        --prefix=[<prefix>]; add prefix" << std::endl;
+    std::cerr << "        --suffix=[<suffix>]; add suffix" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "path-basename,basename" << std::endl;
     std::cerr << "    options" << std::endl;
     std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to remove" << std::endl;
@@ -110,7 +116,7 @@ static void usage( bool verbose )
 static bool strict;
 static comma::csv::options csv;
 
-namespace comma { namespace applications { namespace strings { namespace path {
+namespace comma { namespace applications { namespace strings {
 
 template < typename T >
 struct record
@@ -121,19 +127,19 @@ struct record
 
 typedef record< std::string > input;
 
-} } } } // namespace comma { namespace applications { namespace strings { namespace path {
+} } } // namespace comma { namespace applications { namespace strings {
 
 namespace comma { namespace visiting {
 
-template < typename T > struct traits< comma::applications::strings::path::record< T > >
+template < typename T > struct traits< comma::applications::strings::record< T > >
 {
-    template < typename K, typename V > static void visit( const K&, const comma::applications::strings::path::record< T >& p, V& v ) { v.apply( "values", p.values ); }
-    template < typename K, typename V > static void visit( const K&, comma::applications::strings::path::record< T >& p, V& v ) { v.apply( "values", p.values ); }
+    template < typename K, typename V > static void visit( const K&, const comma::applications::strings::record< T >& p, V& v ) { v.apply( "values", p.values ); }
+    template < typename K, typename V > static void visit( const K&, comma::applications::strings::record< T >& p, V& v ) { v.apply( "values", p.values ); }
 };
 
 } } // namespace comma { namespace visiting {
 
-namespace comma { namespace applications { namespace strings { namespace path {
+namespace comma { namespace applications { namespace strings {
 
 template < typename T >
 static int run( const comma::command_line_options& options )
@@ -179,6 +185,8 @@ static int run( const comma::command_line_options& options )
     return run_();
 }
 
+namespace path {
+
 struct basename
 {
     typedef input output_t;
@@ -268,7 +276,19 @@ struct canonical
     }
 };
 
-} } } } // namespace comma { namespace applications { namespace strings { namespace path {
+} // namespace path {
+
+struct add
+{
+    typedef input output_t;
+    std::string prefix;
+    std::string suffix;
+    static const char* name() { return "add"; }
+    add( const comma::command_line_options& options ): prefix( options.value( "--prefix", std::string() ) ), suffix( options.value( "--suffix", std::string() ) ) {}
+    std::string convert( const std::string& t ) { return prefix + t + suffix; }
+};
+    
+} } } // namespace comma { namespace applications { namespace strings {
 
 int main( int ac, char** av )
 {
@@ -280,9 +300,10 @@ int main( int ac, char** av )
         std::string operation = unnamed[0];
         strict = options.exists( "--strict" );
         csv = comma::csv::options( options );
-        if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::path::run< comma::applications::strings::path::basename >( options ); }
-        if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::path::run< comma::applications::strings::path::dirname >( options ); }
-        if( operation == "path-real" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::path::run< comma::applications::strings::path::canonical >( options ); }
+        if( operation == "add" ) { return comma::applications::strings::run< comma::applications::strings::add >( options ); }
+        if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::run< comma::applications::strings::path::basename >( options ); }
+        if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::run< comma::applications::strings::path::dirname >( options ); }
+        if( operation == "path-real" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::run< comma::applications::strings::path::canonical >( options ); }
         std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
         return 1;
     }
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index 4432d8d83..88e6f5b44 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -134,3 +134,6 @@ fields[4]/output/line[2]="m,,a/b,,x/y"
 fields[5]/output/line[0]="k,,,,"
 fields[5]/output/line[1]="l,,,,"
 fields[5]/output/line[2]="m,,a,,x"
+
+add[0]/output="a,b,xay,xby"
+add[1]/output="xay,xby"
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index b02076f42..ae544b409 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -52,3 +52,6 @@ fields[2]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-string
 fields[3]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n"
 fields[4]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace"
 fields[5]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace --tail 2"
+
+add[0]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b"
+add[1]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b --emplace"

From f9d500354fef1c6e953ce98d9c13eb5ab3c8fa71 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 11 Feb 2020 12:59:46 +1100
Subject: [PATCH 0135/1056] csv-split: --files: if directory in output file
 path does not exist, create it

---
 csv/applications/split/split.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 31e93695e..056c82b0c 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -336,6 +336,11 @@ std::ofstream* split< T >::ofstream_by_id_()
         else { mode |= std::ofstream::app; }
         std::string name = filename_from_id_( current_.id );
         if( name.empty() ) { return nullptr; }
+        const auto& dirname = boost::filesystem::path( name ).parent_path();
+        if( !( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) )
+        {
+            COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << name << "'" );
+        }
         std::shared_ptr< std::ofstream > stmp( new std::ofstream( &name[0], mode ) );
         it = files_.insert( std::make_pair( current_.id, stmp ) ).first;
     }

From dce6a8af2bd6ba9f5adca41d6ff01f942be0c960 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 13 Feb 2020 18:04:24 +1100
Subject: [PATCH 0136/1056] comma-call-graph: error message directed to stderr
 instead of stdout

---
 bash/applications/comma-call-graph | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bash/applications/comma-call-graph b/bash/applications/comma-call-graph
index 3ebef826a..d9e916ace 100755
--- a/bash/applications/comma-call-graph
+++ b/bash/applications/comma-call-graph
@@ -108,10 +108,10 @@ load_options $@
 
 if [[ $dot_output && $dot_output != "dot" ]]; then
     type -p dot > /dev/null || {
-        echo "$basename requires graphviz"
-        echo "Install on Ubuntu with:"
-        echo "$ sudo apt-get install graphviz"
-        exit
+        echo "$basename: requires graphviz" >&2
+        echo "$basename: install on ubuntu with:" >&2
+        echo "$basename: sudo apt-get install graphviz" >&2
+        exit 1
     }
     output_fn="dot -T$dot_output"
 else

From 5b63bc4f0babb8d5aba111d3935b10f442ed5075 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Tue, 25 Feb 2020 19:35:56 +1100
Subject: [PATCH 0137/1056] comma.signal: disabling sigpipe signal commented
 out; csv-eval: sigpipe disabled by hand

---
 python/comma/csv/applications/csv_eval.py | 2 ++
 python/comma/signal/signal.py             | 2 +-
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 7e2ad7a07..37b8d2927 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -34,6 +34,7 @@
 import numpy as np
 import os
 import re
+import signal
 import sys
 if sys.version_info.major < 3: from itertools import izip
 else: izip = zip # todo! watch performance! it's reported python3 zip is some 30% slower than izip
@@ -619,6 +620,7 @@ def exit_if(stream):
 
 def main():
     try:
+        signal.signal( signal.SIGPIPE, signal.SIG_DFL )
         comma.csv.time.zone('UTC')
         args = get_args()
         prepare_options(args)
diff --git a/python/comma/signal/signal.py b/python/comma/signal/signal.py
index 34ed994bb..9612127e6 100644
--- a/python/comma/signal/signal.py
+++ b/python/comma/signal/signal.py
@@ -49,4 +49,4 @@ def __bool__( self ): return self.state
 
     __nonzero__ = __bool__
 
-signal.signal( signal.SIGPIPE, signal.SIG_DFL )
+# signal.signal( signal.SIGPIPE, signal.SIG_DFL )

From d7f45ef9f9d728cf60e9ae0dee9e2f30a8cc8be0 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 24 Feb 2020 14:23:20 +1100
Subject: [PATCH 0138/1056] check.c++.standard.cmake: remove unnecessary loop

it looks like it was just there for early debugging
---
 CMakeFiles/check.c++.standard.cmake | 43 +++++++++++++----------------
 1 file changed, 19 insertions(+), 24 deletions(-)

diff --git a/CMakeFiles/check.c++.standard.cmake b/CMakeFiles/check.c++.standard.cmake
index fd1942322..1b188830e 100644
--- a/CMakeFiles/check.c++.standard.cmake
+++ b/CMakeFiles/check.c++.standard.cmake
@@ -28,27 +28,22 @@
  #########################################################################
 " )
     ENDIF()
-    FOREACH( STANDARD ${CXX_STANDARDS} )
-        # message( "Check if using C++${STANDARD}" )
-        IF( ${CXX_STANDARD_TO_USE} MATCHES "${STANDARD}" )
-            # message( "Yes, using C++${STANDARD}" )
-            IF( NOT ( ${CXX_STANDARD_TO_USE} MATCHES ${CXX_STANDARD_LAST} ) )
-                # message( "Have to check if ${CMAKE_CXX_COMPILER} supports C++${STANDARD}" )
-                message( "Attempt to use C++ standard ${STANDARD}" )
-		UNSET( compiler_supports_standard CACHE )
-		UNSET( compiler_flag_to_check CACHE )
-		SET( compiler_flag_to_check "-std=c++${STANDARD}" )
-		if ( CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND ${STANDARD} MATCHES "11" )
-		    set( compiler_flag_to_check "${compiler_flag_to_check} -Wc++11-narrowing" )
-		endif()
-		CHECK_CXX_COMPILER_FLAG( "${compiler_flag_to_check}" compiler_supports_standard )
-		if( NOT compiler_supports_standard )
-		    message( FATAL_ERROR "attempt to use C++ standard ${STANDARD} but ${CMAKE_CXX_COMPILER} does not support it" )
-		endif()
-                STRING( REPLACE " ${CXX_STANDARD_FLAGS}" "" CXX_FLAGS_NO_STANDARD "${CMAKE_CXX_FLAGS}" )
-		SET( CXX_STANDARD_FLAGS ${compiler_flag_to_check} CACHE STRING "updating compiler flags selecting C++ standard" FORCE )
-		SET( CXX_STANDARD_LAST ${CXX_STANDARD_TO_USE} CACHE STRING "updating C++ standard to use option" FORCE )
-                set( CMAKE_CXX_FLAGS "${CXX_FLAGS_NO_STANDARD} ${compiler_flag_to_check}" CACHE STRING "" FORCE )
-            ENDIF()
-        ENDIF()
-    ENDFOREACH()
+
+    IF( NOT ( ${CXX_STANDARD_TO_USE} MATCHES ${CXX_STANDARD_LAST} ) )
+        # message( "Have to check if ${CMAKE_CXX_COMPILER} supports C++${CXX_STANDARD_TO_USE}" )
+        message( "Attempt to use C++ standard ${CXX_STANDARD_TO_USE}" )
+        UNSET( compiler_supports_standard CACHE )
+        UNSET( compiler_flag_to_check CACHE )
+        SET( compiler_flag_to_check "-std=c++${CXX_STANDARD_TO_USE}" )
+        if ( CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND ${CXX_STANDARD_TO_USE} MATCHES "11" )
+            set( compiler_flag_to_check "${compiler_flag_to_check} -Wc++11-narrowing" )
+        endif()
+        CHECK_CXX_COMPILER_FLAG( "${compiler_flag_to_check}" compiler_supports_standard )
+        if( NOT compiler_supports_standard )
+            message( FATAL_ERROR "attempt to use C++ standard ${CXX_STANDARD_TO_USE} but ${CMAKE_CXX_COMPILER} does not support it" )
+        endif()
+        STRING( REPLACE " ${CXX_STANDARD_FLAGS}" "" CXX_FLAGS_NO_STANDARD "${CMAKE_CXX_FLAGS}" )
+        SET( CXX_STANDARD_FLAGS ${compiler_flag_to_check} CACHE STRING "updating compiler flags selecting C++ standard" FORCE )
+        SET( CXX_STANDARD_LAST ${CXX_STANDARD_TO_USE} CACHE STRING "updating C++ standard to use option" FORCE )
+        set( CMAKE_CXX_FLAGS "${CXX_FLAGS_NO_STANDARD} ${compiler_flag_to_check}" CACHE STRING "" FORCE )
+    ENDIF()

From 1dc6bb58f7c71d936bf8c8ad60b9e2a3a68693ce Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 24 Feb 2020 14:51:51 +1100
Subject: [PATCH 0139/1056] check.c++.standard.cmake: use CMAKE_CXX_STANDARD to
 set standard flag

rather than directly setting it through CMAKE_CXX_FLAGS.

Using CMAKE_CXX_FLAGS breaks when using Qt and a version later than C++11.
Qt will set -std=gnu+11 if CMAKE_CXX_STANDARD is not set, overriding the
desired setting.
---
 CMakeFiles/check.c++.standard.cmake | 11 +++++------
 CMakeLists.txt                      |  2 +-
 2 files changed, 6 insertions(+), 7 deletions(-)

diff --git a/CMakeFiles/check.c++.standard.cmake b/CMakeFiles/check.c++.standard.cmake
index 1b188830e..d734acf41 100644
--- a/CMakeFiles/check.c++.standard.cmake
+++ b/CMakeFiles/check.c++.standard.cmake
@@ -17,7 +17,6 @@
 	 MARK_AS_ADVANCED( FORCE CXX_STANDARD_FLAGS )
     ENDIF()
 
-    # A much better way to do this is with CXX_STANDARD but that requires CMake 3.1
     include( CheckCXXCompilerFlag )
     IF( ${CXX_STANDARD_TO_USE} MATCHES "0x" )
         message( WARNING "
@@ -36,14 +35,14 @@
         UNSET( compiler_flag_to_check CACHE )
         SET( compiler_flag_to_check "-std=c++${CXX_STANDARD_TO_USE}" )
         if ( CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND ${CXX_STANDARD_TO_USE} MATCHES "11" )
-            set( compiler_flag_to_check "${compiler_flag_to_check} -Wc++11-narrowing" )
+            set( extra_compiler_flags "${compiler_flag_to_check} -Wc++11-narrowing" )
         endif()
-        CHECK_CXX_COMPILER_FLAG( "${compiler_flag_to_check}" compiler_supports_standard )
+        CHECK_CXX_COMPILER_FLAG( "${compiler_flag_to_check} ${extra_compiler_flags}" compiler_supports_standard )
         if( NOT compiler_supports_standard )
             message( FATAL_ERROR "attempt to use C++ standard ${CXX_STANDARD_TO_USE} but ${CMAKE_CXX_COMPILER} does not support it" )
         endif()
-        STRING( REPLACE " ${CXX_STANDARD_FLAGS}" "" CXX_FLAGS_NO_STANDARD "${CMAKE_CXX_FLAGS}" )
-        SET( CXX_STANDARD_FLAGS ${compiler_flag_to_check} CACHE STRING "updating compiler flags selecting C++ standard" FORCE )
         SET( CXX_STANDARD_LAST ${CXX_STANDARD_TO_USE} CACHE STRING "updating C++ standard to use option" FORCE )
-        set( CMAKE_CXX_FLAGS "${CXX_FLAGS_NO_STANDARD} ${compiler_flag_to_check}" CACHE STRING "" FORCE )
+        set( CMAKE_CXX_FLAGS "${extra_compiler_flags}" CACHE STRING "" FORCE )
     ENDIF()
+
+    set( CMAKE_CXX_STANDARD ${CXX_STANDARD_TO_USE} )
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 980e1a74e..e21f8de81 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 PROJECT( "comma" )
 
-cmake_minimum_required(VERSION 2.6)
+cmake_minimum_required( VERSION 3.1 )
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )

From 201c05d55ff5bdaba8859abeee004e97fb7f97d7 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 27 Feb 2020 16:02:03 +1100
Subject: [PATCH 0140/1056] csv-random: make operation implemented

---
 csv/applications/csv-random.cpp | 112 ++++++++++++++++++++++++++++++--
 1 file changed, 108 insertions(+), 4 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index aa5e5b038..28ee82acc 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -83,6 +83,17 @@ static void usage( bool verbose )
     std::cerr << "    --seed=[<int>]; random seed" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
+    std::cerr << "    make: output pseudo-random numbers" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        usage: csv-random make <options> > random.csv" << std::endl;
+    std::cerr << "               cat records.csv | csv-random make --append <options> > appended.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --append; append random numbers to stdin input" << std::endl;
+    std::cerr << "            --distribution=<distribution>; default=uniform; values: uniform, more todo, just ask" << std::endl;
+    std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
+    std::cerr << "            --type=<type>; default=i; supported values: i, ui, f, d" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "    shuffle: output input records in pseudo-random order" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv" << std::endl;
@@ -121,7 +132,97 @@ template <> struct traits< comma::applications::random::shuffle::input >
 
 } } // namespace comma { namespace visiting {
 
-namespace comma { namespace applications { namespace random { namespace shuffle {
+namespace comma { namespace applications { namespace random {
+
+namespace make {
+
+template < typename T, typename Distribution >
+static int run_impl( Distribution& distribution, bool append )
+{
+    std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
+    if( !::csv.flush ) { std::cin.tie( NULL ); }
+    if( append )
+    {
+        if( ::csv.binary() )
+        {
+            std::vector< char > buf( ::csv.format().size() );
+            while( std::cin.good() )
+            {
+                std::cin.read( &buf[0], buf.size() );
+                if( std::cin.gcount() == 0 ) { break; }
+                if( std::cin.gcount() != int( buf.size() ) ) { std::cerr << "csv-random: make: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                std::cout.write( &buf[0], buf.size() );
+                T r = distribution( generator );
+                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
+                if( ::csv.flush ) { std::cout.flush(); }
+            }
+        }
+        else
+        {
+            while( std::cin.good() )
+            {
+                std::string s;
+                std::getline( std::cin, s );
+                if( s.empty() ) { continue; }
+                std::cout << s << ::csv.delimiter << distribution( generator ) << std::endl;
+                if( ::csv.flush ) { std::cout.flush(); }
+            }
+        }
+    }
+    else
+    {
+        while( std::cout.good() )
+        {
+            T r = distribution( generator );
+            if( ::csv.binary() ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) ); }
+            else { std::cout << r << std::endl; }
+            if( ::csv.flush ) { std::cout.flush(); }
+        }
+    }
+    return 0;
+}
+
+template < typename T, template < typename > class Distribution >
+static int run_impl( const comma::command_line_options& options )
+{
+    bool append = options.exists( "--append" );
+    auto r = options.optional< std::string >( "--range" );
+    auto range = comma::csv::ascii< std::pair< T, T > >().get( *r );
+    auto distribution = r ? Distribution< T >( range.first, range.second ) : Distribution< T >();
+    return run_impl< T >( distribution, append );
+}
+    
+static int run( const comma::command_line_options& options ) // quick and dirty
+{
+    auto distribution = options.value< std::string >( "--distribution", "uniform" );
+    auto type = options.value< std::string >( "--type", "int" );
+    if( type == "i" )
+    {
+        if( distribution == "uniform" ) { return run_impl< comma::int32, std::uniform_int_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
+    if( type == "ui" )
+    {
+        if( distribution == "uniform" ) { return run_impl< comma::int32, std::uniform_int_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
+    if( type == "f" )
+    {
+        if( distribution == "uniform" ) { return run_impl< float, std::uniform_real_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
+    if( type == "d" )
+    {
+        if( distribution == "uniform" ) { return run_impl< double, std::uniform_real_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
+    std::cerr << "csv-random make: expected type; got: '" << type << "'" << std::endl;
+    return 1;
+}
+
+} // namespace make {
+
+namespace shuffle {
 
 static int run( const comma::command_line_options& options )
 {
@@ -194,7 +295,9 @@ static int run( const comma::command_line_options& options )
     return 0;
 }
 
-} } } } // namespace comma { namespace applications { namespace random { namespace shuffle {
+} // namespace shuffle {
+
+} } } // namespace comma { namespace applications { namespace random {
 
 int main( int ac, char** av )
 {
@@ -203,10 +306,11 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         const auto& unnamed = options.unnamed( "--flush,--verbose,-v", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-random: please specify operation" << std::endl; return 1; }
-        csv = comma::csv::options( options );
+        ::csv = comma::csv::options( options );
         seed = options.optional< int >( "--seed" );
-        verbose = options.exists( "--verbose,-v" );
+        ::verbose = options.exists( "--verbose,-v" );
         std::string operation = unnamed[0];
+        if( operation == "make" ) { return comma::applications::random::make::run( options ); }
         if( operation == "shuffle" ) { return comma::applications::random::shuffle::run( options ); }
         std::cerr << "csv-random: expection operation; got: '" << operation << "'" << std::endl;
         return 1;

From b05e0878306e83ace3803265abf1bf02fb69e8c2 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 27 Feb 2020 16:46:23 +1100
Subject: [PATCH 0141/1056] csv-random: make operation: a few bugs fixed; usage
 semantics fixed

---
 csv/applications/csv-random.cpp | 69 +++++++++++++++++++++++++++------
 1 file changed, 58 insertions(+), 11 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 28ee82acc..5ce089527 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -91,8 +91,9 @@ static void usage( bool verbose )
     std::cerr << "        options" << std::endl;
     std::cerr << "            --append; append random numbers to stdin input" << std::endl;
     std::cerr << "            --distribution=<distribution>; default=uniform; values: uniform, more todo, just ask" << std::endl;
+    std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
     std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
-    std::cerr << "            --type=<type>; default=i; supported values: i, ui, f, d" << std::endl;
+    std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, f, d" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    shuffle: output input records in pseudo-random order" << std::endl;
     std::cerr << std::endl;
@@ -108,10 +109,12 @@ static void usage( bool verbose )
     exit( 0 );
 }
 
+static bool output_binary;
 static bool verbose;
 static comma::csv::options csv;
 static boost::optional< int > seed;
 
+
 namespace comma { namespace applications { namespace random { namespace shuffle {
 
 struct input
@@ -136,8 +139,26 @@ namespace comma { namespace applications { namespace random {
 
 namespace make {
 
+template < typename T >
+struct type_traits
+{
+    static T cast( T t ) { return t; }
+};
+
+template <>
+struct type_traits< char >
+{
+    static int cast( char t ) { return static_cast< int >( t ); }
+};
+
+template <>
+struct type_traits< unsigned char >
+{
+    static unsigned int cast( unsigned char t ) { return static_cast< int >( t ); }
+};
+    
 template < typename T, typename Distribution >
-static int run_impl( Distribution& distribution, bool append )
+static int run_impl( Distribution& distribution, bool append, bool binary )
 {
     std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
     if( !::csv.flush ) { std::cin.tie( NULL ); }
@@ -164,7 +185,7 @@ static int run_impl( Distribution& distribution, bool append )
                 std::string s;
                 std::getline( std::cin, s );
                 if( s.empty() ) { continue; }
-                std::cout << s << ::csv.delimiter << distribution( generator ) << std::endl;
+                std::cout << s << ::csv.delimiter << type_traits< T >::cast( distribution( generator ) ) << std::endl;
                 if( ::csv.flush ) { std::cout.flush(); }
             }
         }
@@ -174,8 +195,8 @@ static int run_impl( Distribution& distribution, bool append )
         while( std::cout.good() )
         {
             T r = distribution( generator );
-            if( ::csv.binary() ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) ); }
-            else { std::cout << r << std::endl; }
+            if( binary ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) ); }
+            else { std::cout << type_traits< T >::cast( r ) << std::endl; }
             if( ::csv.flush ) { std::cout.flush(); }
         }
     }
@@ -186,16 +207,42 @@ template < typename T, template < typename > class Distribution >
 static int run_impl( const comma::command_line_options& options )
 {
     bool append = options.exists( "--append" );
-    auto r = options.optional< std::string >( "--range" );
-    auto range = comma::csv::ascii< std::pair< T, T > >().get( *r );
-    auto distribution = r ? Distribution< T >( range.first, range.second ) : Distribution< T >();
-    return run_impl< T >( distribution, append );
+    bool binary = options.exists( "--output-binary" ) || ::csv.binary();
+    auto r = options.optional< std::string >( "--range" ); // todo: parse distribution parameters
+    if( r )
+    {
+        auto range = comma::csv::ascii< std::pair< T, T > >().get( *r );
+        Distribution< T > distribution( range.first, range.second );
+        return run_impl< T >( distribution, append, binary );
+    }
+    Distribution< T > distribution;
+    return run_impl< T >( distribution, append, binary );
 }
     
 static int run( const comma::command_line_options& options ) // quick and dirty
 {
     auto distribution = options.value< std::string >( "--distribution", "uniform" );
-    auto type = options.value< std::string >( "--type", "int" );
+    auto type = options.value< std::string >( "--type", "ui" );
+    if( type == "b" )
+    {
+        if( distribution == "uniform" ) { return run_impl< char, std::uniform_int_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
+    if( type == "ub" )
+    {
+        if( distribution == "uniform" ) { return run_impl< unsigned char, std::uniform_int_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
+    if( type == "w" )
+    {
+        if( distribution == "uniform" ) { return run_impl< comma::int16, std::uniform_int_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
+    if( type == "uw" )
+    {
+        if( distribution == "uniform" ) { return run_impl< comma::uint16, std::uniform_int_distribution >( options ); }
+        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    }
     if( type == "i" )
     {
         if( distribution == "uniform" ) { return run_impl< comma::int32, std::uniform_int_distribution >( options ); }
@@ -304,7 +351,7 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        const auto& unnamed = options.unnamed( "--flush,--verbose,-v", "-.*" );
+        const auto& unnamed = options.unnamed( "--append,--flush,--verbose,-v", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-random: please specify operation" << std::endl; return 1; }
         ::csv = comma::csv::options( options );
         seed = options.optional< int >( "--seed" );

From 8735ed3846a6a1972dd918e31d8763e1d4c87b04 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 27 Feb 2020 17:34:41 +1100
Subject: [PATCH 0142/1056] examples.md added

---
 examples.md | 28 ++++++++++++++++++++++++++++
 1 file changed, 28 insertions(+)
 create mode 100644 examples.md

diff --git a/examples.md b/examples.md
new file mode 100644
index 000000000..b4802fc0d
--- /dev/null
+++ b/examples.md
@@ -0,0 +1,28 @@
+# csv
+
+## accumulate values
+
+### take velocities, calculate distance
+
+generate sample file with velocity a m/sec at each given time:
+
+```
+cat <<eof > velocities.csv
+20200101T000000,0.7
+20200101T000001,1.1
+20200101T000002,1.1
+20200101T000003,0.9
+20200101T000004,1.3
+eof 
+
+```
+
+append distance travelled to each data point:
+
+```
+cat velocities.csv \
+    | csv-shuffle --fields t,v --output-fields t,t,v \
+    | csv-time --to seconds --fields ,t \
+    | csv-eval --init-values "prev=0;sum=0" --fields ,cur,v "sum+=(cur-prev)*(prev>0)*v;prev=cur" \
+    | csv-shuffle --fields t,,v,d --output-fields t,v,d
+```

From 5247fda668c035ffdf600a51230ce93593a33d81 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 27 Feb 2020 06:36:41 +0000
Subject: [PATCH 0143/1056] Update examples.md

---
 examples.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/examples.md b/examples.md
index b4802fc0d..e0c521e7b 100644
--- a/examples.md
+++ b/examples.md
@@ -6,7 +6,7 @@
 
 generate sample file with velocity a m/sec at each given time:
 
-```
+```bash
 cat <<eof > velocities.csv
 20200101T000000,0.7
 20200101T000001,1.1
@@ -19,7 +19,7 @@ eof
 
 append distance travelled to each data point:
 
-```
+```bash
 cat velocities.csv \
     | csv-shuffle --fields t,v --output-fields t,t,v \
     | csv-time --to seconds --fields ,t \

From 723bdf5e5af1a346df7e5a6d796b2bb6b9c04af8 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 28 Feb 2020 11:56:21 +1100
Subject: [PATCH 0144/1056] csv-calc: trivial change

---
 csv/applications/csv-calc.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 181e6ab60..25d4a10d5 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1377,7 +1377,7 @@ int main( int ac, char** av )
         else { output( csv, results, block, has_block, has_id ); }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << comma::verbose.app_name() << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << comma::verbose.app_name() << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-calc: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-calc: unknown exception" << std::endl; }
     return 1;
 }

From 30c202752d9b6e7287eae93befe3254feae8315f Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 4 Mar 2020 09:35:59 +1100
Subject: [PATCH 0145/1056] COPYING: updated

---
 AUTHORS | 8 ++++----
 COPYING | 1 +
 2 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/AUTHORS b/AUTHORS
index 53aaa505a..b3ae456ea 100644
--- a/AUTHORS
+++ b/AUTHORS
@@ -1,4 +1,4 @@
-  Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
-  Cedric Wohlleber <c.wohlleber@acfr.usyd.edu.au>
-  Matthew Herrmann <matthewinrandwick@gmail.com>
-  James Underwood <j.underwood@acfr.usyd.edu.au>
+Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
+Cedric Wohlleber <c.wohlleber@acfr.usyd.edu.au>
+Matthew Herrmann <matthewinrandwick@gmail.com>
+James Underwood <j.underwood@acfr.usyd.edu.au>
diff --git a/COPYING b/COPYING
index 5702f519c..d880d7275 100644
--- a/COPYING
+++ b/COPYING
@@ -1,4 +1,5 @@
 Copyright (c) 2011 The University of Sydney
+Copyright (c) 2018 Vsevolod Vlaskine
 All rights reserved.
 
 Redistribution and use in source and binary forms, with or without

From a26920e36dab3684116d5b6d8b19c8ff0256b95f Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 12 Mar 2020 12:13:35 +1100
Subject: [PATCH 0146/1056] python: comma.csv.time: made permissive on
 nanoseconds present

---
 python/comma/csv/test/numpy_time/expected | 2 ++
 python/comma/csv/test/numpy_time/input    | 1 +
 python/comma/csv/time.py                  | 3 ++-
 3 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/python/comma/csv/test/numpy_time/expected b/python/comma/csv/test/numpy_time/expected
index 4bb01817a..ef29ef5e3 100644
--- a/python/comma/csv/test/numpy_time/expected
+++ b/python/comma/csv/test/numpy_time/expected
@@ -6,6 +6,8 @@ incomplete/output="20150101T010203.123000"
 incomplete/status=0
 microseconds/output="20140101T010203.123456"
 microseconds/status=0
+nanoseconds/output="20140101T010203.123456"
+nanoseconds/status=0
 not_a_date_time/output="not-a-date-time"
 not_a_date_time/status=0
 invalid_month/output=""
diff --git a/python/comma/csv/test/numpy_time/input b/python/comma/csv/test/numpy_time/input
index 13c35aa3d..57b935473 100644
--- a/python/comma/csv/test/numpy_time/input
+++ b/python/comma/csv/test/numpy_time/input
@@ -2,6 +2,7 @@ basic 20150101T010203
 dot 20150101T010203.
 incomplete 20150101T010203.123
 microseconds 20140101T010203.123456
+nanoseconds 20140101T010203.123456789
 invalid_month 20150001T000000
 invalid_format 20150101T0000
 not_a_date_time not-a-date-time
diff --git a/python/comma/csv/time.py b/python/comma/csv/time.py
index 39c33ad3b..b1deaa33f 100644
--- a/python/comma/csv/time.py
+++ b/python/comma/csv/time.py
@@ -52,6 +52,7 @@ def is_negative_infinity(numpy_time): return numpy_time == NEGATIVE_INFINITY
 def to_numpy(t):
     """
     return numpy datetime64 scalar corresponding to the given comma time string
+    if t has nanoseconds, it will be trunkated (rather than rounded) to microseconds
 
     >>> import numpy as np
     >>> from comma.csv.time import to_numpy
@@ -67,7 +68,7 @@ def to_numpy(t):
     if t in ['', 'not-a-date-time']: return NOT_A_DATE_TIME
     if t in ['+infinity', '+inf', 'infinity', 'inf']: return POSITIVE_INFINITY
     if t in ['-infinity', '-inf']: return NEGATIVE_INFINITY
-    if not (isinstance(t, BASESTRING) and re.match(r'^(\d{8}T\d{6}(\.\d{0,6})?)$', t)):
+    if not (isinstance(t, BASESTRING) and re.match(r'^(\d{8}T\d{6}(\.\d{0,12})?)$', t)):
         msg = "expected comma time, got '{}'".format(repr(t))
         raise TypeError(msg)
     v = list(t)

From 0defca981e09037ec4e883a03a35f07bcf7385cc Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Thu, 19 Mar 2020 19:02:34 +1100
Subject: [PATCH 0147/1056] csv-repeat: --timestamped: implemented; unit test:
 todo...

---
 csv/applications/csv-repeat.cpp | 103 ++++++++++++++++++++++++++------
 1 file changed, 86 insertions(+), 17 deletions(-)

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index 460133a7e..81e2db55b 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -29,6 +29,7 @@
 
 /// @author dave jennings
 
+#include <functional>
 #include <iostream>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/thread/thread.hpp>
@@ -73,6 +74,11 @@ void usage( bool verbose = false )
     std::cerr << "            warning: currently is very simplistic; see todo comments in the code to make it more robust" << std::endl;
     std::cerr << "    --period=[<seconds>]: period of repeated record" << std::endl;
     std::cerr << "    --timeout,-t=[<seconds>]: timeout before repeating the last record; if not specified, timeout is set to --period" << std::endl;
+    std::cerr << "    --timestamped: use input timestamp for repeating; currently, would do blocking read" << std::endl;
+    std::cerr << "                   convenient for filling holes in data in offline processing" << std::endl;
+    std::cerr << "      --timestamped options" << std::endl;
+    std::cerr << "          --from=[<time>]; if first timestamp greater than <time>, fill the hole with the first record" << std::endl;
+    std::cerr << "          --to=[<time>]; if last timestamp less than <time>, fill the hole with the last record" << std::endl;
     std::cerr << "    --verbose,-v: more output" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    if --period is not set, --timeout acts as a watchdog. If no input is seen" << std::endl;
@@ -107,6 +113,11 @@ void usage( bool verbose = false )
     exit( 0 );
 }
 
+struct input_t
+{
+    boost::posix_time::ptime time;
+};
+
 struct output_t
 {
     boost::posix_time::ptime time;
@@ -117,6 +128,12 @@ struct output_t
 
 namespace comma { namespace visiting {
 
+template <> struct traits< input_t >
+{
+    template < typename K, typename V > static void visit( const K&, input_t& p, V& v ) { v.apply( "t", p.time ); }
+    template < typename K, typename V > static void visit( const K&, const input_t& p, V& v ) { v.apply( "t", p.time ); }
+};
+
 template <> struct traits< output_t >
 {
     template < typename K, typename V > static void visit( const K&, const output_t& p, V& v )
@@ -142,16 +159,6 @@ int main( int ac, char** av )
         bool ignore_eof = options.exists( "--ignore-eof,--ignoreeof,--yes" );
         if( ignore_eof && !options.exists( "--period" ) ) { std::cerr << "csv-repeat: got --ignore-oef, thus please specify --period" << std::endl; return 1; }
         comma::csv::options csv = comma::csv::options( options );
-        std::size_t record_size = csv.binary() ? csv.format().size() : 0;
-        std::vector< char > buffer( csv.binary() ? ( 65536ul / record_size + 1 ) * record_size : 0 );
-        char* buffer_begin = &buffer[0];
-        const char* buffer_end = &buffer[0] + buffer.size();
-        char* read_position = buffer_begin;
-        char* write_position = buffer_begin;
-        char* last_record = NULL;
-        comma::io::select select;
-        select.read().add( comma::io::stdin_fd );
-        comma::io::istream is( "-", comma::io::mode::binary );
         boost::scoped_ptr< comma::csv::output_stream< output_t > > ostream;
         comma::csv::options output_csv;
         output_csv.full_xpath = false;
@@ -183,6 +190,12 @@ int main( int ac, char** av )
             output_csv.delimiter = csv.delimiter;
             ostream.reset( new comma::csv::output_stream< output_t >( std::cout, output_csv ) );
         }
+        boost::optional< boost::posix_time::time_duration > period;
+        if( options.exists( "--period" ) ) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
+        boost::posix_time::time_duration timeout;
+        boost::optional< double > timeout_seconds = options.optional< double >( "--timeout,-t" );
+        if( !period && !timeout_seconds ) { std::cerr << "csv-repeat: please specify either --period, or --timeout, or both" << std::endl; return 1; }
+        timeout = timeout_seconds ? boost::posix_time::microseconds( static_cast<unsigned int>(*timeout_seconds * 1000000 )) : *period;
         if( options.exists( "--output-fields" ) )
         {
             if( !options.exists( "--fields,-f" ) ) { std::cerr << "csv-repeat: --output-fields option requires --fields" << std::endl; return 1; }
@@ -199,17 +212,73 @@ int main( int ac, char** av )
             std::cout << std::endl;
             return 0;
         }
-        boost::optional< boost::posix_time::time_duration > period;
-        if( options.exists( "--period" ) ) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
-        boost::posix_time::time_duration timeout;
-        boost::optional< double > timeout_seconds = options.optional< double >( "--timeout,-t" );
-        if( !period && !timeout_seconds ) { std::cerr << "csv-repeat: please specify either --period, or --timeout, or both" << std::endl; return 1; }
-        timeout = timeout_seconds ? boost::posix_time::microseconds( static_cast<unsigned int>(*timeout_seconds * 1000000 )) : *period;
+        std::cin.tie( NULL );
+        if( options.exists( "--timestamped" ) )
+        {
+            if( !period ) { std::cerr << "csv-repeat: for --timestamped, please specify --period" << std::endl; return 1; }
+            if( options.exists( "--timeout,-t" ) ) { std::cerr << "csv-repeat: for --timestamped: --timeout not supported" << std::endl; return 1; }
+            comma::csv::input_stream< input_t > istream( std::cin, csv );
+            boost::posix_time::ptime last;
+            if( options.exists( "--from" ) ) { last = boost::posix_time::from_iso_string( options.value< std::string >( "--from" ) ); }
+            boost::posix_time::ptime to;
+            if( options.exists( "--to" ) ) { to = boost::posix_time::from_iso_string( options.value< std::string >( "--to" ) ); }
+            std::string last_record;
+            if( csv.binary() ) { last_record = std::string( csv.format().size(), 0 ); }
+            auto pass = [&]( const output_t& )
+            {
+                static comma::csv::passed< input_t > passed( istream, std::cout, csv.flush );
+                passed.write();
+            };
+            auto append = [&]( const output_t& o )
+            {
+                static comma::csv::tied< input_t, output_t > tied( istream, *ostream );
+                tied.append( o );
+            };
+            std::function< void( const output_t& p ) > write;
+            if( ostream ) { write = append; } else { write = pass; }
+            auto repeat = [&]( boost::posix_time::ptime now )
+            {
+                if( now.is_not_a_date_time() || last.is_not_a_date_time() ) { return; }
+                for( boost::posix_time::ptime t = last + *period; t < now; t += *period )
+                {
+                    std::cout.write( &last_record[0], last_record.size() );
+                    if( !csv.binary() ) { std::cout << csv.delimiter; }
+                    if( ostream ) { ostream->write( output_t( t, true ) ); }
+                }
+            };
+            auto set_last_record = [&]()
+            {
+                if( csv.binary() ) { std::memcpy( &last_record[0], istream.binary().last(), last_record.size() ); } // todo! quick and dirty, watch performance! we don't need to copy each record, but that would make the code more complex
+                else { last_record = comma::join( istream.ascii().last(), csv.delimiter ); }
+            };
+            while( istream.ready() || std::cin.good() )
+            {
+                const input_t* p = istream.read();
+                if( !p ) { break; }
+                if( p->time.is_not_a_date_time() ) { std::cerr << "csv-repeat: expected timestamp, got not a date/time" << std::endl; return 1; }
+                if( last_record.empty() && !last.is_not_a_date_time() ) { set_last_record(); } // quick and dirty
+                repeat( p->time );
+                write( output_t( p->time, false ) );
+                last = p->time;
+                set_last_record();
+            }
+            repeat( to );
+            return 0;
+        }
+        std::size_t record_size = csv.binary() ? csv.format().size() : 0;
+        std::vector< char > buffer( csv.binary() ? ( 65536ul / record_size + 1 ) * record_size : 0 );
+        char* buffer_begin = &buffer[0];
+        const char* buffer_end = &buffer[0] + buffer.size();
+        char* read_position = buffer_begin;
+        char* write_position = buffer_begin;
+        char* last_record = NULL;
+        comma::io::select select;
+        select.read().add( comma::io::stdin_fd );
+        comma::io::istream is( "-", comma::io::mode::binary );
         bool end_of_stream = false;
         std::string line;
         std::string last_line;
         std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
-        std::cin.tie( NULL ); // std::cin is tied to std::cout by default
         bool repeating = false;
         bool pace = options.exists( "--pace" );
         if( pace && !period ) { std::cerr << "csv-repeat: for --pace, please specify --period" << std::endl; return 1; }

From e614d48a9caf03057581ea2bc2256b8adafb1cc6 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Fri, 20 Mar 2020 19:14:32 +1100
Subject: [PATCH 0148/1056] csv-repeat: --timestamped: a few bugs fixed, unit
 test added

---
 csv/applications/csv-repeat.cpp          | 26 ++++++++----
 csv/test/csv-repeat/timestamped/expected | 53 ++++++++++++++++++++++++
 csv/test/csv-repeat/timestamped/input    |  5 +++
 csv/test/csv-repeat/timestamped/test     |  6 +++
 4 files changed, 81 insertions(+), 9 deletions(-)
 create mode 100644 csv/test/csv-repeat/timestamped/expected
 create mode 100644 csv/test/csv-repeat/timestamped/input
 create mode 100755 csv/test/csv-repeat/timestamped/test

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index 81e2db55b..20bd972df 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -77,8 +77,8 @@ void usage( bool verbose = false )
     std::cerr << "    --timestamped: use input timestamp for repeating; currently, would do blocking read" << std::endl;
     std::cerr << "                   convenient for filling holes in data in offline processing" << std::endl;
     std::cerr << "      --timestamped options" << std::endl;
-    std::cerr << "          --from=[<time>]; if first timestamp greater than <time>, fill the hole with the first record" << std::endl;
-    std::cerr << "          --to=[<time>]; if last timestamp less than <time>, fill the hole with the last record" << std::endl;
+    std::cerr << "          --at-least-from,--from=[<time>]; if first timestamp greater than <time>, fill the hole with the first record" << std::endl;
+    std::cerr << "          --at-least-to,--to=[<time>]; if last timestamp less than <time>, fill the hole with the last record" << std::endl;
     std::cerr << "    --verbose,-v: more output" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    if --period is not set, --timeout acts as a watchdog. If no input is seen" << std::endl;
@@ -219,9 +219,9 @@ int main( int ac, char** av )
             if( options.exists( "--timeout,-t" ) ) { std::cerr << "csv-repeat: for --timestamped: --timeout not supported" << std::endl; return 1; }
             comma::csv::input_stream< input_t > istream( std::cin, csv );
             boost::posix_time::ptime last;
-            if( options.exists( "--from" ) ) { last = boost::posix_time::from_iso_string( options.value< std::string >( "--from" ) ); }
+            if( options.exists( "--from" ) ) { last = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-from,--from" ) ); }
             boost::posix_time::ptime to;
-            if( options.exists( "--to" ) ) { to = boost::posix_time::from_iso_string( options.value< std::string >( "--to" ) ); }
+            if( options.exists( "--to" ) ) { to = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-to,--to" ) ); }
             std::string last_record;
             if( csv.binary() ) { last_record = std::string( csv.format().size(), 0 ); }
             auto pass = [&]( const output_t& )
@@ -236,14 +236,22 @@ int main( int ac, char** av )
             };
             std::function< void( const output_t& p ) > write;
             if( ostream ) { write = append; } else { write = pass; }
+            auto write_last = [&]( boost::posix_time::ptime t )
+            {
+                std::cout.write( &last_record[0], last_record.size() );
+                if( !csv.binary() ) { std::cout << csv.delimiter; }
+                if( ostream ) { ostream->write( output_t( t, true ) ); }
+                else if( !csv.binary() ) { std::cout << std::endl; }
+            };
             auto repeat = [&]( boost::posix_time::ptime now )
             {
                 if( now.is_not_a_date_time() || last.is_not_a_date_time() ) { return; }
-                for( boost::posix_time::ptime t = last + *period; t < now; t += *period )
+                for( boost::posix_time::ptime t = last + *period; t <= now; )
                 {
-                    std::cout.write( &last_record[0], last_record.size() );
-                    if( !csv.binary() ) { std::cout << csv.delimiter; }
-                    if( ostream ) { ostream->write( output_t( t, true ) ); }
+                    write_last( t );
+                    if( t == now ) { break; }
+                    t += *period;
+                    if( t > now ) { t = now; }
                 }
             };
             auto set_last_record = [&]()
@@ -256,7 +264,7 @@ int main( int ac, char** av )
                 const input_t* p = istream.read();
                 if( !p ) { break; }
                 if( p->time.is_not_a_date_time() ) { std::cerr << "csv-repeat: expected timestamp, got not a date/time" << std::endl; return 1; }
-                if( last_record.empty() && !last.is_not_a_date_time() ) { set_last_record(); } // quick and dirty
+                if( last_record.empty() && !last.is_not_a_date_time() ) { set_last_record(); write_last( last ); } // quick and dirty
                 repeat( p->time );
                 write( output_t( p->time, false ) );
                 last = p->time;
diff --git a/csv/test/csv-repeat/timestamped/expected b/csv/test/csv-repeat/timestamped/expected
new file mode 100644
index 000000000..3e01a4129
--- /dev/null
+++ b/csv/test/csv-repeat/timestamped/expected
@@ -0,0 +1,53 @@
+timestamped[0]/output/line[0]="20200101T000010,a"
+timestamped[0]/output/line[1]="20200101T000010,a,"
+timestamped[0]/output/line[2]="20200101T000010,a,"
+timestamped[0]/output/line[3]="20200101T000010,a,"
+timestamped[0]/output/line[4]="20200101T000010,a,"
+timestamped[0]/output/line[5]="20200101T000020,b"
+timestamped[0]/status=0
+timestamped[1]/output/line[0]="20200101T000010,a,20200101T000010,0"
+timestamped[1]/output/line[1]="20200101T000010,a,20200101T000013,1"
+timestamped[1]/output/line[2]="20200101T000010,a,20200101T000016,1"
+timestamped[1]/output/line[3]="20200101T000010,a,20200101T000019,1"
+timestamped[1]/output/line[4]="20200101T000010,a,20200101T000020,1"
+timestamped[1]/output/line[5]="20200101T000020,b,20200101T000020,0"
+timestamped[1]/status=0
+timestamped[2]/output/line[0]="20200101T000010,a,20200101T000000,1"
+timestamped[2]/output/line[1]="20200101T000010,a,20200101T000003,1"
+timestamped[2]/output/line[2]="20200101T000010,a,20200101T000006,1"
+timestamped[2]/output/line[3]="20200101T000010,a,20200101T000009,1"
+timestamped[2]/output/line[4]="20200101T000010,a,20200101T000010,1"
+timestamped[2]/output/line[5]="20200101T000010,a,20200101T000010,0"
+timestamped[2]/output/line[6]="20200101T000010,a,20200101T000013,1"
+timestamped[2]/output/line[7]="20200101T000010,a,20200101T000016,1"
+timestamped[2]/output/line[8]="20200101T000010,a,20200101T000019,1"
+timestamped[2]/output/line[9]="20200101T000010,a,20200101T000020,1"
+timestamped[2]/output/line[10]="20200101T000020,b,20200101T000020,0"
+timestamped[2]/status=0
+timestamped[3]/output/line[0]="20200101T000010,a,20200101T000010,0"
+timestamped[3]/output/line[1]="20200101T000010,a,20200101T000013,1"
+timestamped[3]/output/line[2]="20200101T000010,a,20200101T000016,1"
+timestamped[3]/output/line[3]="20200101T000010,a,20200101T000019,1"
+timestamped[3]/output/line[4]="20200101T000010,a,20200101T000020,1"
+timestamped[3]/output/line[5]="20200101T000020,b,20200101T000020,0"
+timestamped[3]/output/line[6]="20200101T000020,b,20200101T000023,1"
+timestamped[3]/output/line[7]="20200101T000020,b,20200101T000026,1"
+timestamped[3]/output/line[8]="20200101T000020,b,20200101T000029,1"
+timestamped[3]/output/line[9]="20200101T000020,b,20200101T000030,1"
+timestamped[3]/status=0
+timestamped[4]/output/line[0]="20200101T000010,a,20200101T000000,1"
+timestamped[4]/output/line[1]="20200101T000010,a,20200101T000003,1"
+timestamped[4]/output/line[2]="20200101T000010,a,20200101T000006,1"
+timestamped[4]/output/line[3]="20200101T000010,a,20200101T000009,1"
+timestamped[4]/output/line[4]="20200101T000010,a,20200101T000010,1"
+timestamped[4]/output/line[5]="20200101T000010,a,20200101T000010,0"
+timestamped[4]/output/line[6]="20200101T000010,a,20200101T000013,1"
+timestamped[4]/output/line[7]="20200101T000010,a,20200101T000016,1"
+timestamped[4]/output/line[8]="20200101T000010,a,20200101T000019,1"
+timestamped[4]/output/line[9]="20200101T000010,a,20200101T000020,1"
+timestamped[4]/output/line[10]="20200101T000020,b,20200101T000020,0"
+timestamped[4]/output/line[11]="20200101T000020,b,20200101T000023,1"
+timestamped[4]/output/line[12]="20200101T000020,b,20200101T000026,1"
+timestamped[4]/output/line[13]="20200101T000020,b,20200101T000029,1"
+timestamped[4]/output/line[14]="20200101T000020,b,20200101T000030,1"
+timestamped[4]/status=0
diff --git a/csv/test/csv-repeat/timestamped/input b/csv/test/csv-repeat/timestamped/input
new file mode 100644
index 000000000..fcbfd69cc
--- /dev/null
+++ b/csv/test/csv-repeat/timestamped/input
@@ -0,0 +1,5 @@
+timestamped[0]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3"
+timestamped[1]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating"
+timestamped[2]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating --from 20200101T000000"
+timestamped[3]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating --to 20200101T000030"
+timestamped[4]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating --to 20200101T000030 --from 20200101T000000"
diff --git a/csv/test/csv-repeat/timestamped/test b/csv/test/csv-repeat/timestamped/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/csv/test/csv-repeat/timestamped/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From ac5416b421b55e3f14f7ffc219e8db4f344624c1 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 1 Apr 2020 13:16:45 +1100
Subject: [PATCH 0149/1056] csv-blocks: scalar field: --min/--max implemented;
 debugging...

---
 csv/applications/csv-blocks.cpp | 126 +++++++++++++++++++++-----------
 1 file changed, 83 insertions(+), 43 deletions(-)

diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index 42d09a96d..bab7b8d00 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -145,8 +145,14 @@ static void usage( bool more )
     std::cerr << "            --fields=<fields>" << std::endl;
     std::cerr << "                id: any number of id fields to group by" << std::endl;
     std::cerr << "                scalar: group by scalar, which can be integer, floating point number, or time" << std::endl;
-    std::cerr << "            --block-gap,--gap=<value>; minimum gap in values between blocks, double (for time: seconds as double), see examples" << std::endl;
-    std::cerr << "            --block-span,--span=<value>; maximum block span, double (for time: seconds as double), see examples" << std::endl;
+    std::cerr << "                        options" << std::endl;
+    std::cerr << "                            --block-gap,--gap=<value>; minimum gap in values between block" << std::endl;
+    std::cerr << "                                                       double (for time: seconds as double), see examples" << std::endl;
+    std::cerr << "                            --block-span,--span=<value>; maximum block span, double (for time: seconds as" << std::endl;
+    std::cerr << "                                                         double), see examples" << std::endl;
+    std::cerr << "                            --discard-out-of-range; discard input records with scalar out of range defined by --min and --max" << std::endl;
+    std::cerr << "                            --min=[<value>]; min value for the scalar range, see examples" << std::endl;
+    std::cerr << "                            --max=[<value>]; max value for the scalar range, see examples" << std::endl;
     std::cerr << "    head" << std::endl;
     std::cerr << "        reads records from first block to stdout, if --num-of-blocks=<num> specified, read more than one blocks" << std::endl;
     std::cerr << "        requires the index from 'index' mode in the inputs" << std::endl;
@@ -230,7 +236,6 @@ static comma::csv::options csv;
 static bool reverse_index = false;
 // All the data for this block
 static std::deque< std::string > block_records;
-static comma::uint32 current_block = 1;
 static comma::int32 increment_step = 1;
 
 static void output_record_and_index( const std::string& input, comma::uint32 index, bool is_binary, char delimiter )
@@ -266,12 +271,21 @@ static bool empty_( const std::string& s ) // quick and dirty
     return true;
 }
 
-static double diff( const input_t& from, const input_t& to ) // quick and dirty
+static double to_double( const input_t& lhs ) // quick and dirty
 {
-    if( from.key.longs.size() == 1 ) { return std::abs( double( from.key.longs[0] ) - to.key.longs[0] ); }
-    if( from.key.doubles.size() == 1 ) { return std::abs( from.key.doubles[0] - to.key.doubles[0] ); }
-    if( from.key.time.size() == 1 ) { return std::abs( double( ( from.key.time[0] - to.key.time[0] ).total_microseconds() ) / 1000000 ); }
-    if( from.key.strings.size() == 1 ) { COMMA_THROW( comma::exception, "difference for strings: not implemented" ); }
+    if( lhs.key.longs.size() == 1 ) { return lhs.key.longs[0]; }
+    if( lhs.key.doubles.size() == 1 ) { return lhs.key.doubles[0]; }
+    if( lhs.key.time.size() == 1 ) { COMMA_THROW( comma::exception, "cannot convert time to double" ); }
+    if( lhs.key.strings.size() == 1 ) { COMMA_THROW( comma::exception, "cannot convert strings to double" ); }
+    COMMA_THROW( comma::exception, "never here" );
+}
+
+static double diff( const input_t& lhs, const input_t& rhs ) // quick and dirty
+{
+    if( lhs.key.longs.size() == 1 ) { return std::abs( double( lhs.key.longs[0] ) - rhs.key.longs[0] ); }
+    if( lhs.key.doubles.size() == 1 ) { return std::abs( lhs.key.doubles[0] - rhs.key.doubles[0] ); }
+    if( lhs.key.time.size() == 1 ) { return std::abs( double( ( lhs.key.time[0] - rhs.key.time[0] ).total_microseconds() ) / 1000000 ); }
+    if( lhs.key.strings.size() == 1 ) { COMMA_THROW( comma::exception, "difference for strings: not implemented" ); }
     COMMA_THROW( comma::exception, "never here" );
 }
 
@@ -460,12 +474,10 @@ int main( int ac, char** av )
         comma::csv::options csv_out;
         csv_out.full_xpath = false;
         if( csv.binary() ) { csv_out.format( comma::csv::format("ui") ); }
-        std::vector< std::string > unnamed = options.unnamed( "--help,-h,--reverse,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--help,-h,--reverse,--verbose,-v,--discard-out-of-range", "-.*" );
         if( unnamed.empty() ) { std::cerr << name() << "please specify operation" << std::endl; return 1; }
         const std::string  operation = unnamed.front();
-        
         if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << std::endl; }
-        
         if( operation == "accumulate" )
         {
             std::string first_line;
@@ -514,55 +526,93 @@ int main( int ac, char** av )
         }
         if( operation == "group" || operation == "make-blocks" )
         {
-            current_block = options.value< comma::uint32 >( "--starting-block,--from", 0 );
+            comma::uint32 current_block = options.value< comma::uint32 >( "--starting-block,--from", 0 );
             std::string first_line;
             input_t default_input;
             auto how = set_fields( options, first_line, default_input );
             if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << "; making blocks by " << ( how == how_t::by_id ? "id" : "scalar" ) << std::endl; }
             boost::optional< double > gap;
             boost::optional< double > span;
+            boost::optional< double > min;
+            boost::optional< double > max;
             if( how == how_t::by_scalar )
-            { 
+            {
+                options.assert_mutually_exclusive( "--gap,--span", "--min,--max" ); // for now
                 gap = options.optional< double >( "--block-gap,--gap" );
                 span = options.optional< double >( "--block-span,--span" );
+                min = options.optional< double >( "--min" );
+                max = options.optional< double >( "--max" );
             }
             comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
             comma::csv::output_stream< appended_column > ostream( std::cout, csv_out );
             comma::csv::tied< input_t, appended_column > tied( istream, ostream );
-            auto update_block = [&]( const input_t& p )
+            auto update_block = [&]( const input_t& p )->bool
             {
-                static input_t first = p;
                 static input_t last = p;
                 switch( how )
                 {
                     case how_t::by_id:
                         if( !( last.key == p.key ) ) { ++current_block; }
-                        break;
+                        last = p;
+                        return true;
                     case how_t::by_scalar:
-                        if( ( gap && diff( last, p ) >= *gap ) || ( span && diff( first, p ) >= *span ) ) { ++current_block; first = p; }
-                        break;
+                    {
+                        static input_t first = p;
+                        if( gap || span )
+                        {
+                            if( ( gap && diff( last, p ) >= *gap ) || ( span && diff( first, p ) >= *span ) ) { ++current_block; first = p; }
+                            last = p;
+                            return true;
+                        }
+                        else
+                        {
+                            static bool last_in_range = false;
+                            static bool discard_output_out_of_range = !options.exists( "--discard-out-of-range" );
+                            double v = to_double( p );
+                            bool in_range = ( !min || !comma::math::less( v, *min ) ) && ( !max || !comma::math::less( *max, v ) );
+                            static bool first_record = true;
+                            if( !first_record ) // quick and dirty
+                            {
+                                if( discard_output_out_of_range )
+                                {
+                                    if( last_in_range && !in_range ) { ++current_block; }
+                                }
+                                else
+                                {
+                                    if( last_in_range != in_range ) { ++current_block; } // quick and dirty
+                                }
+                            }
+                            last = p;
+                            last_in_range = in_range;
+                            first_record = false;
+                            return in_range || !discard_output_out_of_range;
+                        }
+                    }
                     case how_t::none: // never here
-                        break;
+                        return true;
                 }
-                last = p;
-                    
+                return true; // never here
             };
             if( !first_line.empty() ) 
             { 
                 input_t p = comma::csv::ascii< input_t >( csv, default_input ).get( first_line ); 
-                update_block( p );
-                if( istream.is_binary() ) { std::cout.write( (char*)&p, istream.binary().size() ); }
-                else { std::cout << first_line << istream.ascii().ascii().delimiter(); }
-                ostream.write( appended_column( current_block ) );
-                if( csv.flush ) { std::cout.flush(); }
+                if( update_block( p ) )
+                {
+                    if( istream.is_binary() ) { std::cout.write( (char*)&p, istream.binary().size() ); }
+                    else { std::cout << first_line << istream.ascii().ascii().delimiter(); }
+                    ostream.write( appended_column( current_block ) );
+                    if( csv.flush ) { std::cout.flush(); }
+                }
             }
             while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
             {
                 const input_t* p = istream.read();
                 if( !p ) { break; }
-                update_block( *p );
-                tied.append( appended_column( current_block ) );
-                if( csv.flush ) { std::cout.flush(); }
+                if( update_block( *p ) )
+                {
+                    tied.append( appended_column( current_block ) );
+                    if( csv.flush ) { std::cout.flush(); }
+                }
             }            
             return 0;
         }
@@ -606,60 +656,51 @@ int main( int ac, char** av )
         else if( operation == "index" )
         {
             reverse_index = options.exists("--reverse");
-            
             comma::csv::input_stream< input_with_block > istream( std::cin, csv );
-            
             char delimiter = istream.is_binary() ? ',' : istream.ascii().ascii().delimiter();
             comma::uint32 block = 0;
             comma::uint32 index = 0;
             std::string buffer;
             if( istream.is_binary() ) { buffer.resize( istream.binary().size() ); }
-            
             while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
             {
                 const input_with_block* p = istream.read();
                 if( !p ) { break; }
-                
                 if( block != p->block ) 
                 { 
                     if ( reverse_index ) { output_reverse_indexing( block_records, istream.is_binary(), delimiter  ); }
                     else { index = 0; }
                 }
                 block = p->block;
-                
                 if ( reverse_index )
                 {
-                    // Reverse index mode - accumulate whole block before indexing
                     if( istream.is_binary() )  
                     { 
                         ::memcpy( &buffer[0], istream.binary().last(),  istream.binary().size() ); 
                         block_records.push_back( buffer );
                     }
-                    else { block_records.push_back( comma::join( istream.ascii().last(), delimiter ) ); }
+                    else
+                    {
+                        block_records.push_back( comma::join( istream.ascii().last(), delimiter ) );
+                    }
                 }
                 else
                 {
-                    // Forward index mode - append index to each record
                     if( istream.is_binary() ) { ::memcpy( &buffer[0], istream.binary().last(),  istream.binary().size() ); }
                     else { buffer = comma::join( istream.ascii().last(), delimiter ); }
                     output_record_and_index( buffer, index, istream.is_binary(), delimiter );
                     index++;
                 }
             }
-            
-            // flushes the last block
             if ( reverse_index ) { output_reverse_indexing( block_records, istream.is_binary(), delimiter  ); }
-            
             return 0;
         }
         else if( operation == "increment" )    // operation is head
         {
             increment_step = options.value< comma::int32 >( "--step", 1 );
-            
             comma::csv::input_stream< input_with_block > istream( std::cin, csv );
             comma::csv::output_stream< appended_column > ostream( std::cout, csv_out );
             comma::csv::tied< input_with_block, appended_column > tied( istream, ostream );
-            
             appended_column incremented;
             while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
             {
@@ -669,7 +710,6 @@ int main( int ac, char** av )
                 tied.append( incremented );
                 if( csv.flush ) { std::cout.flush(); }
             }
-            
             return 0;
         }
         else if( operation == "read-until" )

From e19bf5d4af615e9aaf53b66097ab99b52e6b7bd4 Mon Sep 17 00:00:00 2001
From: seva <seva>
Date: Wed, 1 Apr 2020 13:52:25 +1100
Subject: [PATCH 0150/1056] csv-blocks: scalar field: --min/--max: tests added

---
 csv/applications/csv-blocks.cpp    |  6 ++---
 csv/test/csv-blocks/group/expected | 42 ++++++++++++++++++++++++++++++
 csv/test/csv-blocks/group/input    |  9 +++++++
 3 files changed, 54 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index bab7b8d00..a2be3c024 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -151,8 +151,8 @@ static void usage( bool more )
     std::cerr << "                            --block-span,--span=<value>; maximum block span, double (for time: seconds as" << std::endl;
     std::cerr << "                                                         double), see examples" << std::endl;
     std::cerr << "                            --discard-out-of-range; discard input records with scalar out of range defined by --min and --max" << std::endl;
-    std::cerr << "                            --min=[<value>]; min value for the scalar range, see examples" << std::endl;
-    std::cerr << "                            --max=[<value>]; max value for the scalar range, see examples" << std::endl;
+    std::cerr << "                            --min=[<value>]; convenience option: min value for the scalar range, see examples" << std::endl;
+    std::cerr << "                            --max=[<value>]; convenience option: max value for the scalar range, see examples" << std::endl;
     std::cerr << "    head" << std::endl;
     std::cerr << "        reads records from first block to stdout, if --num-of-blocks=<num> specified, read more than one blocks" << std::endl;
     std::cerr << "        requires the index from 'index' mode in the inputs" << std::endl;
@@ -567,7 +567,7 @@ int main( int ac, char** av )
                         else
                         {
                             static bool last_in_range = false;
-                            static bool discard_output_out_of_range = !options.exists( "--discard-out-of-range" );
+                            static bool discard_output_out_of_range = options.exists( "--discard-out-of-range" );
                             double v = to_double( p );
                             bool in_range = ( !min || !comma::math::less( v, *min ) ) && ( !max || !comma::math::less( *max, v ) );
                             static bool first_record = true;
diff --git a/csv/test/csv-blocks/group/expected b/csv/test/csv-blocks/group/expected
index 5c144db16..52255b96a 100644
--- a/csv/test/csv-blocks/group/expected
+++ b/csv/test/csv-blocks/group/expected
@@ -68,3 +68,45 @@ group/scalar/gap_and_span[0]/output/line[4]="7,1"
 group/scalar/gap_and_span[0]/output/line[5]="8,1"
 group/scalar/gap_and_span[0]/output/line[6]="9,2"
 group/scalar/gap_and_span[0]/status=0
+
+group/scalar/range[0]/output/line[0]="1,0"
+group/scalar/range[0]/output/line[1]="2,1"
+group/scalar/range[0]/output/line[2]="3,1"
+group/scalar/range[0]/output/line[3]="1,2"
+group/scalar/range[0]/output/line[4]="2,3"
+group/scalar/range[0]/output/line[5]="3,3"
+group/scalar/range[0]/status=0
+group/scalar/range[1]/output/line[0]="2,0"
+group/scalar/range[1]/output/line[1]="3,0"
+group/scalar/range[1]/output/line[2]="2,1"
+group/scalar/range[1]/output/line[3]="3,1"
+group/scalar/range[1]/status=0
+group/scalar/range[2]/output/line[0]="1,0"
+group/scalar/range[2]/output/line[1]="2,1"
+group/scalar/range[2]/output/line[2]="3,1"
+group/scalar/range[2]/output/line[3]="1,2"
+group/scalar/range[2]/output/line[4]="2,3"
+group/scalar/range[2]/output/line[5]="3,3"
+group/scalar/range[2]/status=0
+group/scalar/range[3]/output/line[0]="1,0"
+group/scalar/range[3]/output/line[1]="1,1"
+group/scalar/range[3]/status=0
+group/scalar/range[4]/output/line[0]="1,0"
+group/scalar/range[4]/output/line[1]="2,1"
+group/scalar/range[4]/output/line[2]="3,2"
+group/scalar/range[4]/output/line[3]="1,2"
+group/scalar/range[4]/output/line[4]="2,3"
+group/scalar/range[4]/output/line[5]="3,4"
+group/scalar/range[4]/status=0
+group/scalar/range[5]/output/line[0]="2,0"
+group/scalar/range[5]/output/line[1]="2,1"
+group/scalar/range[5]/status=0
+group/scalar/range[6]/output/line[0]="1,0"
+group/scalar/range[6]/output/line[1]="2,0"
+group/scalar/range[6]/output/line[2]="3,0"
+group/scalar/range[6]/output/line[3]="1,0"
+group/scalar/range[6]/output/line[4]="2,0"
+group/scalar/range[6]/output/line[5]="3,0"
+group/scalar/range[6]/status=0
+group/scalar/range[7]/output=""
+group/scalar/range[7]/status=0
diff --git a/csv/test/csv-blocks/group/input b/csv/test/csv-blocks/group/input
index f4bf3e794..79d9a03c2 100644
--- a/csv/test/csv-blocks/group/input
+++ b/csv/test/csv-blocks/group/input
@@ -13,3 +13,12 @@ group/scalar/span[4]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from s
 group/scalar/span[5]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --span 5"
 
 group/scalar/gap_and_span[0]="( echo 1; echo 2; echo 5; echo 6; echo 7; echo 8; echo 9 ) | csv-blocks group --fields scalar --gap 2 --span 4"
+
+group/scalar/range[0]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5
+group/scalar/range[1]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --discard-out-of-range
+group/scalar/range[2]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5
+group/scalar/range[3]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5 --discard-out-of-range
+group/scalar/range[4]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5
+group/scalar/range[5]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5 --discard-out-of-range
+group/scalar/range[6]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0
+group/scalar/range[7]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0 --discard-out-of-range

From 460a61fbc7f7663481ccff0ca3cb50437b781e73 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 18 Apr 2020 17:13:33 +1000
Subject: [PATCH 0151/1056] csv-repeat: a trivial regression bug fixed

---
 csv/applications/csv-repeat.cpp | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index 20bd972df..b622a6b4b 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -190,12 +190,6 @@ int main( int ac, char** av )
             output_csv.delimiter = csv.delimiter;
             ostream.reset( new comma::csv::output_stream< output_t >( std::cout, output_csv ) );
         }
-        boost::optional< boost::posix_time::time_duration > period;
-        if( options.exists( "--period" ) ) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
-        boost::posix_time::time_duration timeout;
-        boost::optional< double > timeout_seconds = options.optional< double >( "--timeout,-t" );
-        if( !period && !timeout_seconds ) { std::cerr << "csv-repeat: please specify either --period, or --timeout, or both" << std::endl; return 1; }
-        timeout = timeout_seconds ? boost::posix_time::microseconds( static_cast<unsigned int>(*timeout_seconds * 1000000 )) : *period;
         if( options.exists( "--output-fields" ) )
         {
             if( !options.exists( "--fields,-f" ) ) { std::cerr << "csv-repeat: --output-fields option requires --fields" << std::endl; return 1; }
@@ -212,6 +206,12 @@ int main( int ac, char** av )
             std::cout << std::endl;
             return 0;
         }
+        boost::optional< boost::posix_time::time_duration > period;
+        if( options.exists( "--period" ) ) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
+        boost::posix_time::time_duration timeout;
+        boost::optional< double > timeout_seconds = options.optional< double >( "--timeout,-t" );
+        if( !period && !timeout_seconds ) { std::cerr << "csv-repeat: please specify either --period, or --timeout, or both" << std::endl; return 1; }
+        timeout = timeout_seconds ? boost::posix_time::microseconds( static_cast<unsigned int>(*timeout_seconds * 1000000 )) : *period;
         std::cin.tie( NULL );
         if( options.exists( "--timestamped" ) )
         {

From 062fed947a8b3a02afa616ffe6c2ba5cefd43862 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 22 Apr 2020 10:15:59 +1000
Subject: [PATCH 0152/1056] comma-options-validate: support foo=bar style

---
 .../applications/test/comma-options-validate/expected      | 1 +
 application/applications/test/comma-options-validate/input | 1 +
 application/command_line_options.cpp                       | 7 ++++---
 3 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/application/applications/test/comma-options-validate/expected b/application/applications/test/comma-options-validate/expected
index 5840f904e..8fe979a91 100644
--- a/application/applications/test/comma-options-validate/expected
+++ b/application/applications/test/comma-options-validate/expected
@@ -10,6 +10,7 @@ valid_options/valued[2]/status=0
 valid_options/valued[3]/status=0
 valid_options/valued[4]/status=0
 valid_options/valued[5]/status=0
+valid_options/equals_sign[0]/status=0
 invalid_options/valueless[0]/status=1
 invalid_options/valueless[1]/status=1
 invalid_options/valueless[2]/status=1
diff --git a/application/applications/test/comma-options-validate/input b/application/applications/test/comma-options-validate/input
index 4782830e9..7b3c6a6f9 100644
--- a/application/applications/test/comma-options-validate/input
+++ b/application/applications/test/comma-options-validate/input
@@ -10,6 +10,7 @@ valid_options/valued[2]="echo '--file,-f=<v>' | comma-options-validate 4 -f -5"
 valid_options/valued[3]="echo '--file,-f=<v>' | comma-options-validate 4 -f -5 6"
 valid_options/valued[4]="echo '--file,-f=<v>' | comma-options-validate -f -5 -"
 valid_options/valued[5]="echo '--file,-f=<v>' | comma-options-validate - -f -5"
+valid_options/equals_sign[0]="echo '--file,-f=<v>' | comma-options-validate -f=-5"
 
 invalid_options/valueless[0]="echo '--verbose,-v' | comma-options-validate -v -g"
 invalid_options/valueless[1]="echo '--verbose,-v' | comma-options-validate hello -g -v"
diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index ecbff9b45..42a406177 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -195,9 +195,10 @@ void command_line_options::assert_valid( const std::vector< description >& d, bo
     for( unsigned int i = 0; i < d.size(); ++i ) { for( unsigned int j = 0; j < d[i].names.size(); ++j ) { m[ d[i].names[j] ] = d[i].has_value; } }
     for( unsigned int i = 1; i < argv_.size(); ++i )
     {
-        if( !boost::regex_match( argv_[i], boost::regex( "-.+" ) ) ) { continue; }
-        auto it = m.find( argv_[i] );
-        if( it == m.end() ) { COMMA_THROW( comma::exception, "unknown option " << argv_[i] ); }
+        std::string option_name = comma::split( argv_[i], '=' )[0];
+        if( !boost::regex_match( option_name, boost::regex( "-.+" ) ) ) { continue; }
+        auto it = m.find( option_name );
+        if( it == m.end() ) { COMMA_THROW( comma::exception, "unknown option " << option_name ); }
         if( it->second ) { ++i; }
     }
 }

From 1da57fa1c504a3d9c4c84833d219693616096253 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 30 Apr 2020 19:09:22 +1000
Subject: [PATCH 0153/1056] csv-strings: path-common: first cut implemented;
 more unit tests: todo...

---
 csv/applications/csv-strings.cpp | 289 +++++++++++++++++++------------
 csv/test/csv-strings/expected    |  41 +++++
 csv/test/csv-strings/input       |  27 +++
 3 files changed, 248 insertions(+), 109 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index f1140f820..095c3b24a 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -1,5 +1,3 @@
-// This file is provided in addition to comma and is not an integral
-// part of comma library.
 // Copyright (c) 2018 Vsevolod Vlaskine
 // All rights reserved.
 //
@@ -25,41 +23,15 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-// comma is a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 /// @author vsevolod vlaskine
 
+#include <deque>
 #include <functional>
 #include <iostream>
+
 #include <boost/filesystem.hpp>
 #include <boost/lexical_cast.hpp>
+
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
@@ -68,49 +40,55 @@
 
 static void usage( bool verbose )
 {
-    std::cerr << std::endl;
-    std::cerr << "operations on strings" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    usage: cat input.csv | csv-strings <operation> [<options>] > output.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "operations" << std::endl;
-    std::cerr << "    add" << std::endl;
-    std::cerr << "    path-basename,basename" << std::endl;
-    std::cerr << "    path-dirname,dirname" << std::endl;
-    std::cerr << "    path-real,path-canonical,canonical" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --emplace; perform operation emplace" << std::endl;
-    std::cerr << "    --fields=[<fields>]; will perform operation on any non-empty fields" << std::endl;
-    std::cerr << "                         unless different semantics specified for operation" << std::endl;
-    std::cerr << "                         default: perform operation on the first field" << std::endl;
-    std::cerr << "    --strict; exit on strings on which operation does not make sense" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "add" << std::endl;
-    std::cerr << "    options" << std::endl;
-    std::cerr << "        --prefix=[<prefix>]; add prefix" << std::endl;
-    std::cerr << "        --suffix=[<suffix>]; add suffix" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "path-basename,basename" << std::endl;
-    std::cerr << "    options" << std::endl;
-    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to remove" << std::endl;
-    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to keep" << std::endl;
-    std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "path-dirname,dirname" << std::endl;
-    std::cerr << "    options" << std::endl;
-    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to keep" << std::endl;
-    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to remove" << std::endl;
-    std::cerr << "        --path-delimiter,-p=<delimiter>; default=/" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "path-real,path-canonical,canonical" << std::endl;
-    std::cerr << "    options" << std::endl;
-    std::cerr << "        --base=[<path>]; base path, default: current directory" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "csv options:" << std::endl;
-    std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;
-    std::cerr << std::endl;
-    exit( 0 );
+    std::cerr << '\n';
+    std::cerr << "operations on strings\n";
+    std::cerr << '\n';
+    std::cerr << "    usage: cat input.csv | csv-strings <operation> [<options>] > output.csv\n";
+    std::cerr << '\n';
+    std::cerr << "operations\n";
+    std::cerr << "    add\n";
+    std::cerr << "    path-basename,basename\n";
+    std::cerr << "    path-common\n";
+    std::cerr << "    path-dirname,dirname\n";
+    std::cerr << "    path-real,path-canonical\n";
+    std::cerr << '\n';
+    std::cerr << "options\n";
+    std::cerr << "    --emplace; perform operation emplace\n";
+    std::cerr << "    --fields=[<fields>]; will perform operation on any non-empty fields\n";
+    std::cerr << "                         unless different semantics specified for operation\n";
+    std::cerr << "                         default: perform operation on the first field\n";
+    std::cerr << "    --strict; exit on strings on which operation does not make sense\n";
+    std::cerr << '\n';
+    std::cerr << "add\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --prefix=[<prefix>]; add prefix\n";
+    std::cerr << "        --suffix=[<suffix>]; add suffix\n";
+    std::cerr << '\n';
+    std::cerr << "path-basename,basename\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to remove\n";
+    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to keep\n";
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default: '/'\n";
+    std::cerr << '\n';
+    std::cerr << "path-common\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --once; output only the common path, do not append or emplace\n";
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default: '/'\n";
+    std::cerr << '\n';
+    std::cerr << "path-dirname,dirname\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to keep\n";
+    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to remove\n";
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default: '/'\n";
+    std::cerr << '\n';
+    std::cerr << "path-real,path-canonical\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --base=[<path>]; base path, default: current directory\n";
+    std::cerr << '\n';
+    std::cerr << "csv options\n";
+    std::cerr << comma::csv::options::usage( "", verbose ) << '\n';
+    std::cerr << '\n';
+    exit( EXIT_SUCCESS );
 }
 
 static bool strict;
@@ -122,7 +100,7 @@ template < typename T >
 struct record
 { 
     std::vector< T > values;
-    record( unsigned int n = 0 ): values( n ) {}
+    record( unsigned int n = 0 ) : values( n ) {}
 };
 
 typedef record< std::string > input;
@@ -144,7 +122,8 @@ namespace comma { namespace applications { namespace strings {
 template < typename T >
 static int run( const comma::command_line_options& options )
 {
-    auto v = comma::split( ::csv.fields, ',' );
+    if( ::csv.binary() && !options.exists( "--emplace") ) { std::cerr << "csv-strings: path-" << T::name() << ": binary mode supported only for --emplace; todo, just ask\n"; exit( 1 ); }
+    auto v = comma::split( ::csv.fields, options.value( "--delimiter", ',' ) );
     unsigned int n = 0;
     for( unsigned int i = 0; i < v.size(); ++i )
     {
@@ -155,8 +134,8 @@ static int run( const comma::command_line_options& options )
     ::csv.fields = n == 0 ? std::string( "values[0]" ) : comma::join( v, ',' );
     if( n == 0 ) { ++n; }
     comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
-    std::function< void( const input& p ) > write;
-    auto run_ = [&]()->int
+    std::function< void( const typename T::output_t& p ) > write;
+    auto run_ = [&]() -> int
     {
         T t( options );
         while( istream.ready() || std::cin.good() )
@@ -173,12 +152,11 @@ static int run( const comma::command_line_options& options )
     if( options.exists( "--emplace" ) )
     {
         comma::csv::passed< input > passed( istream, std::cout, ::csv.flush );
-        write = [&]( const input& p ) { passed.write( p ); };
+        write = [&]( const typename T::output_t& p ) { passed.write( p ); };
         return run_();
     }
     comma::csv::options output_csv = ::csv;
     output_csv.fields = "values";
-    if( ::csv.binary() ) { std::cerr << "csv-strings: path-" << T::name() << ": binary mode supported only for --emplace; todo, just ask" << std::endl; exit( 1 ); }
     comma::csv::output_stream< typename T::output_t > ostream( std::cout, output_csv, input( n ) );
     comma::csv::tied< input, typename T::output_t > tied( istream, ostream );
     write = [&]( const typename T::output_t& p ) { tied.append( p ); };
@@ -190,13 +168,13 @@ namespace path {
 struct basename
 {
     typedef input output_t;
-    
+
     unsigned int head;
     unsigned int tail;
     char delimiter;
-    
-    static const char* name() { return "basename"; }
-    
+
+    static constexpr char const* name() { return "basename"; }
+
     basename( const comma::command_line_options& options )
         : head( options.value( "--head", 0 ) )
         , tail( options.value( "--tail", 1 ) )
@@ -204,32 +182,31 @@ struct basename
     {
         options.assert_mutually_exclusive( "--head,--tail" );
     }
-    
-    std::string convert( const std::string& t )
+
+    std::string convert( const std::string& t ) const
     {
         const auto& s = comma::split( t, delimiter );
         if( head > 0 )
         {
             if( s.size() >= head ) { return comma::join( s.begin() + head, s.end(), delimiter ); }
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-            return "";
+            return {};
         }
         if( s.size() >= tail ) { return comma::join( s.end() - tail, s.end(), delimiter ); }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-        return "";
+        return {};
     }
 };
 
 struct dirname
 {
     typedef input output_t;
-    
     unsigned int head;
     unsigned int tail;
     char delimiter;
-    
-    static const char* name() { return "dirname"; }
-    
+
+    static constexpr char const* name() { return "dirname"; }
+
     dirname( const comma::command_line_options& options )
         : head( options.value( "--head", 0 ) )
         , tail( options.value( "--tail", 1 ) )
@@ -237,19 +214,19 @@ struct dirname
     {
         options.assert_mutually_exclusive( "--head,--tail" );
     }
-    
-    std::string convert( const std::string& t )
+
+    std::string convert( const std::string& t ) const
     {
         const auto& s = comma::split( t, delimiter );
         if( head > 0 )
         {
             if( s.size() >= head ) { return comma::join( s.begin(), s.begin() + head, delimiter ); }
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-            return "";
+            return {};
         }
         if( s.size() >= tail ) { return comma::join( s.begin(), s.end() - tail, delimiter ); }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-        return "";
+        return {};
     }
 };
 
@@ -258,8 +235,8 @@ struct canonical
     typedef input output_t;
     
     boost::filesystem::path base;
-    
-    static const char* name() { return "canonical"; }
+
+    static constexpr char const* name() { return "canonical"; }
     
     canonical( const comma::command_line_options& options )
         : base( options.exists( "--base" )
@@ -268,24 +245,117 @@ struct canonical
     {
         if( ( options.value( "--path-delimiter,-p", '/' ) ) != '/' ) { COMMA_THROW( comma::exception, "path-canonical: expected path delimiter '/'; got: '" << options.value( "--path-delimiter,-p", '/' ) << "'" ); }
     }
-    
-    std::string convert( const std::string& s )
+
+    std::string convert( const std::string& s ) const
     {
         try { return boost::filesystem::canonical( boost::filesystem::path( s ), base ).string(); } catch( ... ) { if( strict ) { throw; } }
         return s;
     }
 };
 
+namespace common {
+
+typedef input output_t;
+
+// todo
+// - fix code so that failing test pass
+// - add more tests, something like
+//   - echo abc; echo ab
+//   - echo ab; echo abc
+//   - echo /a; echo /a/b
+//   - echo /ab; echo /ac
+//   - echo /b; echo /c
+//   - echo /bb; echo /cc
+//   - echo /a; echo /
+//   - echo /; echo /a
+//   - etc
+
+static int run( const comma::command_line_options& options )
+{
+    if( ::csv.binary() ) { std::cerr << "csv-strings: path-common: binary mode: todo, just ask" << std::endl; exit( 1 ); }
+    if( options.exists( "--emplace ") ) { std::cerr << "csv-strings: path-common: --emplace: todo, just ask" << std::endl; exit( 1 ); }
+    auto v = comma::split( ::csv.fields, options.value( "--delimiter", ',' ) );
+    unsigned int n = 0;
+    for( unsigned int i = 0; i < v.size(); ++i )
+    {
+        if( v[i].empty() ) { continue; }
+        v[i] = "values[" + boost::lexical_cast< std::string >( n ) + "]";
+        ++n;
+    }
+    ::csv.fields = n == 0 ? std::string( "values[0]" ) : comma::join( v, ',' );
+    if( n == 0 ) { ++n; }
+    comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
+    std::deque< std::string > inputs;
+    output_t output;
+    char delimiter = options.value( "--path-delimiter,-p", '/' );
+    bool once = options.exists( "--once" );
+    while( istream.ready() || std::cin.good() )
+    {
+        auto p = istream.read();
+        if( !p ) { break; }
+        if( !once ) { inputs.emplace_back( istream.last() ); }
+        for( const auto& s: p->values )
+        {
+            if( s.size() > 1 && s.back() == delimiter ) { std::cerr << "csv-strings: path-common: handling trailing path delimiter not implemented; got;'" << s << "'" << std::endl; exit( 1 ); }
+        }
+        if( output.values.empty() ) { output.values = p->values; continue; }
+        for( std::size_t i = 0; i < p->values.size(); ++i )
+        {
+            if( ( output.values[i][0] == delimiter ) != ( p->values[i][0] == delimiter ) ) { std::cerr << "csv-string: path-common: expected all paths absolute or all relative; got: '" << output.values[i][0] << "' and '" << p->values[i][0] << "'" << std::endl; exit( 1 ); }
+            unsigned int j = 0;
+            for( ; j < output.values[i].size() && j < p->values[i].size() && output.values[i][j] == p->values[i][j]; ++j );
+            if( ( j < output.values[i].size() && output.values[i][j] != delimiter ) || ( j < p->values[i].size() && p->values[i][j] != delimiter ) )
+            {
+                j = output.values[i].substr( 0, j ).find_last_of( delimiter );
+                if( j == std::string::npos ) { j = 0; }
+                else if( j == 0 ) { j = 1; } // root only
+            }
+            output.values[i] = output.values[i].substr( 0, j );
+        }
+    }
+    if( once )
+    {
+        std::string comma;
+        for( auto& value : output.values ) { std::cout << comma << value; comma = ::csv.delimiter; }
+        std::cout << std::endl;
+    }
+    else
+    {
+        for( const auto& input : inputs )
+        {
+            std::cout.write( &input[0], input.size() );
+            if( ::csv.binary() )
+            {
+                COMMA_THROW( comma::exception, "todo" );
+            }
+            else
+            {
+                for( const auto& value: output.values ) { std::cout << ::csv.delimiter << value; }
+                std::cout << std::endl;
+            }
+        }
+    }
+    return 0;
+}
+
+} // namespace common {
+
 } // namespace path {
 
 struct add
 {
     typedef input output_t;
+
     std::string prefix;
     std::string suffix;
-    static const char* name() { return "add"; }
-    add( const comma::command_line_options& options ): prefix( options.value( "--prefix", std::string() ) ), suffix( options.value( "--suffix", std::string() ) ) {}
-    std::string convert( const std::string& t ) { return prefix + t + suffix; }
+
+    static constexpr char const* name() { return "add"; }
+
+    explicit add( const comma::command_line_options& options )
+        : prefix( options.value( "--prefix", std::string() ) )
+        , suffix( options.value( "--suffix", std::string() ) ) {}
+
+    inline std::string convert( const std::string& t ) const { return prefix + t + suffix; }
 };
     
 } } } // namespace comma { namespace applications { namespace strings {
@@ -295,19 +365,20 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace,--strict", "-.*" );
-        if( unnamed.empty() ) { std::cerr << "csv-strings: please specify operation" << std::endl; return 1; }
+        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace,--strict,--once", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-strings: please specify operation\n"; return 1; }
         std::string operation = unnamed[0];
         strict = options.exists( "--strict" );
         csv = comma::csv::options( options );
         if( operation == "add" ) { return comma::applications::strings::run< comma::applications::strings::add >( options ); }
         if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::run< comma::applications::strings::path::basename >( options ); }
         if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::run< comma::applications::strings::path::dirname >( options ); }
-        if( operation == "path-real" || operation == "path-canonical" || operation == "canonical" ) { return comma::applications::strings::run< comma::applications::strings::path::canonical >( options ); }
-        std::cerr << "csv-strings: expection operation; got: '" << operation << "'" << std::endl;
+        if( operation == "path-real" || operation == "path-canonical" ) { return comma::applications::strings::run< comma::applications::strings::path::canonical >( options ); }
+        if( operation == "path-common" ) { return comma::applications::strings::path::common::run( options ); }
+        std::cerr << "csv-strings: expection operation; got: '" << operation << "'\n";
         return 1;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-strings: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-strings: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-strings: " << ex.what() << '\n'; }
+    catch( ... ) { std::cerr << "csv-strings: unknown exception\n"; }
     return 1;
 }
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index 88e6f5b44..f69d8f492 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -24,6 +24,10 @@ basename/emplace[3]/output/line[0]=","
 basename/emplace[3]/output/line[1]=","
 basename/emplace[3]/output/line[2]=","
 
+basename/binary/emplace[0]/output/line[0]="a"
+basename/binary/emplace[0]/output/line[1]="b"
+basename/binary/emplace[0]/output/line[2]="c"
+
 basename/head/append[0]/output/line[0]="a,"
 basename/head/append[0]/output/line[1]="a/b,b"
 basename/head/append[0]/output/line[2]="a/b/c,b/c"
@@ -38,6 +42,10 @@ basename/head/emplace[1]/output/line[0]=""
 basename/head/emplace[1]/output/line[1]=""
 basename/head/emplace[1]/output/line[2]="c"
 
+basename/binary/head/emplace[0]/output/line[0]=""
+basename/binary/head/emplace[0]/output/line[1]="b"
+basename/binary/head/emplace[0]/output/line[2]="b/c"
+
 dirname/tail/append[0]/output/line[0]="a,"
 dirname/tail/append[0]/output/line[1]="a/b,a"
 dirname/tail/append[0]/output/line[2]="a/b/c,a/b"
@@ -64,6 +72,10 @@ dirname/tail/emplace[3]/output/line[0]=","
 dirname/tail/emplace[3]/output/line[1]=","
 dirname/tail/emplace[3]/output/line[2]=","
 
+dirname/binary/tail/emplace[0]/output/line[0]=""
+dirname/binary/tail/emplace[0]/output/line[1]="a"
+dirname/binary/tail/emplace[0]/output/line[2]="a/b"
+
 dirname/head/append[0]/output/line[0]="a,"
 dirname/head/append[0]/output/line[1]="a/b,a"
 dirname/head/append[0]/output/line[2]="a/b/c,a/b"
@@ -90,6 +102,10 @@ dirname/head/emplace[3]/output/line[0]=","
 dirname/head/emplace[3]/output/line[1]=","
 dirname/head/emplace[3]/output/line[2]=","
 
+dirname/binary/head/emplace[0]/output/line[0]=""
+dirname/binary/head/emplace[0]/output/line[1]="a"
+dirname/binary/head/emplace[0]/output/line[2]="a/b"
+
 delimiter[0]/output/line[0]="a.a"
 delimiter[0]/output/line[1]="a.b.a"
 delimiter[0]/output/line[2]="a.b/c.d/e.a"
@@ -137,3 +153,28 @@ fields[5]/output/line[2]="m,,a,,x"
 
 add[0]/output="a,b,xay,xby"
 add[1]/output="xay,xby"
+
+path_common/once[0]/output="a/b"
+path_common/once[1]/output="/a/b"
+path_common/once[2]/output="a"
+path_common/once[3]/output="/a"
+path_common/once[4]/output="a/b"
+path_common/once[5]/output="a"
+path_common/once[6]/output="/a/b/c"
+path_common/once[7]/output="/"
+path_common/once[8]/output=""
+path_common/once[9]/output="a/b,d/e,g/h"
+path_common/once[10]/output="g/h"
+path_common/once[11]/output="a/b,g/h"
+
+path_common/delimiter[0]/output="a-b,g-h"
+
+path_common/fields[0]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,d/e,g/h"
+path_common/fields[0]/output/line[1]="a/b/d,d/e,g/h/k,a/b,d/e,g/h"
+path_common/fields[0]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,d/e,g/h"
+path_common/fields[1]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,g/h"
+path_common/fields[1]/output/line[1]="a/b/d,d/e,g/h/k,a/b,g/h"
+path_common/fields[1]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,g/h"
+path_common/fields[2]/output/line[0]="a/b/c,d/e/f,g/h/i,g/h"
+path_common/fields[2]/output/line[1]="a/b/d,d/e,g/h/k,g/h"
+path_common/fields[2]/output/line[2]="a/b/z,d/e/x,g/h/y,g/h"
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index ae544b409..4f4f94ccd 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -8,12 +8,16 @@ basename/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basenam
 basename/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3 --emplace"
 basename/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-basename --tail 4 --emplace"
 
+basename/binary/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-basename --emplace --binary s[6] | csv-from-bin s[6]"
+
 basename/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1"
 basename/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2"
 
 basename/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1 --emplace"
 basename/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2 --emplace"
 
+basename/binary/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-basename --head 1 --emplace --binary s[6] | csv-from-bin s[6]"
+
 dirname/tail/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
 dirname/tail/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2"
 dirname/tail/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 3"
@@ -24,6 +28,8 @@ dirname/tail/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dir
 dirname/tail/emplace[2]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 3 --emplace"
 dirname/tail/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 4 --emplace"
 
+dirname/binary/tail/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-dirname --emplace --binary s[6] | csv-from-bin s[6]"
+
 dirname/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
 dirname/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2"
 dirname/head/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3"
@@ -34,6 +40,8 @@ dirname/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dir
 dirname/head/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3 --emplace"
 dirname/head/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --head 4 --emplace"
 
+dirname/binary/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-dirname --emplace --binary s[6] | csv-from-bin s[6]"
+
 delimiter[0]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=."
 delimiter[1]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=. --emplace"
 delimiter[2]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-dirname --delimiter=."
@@ -55,3 +63,22 @@ fields[5]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-string
 
 add[0]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b"
 add[1]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b --emplace"
+
+path_common/once[0]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --once"
+path_common/once[1]="{ echo /a/b/c; echo /a/b/d; echo /a/b/e; } | csv-strings path-common --once"
+path_common/once[2]="{ echo a; echo a; echo a; } | csv-strings path-common --once"
+path_common/once[3]="{ echo /a; echo /a; echo /a; } | csv-strings path-common --once"
+path_common/once[4]="{ echo a/b; echo a/b; echo a/b; } | csv-strings path-common --once"
+path_common/once[5]="{ echo a; } | csv-strings path-common --once"
+path_common/once[6]="{ echo /a/b/c; } | csv-strings path-common --once"
+path_common/once[7]="{ echo /a/b; echo /c/d; } | csv-strings path-common --once"
+path_common/once[8]="{ echo; echo; } | csv-strings path-common --once"
+path_common/once[9]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --once"
+path_common/once[10]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c --once"
+path_common/once[11]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c --once"
+
+path_common/delimiter[0]="{ echo a-b-c,d-e-f,g-h-i; echo a-b-d,d-e,g-h-k; echo a-b-z,d-e-x,g-h-y; } | csv-strings path-common --fields a,,c --once --path-delimiter -"
+
+path_common/fields[0]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c"
+path_common/fields[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c"
+path_common/fields[2]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c"

From 65ad8f34bae40aeb406189fd3d80d64896a1b701 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Fri, 1 May 2020 13:14:39 +1000
Subject: [PATCH 0154/1056] string: common_front() implemented, unit test
 added; csv-strings: common_front() used

---
 csv/applications/csv-strings.cpp | 18 +------------
 csv/test/csv-strings/expected    | 13 +++-------
 csv/test/csv-strings/input       | 17 +++++-------
 string/string.cpp                | 33 ++++++++++++++++++++++++
 string/string.h                  | 16 +++++++++---
 string/test/string_test.cpp      | 44 ++++++++++++++++++++++++++++++++
 6 files changed, 100 insertions(+), 41 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 095c3b24a..c115df49d 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -294,24 +294,8 @@ static int run( const comma::command_line_options& options )
         auto p = istream.read();
         if( !p ) { break; }
         if( !once ) { inputs.emplace_back( istream.last() ); }
-        for( const auto& s: p->values )
-        {
-            if( s.size() > 1 && s.back() == delimiter ) { std::cerr << "csv-strings: path-common: handling trailing path delimiter not implemented; got;'" << s << "'" << std::endl; exit( 1 ); }
-        }
         if( output.values.empty() ) { output.values = p->values; continue; }
-        for( std::size_t i = 0; i < p->values.size(); ++i )
-        {
-            if( ( output.values[i][0] == delimiter ) != ( p->values[i][0] == delimiter ) ) { std::cerr << "csv-string: path-common: expected all paths absolute or all relative; got: '" << output.values[i][0] << "' and '" << p->values[i][0] << "'" << std::endl; exit( 1 ); }
-            unsigned int j = 0;
-            for( ; j < output.values[i].size() && j < p->values[i].size() && output.values[i][j] == p->values[i][j]; ++j );
-            if( ( j < output.values[i].size() && output.values[i][j] != delimiter ) || ( j < p->values[i].size() && p->values[i][j] != delimiter ) )
-            {
-                j = output.values[i].substr( 0, j ).find_last_of( delimiter );
-                if( j == std::string::npos ) { j = 0; }
-                else if( j == 0 ) { j = 1; } // root only
-            }
-            output.values[i] = output.values[i].substr( 0, j );
-        }
+        for( std::size_t i = 0; i < p->values.size(); ++i ) { output.values[i] = comma::common_front( output.values[i], p->values[i], delimiter ); }
     }
     if( once )
     {
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index f69d8f492..ff4c541dc 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -155,17 +155,12 @@ add[0]/output="a,b,xay,xby"
 add[1]/output="xay,xby"
 
 path_common/once[0]/output="a/b"
-path_common/once[1]/output="/a/b"
+path_common/once[1]/output="/"
 path_common/once[2]/output="a"
 path_common/once[3]/output="/a"
-path_common/once[4]/output="a/b"
-path_common/once[5]/output="a"
-path_common/once[6]/output="/a/b/c"
-path_common/once[7]/output="/"
-path_common/once[8]/output=""
-path_common/once[9]/output="a/b,d/e,g/h"
-path_common/once[10]/output="g/h"
-path_common/once[11]/output="a/b,g/h"
+path_common/once[4]/output="a/b,d/e,g/h"
+path_common/once[5]/output="g/h"
+path_common/once[6]/output="a/b,g/h"
 
 path_common/delimiter[0]/output="a-b,g-h"
 
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index 4f4f94ccd..85bb3e6f6 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -65,17 +65,12 @@ add[0]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b"
 add[1]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b --emplace"
 
 path_common/once[0]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --once"
-path_common/once[1]="{ echo /a/b/c; echo /a/b/d; echo /a/b/e; } | csv-strings path-common --once"
-path_common/once[2]="{ echo a; echo a; echo a; } | csv-strings path-common --once"
-path_common/once[3]="{ echo /a; echo /a; echo /a; } | csv-strings path-common --once"
-path_common/once[4]="{ echo a/b; echo a/b; echo a/b; } | csv-strings path-common --once"
-path_common/once[5]="{ echo a; } | csv-strings path-common --once"
-path_common/once[6]="{ echo /a/b/c; } | csv-strings path-common --once"
-path_common/once[7]="{ echo /a/b; echo /c/d; } | csv-strings path-common --once"
-path_common/once[8]="{ echo; echo; } | csv-strings path-common --once"
-path_common/once[9]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --once"
-path_common/once[10]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c --once"
-path_common/once[11]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c --once"
+path_common/once[1]="{ echo /; } | csv-strings path-common --once"
+path_common/once[2]="{ echo a; } | csv-strings path-common --once"
+path_common/once[3]="{ echo /a; } | csv-strings path-common --once"
+path_common/once[4]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --once"
+path_common/once[5]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c --once"
+path_common/once[6]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c --once"
 
 path_common/delimiter[0]="{ echo a-b-c,d-e-f,g-h-i; echo a-b-d,d-e,g-h-k; echo a-b-z,d-e-x,g-h-y; } | csv-strings path-common --fields a,,c --once --path-delimiter -"
 
diff --git a/string/string.cpp b/string/string.cpp
index c8229b4e4..c12187eec 100644
--- a/string/string.cpp
+++ b/string/string.cpp
@@ -37,6 +37,8 @@
 #include "../base/exception.h"
 #include "string.h"
 
+#include <iostream>
+
 namespace comma {
 
 std::string strip( const std::string& s, char character )
@@ -139,4 +141,35 @@ std::string unescape_and_unquote( const std::string & s, char esc, const char* q
     return v;
 }
 
+std::string common_front( const std::string& s, const std::string& t )
+{
+    std::string::size_type i = 0;
+    for( ; i < s.size() && i < t.size() && s[i] == t[i]; ++i );
+    return s.substr( 0, i );
+}
+
+std::string common_front( const std::string& s, const std::string& t, char delimiter )
+{
+    bool s_abs = !s.empty() && s[0] == delimiter;
+    bool t_abs = !t.empty() && t[0] == delimiter;
+    if( s_abs != t_abs ) { COMMA_THROW( comma::exception, "expected both paths absolute or both relative; got '" << s << "' and '" << t << "'" ); }
+    std::string::size_type i = 0;
+    std::string::size_type d = 0;
+    for( ; i < s.size() && i < t.size() && s[i] == t[i]; ++i );
+    if( i < s.size() && s[i] != delimiter )
+    {
+        i = s.find_last_of( delimiter, i );
+        if( i == 0 ) { i = 1; } // root only
+    }
+    else if( i < t.size() && t[i] != delimiter )
+    {
+        i = t.find_last_of( delimiter, i );
+        if( i == 0 ) { i = 1; } // root only
+    }
+    if( i == std::string::npos ) { i = 0; }
+    else if( i == s.size() && s.size() > 1 && s.back() == delimiter ) { --i; }
+    return s.substr( 0, i );
+}
+
+
 } // namespace comma {
diff --git a/string/string.h b/string/string.h
index 2d3e2efd1..a9b68392d 100644
--- a/string/string.h
+++ b/string/string.h
@@ -47,16 +47,24 @@ std::string strip( const std::string& s, const char* characters = " \t\r\n" );
 /// strip given character from the beginning and end
 std::string strip( const std::string& s, char character );
 
-// Escape given character and escape characters by preceding them with escape charcter.
+// escape given character and escape characters by preceding them with escape charcter.
 std::string escape( const std::string & s, char character = '\'', char esc = '\\' );
-// Escape any of the given characters and escape character by preceding them with escape character
+// escape any of the given characters and escape character by preceding them with escape character
 std::string escape( const std::string & s, const char* characters, char esc = '\\' );
 
-// Escape given character and escape characters by preceding them with escape charcter.
+// escape given character and escape characters by preceding them with escape charcter.
 std::string unescape( const std::string & s, char character = '\'', char esc = '\\' );
-// Escape any of the given characters and escape character by preceding them with escape character
+// escape any of the given characters and escape character by preceding them with escape character
 std::string unescape( const std::string & s, const char* characters, char esc = '\\' );
 
+/// return common initial part of two strings
+/// e.g. for abc and abd return ab; for abc and def return empty string
+std::string common_front( const std::string& s, const std::string& t );
+
+/// return common initial part of two strings as xpaths with a delimiter (probably should be in xpath)
+/// e.g. for abc and abd return ab; for abc and def return empty string
+std::string common_front( const std::string& s, const std::string& t, char delimiter ); 
+
 /// join array elements into a string with given delimiter
 template < typename A >
 std::string join( const A& a, std::size_t size, char delimiter );
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 8b9e75059..fe58e918d 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -350,6 +350,50 @@ TEST( string, strip )
     EXPECT_EQ( strip( ";,;abc;;,", ";," ), "abc" );
 }
 
+TEST( string, common_head )
+{
+    EXPECT_EQ( "", common_front( "", "" ) );
+    EXPECT_EQ( "", common_front( "", "a" ) );
+    EXPECT_EQ( "", common_front( "", "ab" ) );
+    EXPECT_EQ( "", common_front( "", "abc" ) );
+    EXPECT_EQ( "", common_front( "a", "" ) );
+    EXPECT_EQ( "", common_front( "ab", "" ) );
+    EXPECT_EQ( "", common_front( "abc", "" ) );
+    EXPECT_EQ( "", common_front( "a", "b" ) );
+    EXPECT_EQ( "", common_front( "abc", "def" ) );
+    EXPECT_EQ( "a", common_front( "ab", "ac" ) );
+    EXPECT_EQ( "ab", common_front( "abc", "abd" ) );
+}
+
+TEST( string, common_head_delimiter )
+{
+    EXPECT_EQ( common_front( "", "", '/' ), "" );
+    EXPECT_EQ( common_front( "a", "b", '/' ), "" );
+    EXPECT_EQ( common_front( "ab", "cd", '/' ), "" );
+    EXPECT_EQ( common_front( "ab", "abc", '/' ), "" );
+    EXPECT_EQ( common_front( "/", "/", '/' ), "/" );
+    EXPECT_EQ( common_front( "/a", "/b", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab", "/cd", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab", "/abc", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab/", "/abc", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab/", "/abc/", '/' ), "/" );
+    EXPECT_EQ( common_front( "a/b", "a/c", '/' ), "a" );
+    EXPECT_EQ( common_front( "a/b/", "a/c", '/' ), "a" );
+    EXPECT_EQ( common_front( "a/b", "a/c/", '/' ), "a" );
+    EXPECT_EQ( common_front( "a/b/", "a/c/", '/' ), "a" );
+    EXPECT_EQ( common_front( "/a/b", "/a/c", '/' ), "/a" );
+    EXPECT_EQ( common_front( "ab/cd", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/", "ab/cd/", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef", "ab/cd/xy", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd", "ab/cd/", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd", "ab/cd/ef", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef/", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef/", "ab/cd/", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef", "ab/cd/", '/' ), "ab/cd" );
+}
+
 } // namespace comma {
 
 int main( int argc, char* argv[] )

From ccd7163ea85cb9146a8c6a206b716ae287360037 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Fri, 1 May 2020 13:23:58 +1000
Subject: [PATCH 0155/1056] csv-eval: installation moved from cmake to setup.py

---
 python/comma/CMakeLists.txt                  | 11 +++--------
 python/comma/application/CMakeLists.txt      |  0
 python/comma/csv/CMakeLists.txt              |  1 -
 python/comma/csv/applications/CMakeLists.txt |  1 -
 python/comma/io/CMakeLists.txt               |  0
 python/comma/util/CMakeLists.txt             |  0
 python/setup.py                              |  1 +
 7 files changed, 4 insertions(+), 10 deletions(-)
 delete mode 100644 python/comma/application/CMakeLists.txt
 delete mode 100644 python/comma/csv/CMakeLists.txt
 delete mode 100644 python/comma/csv/applications/CMakeLists.txt
 delete mode 100644 python/comma/io/CMakeLists.txt
 delete mode 100644 python/comma/util/CMakeLists.txt

diff --git a/python/comma/CMakeLists.txt b/python/comma/CMakeLists.txt
index 22a8a1305..5df8ec9cc 100644
--- a/python/comma/CMakeLists.txt
+++ b/python/comma/CMakeLists.txt
@@ -1,8 +1,3 @@
-ADD_SUBDIRECTORY( application )
-ADD_SUBDIRECTORY( csv )
-ADD_SUBDIRECTORY( io )
-ADD_SUBDIRECTORY( util )
-
-IF( BUILD_CPP_PYTHON_BINDINGS )
-    ADD_SUBDIRECTORY( cpp_bindings )
-ENDIF( BUILD_CPP_PYTHON_BINDINGS )
+if( BUILD_CPP_PYTHON_BINDINGS )
+    add_subdirectory( cpp_bindings )
+endif( BUILD_CPP_PYTHON_BINDINGS )
diff --git a/python/comma/application/CMakeLists.txt b/python/comma/application/CMakeLists.txt
deleted file mode 100644
index e69de29bb..000000000
diff --git a/python/comma/csv/CMakeLists.txt b/python/comma/csv/CMakeLists.txt
deleted file mode 100644
index de33d8faa..000000000
--- a/python/comma/csv/CMakeLists.txt
+++ /dev/null
@@ -1 +0,0 @@
-ADD_SUBDIRECTORY( applications )
diff --git a/python/comma/csv/applications/CMakeLists.txt b/python/comma/csv/applications/CMakeLists.txt
deleted file mode 100644
index ef8b8b8e9..000000000
--- a/python/comma/csv/applications/CMakeLists.txt
+++ /dev/null
@@ -1 +0,0 @@
-install( PROGRAMS csv-eval DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/python/comma/io/CMakeLists.txt b/python/comma/io/CMakeLists.txt
deleted file mode 100644
index e69de29bb..000000000
diff --git a/python/comma/util/CMakeLists.txt b/python/comma/util/CMakeLists.txt
deleted file mode 100644
index e69de29bb..000000000
diff --git a/python/setup.py b/python/setup.py
index 9f31132c5..05c56d2a5 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -8,6 +8,7 @@
         description         = 'comma python utilties',
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
+        scripts             =["comma/csv/applications/csv-eval"],
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] }

From 691ee0ee9d123426612bc150b3bef3cbc5560d56 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 6 May 2020 18:28:42 +1000
Subject: [PATCH 0156/1056] string: trivial complilation warning fixed

---
 string/string.cpp | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/string/string.cpp b/string/string.cpp
index c12187eec..1043d3265 100644
--- a/string/string.cpp
+++ b/string/string.cpp
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2019 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -32,8 +33,6 @@
 /// @author mathew hounsell
 
 #include <boost/optional.hpp>
-
-// Don't use <> foc comma as that requires the code to be installed first.
 #include "../base/exception.h"
 #include "string.h"
 
@@ -154,7 +153,6 @@ std::string common_front( const std::string& s, const std::string& t, char delim
     bool t_abs = !t.empty() && t[0] == delimiter;
     if( s_abs != t_abs ) { COMMA_THROW( comma::exception, "expected both paths absolute or both relative; got '" << s << "' and '" << t << "'" ); }
     std::string::size_type i = 0;
-    std::string::size_type d = 0;
     for( ; i < s.size() && i < t.size() && s[i] == t[i]; ++i );
     if( i < s.size() && s[i] != delimiter )
     {

From a81044b3ab58dbb9773157d7791920f823c1711e Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 7 May 2020 14:24:16 +1000
Subject: [PATCH 0157/1056] csv-strings: path-common: --dirname-on-...: in
 progress...

---
 csv/applications/csv-strings.cpp | 32 +++++++++++++++++---------------
 1 file changed, 17 insertions(+), 15 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index c115df49d..d2e1474eb 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -73,6 +73,10 @@ static void usage( bool verbose )
     std::cerr << "path-common\n";
     std::cerr << "    options\n";
     std::cerr << "        --once; output only the common path, do not append or emplace\n";
+    std::cerr << "        --dirname-on-single-record; if only one input record, output its 'dirname'; e.g: on a single\n";
+    std::cerr << "                                    input record 'a/b/c' output 'a/b'\n";
+    std::cerr << "        --dirname-on-full-match; if there is an input record that fully matches the common path\n";
+    std::cerr << "                                 output its 'dirname'; e.g: on 'a/b/c' and 'a/b/c/d' output 'a/b'\n";
     std::cerr << "        --path-delimiter,-p=<delimiter>; default: '/'\n";
     std::cerr << '\n';
     std::cerr << "path-dirname,dirname\n";
@@ -257,19 +261,6 @@ namespace common {
 
 typedef input output_t;
 
-// todo
-// - fix code so that failing test pass
-// - add more tests, something like
-//   - echo abc; echo ab
-//   - echo ab; echo abc
-//   - echo /a; echo /a/b
-//   - echo /ab; echo /ac
-//   - echo /b; echo /c
-//   - echo /bb; echo /cc
-//   - echo /a; echo /
-//   - echo /; echo /a
-//   - etc
-
 static int run( const comma::command_line_options& options )
 {
     if( ::csv.binary() ) { std::cerr << "csv-strings: path-common: binary mode: todo, just ask" << std::endl; exit( 1 ); }
@@ -289,13 +280,24 @@ static int run( const comma::command_line_options& options )
     output_t output;
     char delimiter = options.value( "--path-delimiter,-p", '/' );
     bool once = options.exists( "--once" );
+    bool dirname_on_single_record = options.exists( "--dirname-on-single-record" );
+    bool dirname_on_full_match = options.exists( "--dirname-on-full-match" );
+    if( dirname_on_full_match || dirname_on_single_record ) { std::cerr << "csv-strings: path-common: --dirname-on-...: todo" << std::endl; return 1; }
+    std::vector< char > full_match( output.values.size(), true );
+    unsigned int count = 0;
     while( istream.ready() || std::cin.good() )
     {
         auto p = istream.read();
         if( !p ) { break; }
         if( !once ) { inputs.emplace_back( istream.last() ); }
         if( output.values.empty() ) { output.values = p->values; continue; }
-        for( std::size_t i = 0; i < p->values.size(); ++i ) { output.values[i] = comma::common_front( output.values[i], p->values[i], delimiter ); }
+        for( std::size_t i = 0; i < p->values.size(); ++i )
+        {
+            const std::string& common = comma::common_front( output.values[i], p->values[i], delimiter );
+            if( dirname_on_single_record || dirname_on_full_match ) { full_match[i] = ( full_match[i] && output.values[i] == common ) || ( !full_match[i] && p->values[i] == common ); }
+            output.values[i] = common;
+        }
+        ++count;
     }
     if( once )
     {
@@ -349,7 +351,7 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace,--strict,--once", "-.*" );
+        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace,--strict,--once,--dirname-on-single-record,--dirname-on-full-match", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-strings: please specify operation\n"; return 1; }
         std::string operation = unnamed[0];
         strict = options.exists( "--strict" );

From 5532b2547fe0dab0caf030f166a06c9fd245110e Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Mon, 11 May 2020 16:54:24 +1000
Subject: [PATCH 0158/1056] csv-string: path-common: --dirname-on-* implemented
 (Kent Hu), reviewed and slightly refactored; todo: fix bug on root-only path
 in path-common and path-dirname, add regression tests

---
 csv/applications/csv-strings.cpp | 51 +++++++++++++++++++++-----------
 csv/test/csv-strings/expected    | 30 +++++++++++++++++++
 csv/test/csv-strings/input       | 20 +++++++++++++
 3 files changed, 83 insertions(+), 18 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index d2e1474eb..a76b63cdb 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -261,6 +261,14 @@ namespace common {
 
 typedef input output_t;
 
+// todo
+// - path-common --dirname-on-single-record
+//   - test case: expected / on ( echo /a ) | csv-strings path-common --dirname-on-single-record --field x
+//   - fix
+// - path-dirname
+//   - test case: expected / on ( echo /a ) | csv-strings path-common --dirname-on-single-record --field x
+//   - fix
+
 static int run( const comma::command_line_options& options )
 {
     if( ::csv.binary() ) { std::cerr << "csv-strings: path-common: binary mode: todo, just ask" << std::endl; exit( 1 ); }
@@ -282,8 +290,7 @@ static int run( const comma::command_line_options& options )
     bool once = options.exists( "--once" );
     bool dirname_on_single_record = options.exists( "--dirname-on-single-record" );
     bool dirname_on_full_match = options.exists( "--dirname-on-full-match" );
-    if( dirname_on_full_match || dirname_on_single_record ) { std::cerr << "csv-strings: path-common: --dirname-on-...: todo" << std::endl; return 1; }
-    std::vector< char > full_match( output.values.size(), true );
+    std::vector< char > full_match( n, true );
     unsigned int count = 0;
     while( istream.ready() || std::cin.good() )
     {
@@ -294,39 +301,47 @@ static int run( const comma::command_line_options& options )
         for( std::size_t i = 0; i < p->values.size(); ++i )
         {
             const std::string& common = comma::common_front( output.values[i], p->values[i], delimiter );
-            if( dirname_on_single_record || dirname_on_full_match ) { full_match[i] = ( full_match[i] && output.values[i] == common ) || ( !full_match[i] && p->values[i] == common ); }
+            if( dirname_on_full_match ) { full_match[i] = ( full_match[i] && output.values[i] == common ) || ( !full_match[i] && p->values[i] == common ); }
             output.values[i] = common;
         }
         ++count;
     }
+    if( dirname_on_full_match || ( dirname_on_single_record && count < 2 ) )
+    {
+        for( unsigned int i = 0; i < output.values.size(); ++i )
+        {
+            if( !full_match[i] ) { continue; }
+            const auto& s = comma::split( output.values[i], delimiter );
+            output.values[i] = comma::join( s.begin(), s.end() - 1, delimiter );
+        }
+    }
     if( once )
     {
-        std::string comma;
-        for( auto& value : output.values ) { std::cout << comma << value; comma = ::csv.delimiter; }
-        std::cout << std::endl;
+        if( ::csv.binary() ) { COMMA_THROW( comma::exception, "todo" ); }
+        else
+        {
+            std::string comma;
+            for( std::size_t i = 0; i < output.values.size(); ++i )
+            {
+                std::cout << comma << output.values[i];
+                comma = ::csv.delimiter;
+            }
+            std::cout << std::endl;
+        }
     }
     else
     {
         for( const auto& input : inputs )
         {
             std::cout.write( &input[0], input.size() );
-            if( ::csv.binary() )
-            {
-                COMMA_THROW( comma::exception, "todo" );
-            }
-            else
-            {
-                for( const auto& value: output.values ) { std::cout << ::csv.delimiter << value; }
-                std::cout << std::endl;
-            }
+            for( std::size_t i = 0; i < output.values.size(); ++i ) { std::cout << ::csv.delimiter << output.values[i]; }
+            std::cout << std::endl;
         }
     }
     return 0;
 }
 
-} // namespace common {
-
-} // namespace path {
+} } // namespace common { namespace path {
 
 struct add
 {
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index ff4c541dc..60d56360a 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -161,6 +161,7 @@ path_common/once[3]/output="/a"
 path_common/once[4]/output="a/b,d/e,g/h"
 path_common/once[5]/output="g/h"
 path_common/once[6]/output="a/b,g/h"
+path_common/once[7]/output="abc"
 
 path_common/delimiter[0]/output="a-b,g-h"
 
@@ -173,3 +174,32 @@ path_common/fields[1]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,g/h"
 path_common/fields[2]/output/line[0]="a/b/c,d/e/f,g/h/i,g/h"
 path_common/fields[2]/output/line[1]="a/b/d,d/e,g/h/k,g/h"
 path_common/fields[2]/output/line[2]="a/b/z,d/e/x,g/h/y,g/h"
+
+path_common/dirname_on_single_record[0]/output="a/b"
+path_common/dirname_on_single_record[1]/output="abc/def"
+path_common/dirname_on_single_record[2]/output="a/b"
+path_common/dirname_on_single_record[3]/output="a/b,d/e,g/h"
+path_common/dirname_on_single_record[4]/output="a/b,d/e,g/h"
+path_common/dirname_on_single_record[5]/output="abc,abc/abc,abc"
+path_common/dirname_on_single_record[6]/output=""
+path_common/dirname_on_single_record[7]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,d/e,g/h"
+path_common/dirname_on_single_record[7]/output/line[1]="a/b/d,d/e,g/h/k,a/b,d/e,g/h"
+path_common/dirname_on_single_record[7]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,d/e,g/h"
+path_common/dirname_on_single_record[8]/output/line[0]="a/b/c,a/b"
+path_common/dirname_on_single_record[8]/output/line[1]="a/b/d,a/b"
+path_common/dirname_on_single_record[8]/output/line[2]="a/b/z,a/b"
+
+path_common/dirname_on_full_match[0]/output="a/b"
+path_common/dirname_on_full_match[1]/output="abc/def"
+path_common/dirname_on_full_match[2]/output="a"
+path_common/dirname_on_full_match[3]/output="a/b"
+path_common/dirname_on_full_match[4]/output="a/b,d/e,g/h"
+path_common/dirname_on_full_match[5]/output=",abc,"
+path_common/dirname_on_full_match[6]/output/line[0]="abc/def/ghi,"
+path_common/dirname_on_full_match[6]/output/line[1]="abc/deg/hij,"
+path_common/dirname_on_full_match[6]/output/line[2]="abc/dgh/ijk,"
+path_common/dirname_on_full_match[6]/output/line[3]="abc,"
+path_common/dirname_on_full_match[7]/output/line[0]="abc/def/ghi,abc/abc/abc,abc/def/abc,,abc,"
+path_common/dirname_on_full_match[7]/output/line[1]="abc/deg/hij,abc/abc/abb,abc/def/hij,,abc,"
+path_common/dirname_on_full_match[7]/output/line[2]="abc/dgh/ijk,abc/abc/xyz,abc/d/ijk,,abc,"
+path_common/dirname_on_full_match[7]/output/line[3]="abc,abc/abc,abc,,abc,"
\ No newline at end of file
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index 85bb3e6f6..23d376064 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -71,9 +71,29 @@ path_common/once[3]="{ echo /a; } | csv-strings path-common --once"
 path_common/once[4]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --once"
 path_common/once[5]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c --once"
 path_common/once[6]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c --once"
+path_common/once[7]="{ echo abc/def/ghi; echo abc/deg/hij; echo abc/dgh/ijk; } | csv-strings path-common --once"
 
 path_common/delimiter[0]="{ echo a-b-c,d-e-f,g-h-i; echo a-b-d,d-e,g-h-k; echo a-b-z,d-e-x,g-h-y; } | csv-strings path-common --fields a,,c --once --path-delimiter -"
 
 path_common/fields[0]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c"
 path_common/fields[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c"
 path_common/fields[2]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c"
+
+path_common/dirname_on_single_record[0]="{ echo a/b/c; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname_on_single_record[1]="{ echo abc/def/ghi; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname_on_single_record[2]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname_on_single_record[3]="{ echo a/b/c,d/e/f,g/h/i; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
+path_common/dirname_on_single_record[4]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e/g,g/h/j; echo a/b/x,d/e/y,g/h/z; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
+path_common/dirname_on_single_record[5]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
+path_common/dirname_on_single_record[6]="{ echo abc; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname_on_single_record[7]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --dirname-on-single-record"
+path_common/dirname_on_single_record[8]="{ echo a/b/c; echo a/b/d; echo a/b/z; } | csv-strings path-common --dirname-on-single-record"
+
+path_common/dirname_on_full_match[0]="{ echo a/b/c; } | csv-strings path-common --dirname-on-full-match --once"
+path_common/dirname_on_full_match[1]="{ echo abc/def/ghi; } | csv-strings path-common --dirname-on-full-match --once"
+path_common/dirname_on_full_match[2]="{ echo a/b; echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-full-match --once"
+path_common/dirname_on_full_match[3]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-full-match --once"
+path_common/dirname_on_full_match[4]="{ echo a/b/c,d/e/f,g/h/i; } | csv-strings path-common --dirname-on-full-match --once --fields a,b,c"
+path_common/dirname_on_full_match[5]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --once --fields a,b,c"
+path_common/dirname_on_full_match[6]="{ echo abc/def/ghi; echo abc/deg/hij; echo abc/dgh/ijk; echo abc; } | csv-strings path-common --dirname-on-full-match"
+path_common/dirname_on_full_match[7]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --fields a,b,c"

From 0bc376ee47cf846b02acbebe4aa984675def9d8b Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 12 May 2020 12:49:15 +1000
Subject: [PATCH 0159/1056] csv-strings: dirname: absolute path handling added;
 --head, --tail, basename: to fix

---
 csv/applications/csv-strings.cpp | 36 ++++++++++-----
 csv/test/csv-strings/expected    | 75 +++++++++++++++++++++-----------
 csv/test/csv-strings/input       | 47 ++++++++++++--------
 3 files changed, 105 insertions(+), 53 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index a76b63cdb..abdb3359a 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -221,14 +221,25 @@ struct dirname
 
     std::string convert( const std::string& t ) const
     {
+        bool is_absolute = t[0] == delimiter;
         const auto& s = comma::split( t, delimiter );
         if( head > 0 )
         {
-            if( s.size() >= head ) { return comma::join( s.begin(), s.begin() + head, delimiter ); }
+            if( s.size() >= head )
+            {
+                auto o = comma::join( s.begin(), s.begin() + head, delimiter );
+                if( is_absolute && o.empty() ) { o = std::string( 1, delimiter ); }
+                return o;
+            }
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
             return {};
         }
-        if( s.size() >= tail ) { return comma::join( s.begin(), s.end() - tail, delimiter ); }
+        if( s.size() >= tail )
+        {
+            auto o = comma::join( s.begin(), s.end() - tail, delimiter );
+            if( is_absolute && o.empty() ) { o = std::string( 1, delimiter ); }
+            return o;
+        }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
         return {};
     }
@@ -261,14 +272,6 @@ namespace common {
 
 typedef input output_t;
 
-// todo
-// - path-common --dirname-on-single-record
-//   - test case: expected / on ( echo /a ) | csv-strings path-common --dirname-on-single-record --field x
-//   - fix
-// - path-dirname
-//   - test case: expected / on ( echo /a ) | csv-strings path-common --dirname-on-single-record --field x
-//   - fix
-
 static int run( const comma::command_line_options& options )
 {
     if( ::csv.binary() ) { std::cerr << "csv-strings: path-common: binary mode: todo, just ask" << std::endl; exit( 1 ); }
@@ -311,8 +314,10 @@ static int run( const comma::command_line_options& options )
         for( unsigned int i = 0; i < output.values.size(); ++i )
         {
             if( !full_match[i] ) { continue; }
+            bool is_absolute = output.values[i][0] == delimiter;
             const auto& s = comma::split( output.values[i], delimiter );
             output.values[i] = comma::join( s.begin(), s.end() - 1, delimiter );
+            if ( is_absolute && output.values[i].empty() ) { output.values[i] = std::string( 1, delimiter ); }
         }
     }
     if( once )
@@ -356,11 +361,20 @@ struct add
         : prefix( options.value( "--prefix", std::string() ) )
         , suffix( options.value( "--suffix", std::string() ) ) {}
 
-    inline std::string convert( const std::string& t ) const { return prefix + t + suffix; }
+    std::string convert( const std::string& t ) const { return prefix + t + suffix; }
 };
     
 } } } // namespace comma { namespace applications { namespace strings {
 
+// todo
+// - basename
+//   - fix absolute path behaviour
+//   - fix --head; add tests
+//   - fix --tail; add tests
+// - dirname
+//   - fix --head; add tests
+//   - fix --tail; add tests
+
 int main( int ac, char** av )
 {
     try
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index 60d56360a..2ae3fc800 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -46,6 +46,21 @@ basename/binary/head/emplace[0]/output/line[0]=""
 basename/binary/head/emplace[0]/output/line[1]="b"
 basename/binary/head/emplace[0]/output/line[2]="b/c"
 
+dirname/append[0]/output/line[0]="/,/"
+dirname/append[0]/output/line[1]="/a,/"
+dirname/append[0]/output/line[2]="/a/,/a"
+dirname/append[0]/output/line[3]="/a/b,/a"
+dirname/append[0]/output/line[4]="/a/b/c,/a/b"
+dirname/append[0]/output/line[5]="/aaa/bbb,/aaa"
+dirname/append[0]/output/line[6]="/aaa/bbb/ccc,/aaa/bbb"
+
+dirname/append[1]/output/line[0]="a,"
+dirname/append[1]/output/line[1]="a/,a"
+dirname/append[1]/output/line[2]="a/b,a"
+dirname/append[1]/output/line[3]="a/b/c,a/b"
+dirname/append[1]/output/line[4]="aaa/bbb,aaa"
+dirname/append[1]/output/line[5]="aaa/bbb/ccc,aaa/bbb"
+
 dirname/tail/append[0]/output/line[0]="a,"
 dirname/tail/append[0]/output/line[1]="a/b,a"
 dirname/tail/append[0]/output/line[2]="a/b/c,a/b"
@@ -175,31 +190,41 @@ path_common/fields[2]/output/line[0]="a/b/c,d/e/f,g/h/i,g/h"
 path_common/fields[2]/output/line[1]="a/b/d,d/e,g/h/k,g/h"
 path_common/fields[2]/output/line[2]="a/b/z,d/e/x,g/h/y,g/h"
 
+path_common/dirname[0]/output="/"
+path_common/dirname[1]/output="/"
+path_common/dirname[2]/output="/"
+path_common/dirname[3]/output="/aaa"
+path_common/dirname[4]/output="/aaa"
+path_common/dirname[5]/output="/aaa/bbb"
+path_common/dirname[6]/output=""
+path_common/dirname[7]/output=""
+path_common/dirname[8]/output="aaa"
+path_common/dirname[9]/output="aaa"
+path_common/dirname[10]/output="aaa/bbb"
+
 path_common/dirname_on_single_record[0]/output="a/b"
-path_common/dirname_on_single_record[1]/output="abc/def"
-path_common/dirname_on_single_record[2]/output="a/b"
-path_common/dirname_on_single_record[3]/output="a/b,d/e,g/h"
-path_common/dirname_on_single_record[4]/output="a/b,d/e,g/h"
-path_common/dirname_on_single_record[5]/output="abc,abc/abc,abc"
-path_common/dirname_on_single_record[6]/output=""
-path_common/dirname_on_single_record[7]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,d/e,g/h"
-path_common/dirname_on_single_record[7]/output/line[1]="a/b/d,d/e,g/h/k,a/b,d/e,g/h"
-path_common/dirname_on_single_record[7]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,d/e,g/h"
-path_common/dirname_on_single_record[8]/output/line[0]="a/b/c,a/b"
-path_common/dirname_on_single_record[8]/output/line[1]="a/b/d,a/b"
-path_common/dirname_on_single_record[8]/output/line[2]="a/b/z,a/b"
+path_common/dirname_on_single_record[1]/output="a/b"
+
+path_common/dirname_on_single_record[2]/fields[0]/output="a/b,d/e,g/h"
+path_common/dirname_on_single_record[2]/fields[1]/output="a/b,d/e,g/h"
+
+path_common/dirname_on_single_record[2]/append[0]/output/line[0]="a/b/c,a/b"
+path_common/dirname_on_single_record[2]/append[0]/output/line[1]="a/b/d,a/b"
+path_common/dirname_on_single_record[2]/append[0]/output/line[2]="a/b/z,a/b"
+path_common/dirname_on_single_record[2]/append[1]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,d/e,g/h"
+path_common/dirname_on_single_record[2]/append[1]/output/line[1]="a/b/d,d/e,g/h/k,a/b,d/e,g/h"
+path_common/dirname_on_single_record[2]/append[1]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,d/e,g/h"
 
 path_common/dirname_on_full_match[0]/output="a/b"
-path_common/dirname_on_full_match[1]/output="abc/def"
-path_common/dirname_on_full_match[2]/output="a"
-path_common/dirname_on_full_match[3]/output="a/b"
-path_common/dirname_on_full_match[4]/output="a/b,d/e,g/h"
-path_common/dirname_on_full_match[5]/output=",abc,"
-path_common/dirname_on_full_match[6]/output/line[0]="abc/def/ghi,"
-path_common/dirname_on_full_match[6]/output/line[1]="abc/deg/hij,"
-path_common/dirname_on_full_match[6]/output/line[2]="abc/dgh/ijk,"
-path_common/dirname_on_full_match[6]/output/line[3]="abc,"
-path_common/dirname_on_full_match[7]/output/line[0]="abc/def/ghi,abc/abc/abc,abc/def/abc,,abc,"
-path_common/dirname_on_full_match[7]/output/line[1]="abc/deg/hij,abc/abc/abb,abc/def/hij,,abc,"
-path_common/dirname_on_full_match[7]/output/line[2]="abc/dgh/ijk,abc/abc/xyz,abc/d/ijk,,abc,"
-path_common/dirname_on_full_match[7]/output/line[3]="abc,abc/abc,abc,,abc,"
\ No newline at end of file
+path_common/dirname_on_full_match[1]/output="a"
+
+path_common/dirname_on_full_match[2]/fields[0]/output=",abc,"
+
+path_common/dirname_on_full_match[3]/append[0]/output/line[0]="abc/def/ghi,"
+path_common/dirname_on_full_match[3]/append[0]/output/line[1]="abc/deg/hij,"
+path_common/dirname_on_full_match[3]/append[0]/output/line[2]="abc/dgh/ijk,"
+path_common/dirname_on_full_match[3]/append[0]/output/line[3]="abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[0]="abc/def/ghi,abc/abc/abc,abc/def/abc,,abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[1]="abc/deg/hij,abc/abc/abb,abc/def/hij,,abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[2]="abc/dgh/ijk,abc/abc/xyz,abc/d/ijk,,abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[3]="abc,abc/abc,abc,,abc,"
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index 23d376064..851189f7d 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -18,6 +18,9 @@ basename/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-ba
 
 basename/binary/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-basename --head 1 --emplace --binary s[6] | csv-from-bin s[6]"
 
+dirname/append[0]="( echo /; echo /a; echo /a/; echo /a/b; echo /a/b/c; echo /aaa/bbb; echo /aaa/bbb/ccc; ) | csv-strings path-dirname"
+dirname/append[1]="( echo a; echo a/; echo a/b; echo a/b/c; echo aaa/bbb; echo aaa/bbb/ccc; ) | csv-strings path-dirname"
+
 dirname/tail/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
 dirname/tail/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2"
 dirname/tail/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 3"
@@ -79,21 +82,31 @@ path_common/fields[0]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/
 path_common/fields[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c"
 path_common/fields[2]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c"
 
+path_common/dirname[0]="{ echo /; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[1]="{ echo /a; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[2]="{ echo /aaa; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[3]="{ echo /aaa/; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[4]="{ echo /aaa/bbb; } | csv-strings path-common --dirname-on-single-record --once
+path_common/dirname[5]="{ echo /aaa/bbb/ccc; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[6]="{ echo a; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[7]="{ echo aaa; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[8]="{ echo aaa/; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[9]="{ echo aaa/bbb; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[10]="{ echo aaa/bbb/ccc; } | csv-strings path-common --dirname-on-single-record --once"
+
 path_common/dirname_on_single_record[0]="{ echo a/b/c; } | csv-strings path-common --dirname-on-single-record --once"
-path_common/dirname_on_single_record[1]="{ echo abc/def/ghi; } | csv-strings path-common --dirname-on-single-record --once"
-path_common/dirname_on_single_record[2]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-single-record --once"
-path_common/dirname_on_single_record[3]="{ echo a/b/c,d/e/f,g/h/i; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
-path_common/dirname_on_single_record[4]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e/g,g/h/j; echo a/b/x,d/e/y,g/h/z; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
-path_common/dirname_on_single_record[5]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
-path_common/dirname_on_single_record[6]="{ echo abc; } | csv-strings path-common --dirname-on-single-record --once"
-path_common/dirname_on_single_record[7]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --dirname-on-single-record"
-path_common/dirname_on_single_record[8]="{ echo a/b/c; echo a/b/d; echo a/b/z; } | csv-strings path-common --dirname-on-single-record"
-
-path_common/dirname_on_full_match[0]="{ echo a/b/c; } | csv-strings path-common --dirname-on-full-match --once"
-path_common/dirname_on_full_match[1]="{ echo abc/def/ghi; } | csv-strings path-common --dirname-on-full-match --once"
-path_common/dirname_on_full_match[2]="{ echo a/b; echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-full-match --once"
-path_common/dirname_on_full_match[3]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-full-match --once"
-path_common/dirname_on_full_match[4]="{ echo a/b/c,d/e/f,g/h/i; } | csv-strings path-common --dirname-on-full-match --once --fields a,b,c"
-path_common/dirname_on_full_match[5]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --once --fields a,b,c"
-path_common/dirname_on_full_match[6]="{ echo abc/def/ghi; echo abc/deg/hij; echo abc/dgh/ijk; echo abc; } | csv-strings path-common --dirname-on-full-match"
-path_common/dirname_on_full_match[7]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --fields a,b,c"
+path_common/dirname_on_single_record[1]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-single-record --once"
+
+path_common/dirname_on_single_record[2]/fields[0]="{ echo a/b/c,d/e/f,g/h/i; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
+path_common/dirname_on_single_record[2]/fields[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e/g,g/h/j; echo a/b/x,d/e/y,g/h/z; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
+
+path_common/dirname_on_single_record[2]/append[0]="{ echo a/b/c; echo a/b/d; echo a/b/z; } | csv-strings path-common --dirname-on-single-record"
+path_common/dirname_on_single_record[2]/append[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --dirname-on-single-record"
+
+path_common/dirname_on_full_match[0]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-full-match --once"
+path_common/dirname_on_full_match[1]="{ echo a/b/c; echo a/b/d; echo a/b/e; echo a/b; } | csv-strings path-common --dirname-on-full-match --once"
+
+path_common/dirname_on_full_match[2]/fields[0]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --once --fields a,b,c"
+
+path_common/dirname_on_full_match[3]/append[0]="{ echo abc/def/ghi; echo abc/deg/hij; echo abc/dgh/ijk; echo abc; } | csv-strings path-common --dirname-on-full-match"
+path_common/dirname_on_full_match[3]/append[1]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --fields a,b,c"

From 2895cdefdd733de2ec8714ba6446861e63c2b323 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 12 May 2020 16:30:38 +1000
Subject: [PATCH 0160/1056] csv-strings: basename, dirname: permissive
 behaviour on --head and --tail made more consistent

---
 csv/applications/csv-strings.cpp | 12 ++++++------
 csv/test/csv-strings/expected    | 28 ++++++++++++++--------------
 2 files changed, 20 insertions(+), 20 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index abdb3359a..35f687d6b 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -177,7 +177,7 @@ struct basename
     unsigned int tail;
     char delimiter;
 
-    static constexpr char const* name() { return "basename"; }
+    static const char* name() { return "basename"; }
 
     basename( const comma::command_line_options& options )
         : head( options.value( "--head", 0 ) )
@@ -194,11 +194,11 @@ struct basename
         {
             if( s.size() >= head ) { return comma::join( s.begin() + head, s.end(), delimiter ); }
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-            return {};
+            return t;
         }
         if( s.size() >= tail ) { return comma::join( s.end() - tail, s.end(), delimiter ); }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-        return {};
+        return "";
     }
 };
 
@@ -209,7 +209,7 @@ struct dirname
     unsigned int tail;
     char delimiter;
 
-    static constexpr char const* name() { return "dirname"; }
+    static const char* name() { return "dirname"; }
 
     dirname( const comma::command_line_options& options )
         : head( options.value( "--head", 0 ) )
@@ -232,7 +232,7 @@ struct dirname
                 return o;
             }
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-            return {};
+            return t;
         }
         if( s.size() >= tail )
         {
@@ -241,7 +241,7 @@ struct dirname
             return o;
         }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-        return {};
+        return "";
     }
 };
 
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index 2ae3fc800..0ac7fea9f 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -31,14 +31,14 @@ basename/binary/emplace[0]/output/line[2]="c"
 basename/head/append[0]/output/line[0]="a,"
 basename/head/append[0]/output/line[1]="a/b,b"
 basename/head/append[0]/output/line[2]="a/b/c,b/c"
-basename/head/append[1]/output/line[0]="a,"
+basename/head/append[1]/output/line[0]="a,a"
 basename/head/append[1]/output/line[1]="a/b,"
 basename/head/append[1]/output/line[2]="a/b/c,c"
 
 basename/head/emplace[0]/output/line[0]=""
 basename/head/emplace[0]/output/line[1]="b"
 basename/head/emplace[0]/output/line[2]="b/c"
-basename/head/emplace[1]/output/line[0]=""
+basename/head/emplace[1]/output/line[0]="a"
 basename/head/emplace[1]/output/line[1]=""
 basename/head/emplace[1]/output/line[2]="c"
 
@@ -94,28 +94,28 @@ dirname/binary/tail/emplace[0]/output/line[2]="a/b"
 dirname/head/append[0]/output/line[0]="a,"
 dirname/head/append[0]/output/line[1]="a/b,a"
 dirname/head/append[0]/output/line[2]="a/b/c,a/b"
-dirname/head/append[1]/output/line[0]="a,"
+dirname/head/append[1]/output/line[0]="a,a"
 dirname/head/append[1]/output/line[1]="a/b,a/b"
 dirname/head/append[1]/output/line[2]="a/b/c,a/b"
-dirname/head/append[2]/output/line[0]="a,"
-dirname/head/append[2]/output/line[1]="a/b,"
+dirname/head/append[2]/output/line[0]="a,a"
+dirname/head/append[2]/output/line[1]="a/b,a/b"
 dirname/head/append[2]/output/line[2]="a/b/c,a/b/c"
-dirname/head/append[3]/output/line[0]="a,"
-dirname/head/append[3]/output/line[1]="a/b,"
-dirname/head/append[3]/output/line[2]="a/b/c,"
+dirname/head/append[3]/output/line[0]="a,a"
+dirname/head/append[3]/output/line[1]="a/b,a/b"
+dirname/head/append[3]/output/line[2]="a/b/c,a/b/c"
 
 dirname/head/emplace[0]/output/line[0]=""
 dirname/head/emplace[0]/output/line[1]="a"
 dirname/head/emplace[0]/output/line[2]="a/b"
-dirname/head/emplace[1]/output/line[0]=""
+dirname/head/emplace[1]/output/line[0]="a"
 dirname/head/emplace[1]/output/line[1]="a/b"
 dirname/head/emplace[1]/output/line[2]="a/b"
-dirname/head/emplace[2]/output/line[0]=""
-dirname/head/emplace[2]/output/line[1]=""
+dirname/head/emplace[2]/output/line[0]="a"
+dirname/head/emplace[2]/output/line[1]="a/b"
 dirname/head/emplace[2]/output/line[2]="a/b/c"
-dirname/head/emplace[3]/output/line[0]=","
-dirname/head/emplace[3]/output/line[1]=","
-dirname/head/emplace[3]/output/line[2]=","
+dirname/head/emplace[3]/output/line[0]="a,"
+dirname/head/emplace[3]/output/line[1]="a/b,"
+dirname/head/emplace[3]/output/line[2]="a/b/c,"
 
 dirname/binary/head/emplace[0]/output/line[0]=""
 dirname/binary/head/emplace[0]/output/line[1]="a"

From 06110c1cf099399b92402b19be71a9c1f8c1d371 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 12 May 2020 16:43:52 +1000
Subject: [PATCH 0161/1056] csv-strings: basename: bug fixed

---
 csv/applications/csv-strings.cpp |  4 ++--
 csv/test/csv-strings/expected    | 30 +++++++++++++++---------------
 2 files changed, 17 insertions(+), 17 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 35f687d6b..fcd814dbe 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -194,11 +194,11 @@ struct basename
         {
             if( s.size() >= head ) { return comma::join( s.begin() + head, s.end(), delimiter ); }
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-            return t;
+            return "";
         }
         if( s.size() >= tail ) { return comma::join( s.end() - tail, s.end(), delimiter ); }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-        return "";
+        return t;
     }
 };
 
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index 0ac7fea9f..c100ca50a 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -1,28 +1,28 @@
 basename/append[0]/output/line[0]="a,a"
 basename/append[0]/output/line[1]="a/b,b"
 basename/append[0]/output/line[2]="a/b/c,c"
-basename/append[1]/output/line[0]="a,"
+basename/append[1]/output/line[0]="a,a"
 basename/append[1]/output/line[1]="a/b,a/b"
 basename/append[1]/output/line[2]="a/b/c,b/c"
-basename/append[2]/output/line[0]="a,"
-basename/append[2]/output/line[1]="a/b,"
+basename/append[2]/output/line[0]="a,a"
+basename/append[2]/output/line[1]="a/b,a/b"
 basename/append[2]/output/line[2]="a/b/c,a/b/c"
-basename/append[3]/output/line[0]="a,"
-basename/append[3]/output/line[1]="a/b,"
-basename/append[3]/output/line[2]="a/b/c,"
+basename/append[3]/output/line[0]="a,a"
+basename/append[3]/output/line[1]="a/b,a/b"
+basename/append[3]/output/line[2]="a/b/c,a/b/c"
 
 basename/emplace[0]/output/line[0]="a"
 basename/emplace[0]/output/line[1]="b"
 basename/emplace[0]/output/line[2]="c"
-basename/emplace[1]/output/line[0]=""
+basename/emplace[1]/output/line[0]="a"
 basename/emplace[1]/output/line[1]="a/b"
 basename/emplace[1]/output/line[2]="b/c"
-basename/emplace[2]/output/line[0]=""
-basename/emplace[2]/output/line[1]=""
+basename/emplace[2]/output/line[0]="a"
+basename/emplace[2]/output/line[1]="a/b"
 basename/emplace[2]/output/line[2]="a/b/c"
-basename/emplace[3]/output/line[0]=","
-basename/emplace[3]/output/line[1]=","
-basename/emplace[3]/output/line[2]=","
+basename/emplace[3]/output/line[0]="a,"
+basename/emplace[3]/output/line[1]="a/b,"
+basename/emplace[3]/output/line[2]="a/b/c,"
 
 basename/binary/emplace[0]/output/line[0]="a"
 basename/binary/emplace[0]/output/line[1]="b"
@@ -31,14 +31,14 @@ basename/binary/emplace[0]/output/line[2]="c"
 basename/head/append[0]/output/line[0]="a,"
 basename/head/append[0]/output/line[1]="a/b,b"
 basename/head/append[0]/output/line[2]="a/b/c,b/c"
-basename/head/append[1]/output/line[0]="a,a"
+basename/head/append[1]/output/line[0]="a,"
 basename/head/append[1]/output/line[1]="a/b,"
 basename/head/append[1]/output/line[2]="a/b/c,c"
 
 basename/head/emplace[0]/output/line[0]=""
 basename/head/emplace[0]/output/line[1]="b"
 basename/head/emplace[0]/output/line[2]="b/c"
-basename/head/emplace[1]/output/line[0]="a"
+basename/head/emplace[1]/output/line[0]=""
 basename/head/emplace[1]/output/line[1]=""
 basename/head/emplace[1]/output/line[2]="c"
 
@@ -153,7 +153,7 @@ fields[0]/output/line[2]="m,,a/b/c,,x/y/z,c,z"
 fields[1]/output/line[0]="k,,a,,x"
 fields[1]/output/line[1]="l,,b,,y"
 fields[1]/output/line[2]="m,,c,,z"
-fields[2]/output/line[0]="k,,,,"
+fields[2]/output/line[0]="k,,a,,x"
 fields[2]/output/line[1]="l,,a/b,,x/y"
 fields[2]/output/line[2]="m,,b/c,,y/z"
 fields[3]/output/line[0]="k,,a,,x,,"

From 46ace1e5252fb32ed8c84b3bb3824be3b58166d9 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 12 May 2020 16:49:32 +1000
Subject: [PATCH 0162/1056] csv-strings: todo comment added

---
 csv/applications/csv-strings.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index fcd814dbe..d1810b2d7 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -372,6 +372,7 @@ struct add
 //   - fix --head; add tests
 //   - fix --tail; add tests
 // - dirname
+//   - fix absolute path behaviour
 //   - fix --head; add tests
 //   - fix --tail; add tests
 

From e5c74747c9eaa5a545b81e02ad9eff7c304e5cde Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 13 May 2020 10:30:18 +1000
Subject: [PATCH 0163/1056] csv-strings: basename and dirname: absolute path
 support added and tested by Kent Hu

---
 csv/applications/csv-strings.cpp | 16 +++++++---
 csv/test/csv-strings/expected    | 54 ++++++++++++++++++++++++++++++--
 csv/test/csv-strings/input       | 18 ++++++++++-
 3 files changed, 79 insertions(+), 9 deletions(-)

diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index d1810b2d7..8ca0e9b50 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -189,6 +189,7 @@ struct basename
 
     std::string convert( const std::string& t ) const
     {
+        bool is_absolute = !t.empty() && t[0] == delimiter;
         const auto& s = comma::split( t, delimiter );
         if( head > 0 )
         {
@@ -196,7 +197,12 @@ struct basename
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
             return "";
         }
-        if( s.size() >= tail ) { return comma::join( s.end() - tail, s.end(), delimiter ); }
+        if( s.size() >= tail )
+        {
+            auto o = comma::join( s.end() - tail, s.end(), delimiter );
+            if ( is_absolute && o.empty() ) { o = delimiter; }
+            return o;
+        }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
         return t;
     }
@@ -221,14 +227,14 @@ struct dirname
 
     std::string convert( const std::string& t ) const
     {
-        bool is_absolute = t[0] == delimiter;
+        bool is_absolute = !t.empty() && t[0] == delimiter;
         const auto& s = comma::split( t, delimiter );
         if( head > 0 )
         {
             if( s.size() >= head )
             {
                 auto o = comma::join( s.begin(), s.begin() + head, delimiter );
-                if( is_absolute && o.empty() ) { o = std::string( 1, delimiter ); }
+                if( is_absolute && o.empty() ) { o = delimiter; }
                 return o;
             }
             if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
@@ -237,11 +243,11 @@ struct dirname
         if( s.size() >= tail )
         {
             auto o = comma::join( s.begin(), s.end() - tail, delimiter );
-            if( is_absolute && o.empty() ) { o = std::string( 1, delimiter ); }
+            if( is_absolute && o.empty() ) { o = delimiter; }
             return o;
         }
         if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
-        return "";
+        return is_absolute ? std::string( 1, delimiter ) : "";
     }
 };
 
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
index c100ca50a..4c52e3e8b 100644
--- a/csv/test/csv-strings/expected
+++ b/csv/test/csv-strings/expected
@@ -10,6 +10,18 @@ basename/append[2]/output/line[2]="a/b/c,a/b/c"
 basename/append[3]/output/line[0]="a,a"
 basename/append[3]/output/line[1]="a/b,a/b"
 basename/append[3]/output/line[2]="a/b/c,a/b/c"
+basename/append[4]/output/line[0]="/,/"
+basename/append[4]/output/line[1]="/aaa,aaa"
+basename/append[4]/output/line[2]="/aaa/bbb,bbb"
+basename/append[5]/output/line[0]="/,/"
+basename/append[5]/output/line[1]="/aaa,/aaa"
+basename/append[5]/output/line[2]="/aaa/bbb,aaa/bbb"
+basename/append[6]/output/line[0]="/,/"
+basename/append[6]/output/line[1]="/aaa,/aaa"
+basename/append[6]/output/line[2]="/aaa/bbb,/aaa/bbb"
+basename/append[7]/output/line[0]="/,/"
+basename/append[7]/output/line[1]="/aaa,/aaa"
+basename/append[7]/output/line[2]="/aaa/bbb,/aaa/bbb"
 
 basename/emplace[0]/output/line[0]="a"
 basename/emplace[0]/output/line[1]="b"
@@ -20,9 +32,9 @@ basename/emplace[1]/output/line[2]="b/c"
 basename/emplace[2]/output/line[0]="a"
 basename/emplace[2]/output/line[1]="a/b"
 basename/emplace[2]/output/line[2]="a/b/c"
-basename/emplace[3]/output/line[0]="a,"
-basename/emplace[3]/output/line[1]="a/b,"
-basename/emplace[3]/output/line[2]="a/b/c,"
+basename/emplace[3]/output/line[0]="a"
+basename/emplace[3]/output/line[1]="a/b"
+basename/emplace[3]/output/line[2]="a/b/c"
 
 basename/binary/emplace[0]/output/line[0]="a"
 basename/binary/emplace[0]/output/line[1]="b"
@@ -34,6 +46,18 @@ basename/head/append[0]/output/line[2]="a/b/c,b/c"
 basename/head/append[1]/output/line[0]="a,"
 basename/head/append[1]/output/line[1]="a/b,"
 basename/head/append[1]/output/line[2]="a/b/c,c"
+basename/head/append[2]/output/line[0]="/,"
+basename/head/append[2]/output/line[1]="/aaa,aaa"
+basename/head/append[2]/output/line[2]="/aaa/bbb,aaa/bbb"
+basename/head/append[3]/output/line[0]="/,"
+basename/head/append[3]/output/line[1]="/aaa,"
+basename/head/append[3]/output/line[2]="/aaa/bbb,bbb"
+basename/head/append[4]/output/line[0]="/,"
+basename/head/append[4]/output/line[1]="/aaa,"
+basename/head/append[4]/output/line[2]="/aaa/bbb,"
+basename/head/append[5]/output/line[0]="/,"
+basename/head/append[5]/output/line[1]="/aaa,"
+basename/head/append[5]/output/line[2]="/aaa/bbb,"
 
 basename/head/emplace[0]/output/line[0]=""
 basename/head/emplace[0]/output/line[1]="b"
@@ -73,6 +97,18 @@ dirname/tail/append[2]/output/line[2]="a/b/c,"
 dirname/tail/append[3]/output/line[0]="a,"
 dirname/tail/append[3]/output/line[1]="a/b,"
 dirname/tail/append[3]/output/line[2]="a/b/c,"
+dirname/tail/append[4]/output/line[0]="/,/"
+dirname/tail/append[4]/output/line[1]="/aaa,/"
+dirname/tail/append[4]/output/line[2]="/aaa/bbb,/aaa"
+dirname/tail/append[5]/output/line[0]="/,/"
+dirname/tail/append[5]/output/line[1]="/aaa,/"
+dirname/tail/append[5]/output/line[2]="/aaa/bbb,/"
+dirname/tail/append[6]/output/line[0]="/,/"
+dirname/tail/append[6]/output/line[1]="/aaa,/"
+dirname/tail/append[6]/output/line[2]="/aaa/bbb,/"
+dirname/tail/append[7]/output/line[0]="/,/"
+dirname/tail/append[7]/output/line[1]="/aaa,/"
+dirname/tail/append[7]/output/line[2]="/aaa/bbb,/"
 
 dirname/tail/emplace[0]/output/line[0]=""
 dirname/tail/emplace[0]/output/line[1]="a"
@@ -103,6 +139,18 @@ dirname/head/append[2]/output/line[2]="a/b/c,a/b/c"
 dirname/head/append[3]/output/line[0]="a,a"
 dirname/head/append[3]/output/line[1]="a/b,a/b"
 dirname/head/append[3]/output/line[2]="a/b/c,a/b/c"
+dirname/head/append[4]/output/line[0]="/,/"
+dirname/head/append[4]/output/line[1]="/aaa,/"
+dirname/head/append[4]/output/line[2]="/aaa/bbb,/"
+dirname/head/append[5]/output/line[0]="/,/"
+dirname/head/append[5]/output/line[1]="/aaa,/aaa"
+dirname/head/append[5]/output/line[2]="/aaa/bbb,/aaa"
+dirname/head/append[6]/output/line[0]="/,/"
+dirname/head/append[6]/output/line[1]="/aaa,/aaa"
+dirname/head/append[6]/output/line[2]="/aaa/bbb,/aaa/bbb"
+dirname/head/append[7]/output/line[0]="/,/"
+dirname/head/append[7]/output/line[1]="/aaa,/aaa"
+dirname/head/append[7]/output/line[2]="/aaa/bbb,/aaa/bbb"
 
 dirname/head/emplace[0]/output/line[0]=""
 dirname/head/emplace[0]/output/line[1]="a"
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index 851189f7d..f3b123240 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -2,16 +2,24 @@ basename/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename
 basename/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 2"
 basename/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3"
 basename/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 4"
+basename/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 1"
+basename/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 2"
+basename/append[6]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 3"
+basename/append[7]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 100"
 
 basename/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --emplace"
 basename/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 2 --emplace"
 basename/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3 --emplace"
-basename/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-basename --tail 4 --emplace"
+basename/emplace[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 4 --emplace"
 
 basename/binary/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-basename --emplace --binary s[6] | csv-from-bin s[6]"
 
 basename/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1"
 basename/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2"
+basename/head/append[2]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 1"
+basename/head/append[3]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 2"
+basename/head/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 3"
+basename/head/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 100"
 
 basename/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1 --emplace"
 basename/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2 --emplace"
@@ -25,6 +33,10 @@ dirname/tail/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirn
 dirname/tail/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2"
 dirname/tail/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 3"
 dirname/tail/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 4"
+dirname/tail/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 1"
+dirname/tail/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 2"
+dirname/tail/append[6]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 3"
+dirname/tail/append[7]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 100"
 
 dirname/tail/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
 dirname/tail/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2 --emplace"
@@ -37,6 +49,10 @@ dirname/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirn
 dirname/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2"
 dirname/head/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3"
 dirname/head/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 4"
+dirname/head/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 1"
+dirname/head/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 2"
+dirname/head/append[6]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 3"
+dirname/head/append[7]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 100"
 
 dirname/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
 dirname/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2 --emplace"

From e4636254ea453d0f474499ccca19f0e7d9252e9e Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 20 May 2020 18:36:25 +1000
Subject: [PATCH 0164/1056] csv-calc: --help: typo fixed

---
 csv/applications/csv-calc.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 25d4a10d5..0a20fc95c 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -89,7 +89,7 @@ static void usage( bool verbose )
     std::cerr << "        <n> is the desired percentile (e.g. 0.9)" << std::endl;
     std::cerr << "        <method> is one of 'nearest' or 'interpolate' (default: nearest)" << std::endl;
     std::cerr << "        see --help --verbose for more details" << std::endl;
-    std::cerr << "    radius: size / 2" << std::endl;
+    std::cerr << "    radius: diameter / 2" << std::endl;
     std::cerr << "    size: number of values" << std::endl;
     std::cerr << "    skew[=sample]: skew" << std::endl;
     std::cerr << "         sample: use sample skew (default: population stddev)" << std::endl;

From 56e22f404e494948edd1ac6fc964a04ba40c6893 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 21 May 2020 09:55:13 +1000
Subject: [PATCH 0165/1056] comma-name-value-util: fixed application name in
 error message

---
 bash/comma-name-value-util | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/bash/comma-name-value-util b/bash/comma-name-value-util
index 450445d90..4db89e62d 100644
--- a/bash/comma-name-value-util
+++ b/bash/comma-name-value-util
@@ -267,15 +267,15 @@ function comma_path_value_to_var()
         name=${name//-/$delimiter}
         # we are occasionally passed bad data in JSON etc
         # don't attempt to eval anything that is not a legal variable name
-        [[ "$name" =~ $regex ]] || { echo "comma-application-util: comma_path_value_to_var skipping invalid variable name '$name'" >&2 ; ret_code=1 ; continue ; }
+        [[ "$name" =~ $regex ]] || { echo "comma-name-value-util: comma_path_value_to_var skipping invalid variable name '$name'" >&2 ; ret_code=1 ; continue ; }
         # Strip quotes then add them back. This ensures consistent behaviour.
         value=${value#\"}
         value=\"${value%\"}\"
         eval "$export_variable $name=$value" \
-            || { echo "comma-application-util: comma_path_value_to_var failed '$export_variable $name=$value'" >&2 ; ret_code=1 ; }
+            || { echo "comma-name-value-util: comma_path_value_to_var failed '$export_variable $name=$value'" >&2 ; ret_code=1 ; }
     done
     if (( $ret_code != 0 )) ; then
-        echo "comma-application-util: comma_path_value_to_var encountered an error, callstack:" >&2
+        echo "comma-name-value-util: comma_path_value_to_var encountered an error, callstack:" >&2
         comma_stacktrace >&2
     fi
     return $ret_code

From 1f343f2436d886b79e5a347abd3d0b2c20c232de Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 21 May 2020 23:33:04 +1000
Subject: [PATCH 0166/1056] csv-eval: --output-fields: --help made slightly
 clearer

---
 python/comma/csv/applications/csv_eval.py | 91 ++++++-----------------
 1 file changed, 24 insertions(+), 67 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 37b8d2927..a1bee0385 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -44,7 +44,6 @@
 evaluate numerical expressions and append computed values to csv stream
 """
 
-
 notes_and_examples = """
 input fields:
     1) slashes are replaced by underscores if --full-xpath is given, otherwise basenames are used
@@ -164,14 +163,9 @@
     echo 20151231T000000,20160515T120000 | %(prog)s --fields=t1,t2 --format=2t "dt = (t2-t1)/timedelta64(1,'D')"
 """
 
+class csv_eval_error(Exception): pass
 
-class csv_eval_error(Exception):
-    pass
-
-
-def custom_formatwarning(msg, *args):
-    return __name__ + " warning: " + str(msg) + '\n'
-
+def custom_formatwarning(msg, *args): return __name__ + " warning: " + str(msg) + '\n'
 
 def add_csv_options(parser):
     comma.csv.add_options(parser) # comma.csv.add_options(parser, defaults={'fields': 'x,y,z'})
@@ -185,7 +179,7 @@ def add_csv_options(parser):
         '-o',
         default=None,
         metavar='<names>',
-        help="do not infer output fields from expressions; use specified fields instead")
+        help="do not infer output fields from expressions; output specified fields appended to input instead")
     parser.add_argument(
         '--output-format',
         default='',
@@ -259,10 +253,7 @@ def get_args():
         help='select and output records of input stream that satisfy the condition')
     args = parser.parse_args()
     if args.help:
-        if args.verbose:
-            parser.epilog += numpy_functions
-        else:
-            parser.epilog += "\nfor more help run '%(prog)s -h -v'"
+        parser.epilog += numpy_functions if args.verbose else "\nfor more help run '%(prog)s -h -v'"
         parser.print_help()
         parser.exit(0)
     if args.fields is None or args.fields == "": sys.exit( "csv-eval: please specify --fields" )
@@ -274,34 +265,22 @@ def ingest_deprecated_options(args):
         args.output_format = args.append_binary
         del args.append_binary
         if args.verbose:
-            with comma.util.warning(custom_formatwarning) as warn:
-                msg = "--append-binary is deprecated, consider using --output-format"
-                warn(msg)
+            with comma.util.warning(custom_formatwarning) as warn: warn( "--append-binary is deprecated, consider using --output-format" )
     if args.append_fields:
         args.output_fields = args.append_fields
         del args.append_fields
         if args.verbose:
-            with comma.util.warning(custom_formatwarning) as warn:
-                msg = "--append-fields is deprecated, consider using --output-fields"
-                warn(msg)
+            with comma.util.warning(custom_formatwarning) as warn: warn( "--append-fields is deprecated, consider using --output-fields" )
 
 def check_options(args):
-    if not (args.expressions or args.select or args.exit_if):
-        raise csv_eval_error("no expressions are given")
-    if args.binary and args.format:
-        raise csv_eval_error("--binary and --format are mutually exclusive")
+    if not (args.expressions or args.select or args.exit_if): raise csv_eval_error( "please specify expression" )
+    if args.binary and args.format: raise csv_eval_error("--binary and --format are mutually exclusive")
     if args.select or args.exit_if:
-        if args.expressions:
-            msg = "--select <condition> and --exit-if <condition> cannot be used with expressions"
-            raise csv_eval_error(msg)
-        if args.output_fields or args.output_format:
-            msg = "--select and --exit-if cannot be used with --output-fields or --output-format"
-            raise csv_eval_error(msg)
+        if args.expressions: raise csv_eval_error( "--select <condition> and --exit-if <condition> cannot be used with expressions" )
+        if args.output_fields: raise csv_eval_error( "--select and --exit-if cannot be used with --output-fields" )
+        if args.output_format: raise csv_eval_error( "--select and --exit-if cannot be used with --output-format" )
     if args.with_error:
-        if not args.exit_if:
-            msg = "--with-error is only used with --exit-if"
-            raise csv_eval_error(msg)
-
+        if not args.exit_if: raise csv_eval_error( "--with-error can only be used with --exit-if" )
 
 def format_without_blanks(format, fields=[], unnamed_fields=True):
     """
@@ -333,24 +312,17 @@ def format_without_blanks(format, fields=[], unnamed_fields=True):
      ...
     ValueError: format 'ui,t,d' is longer than fields 'a,b'
     """
-    def comma_type(maybe_type, field, default_type='d', type_of_unnamed_field='s[0]'):
-        return type_of_unnamed_field if not field else maybe_type or default_type
+    def comma_type(maybe_type, field, default_type='d', type_of_unnamed_field='s[0]'): return type_of_unnamed_field if not field else maybe_type or default_type
 
-    if not format and not fields:
-        return ''
+    if not format and not fields: return ''
     maybe_types = comma.csv.format.expand(format).split(',')
     if not unnamed_fields:
-        if '' in fields:
-            msg = "expected all fields to be named, got '{}'".format(','.join(fields))
-            raise ValueError(msg)
-        if len(maybe_types) > len(fields):
-            msg = "format '{}' is longer than fields '{}'".format(format, ','.join(fields))
-            raise ValueError(msg)
+        if '' in fields: raise ValueError( "expected all fields to be named, got '{}'".format(','.join(fields)) )
+        if len(maybe_types) > len(fields): raise ValueError( "format '{}' is longer than fields '{}'".format(format, ','.join(fields)) )
     maybe_typed_fields = itertools.zip_longest(maybe_types, fields) if sys.version_info.major > 2 else itertools.izip_longest(maybe_types, fields) # uber quick and dirty
     types = [comma_type(maybe_type, field) for maybe_type, field in maybe_typed_fields]
     return ','.join(types)
 
-
 def assignment_variable_names(expressions):
     """
     >>> from comma.csv.applications.csv_eval import assignment_variable_names
@@ -427,12 +399,10 @@ def prepare_options(args):
         args.binary = False
     else:
         args.first_line = comma.io.readlines_unbuffered(1, sys.stdin)
-        if not args.first_line:
-            raise csv_eval_error("first record is empty - could not guess format")
+        if not args.first_line: raise csv_eval_error("first record is empty - could not guess format")
         args.format = comma.csv.format.guess_format(args.first_line)
         args.binary = False
-        if args.verbose:
-            print( "{}: guessed format: {}".format(__name__, args.format), file = sys.stderr )
+        if args.verbose: print( "{}: guessed format: {}".format(__name__, args.format), file = sys.stderr )
     if args.select or args.exit_if:
         return
     var_names = assignment_variable_names(args.expressions)
@@ -441,10 +411,7 @@ def prepare_options(args):
         args.output_fields = [f for f in var_names if f not in args.fields]
     else:
         args.output_fields = split_fields(args.output_fields)
-    args.output_format = format_without_blanks(args.output_format,
-                                               args.output_fields,
-                                               unnamed_fields=False)
-
+    args.output_format = format_without_blanks( args.output_format, args.output_fields, unnamed_fields = False )
 
 def restricted_numpy_env():
     d = np.__dict__.copy()
@@ -452,13 +419,11 @@ def restricted_numpy_env():
     d.pop('sys', None)
     return d
 
-
 def update_buffer(stream, update_array):
     index = stream.fields.index
     if stream.binary:
         fields = stream._input_array.dtype.names
-        for f in update_array.dtype.names:
-            stream._input_array[fields[index(f)]] = update_array[f]
+        for f in update_array.dtype.names: stream._input_array[fields[index(f)]] = update_array[f]
     else:
         def updated_lines():
             for line, scalars in izip(stream._ascii_buffer, update_array):
@@ -468,7 +433,6 @@ def updated_lines():
                 yield stream.delimiter.join(values)
         stream._ascii_buffer = list(updated_lines())
 
-
 class stream(object):
     def __init__(self, args):
         self.args = args
@@ -515,8 +479,7 @@ def print_info(self, file=sys.stderr):
         print( "default values: '{}'".format(self.args.default_values), file = file )
         print( "input fields: '{}'".format(fields), file = file )
         print( "input format: '{}'".format(format), file = file )
-        if self.args.select or self.args.exit_if:
-            return
+        if self.args.select or self.args.exit_if: return
         update_fields = ','.join(self.update_t.fields) if self.args.update_fields else ''
         output_fields = ','.join(self.output_t.fields) if self.args.output_fields else ''
         output_format = self.output_t.format if self.args.output_fields else ''
@@ -524,7 +487,6 @@ def print_info(self, file=sys.stderr):
         print( "output fields: '{}'".format(output_fields), file = file )
         print( "output format: '{}'".format(output_format), file = file )
 
-
 def check_fields(fields, allow_numpy_names=True):
     for field in fields:
         if not re.match(r'^[a-z_]\w*$', field, re.I): raise csv_eval_error("'{}' is not a valid field name".format(field))
@@ -534,10 +496,7 @@ def check_fields(fields, allow_numpy_names=True):
 def check_output_fields(fields, input_fields):
     check_fields(fields)
     invalid_output_fields = set(fields).intersection(input_fields)
-    if invalid_output_fields:
-        msg = "output fields '{}' are present in input fields '{}'" \
-            .format(','.join(invalid_output_fields), ','.join(input_fields))
-        raise csv_eval_error(msg)
+    if invalid_output_fields: raise csv_eval_error( "output fields '{}' are present in input fields '{}'".format(','.join(invalid_output_fields), ','.join(input_fields)) )
 
 def evaluate(stream):
     def disperse( var, fields ): return '\n'.join("{f} = {v}['{f}']".format( v = var, f = f ) for f in fields )
@@ -615,8 +574,7 @@ def exit_if(stream):
                 sys.exit(1)
             stream.input.dump()
         input = stream.input.read()
-        if input is None:
-            break
+        if input is None: break
 
 def main():
     try:
@@ -639,5 +597,4 @@ def main():
         traceback.print_exc(file=sys.stderr)
         sys.exit(1)
 
-if __name__ == '__main__':
-    main()
+if __name__ == '__main__': main()

From bb717f0b4e6bd279baf98948ddc31256d687f38f Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Fri, 22 May 2020 07:22:18 +1000
Subject: [PATCH 0167/1056] csv-eval: --init-fields, --default fields: --help
 improved

---
 python/comma/csv/applications/csv_eval.py | 9 +++------
 1 file changed, 3 insertions(+), 6 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index a1bee0385..3a37820e9 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -225,13 +225,13 @@ def get_args():
         '--default',
         default='',
         metavar='<assignments>',
-        help='default values for variables in expressions but not in input stream')
+        help='default values for variables in expressions but not in input stream, applied to every input record')
     parser.add_argument(
         '--init-values',
         '--init',
         default='',
         metavar='<assignments>',
-        help='init values, applied only once')
+        help='init values, applied only once on csv-eval start')
     parser.add_argument(
         '--with-error',
         default='',
@@ -407,10 +407,7 @@ def prepare_options(args):
         return
     var_names = assignment_variable_names(args.expressions)
     args.update_fields = [f for f in var_names if f in args.fields]
-    if args.output_fields is None:
-        args.output_fields = [f for f in var_names if f not in args.fields]
-    else:
-        args.output_fields = split_fields(args.output_fields)
+    args.output_fields = [f for f in var_names if f not in args.fields] if args.output_fields is None else split_fields(args.output_fields)
     args.output_format = format_without_blanks( args.output_format, args.output_fields, unnamed_fields = False )
 
 def restricted_numpy_env():

From 4a59ee4e0879960084b3ddc7ac4725be648eb090 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Fri, 22 May 2020 13:51:57 +1000
Subject: [PATCH 0168/1056] csv-eval: --init-values: bug fixed: inconsistent
 behaviour when values are simply assigned in the expression and thus are
 passed by reference; now, if --init-values present, np.copy() is used for
 deep copy

---
 python/comma/csv/applications/csv_eval.py     | 114 ++++++++----------
 .../test/csv-eval/init_values/expected        |  46 +++++--
 .../test/csv-eval/init_values/input           |   6 +-
 3 files changed, 93 insertions(+), 73 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 3a37820e9..1ae279fa0 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -1,31 +1,4 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import print_function
 import argparse
@@ -46,13 +19,13 @@
 
 notes_and_examples = """
 input fields:
-    1) slashes are replaced by underscores if --full-xpath is given, otherwise basenames are used
-    2) for ascii streams, input fields are treated as floating point numbers, unless --format is given
+    - slashes are replaced by underscores if --full-xpath is given, otherwise basenames are used
+    - for ascii streams, input fields are treated as floating point numbers, unless --format is given
 
 output fields:
-    1) inferred from expressions (by default) or specified by --output-fields
-    2) appended to possibly modified input
-    3) treated as floating point numbers, unless --output-format is given
+    - inferred from the names assigned in expression unless specified by --output-fields
+    - appended to input record (input field values can be modified by expression, too)
+    - treated as 64-bit floating point numbers, unless --output-format is given
 
 examples:
     # basic
@@ -80,18 +53,18 @@
     # update input stream values in place
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=x,y "x=x+y; y=y-1"
 
-    # using full xpaths
+    # full xpaths
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=one/x,two/y "x+=1; y-=1"
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=one/x,two/y "one_x+=1; two_y-=1" --full-xpath
 
-    # using default values
+    # default values
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=,y "a=x+y" --default-values="x=0;y=0"
     
-    # using init values: calculate triangular numbers
-    seq 0 10 | %(prog)s --fields=v "sum=sum+v" --init-values="sum=0"
+    # init values: calculate triangular numbers
+    seq 0 10 | csv-eval --fields=v "sum=sum+v" --init-values="sum=0"
     
-    # using init values: calculate fibonacci numbers
-    seq 0 10 | %(prog)s --fields=v "c=b;b=a+b;a=c" --output-fields a,b --init-values="a=0;b=1"
+    # init values: calculate fibonacci numbers
+    seq 0 10 | csv-eval --fields v "a,b=b,a+b" --init-values "a=0;b=1" --output-fields a
 
     # operating on time (internally represented in microseconds)
     echo 20171112T224515.5 | %(prog)s --format=t --fields=t1 "t2=t1+1000000" --output-format t
@@ -185,11 +158,8 @@ def add_csv_options(parser):
         default='',
         metavar='<format>',
         help="format of output fields (default: 'd' for each)")
-    # the options defined below are left for compatibility
-    # use --output-fields and --output-format instead
-    parser.add_argument('--append-fields', '-F', help=argparse.SUPPRESS)
-    parser.add_argument('--append-binary', '-B', help=argparse.SUPPRESS)
-
+    parser.add_argument('--append-fields', '-F', help=argparse.SUPPRESS) # backward compatibility; use --output-fields instead
+    parser.add_argument('--append-binary', '-B', help=argparse.SUPPRESS) # backward compatibility; use --output-format instead
 
 def get_args():
     parser = argparse.ArgumentParser(
@@ -232,6 +202,11 @@ def get_args():
         default='',
         metavar='<assignments>',
         help='init values, applied only once on csv-eval start')
+    parser.add_argument(
+        '--init-format',
+        default='',
+        metavar='<format>',
+        help='format of init non-output variables in the order of appearance in expression (default: "d" for each)')
     parser.add_argument(
         '--with-error',
         default='',
@@ -339,6 +314,7 @@ def assignment_variable_names(expressions):
     >>> assignment_variable_names("x=1; x=2; y+=1; y+=2; z=1; z+=2")
     ['x', 'y', 'z']
     """
+    if expressions is None: return []
     tree = ast.parse(expressions, '<string>', mode='exec')
     fields = []
     for child in ast.iter_child_nodes(tree):
@@ -380,9 +356,7 @@ def normalise_full_xpath(fields, full_xpath=True):
     ['', 'b', '', 'c', 'e', '']
     """
     full_xpath_fields = split_fields(fields)
-    if full_xpath:
-        return [f.replace('/', '_') for f in full_xpath_fields]
-    return [f.split('/')[-1] for f in full_xpath_fields]
+    return [f.replace('/', '_') for f in full_xpath_fields] if full_xpath else [f.split('/')[-1] for f in full_xpath_fields]
 
 def prepare_options(args):
     ingest_deprecated_options(args)
@@ -403,11 +377,15 @@ def prepare_options(args):
         args.format = comma.csv.format.guess_format(args.first_line)
         args.binary = False
         if args.verbose: print( "{}: guessed format: {}".format(__name__, args.format), file = sys.stderr )
-    if args.select or args.exit_if:
-        return
+    if args.select or args.exit_if: return
     var_names = assignment_variable_names(args.expressions)
     args.update_fields = [f for f in var_names if f in args.fields]
     args.output_fields = [f for f in var_names if f not in args.fields] if args.output_fields is None else split_fields(args.output_fields)
+    init_var_names = assignment_variable_names(args.init_values)
+    args.init_fields = [f for f in init_var_names if f not in args.output_fields]
+    if args.init_fields:
+        init_types = format_without_blanks( args.init_format, args.init_fields, unnamed_fields = False )
+        args.init_t = comma.csv.struct( ','.join( args.init_fields ), *comma.csv.format.to_numpy( init_types ) )
     args.output_format = format_without_blanks( args.output_format, args.output_fields, unnamed_fields = False )
 
 def restricted_numpy_env():
@@ -487,50 +465,60 @@ def print_info(self, file=sys.stderr):
 def check_fields(fields, allow_numpy_names=True):
     for field in fields:
         if not re.match(r'^[a-z_]\w*$', field, re.I): raise csv_eval_error("'{}' is not a valid field name".format(field))
-        if field in ['_input', '_update', '_output']: raise csv_eval_error("'{}' is a reserved name".format(field))
+        if field in ['_init', '_input', '_update', '_output']: raise csv_eval_error("'{}' is a reserved name".format(field))
         if not allow_numpy_names and field in np.__dict__: raise csv_eval_error("'{}' is a reserved numpy name".format(field))
 
 def check_output_fields(fields, input_fields):
     check_fields(fields)
     invalid_output_fields = set(fields).intersection(input_fields)
-    if invalid_output_fields: raise csv_eval_error( "output fields '{}' are present in input fields '{}'".format(','.join(invalid_output_fields), ','.join(input_fields)) )
+    if invalid_output_fields: raise csv_eval_error( "output field(s) '{}' should not contain input fields '{}'".format(','.join(invalid_output_fields), ','.join(input_fields)) )
 
 def evaluate(stream):
-    def disperse( var, fields ): return '\n'.join("{f} = {v}['{f}']".format( v = var, f = f ) for f in fields )
+    def disperse( var, fields, do_copy = False ):
+        if do_copy: return '\n'.join( "{f} = copy( {v}['{f}'] )".format( v = var, f = f ) for f in fields )
+        else: return '\n'.join( "{f} = {v}['{f}']".format( v = var, f = f ) for f in fields )
     def collect( var, fields ): return '\n'.join("{v}['{f}'] = {f}".format( v = var, f = f ) for f in fields )
     if stream.args.init_values == '':
         read_size = None
         init_code_string = ''
     else:
         read_size = 1
-        init_code_string = '\n'.join( [ stream.args.default_values,
+        init_code_string = '\n'.join( [ disperse( '_input', stream.nonblank_input_fields, stream.args.init_values ),
+                                        disperse( '_output', stream.args.output_fields, stream.args.init_values ),
+                                        stream.args.default_values,
                                         stream.args.init_values,
-                                        disperse( '_input', stream.nonblank_input_fields ),
+                                        collect( '_init', stream.args.init_fields ),
                                         collect( '_update', stream.args.update_fields ),
                                         collect( '_output', stream.args.output_fields ) ] )
     code_string = '\n'.join( [ stream.args.default_values,
+                               disperse( '_init', stream.args.init_fields, stream.args.init_values ),
                                disperse( '_input', stream.nonblank_input_fields ),
-                               disperse( '_output', stream.args.output_fields ),
+                               disperse( '_output', stream.args.output_fields, stream.args.init_values ),
                                stream.args.expressions,
+                               collect( '_init', stream.args.init_fields ),
                                collect( '_update', stream.args.update_fields ),
                                collect( '_output', stream.args.output_fields ) ] )
+    #print( "-------- init_code_string --------\n" + init_code_string + "\n--------\n", file=sys.stderr )
+    #print( "-------- code_string --------\n" + code_string + "\n--------\n", file=sys.stderr )
     init_code = compile( init_code_string, '<string>', 'exec' )
     code = compile( code_string, '<string>', 'exec' )
     env = np.__dict__ if stream.args.permissive else restricted_numpy_env()    
     size = None
+    init = None
+    input = None
     update = None
     output = None
-    input = None
     is_shutdown = comma.signal.is_shutdown( verbose = stream.args.verbose )
     if stream.args.first_line: input = stream.input.read_from_line( stream.args.first_line )
     while not is_shutdown:
         if input is not None:
             if size != input.size:
                 size = input.size
+                if stream.args.init_fields: init = stream.args.init_t(size)
                 if stream.args.update_fields: update = stream.update_t(size)
                 if stream.args.output_fields: output = stream.output_t(size)
-                exec( init_code, env, { '_input': input, '_update': update, '_output': output } )
-            exec( code, env, { '_input': input, '_update': update, '_output': output } )
+                exec( init_code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
+            exec( code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
             if stream.args.update_fields: update_buffer(stream.input, update)
             if stream.args.output_fields: stream.output.write(output)
             else: stream.input.dump()
@@ -544,8 +532,7 @@ def select(stream):
     fields = stream.input.fields
     code = compile(stream.args.select, '<string>', 'eval')
     is_shutdown = comma.signal.is_shutdown()
-    if stream.args.first_line:
-        input = stream.input.read_from_line(stream.args.first_line)
+    if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
     while not is_shutdown:
         if input is not None: 
             mask = eval(code, env, {f: input[f] for f in fields})
@@ -579,12 +566,9 @@ def main():
         comma.csv.time.zone('UTC')
         args = get_args()
         prepare_options(args)
-        if args.select:
-            select(stream(args))
-        elif args.exit_if:
-            exit_if(stream(args))
-        else:
-            evaluate(stream(args))
+        if args.select: select(stream(args))
+        elif args.exit_if: exit_if(stream(args))
+        else: evaluate(stream(args))
     except csv_eval_error as e:
         name = os.path.basename(sys.argv[0])
         print( "{} error: {}".format(name, e), file = sys.stderr )
diff --git a/python/comma/csv/applications/test/csv-eval/init_values/expected b/python/comma/csv/applications/test/csv-eval/init_values/expected
index d0dcb868b..44bb4bfd9 100644
--- a/python/comma/csv/applications/test/csv-eval/init_values/expected
+++ b/python/comma/csv/applications/test/csv-eval/init_values/expected
@@ -1,7 +1,39 @@
-fibonacci/output/line[0]="0,1,1"
-fibonacci/output/line[1]="1,1,2"
-fibonacci/output/line[2]="2,2,3"
-fibonacci/output/line[3]="3,3,5"
-fibonacci/output/line[4]="4,5,8"
-fibonacci/output/line[5]="5,8,13"
-fibonacci/status=0
+fibonacci[0]/output/line[0]="0,1,1"
+fibonacci[0]/output/line[1]="1,1,2"
+fibonacci[0]/output/line[2]="2,2,3"
+fibonacci[0]/output/line[3]="3,3,5"
+fibonacci[0]/output/line[4]="4,5,8"
+fibonacci[0]/output/line[5]="5,8,13"
+fibonacci[0]/status=0
+
+fibonacci[1]/output/line[0]="0,1,1"
+fibonacci[1]/output/line[1]="1,1,2"
+fibonacci[1]/output/line[2]="2,2,3"
+fibonacci[1]/output/line[3]="3,3,5"
+fibonacci[1]/output/line[4]="4,5,8"
+fibonacci[1]/output/line[5]="5,8,13"
+fibonacci[1]/status=0
+
+fibonacci[2]/output/line[0]="0,1,1"
+fibonacci[2]/output/line[1]="1,2,1"
+fibonacci[2]/output/line[2]="2,3,2"
+fibonacci[2]/output/line[3]="3,5,3"
+fibonacci[2]/output/line[4]="4,8,5"
+fibonacci[2]/output/line[5]="5,13,8"
+fibonacci[2]/status=0
+
+fibonacci[3]/output/line[0]="0,1"
+fibonacci[3]/output/line[1]="1,1"
+fibonacci[3]/output/line[2]="2,2"
+fibonacci[3]/output/line[3]="3,3"
+fibonacci[3]/output/line[4]="4,5"
+fibonacci[3]/output/line[5]="5,8"
+fibonacci[3]/status=0
+
+fibonacci[4]/output/line[0]="0,1"
+fibonacci[4]/output/line[1]="1,2"
+fibonacci[4]/output/line[2]="2,3"
+fibonacci[4]/output/line[3]="3,5"
+fibonacci[4]/output/line[4]="4,8"
+fibonacci[4]/output/line[5]="5,13"
+fibonacci[4]/status=0
diff --git a/python/comma/csv/applications/test/csv-eval/init_values/input b/python/comma/csv/applications/test/csv-eval/init_values/input
index 5448c0ca9..501984b70 100644
--- a/python/comma/csv/applications/test/csv-eval/init_values/input
+++ b/python/comma/csv/applications/test/csv-eval/init_values/input
@@ -1 +1,5 @@
-fibonacci="seq 0 5 | csv-eval --fields=v 'c=b;b=a+b;a=c' --output-fields a,b --init-values='a=0;b=1'"
+fibonacci[0]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --init-values='a=0;b=1'"
+fibonacci[1]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields a,b --init-values='a=0;b=1'"
+fibonacci[2]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields b,a --init-values='a=0;b=1'"
+fibonacci[3]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields a --init-values='a=0;b=1'"
+fibonacci[4]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields b --init-values='a=0;b=1'"

From b4891ed58fc5f75b8a6779cff079f76e69ca32d3 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 24 May 2020 22:19:08 +1000
Subject: [PATCH 0169/1056] packed/field: boost static assert replaced with stl
 static assert

---
 packed/field.h | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/packed/field.h b/packed/field.h
index c532d7786..7ed6323ca 100644
--- a/packed/field.h
+++ b/packed/field.h
@@ -35,7 +35,7 @@
 #define COMMA_PACKED_FIELD_H_
 
 #include <string.h>
-#include <boost/static_assert.hpp>
+#include <type_traits> // #include <boost/static_assert.hpp>
 
 namespace comma { namespace packed {
 
@@ -46,25 +46,25 @@ class field
     public:
         enum { size = S };
 
-        BOOST_STATIC_ASSERT( size > 0 );
+        static_assert( size > 0, "expected positive size" );
 
         typedef T type;
 
         field()
         {
-            BOOST_STATIC_ASSERT( sizeof( field ) == size );
+            static_assert( sizeof( field ) == size, "field size does not match stated size" );
             Derived::pack( storage_, Derived::default_value() );
         }
 
         field( const type& t )
         {
-            BOOST_STATIC_ASSERT( sizeof( field ) == size );
+            static_assert( sizeof( field ) == size, "field size does not match stated size" );
             Derived::pack( storage_, t );
         }
 
         field( const field& rhs )
         {
-            BOOST_STATIC_ASSERT( sizeof( field ) == size );
+            static_assert( sizeof( field ) == size, "field size does not match stated size" );
             operator=( rhs );
         }
 

From b794a6b789a103333f1f1cc35da44c79d395653c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 24 May 2020 22:38:05 +1000
Subject: [PATCH 0170/1056] BOOST_STATIC_ASSERT replaced with STL static_assert

---
 base/types.h                   | 14 +++++++-------
 csv/applications/csv-calc.cpp  |  3 ++-
 csv/applications/csv-join.cpp  |  4 ++--
 csv/applications/split/split.h |  4 ++--
 csv/impl/unstructured.h        |  4 ++--
 io/applications/udp-client.cpp |  4 ++--
 packed/bits.h                  |  6 +++---
 packed/byte.h                  |  6 +++---
 packed/detail/endian.h         | 10 +++++-----
 packed/string.h                |  3 ++-
 packed/struct.h                |  4 ++--
 11 files changed, 32 insertions(+), 30 deletions(-)

diff --git a/base/types.h b/base/types.h
index 065547899..fecd5afa9 100644
--- a/base/types.h
+++ b/base/types.h
@@ -45,7 +45,7 @@
 
 #include <cmath>
 #include <limits>
-#include <boost/static_assert.hpp>
+#include <type_traits>
 
 namespace comma {
 
@@ -70,12 +70,12 @@ typedef __int32 int32;
 typedef __int64 int64;
 
 // Windows, you know...
-BOOST_STATIC_ASSERT( sizeof( uint16 ) == 2 );
-BOOST_STATIC_ASSERT( sizeof( uint32 ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( uint64 ) == 8 );
-BOOST_STATIC_ASSERT( sizeof( int16 ) == 2 );
-BOOST_STATIC_ASSERT( sizeof( int32 ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( int64 ) == 8 );
+static_assert( sizeof( uint16 ) == 2, "expected uint16 of size 2" );
+static_assert( sizeof( uint32 ) == 4, "expected uint32 of size 4" );
+static_assert( sizeof( uint64 ) == 8, "expected uint64 of size 8" );
+static_assert( sizeof( int16 ) == 2, "expected int16 of size 2" );
+static_assert( sizeof( int32 ) == 4, "expected int32 of size 4" );
+static_assert( sizeof( int64 ) == 8, "expected int64 of size 8" );
 
 #endif
 
diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 0a20fc95c..d1791dad3 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -36,6 +36,7 @@
 #endif
 
 #include <iostream>
+#include <type_traits>
 #include <boost/bind.hpp>
 #include <boost/function.hpp>
 #include <boost/optional.hpp>
@@ -378,7 +379,7 @@ template < typename V > struct map_traits< boost::posix_time::ptime, V >
     {
         std::size_t operator()( const boost::posix_time::ptime& t ) const
         {
-            BOOST_STATIC_ASSERT( sizeof( t ) == sizeof( comma::uint64 ) );
+            static_assert( sizeof( t ) == sizeof( comma::uint64 ), "expected 8-byte time" );
             std::size_t seed = 0;
             boost::hash_combine( seed, reinterpret_cast< const comma::uint64& >( t ) ); // quick and dirty
             return seed;
diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index f3b6456b5..cf094c7eb 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -34,13 +34,13 @@
 #include <map>
 #include <sstream>
 #include <string>
+#include <type_traits>
 #include <vector>
 #include <boost/array.hpp>
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/functional/hash.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
-#include <boost/static_assert.hpp>
 #include <boost/unordered_map.hpp>
 #include "../../application/command_line_options.h"
 #include "../../application/contact_info.h"
@@ -159,7 +159,7 @@ static boost::optional< double > radius;
 
 static void hash_combine_( std::size_t& seed, boost::posix_time::ptime key )
 {
-    BOOST_STATIC_ASSERT( sizeof( boost::posix_time::ptime ) == 8 );
+    static_assert( sizeof( boost::posix_time::ptime ) == 8, "expected time of size 8" );
     boost::hash_combine( seed, *reinterpret_cast< const long long* >( &key ) );
 }
 
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 7fb36b57d..50b0e5c99 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -36,12 +36,12 @@
 #include <fstream>
 #include <functional>
 #include <memory>
+#include <type_traits>
 #include <unordered_map>
 #include <unordered_set>
 #include <thread>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/optional.hpp>
-#include <boost/static_assert.hpp>
 #include "../../../base/types.h"
 #include "../../../csv/ascii.h"
 #include "../../../csv/binary.h"
@@ -99,7 +99,7 @@ template <> struct traits< boost::posix_time::ptime >
     {
         std::size_t operator()( const boost::posix_time::ptime& t ) const
         {
-            BOOST_STATIC_ASSERT( sizeof( t ) == sizeof( comma::uint64 ) );
+            static_assert( sizeof( t ) == sizeof( comma::uint64 ), "expected time of size 8" );
             std::size_t seed = 0;
             boost::hash_combine( seed, reinterpret_cast< const comma::uint64& >( t ) ); // quick and dirty
             return seed;
diff --git a/csv/impl/unstructured.h b/csv/impl/unstructured.h
index 21d0426d8..c724d7122 100644
--- a/csv/impl/unstructured.h
+++ b/csv/impl/unstructured.h
@@ -33,8 +33,8 @@
 #pragma once
 
 #include <string>
+#include <type_traits>
 #include <vector>
-#include <boost/static_assert.hpp>
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/functional/hash.hpp>
 #include <boost/lexical_cast.hpp>
@@ -80,7 +80,7 @@ struct unstructured
         private:
             static void hash_combine_impl_( std::size_t& s, const boost::posix_time::ptime& t ) // quick and dirty
             {
-                BOOST_STATIC_ASSERT( sizeof( boost::posix_time::ptime ) == 8 ); // quick and dirty
+                static_assert( sizeof( boost::posix_time::ptime ) == 8, "expected time of size 8" ); // quick and dirty
                 boost::hash_combine( s, reinterpret_cast< const comma::uint64& >( t ) );
             }
             
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index a72ea7b23..232079a86 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -34,11 +34,11 @@
 #include <stdlib.h>
 #endif
 #include <iostream>
+#include <type_traits>
 #include <boost/array.hpp>
 #include <boost/asio/ip/udp.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/noncopyable.hpp>
-#include <boost/static_assert.hpp>
 #include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/types.h"
@@ -109,7 +109,7 @@ int main( int argc, char** argv )
         if( timestamped )
         {
             boost::posix_time::ptime timestamp = boost::posix_time::microsec_clock::universal_time();
-            BOOST_STATIC_ASSERT( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ) );
+            static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
             if( binary )
             { 
                 static char buf[ sizeof( comma::int64 ) ];
diff --git a/packed/bits.h b/packed/bits.h
index cab9bfaad..177c84968 100644
--- a/packed/bits.h
+++ b/packed/bits.h
@@ -36,10 +36,10 @@
 
 #include <limits>
 #include <string.h>
-#include <boost/static_assert.hpp>
+#include <type_traits>
+#include <boost/type_traits.hpp>
 #include "../packed/field.h"
 #include "../base/types.h"
-#include <boost/type_traits.hpp>
 
 namespace comma { namespace packed {
 
@@ -81,7 +81,7 @@ struct bits : public packed::field< bits< B, Default >, B, sizeof( typename comm
 
 template< typename T > inline void reverse_bits( T& v )
 {
-    BOOST_STATIC_ASSERT( boost::is_unsigned< T >::value );
+    static_assert( boost::is_unsigned< T >::value, "expected unsigned value" );
     unsigned int s = std::numeric_limits< T >::digits - 1;
     T r = v;
     for( v >>= 1; v; v >>= 1 )
diff --git a/packed/byte.h b/packed/byte.h
index 24ef1864e..c3259b616 100644
--- a/packed/byte.h
+++ b/packed/byte.h
@@ -43,7 +43,7 @@
 #endif
 #endif
 
-#include <boost/static_assert.hpp>
+#include <type_traits>
 #include "field.h"
 
 namespace comma { namespace packed {
@@ -53,7 +53,7 @@ struct byte : public packed::field< byte, unsigned char, sizeof( unsigned char )
 {
     enum { size = sizeof( unsigned char ) };
 
-    BOOST_STATIC_ASSERT( size == 1 );
+    static_assert( size == 1, "expected size 1" );
 
     typedef unsigned char type;
 
@@ -76,7 +76,7 @@ struct const_byte : public packed::field< const_byte< C >, unsigned char, sizeof
 {
     enum { size = sizeof( unsigned char ) };
 
-    BOOST_STATIC_ASSERT( size == 1 );
+    static_assert( size == 1, "expected size 1" );
 
     typedef unsigned char type;
 
diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index b27ac37e0..11c52363c 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -60,15 +60,15 @@
 
 #include <endian.h>
 #include <algorithm>
-#include <boost/static_assert.hpp>
+#include <type_traits>
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../field.h"
 
 namespace comma { namespace packed { namespace detail {
 
-BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
+static_assert( sizeof( float ) == 4, "expected float of 4 bytes" );
+static_assert( sizeof( double ) == 8, "expected double of 8 bytes" );
 
 enum endiannes { little = 0, big = 1 };
     
@@ -128,9 +128,9 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
 
     typedef typename endian_traits< Endianness, Size, Signed, Floating >::type type;
     
-    BOOST_STATIC_ASSERT( size <= sizeof( type ) );
+    static_assert( size <= sizeof( type ), "expected size less than size of type" );
     
-    BOOST_STATIC_ASSERT( Signed || !Floating ); // unsigned floats don't make sense
+    static_assert( Signed || !Floating, "expected signed or non-floating point type" ); // unsigned floats don't make sense
 
     typedef packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size > base_type;
 
diff --git a/packed/string.h b/packed/string.h
index 155200c65..56106579e 100644
--- a/packed/string.h
+++ b/packed/string.h
@@ -37,6 +37,7 @@
 #include <cmath>
 #include <iomanip>
 #include <string>
+#include <type_traits>
 #include <boost/lexical_cast.hpp>
 #include "../base/exception.h"
 #include "../string/string.h"
@@ -150,7 +151,7 @@ template < typename T, std::size_t S, char Padding = ' ' >
 class ascii_hex : public packed::field< ascii_hex< T, S, Padding >, T, S >
 {
 public:
-    BOOST_STATIC_ASSERT( boost::is_unsigned< T >::value );
+    static_assert( boost::is_unsigned< T >::value, "expected unsigned type" );
     enum { size = S };
     
     typedef T Type;
diff --git a/packed/struct.h b/packed/struct.h
index f5bc8c5f6..2bee4948d 100644
--- a/packed/struct.h
+++ b/packed/struct.h
@@ -35,7 +35,7 @@
 #define COMMA_PACKED_STRUCT_HPP_
 
 #include <cstring>
-#include <boost/static_assert.hpp>
+#include <type_traits>
 
 namespace comma { namespace packed {
 
@@ -46,7 +46,7 @@ class packed_struct
     public:
         enum { size = S };
 
-        packed_struct() throw() { BOOST_STATIC_ASSERT( sizeof( Derived ) == size ); }
+        packed_struct() throw() { static_assert( sizeof( Derived ) == size, "expected derived of provided size" ); }
 
         const char* data() const throw() { return reinterpret_cast< const char* >( this ); }
 

From 382d5515670bfd7b9cead08f99d90745a052c6dc Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 24 Jun 2020 15:12:22 +1000
Subject: [PATCH 0171/1056] string/split: split_as<T>() implemented

---
 string/split.h | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)

diff --git a/string/split.h b/string/split.h
index a12403aa1..3e293a0e6 100644
--- a/string/split.h
+++ b/string/split.h
@@ -33,6 +33,7 @@
 
 #include <string>
 #include <vector>
+#include <boost/lexical_cast.hpp>
 
 namespace comma {
 
@@ -48,6 +49,14 @@ std::vector< std::string > split( const std::string& s, const char* separators =
 /// split string into tokens (a quick implementation); always contains at least one element
 std::vector< std::string > split( const std::string& s, char separator, bool empty_if_empty_input = false );
 
+/// split string into tokens (a quick implementation) and cast to a given type; always contains at least one element
+template < typename T >
+std::vector< T > split_as( const std::string& s, const char* separators );
+
+/// split string into tokens (a quick implementation) and cast to a given type; always contains at least one element
+template < typename T >
+std::vector< T > split_as( const std::string& s, char separator );
+
 /// Split string into tokens; always contains at least one element;
 /// skips backslash escaped separator, handle non-nested quotes;
 /// exceptions thrown on errors.
@@ -72,5 +81,20 @@ std::vector< std::string > split_bracketed( const std::string& s, const char * s
 /// skips bracketed separators
 std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket = '(', char rbracket = ')', bool strip_brackets = true );
 
+template < typename T >
+inline std::vector< T > split_as( const std::string& s, const char* separators )
+{
+    const auto& v = split( s, separators, true );
+    std::vector< T > t( v.size() );
+    for( unsigned int i = 0; i < v.size(); ++i ) { t[i] = boost::lexical_cast< T >( v[i] ); }
+    return t;
+}
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator )
+{
+    const char separators[] = { separator, 0 };
+    return split_as< T >( s, separators );
+}
+
 } // namespace comma {
 

From dfcb0f98bf519b9dbd046de71949bc0ea8c8f36e Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 2 Jul 2020 11:31:06 +1000
Subject: [PATCH 0172/1056] name-value-to-csv: include typo fixed

---
 name_value/applications/name-value-to-csv.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index 92c38ed19..d52114b4f 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -36,7 +36,7 @@
 #include <unordered_set>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
-#include "../../string.h"
+#include "../../string/string.h"
 #include "../../xpath/xpath.h"
 
 static void usage( bool )

From 9e73dbbba18ca18836c22bbfc33ed6cc842e418c Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Wed, 8 Jul 2020 18:00:58 +1000
Subject: [PATCH 0173/1056] csv-random: make: --engine implemented;
 true-random; shuffle: --engine: todo

---
 csv/applications/csv-random.cpp | 50 ++++++++++++++++++++++-----------
 1 file changed, 33 insertions(+), 17 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 5ce089527..d99a74133 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -90,11 +90,17 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --append; append random numbers to stdin input" << std::endl;
-    std::cerr << "            --distribution=<distribution>; default=uniform; values: uniform, more todo, just ask" << std::endl;
+    std::cerr << "            --distribution=<distribution>; default=uniform; todo: more distributions to plug in, just ask" << std::endl;
+    std::cerr << "            --engine=<engine>; default=mt19937_64; values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
     std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
     std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
     std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, f, d" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "    true-random" << std::endl;
+    std::cerr << "        todo" << std::endl;
+    std::cerr << "        example" << std::endl;
+    std::cerr << "            > csv-random make --seed=$( csv-random true-random --once )" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "    shuffle: output input records in pseudo-random order" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv" << std::endl;
@@ -109,7 +115,7 @@ static void usage( bool verbose )
     exit( 0 );
 }
 
-static bool output_binary;
+//static bool output_binary;
 static bool verbose;
 static comma::csv::options csv;
 static boost::optional< int > seed;
@@ -157,10 +163,9 @@ struct type_traits< unsigned char >
     static unsigned int cast( unsigned char t ) { return static_cast< int >( t ); }
 };
     
-template < typename T, typename Distribution >
-static int run_impl( Distribution& distribution, bool append, bool binary )
-{
-    std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
+template < typename T, typename Distribution, typename Engine >
+static int run_impl( Distribution& distribution, Engine engine, bool append, bool binary )
+{;
     if( !::csv.flush ) { std::cin.tie( NULL ); }
     if( append )
     {
@@ -173,7 +178,7 @@ static int run_impl( Distribution& distribution, bool append, bool binary )
                 if( std::cin.gcount() == 0 ) { break; }
                 if( std::cin.gcount() != int( buf.size() ) ) { std::cerr << "csv-random: make: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
                 std::cout.write( &buf[0], buf.size() );
-                T r = distribution( generator );
+                T r = distribution( engine );
                 std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
                 if( ::csv.flush ) { std::cout.flush(); }
             }
@@ -185,7 +190,7 @@ static int run_impl( Distribution& distribution, bool append, bool binary )
                 std::string s;
                 std::getline( std::cin, s );
                 if( s.empty() ) { continue; }
-                std::cout << s << ::csv.delimiter << type_traits< T >::cast( distribution( generator ) ) << std::endl;
+                std::cout << s << ::csv.delimiter << type_traits< T >::cast( distribution( engine ) ) << std::endl;
                 if( ::csv.flush ) { std::cout.flush(); }
             }
         }
@@ -194,7 +199,7 @@ static int run_impl( Distribution& distribution, bool append, bool binary )
     {
         while( std::cout.good() )
         {
-            T r = distribution( generator );
+            T r = distribution( engine );
             if( binary ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) ); }
             else { std::cout << type_traits< T >::cast( r ) << std::endl; }
             if( ::csv.flush ) { std::cout.flush(); }
@@ -208,17 +213,28 @@ static int run_impl( const comma::command_line_options& options )
 {
     bool append = options.exists( "--append" );
     bool binary = options.exists( "--output-binary" ) || ::csv.binary();
+    auto engine = options.value< std::string >( "--engine", "mt19937_64" );
     auto r = options.optional< std::string >( "--range" ); // todo: parse distribution parameters
+    Distribution< T > distribution;
     if( r )
     {
         auto range = comma::csv::ascii< std::pair< T, T > >().get( *r );
-        Distribution< T > distribution( range.first, range.second );
-        return run_impl< T >( distribution, append, binary );
+        distribution = Distribution< T >( range.first, range.second );
     }
-    Distribution< T > distribution;
-    return run_impl< T >( distribution, append, binary );
+    if( engine == "minstd_rand0" ) { return run_impl< T >( distribution, seed ? std::minstd_rand0( *seed ) : std::minstd_rand0() , append, binary ); }
+    if( engine == "minstd_rand" ) { return run_impl< T >( distribution, seed ? std::minstd_rand( *seed ) : std::minstd_rand() , append, binary ); }
+    if( engine == "mt19937" ) { return run_impl< T >( distribution, seed ? std::mt19937( *seed ) : std::mt19937(), append, binary ); }
+    if( engine == "mt19937_64" ) { return run_impl< T >( distribution, seed ? std::mt19937_64( *seed ) : std::mt19937_64(), append, binary ); }
+    if( engine == "ranlux24_base" ) { return run_impl< T >( distribution, seed ? std::ranlux24_base( *seed ) : std::ranlux24_base() , append, binary ); }
+    if( engine == "ranlux48_base" ) { return run_impl< T >( distribution, seed ? std::ranlux48_base( *seed ) : std::ranlux48_base() , append, binary ); }
+    if( engine == "ranlux24" ) { return run_impl< T >( distribution, seed ? std::ranlux24( *seed ) : std::ranlux24() , append, binary ); }
+    if( engine == "ranlux48" ) { return run_impl< T >( distribution, seed ? std::ranlux48( *seed ) : std::ranlux48() , append, binary ); }
+    if( engine == "knuth_b" ) { return run_impl< T >( distribution, seed ? std::knuth_b( *seed ) : std::knuth_b() , append, binary ); }
+    if( engine == "default_random_engine" ) { return run_impl< T >( distribution, seed ? std::default_random_engine( *seed ) : std::default_random_engine() , append, binary ); }
+    std::cerr << "csv-random make: expected engine; got: '" << engine << "'" << std::endl;
+    return 1;
 }
-    
+
 static int run( const comma::command_line_options& options ) // quick and dirty
 {
     auto distribution = options.value< std::string >( "--distribution", "uniform" );
@@ -273,7 +289,7 @@ namespace shuffle {
 
 static int run( const comma::command_line_options& options )
 {
-    std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
+    auto engine = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
     std::deque< std::string > records;
     auto output = []( std::deque< std::string >& records )
     { 
@@ -293,7 +309,7 @@ static int run( const comma::command_line_options& options )
             if( !p || p->block != block )
             {
                 std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
-                std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+                std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
                 output( records );
                 if( p ) { block = p->block; }
             }
@@ -336,7 +352,7 @@ static int run( const comma::command_line_options& options )
             }
         }
         std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
-        std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+        std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
         output( records );
     }
     return 0;

From c664f538d3080588445847ca3aac95d3f39ccd5a Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Fri, 10 Jul 2020 13:40:49 +1000
Subject: [PATCH 0174/1056] csv-random: implemented true-random, shuffle
 --engine and --type can now take more than one value of the same type

---
 csv/applications/csv-random.cpp | 285 +++++++++++++++++++++-----------
 1 file changed, 192 insertions(+), 93 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index d99a74133..0b6341fcd 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -57,22 +57,16 @@
 /// @author vsevolod vlaskine
 
 #include <algorithm>
-#include <string.h>
+#include <cstring>
 #include <deque>
 #include <iostream>
-#include <map>
-#include <memory>
 #include <random>
-#include <sstream>
 #include <string>
 #include <vector>
+
 #include "../../application/command_line_options.h"
-#include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
-#include "../../csv/traits.h"
-#include "../../string/string.h"
-#include "../../visiting/traits.h"
 
 static void usage( bool verbose )
 {
@@ -91,13 +85,19 @@ static void usage( bool verbose )
     std::cerr << "        options" << std::endl;
     std::cerr << "            --append; append random numbers to stdin input" << std::endl;
     std::cerr << "            --distribution=<distribution>; default=uniform; todo: more distributions to plug in, just ask" << std::endl;
-    std::cerr << "            --engine=<engine>; default=mt19937_64; values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
+    std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
     std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
     std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
-    std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, f, d" << std::endl;
+    std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, l, ul, f, d" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    true-random: produces non-deterministic random numbers (if non-deterministic source is not available, may be pseudo-random)" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        usage: csv-random true-random [<options>]" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --append; append random unsigned longs to stdin input" << std::endl;
+    std::cerr << "            --once; output random number only once" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    true-random" << std::endl;
-    std::cerr << "        todo" << std::endl;
     std::cerr << "        example" << std::endl;
     std::cerr << "            > csv-random make --seed=$( csv-random true-random --once )" << std::endl;
     std::cerr << std::endl;
@@ -106,6 +106,7 @@ static void usage( bool verbose )
     std::cerr << "        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
+    std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
     std::cerr << "            --fields=[<fields>]; if 'block' field present shuffle each block, otherwise read whole input and then shuffle" << std::endl;
     std::cerr << "            --sliding-window,--window=[<size>]; todo: shuffle on sliding window of <size> records" << std::endl;
     std::cerr << std::endl;
@@ -115,18 +116,16 @@ static void usage( bool verbose )
     exit( 0 );
 }
 
-//static bool output_binary;
 static bool verbose;
 static comma::csv::options csv;
 static boost::optional< int > seed;
 
-
 namespace comma { namespace applications { namespace random { namespace shuffle {
 
 struct input
 {
     comma::uint32 block;
-    input(): block( 0 ) {}
+    input() : block( 0 ) {}
 };
 
 } } } } // namespace comma { namespace applications { namespace random { namespace shuffle {
@@ -143,7 +142,6 @@ template <> struct traits< comma::applications::random::shuffle::input >
 
 namespace comma { namespace applications { namespace random {
 
-namespace make {
 
 template < typename T >
 struct type_traits
@@ -162,11 +160,13 @@ struct type_traits< unsigned char >
 {
     static unsigned int cast( unsigned char t ) { return static_cast< int >( t ); }
 };
-    
-template < typename T, typename Distribution, typename Engine >
-static int run_impl( Distribution& distribution, Engine engine, bool append, bool binary )
-{;
-    if( !::csv.flush ) { std::cin.tie( NULL ); }
+
+namespace make {
+template < typename T, template < typename > class Distribution, typename Engine >
+static int run_impl( Distribution< T >& distribution, bool append, bool binary, std::size_t count )
+{
+    Engine engine = ::seed ? Engine( *::seed ) : Engine();
+    if( !::csv.flush ) { std::cin.tie( nullptr ); }
     if( append )
     {
         if( ::csv.binary() )
@@ -176,10 +176,17 @@ static int run_impl( Distribution& distribution, Engine engine, bool append, boo
             {
                 std::cin.read( &buf[0], buf.size() );
                 if( std::cin.gcount() == 0 ) { break; }
-                if( std::cin.gcount() != int( buf.size() ) ) { std::cerr << "csv-random: make: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                if( std::cin.gcount() != static_cast< int >( buf.size() ) )
+                {
+                    std::cerr << "csv-random make: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl;
+                    return 1;
+                }
                 std::cout.write( &buf[0], buf.size() );
-                T r = distribution( engine );
-                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
+                for( std::size_t i = 0; i < count; ++i )
+                {
+                    T r = distribution( engine );
+                    std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
+                }
                 if( ::csv.flush ) { std::cout.flush(); }
             }
         }
@@ -190,7 +197,9 @@ static int run_impl( Distribution& distribution, Engine engine, bool append, boo
                 std::string s;
                 std::getline( std::cin, s );
                 if( s.empty() ) { continue; }
-                std::cout << s << ::csv.delimiter << type_traits< T >::cast( distribution( engine ) ) << std::endl;
+                std::cout << s;
+                for( std::size_t i = 0; i < count; ++i ) { std::cout << ::csv.delimiter << type_traits< T >::cast( distribution( engine ) ); }
+                std::cout << std::endl;
                 if( ::csv.flush ) { std::cout.flush(); }
             }
         }
@@ -199,9 +208,24 @@ static int run_impl( Distribution& distribution, Engine engine, bool append, boo
     {
         while( std::cout.good() )
         {
-            T r = distribution( engine );
-            if( binary ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) ); }
-            else { std::cout << type_traits< T >::cast( r ) << std::endl; }
+            if( binary )
+            {
+                for( std::size_t i = 0; i < count; ++i )
+                {
+                    T r = distribution( engine );
+                    std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
+                }
+            }
+            else
+            {
+                std::string comma;
+                for( std::size_t i = 0; i < count; ++i )
+                {
+                    std::cout << comma << type_traits< T >::cast( distribution( engine ) );
+                    comma = ::csv.delimiter;
+                }
+                std::cout << std::endl;
+            }
             if( ::csv.flush ) { std::cout.flush(); }
         }
     }
@@ -211,75 +235,76 @@ static int run_impl( Distribution& distribution, Engine engine, bool append, boo
 template < typename T, template < typename > class Distribution >
 static int run_impl( const comma::command_line_options& options )
 {
-    bool append = options.exists( "--append" );
-    bool binary = options.exists( "--output-binary" ) || ::csv.binary();
-    auto engine = options.value< std::string >( "--engine", "mt19937_64" );
-    auto r = options.optional< std::string >( "--range" ); // todo: parse distribution parameters
+    const auto& append = options.exists( "--append" );
+    const auto& binary = options.exists( "--output-binary" ) || ::csv.binary();
+    const auto& engine = options.value< std::string >( "--engine", "mt19937_64" );
+    const auto& count = comma::csv::format( options.value< std::string >( "--type", "ui" ) ).count();
+    const auto& r = options.optional< std::string >( "--range" ); // todo: parse distribution parameters
     Distribution< T > distribution;
     if( r )
     {
-        auto range = comma::csv::ascii< std::pair< T, T > >().get( *r );
+        const auto& range = comma::csv::ascii< std::pair< T, T > >().get( *r );
         distribution = Distribution< T >( range.first, range.second );
     }
-    if( engine == "minstd_rand0" ) { return run_impl< T >( distribution, seed ? std::minstd_rand0( *seed ) : std::minstd_rand0() , append, binary ); }
-    if( engine == "minstd_rand" ) { return run_impl< T >( distribution, seed ? std::minstd_rand( *seed ) : std::minstd_rand() , append, binary ); }
-    if( engine == "mt19937" ) { return run_impl< T >( distribution, seed ? std::mt19937( *seed ) : std::mt19937(), append, binary ); }
-    if( engine == "mt19937_64" ) { return run_impl< T >( distribution, seed ? std::mt19937_64( *seed ) : std::mt19937_64(), append, binary ); }
-    if( engine == "ranlux24_base" ) { return run_impl< T >( distribution, seed ? std::ranlux24_base( *seed ) : std::ranlux24_base() , append, binary ); }
-    if( engine == "ranlux48_base" ) { return run_impl< T >( distribution, seed ? std::ranlux48_base( *seed ) : std::ranlux48_base() , append, binary ); }
-    if( engine == "ranlux24" ) { return run_impl< T >( distribution, seed ? std::ranlux24( *seed ) : std::ranlux24() , append, binary ); }
-    if( engine == "ranlux48" ) { return run_impl< T >( distribution, seed ? std::ranlux48( *seed ) : std::ranlux48() , append, binary ); }
-    if( engine == "knuth_b" ) { return run_impl< T >( distribution, seed ? std::knuth_b( *seed ) : std::knuth_b() , append, binary ); }
-    if( engine == "default_random_engine" ) { return run_impl< T >( distribution, seed ? std::default_random_engine( *seed ) : std::default_random_engine() , append, binary ); }
+    if( engine == "minstd_rand0" ) { return run_impl< T, Distribution, std::minstd_rand0 >( distribution, append, binary, count ); }
+    if( engine == "minstd_rand" ) { return run_impl< T, Distribution, std::minstd_rand >( distribution, append, binary, count ); }
+    if( engine == "mt19937" ) { return run_impl< T, Distribution, std::mt19937 >( distribution, append, binary, count ); }
+    if( engine == "mt19937_64" ) { return run_impl< T, Distribution, std::mt19937_64 >( distribution, append, binary, count ); }
+    if( engine == "ranlux24_base" ) { return run_impl< T, Distribution, std::ranlux24_base >( distribution, append, binary, count ); }
+    if( engine == "ranlux48_base" ) { return run_impl< T, Distribution, std::ranlux48_base >( distribution, append, binary, count ); }
+    if( engine == "ranlux24" ) { return run_impl< T, Distribution, std::ranlux24 >( distribution, append, binary, count ); }
+    if( engine == "ranlux48" ) { return run_impl< T, Distribution, std::ranlux48 >( distribution, append, binary, count ); }
+    if( engine == "knuth_b" ) { return run_impl< T, Distribution, std::knuth_b >( distribution, append, binary, count ); }
+    if( engine == "default_random_engine" ) { return run_impl< T, Distribution, std::default_random_engine >( distribution, append, binary, count ); }
     std::cerr << "csv-random make: expected engine; got: '" << engine << "'" << std::endl;
     return 1;
 }
 
 static int run( const comma::command_line_options& options ) // quick and dirty
 {
-    auto distribution = options.value< std::string >( "--distribution", "uniform" );
-    auto type = options.value< std::string >( "--type", "ui" );
-    if( type == "b" )
-    {
-        if( distribution == "uniform" ) { return run_impl< char, std::uniform_int_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
-    }
-    if( type == "ub" )
-    {
-        if( distribution == "uniform" ) { return run_impl< unsigned char, std::uniform_int_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
-    }
-    if( type == "w" )
+    const auto& distribution = options.value< std::string >( "--distribution", "uniform" );
+    const auto& format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
+    if ( format.collapsed_string().find( ',' ) != std::string::npos )
     {
-        if( distribution == "uniform" ) { return run_impl< comma::int16, std::uniform_int_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
-    }
-    if( type == "uw" )
-    {
-        if( distribution == "uniform" ) { return run_impl< comma::uint16, std::uniform_int_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
-    }
-    if( type == "i" )
-    {
-        if( distribution == "uniform" ) { return run_impl< comma::int32, std::uniform_int_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
-    }
-    if( type == "ui" )
-    {
-        if( distribution == "uniform" ) { return run_impl< comma::int32, std::uniform_int_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
-    }
-    if( type == "f" )
-    {
-        if( distribution == "uniform" ) { return run_impl< float, std::uniform_real_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+        std::cerr << "csv-random make: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl;
+        return 1;
     }
-    if( type == "d" )
-    {
-        if( distribution == "uniform" ) { return run_impl< double, std::uniform_real_distribution >( options ); }
-        std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    switch ( format.offset( 0 ).type ) {
+        case csv::format::int8:
+            if( distribution == "uniform" ) { return run_impl< char, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::uint8:
+            if( distribution == "uniform" ) { return run_impl< unsigned char, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::int16:
+            if( distribution == "uniform" ) { return run_impl< comma::int16, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::uint16:
+            if( distribution == "uniform" ) { return run_impl< comma::uint16, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::int32:
+            if( distribution == "uniform" ) { return run_impl< comma::int32, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::uint32:
+            if( distribution == "uniform" ) { return run_impl< comma::uint32, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::int64:
+            if( distribution == "uniform" ) { return run_impl< comma::int64, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::uint64:
+            if( distribution == "uniform" ) { return run_impl< comma::uint64, std::uniform_int_distribution >( options ); }
+            break;
+        case csv::format::float_t:
+            if( distribution == "uniform" ) { return run_impl< float, std::uniform_real_distribution >( options ); }
+            break;
+        case csv::format::double_t:
+            if( distribution == "uniform" ) { return run_impl< double, std::uniform_real_distribution >( options ); }
+            break;
+        default:
+            std::cerr << "csv-random make: expected type; got: '" << format.string() << "'" << std::endl;
+            return 1;
     }
-    std::cerr << "csv-random make: expected type; got: '" << type << "'" << std::endl;
+    std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
     return 1;
 }
 
@@ -287,12 +312,13 @@ static int run( const comma::command_line_options& options ) // quick and dirty
 
 namespace shuffle {
 
-static int run( const comma::command_line_options& options )
+template < typename Engine >
+static int run_impl( const comma::command_line_options& options )
 {
-    auto engine = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
+    auto engine = ::seed ? Engine( *::seed ) : Engine();
     std::deque< std::string > records;
     auto output = []( std::deque< std::string >& records )
-    { 
+    {
         for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
         records.clear();
         if( ::csv.flush ) { std::cout.flush(); }
@@ -300,7 +326,7 @@ static int run( const comma::command_line_options& options )
     auto sliding_window = options.optional< unsigned int >( "--sliding-window,--window" );
     if( ::csv.has_field( "block" ) )
     {
-        if( sliding_window ) { std::cerr << "csv-random: shuffle: expected either block field or --sliding-window; got both" << std::endl; return 1; }
+        if( sliding_window ) { std::cerr << "csv-random shuffle: expected either block field or --sliding-window; got both" << std::endl; return 1; }
         comma::csv::input_stream< input > is( std::cin, ::csv );
         comma::uint32 block = 0;
         while( is.ready() || std::cin.good() )
@@ -316,7 +342,7 @@ static int run( const comma::command_line_options& options )
             if( !p ) { break; }
             if( ::csv.binary() )
             {
-                records.push_back( std::string() );
+                records.emplace_back();
                 records.back().resize( ::csv.format().size() );
                 std::memcpy( &records.back()[0], is.binary().last(), ::csv.format().size() );
             }
@@ -328,7 +354,7 @@ static int run( const comma::command_line_options& options )
     }
     else // quick and dirty
     {
-        if( sliding_window ) { std::cerr << "csv-random: shuffle: --sliding-window: todo" << std::endl; return 1; }
+        if( sliding_window ) { std::cerr << "csv-random shuffle: --sliding-window: todo" << std::endl; return 1; }
         if( ::csv.binary() )
         {
             std::string s( ::csv.format().size(), 0 );
@@ -336,8 +362,8 @@ static int run( const comma::command_line_options& options )
             {
                 std::cin.read( &s[0], s.size() );
                 if( std::cin.gcount() == 0 ) { break; }
-                if( std::cin.gcount() != int( s.size() ) ) { std::cerr << "csv-random: random: expected " << s.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
-                records.push_back( std::string() );
+                if( std::cin.gcount() != int( s.size() ) ) { std::cerr << "csv-random shuffle: expected " << s.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                records.emplace_back();
                 records.back().resize( ::csv.format().size() );
                 std::memcpy( &records.back()[0], &s[0], ::csv.format().size() );
             }
@@ -358,8 +384,79 @@ static int run( const comma::command_line_options& options )
     return 0;
 }
 
+static int run( const comma::command_line_options& options )
+{
+    const auto& engine = options.value< std::string >( "--engine", "mt19937_64" );
+    if( engine == "minstd_rand0" ) { return run_impl< std::minstd_rand0 >( options ); }
+    if( engine == "minstd_rand" ) { return run_impl< std::minstd_rand >( options ); }
+    if( engine == "mt19937" ) { return run_impl< std::mt19937>( options ); }
+    if( engine == "mt19937_64" ) { return run_impl< std::mt19937_64 >( options ); }
+    if( engine == "ranlux24_base" ) { return run_impl< std::ranlux24_base >( options ); }
+    if( engine == "ranlux48_base" ) { return run_impl< std::ranlux48_base >( options ); }
+    if( engine == "ranlux24" ) { return run_impl< std::ranlux24 >( options ); }
+    if( engine == "ranlux48" ) { return run_impl< std::ranlux48 >( options ); }
+    if( engine == "knuth_b" ) { return run_impl< std::knuth_b >( options ); }
+    if( engine == "default_random_engine" ) { return run_impl< std::default_random_engine >( options ); }
+    std::cerr << "csv-random shuffle: expected engine; got: '" << engine << "'" << std::endl;
+    return 1;
+}
+
 } // namespace shuffle {
 
+namespace true_random {
+
+static int run( const comma::command_line_options& options )
+{
+    std::random_device rd;
+    bool binary = options.exists( "--output-binary" ) || ::csv.binary();
+    if( options.exists( "--once" ) )
+    {
+        std::cout << rd() << std::endl;
+        return 0;
+    }
+    if( options.exists( "--append" ) )
+    {
+        if( ::csv.binary() )
+        {
+            std::vector< char > buf( ::csv.format().size() );
+            while( std::cin.good() )
+            {
+                std::cin.read( &buf[0], buf.size() );
+                if( std::cin.gcount() == 0 ) { break; }
+                if( std::cin.gcount() != static_cast< int >( buf.size() ) ) { std::cerr << "csv-random true-random: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                std::cout.write( &buf[0], buf.size() );
+                auto r = rd();
+                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( decltype( r ) ) );
+                if( ::csv.flush ) { std::cout.flush(); }
+            }
+        }
+        else
+        {
+            while( std::cin.good() )
+            {
+                std::string s;
+                std::getline( std::cin, s );
+                if( s.empty() ) { continue; }
+                std::cout << s << ::csv.delimiter << rd() << std::endl;
+                if( ::csv.flush ) { std::cout.flush(); }
+            }
+        }
+    }
+    else
+    {
+        while( std::cout.good() )
+        {
+            auto r = rd();
+            if( binary ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( decltype ( r ) ) ); }
+            else { std::cout << r << std::endl; }
+            if( ::csv.flush ) { std::cout.flush(); }
+        }
+    }
+    return 0;
+}
+
+} // namespace true_random {
+
 } } } // namespace comma { namespace applications { namespace random {
 
 int main( int ac, char** av )
@@ -370,12 +467,14 @@ int main( int ac, char** av )
         const auto& unnamed = options.unnamed( "--append,--flush,--verbose,-v", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-random: please specify operation" << std::endl; return 1; }
         ::csv = comma::csv::options( options );
-        seed = options.optional< int >( "--seed" );
+        std::cout.precision(::csv.precision);
+        ::seed = options.optional< int >( "--seed" );
         ::verbose = options.exists( "--verbose,-v" );
         std::string operation = unnamed[0];
         if( operation == "make" ) { return comma::applications::random::make::run( options ); }
         if( operation == "shuffle" ) { return comma::applications::random::shuffle::run( options ); }
-        std::cerr << "csv-random: expection operation; got: '" << operation << "'" << std::endl;
+        if( operation == "true-random" ) { return comma::applications::random::true_random::run( options ); }
+        std::cerr << "csv-random: expected operation; got: '" << operation << "'" << std::endl;
         return 1;
     }
     catch( std::exception& ex ) { std::cerr << "csv-random: " << ex.what() << std::endl; }

From 9f5441841bfdef4b94630c997d5df16a56bc1ec4 Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Fri, 10 Jul 2020 14:26:06 +1000
Subject: [PATCH 0175/1056] csv-random: small changes to usage

---
 csv/applications/csv-random.cpp | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 0b6341fcd..8ba5024b4 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -88,14 +88,14 @@ static void usage( bool verbose )
     std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
     std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
     std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
-    std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, l, ul, f, d" << std::endl;
+    std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, l, ul, f, d; can have more than one <type> i.e. 3ui" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    true-random: produces non-deterministic random numbers (if non-deterministic source is not available, may be pseudo-random)" << std::endl;
+    std::cerr << "    true-random: output non-deterministic random numbers (if non-deterministic source is not available, e.g. a hardware device, output will be pseudo-random). output is unsigned int" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        usage: csv-random true-random [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
-    std::cerr << "            --append; append random unsigned longs to stdin input" << std::endl;
+    std::cerr << "            --append; append random number to stdin input" << std::endl;
     std::cerr << "            --once; output random number only once" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        example" << std::endl;
@@ -411,7 +411,9 @@ static int run( const comma::command_line_options& options )
     bool binary = options.exists( "--output-binary" ) || ::csv.binary();
     if( options.exists( "--once" ) )
     {
-        std::cout << rd() << std::endl;
+        auto r = rd();
+        if ( binary ) { std::cout.write( reinterpret_cast< char * >( &r ), sizeof( r ) ); }
+        else { std::cout << r << std::endl; }
         return 0;
     }
     if( options.exists( "--append" ) )
@@ -426,7 +428,7 @@ static int run( const comma::command_line_options& options )
                 if( std::cin.gcount() != static_cast< int >( buf.size() ) ) { std::cerr << "csv-random true-random: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
                 std::cout.write( &buf[0], buf.size() );
                 auto r = rd();
-                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( decltype( r ) ) );
+                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( r ) );
                 if( ::csv.flush ) { std::cout.flush(); }
             }
         }
@@ -447,7 +449,7 @@ static int run( const comma::command_line_options& options )
         while( std::cout.good() )
         {
             auto r = rd();
-            if( binary ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( decltype ( r ) ) ); }
+            if( binary ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( r ) ); }
             else { std::cout << r << std::endl; }
             if( ::csv.flush ) { std::cout.flush(); }
         }
@@ -467,7 +469,7 @@ int main( int ac, char** av )
         const auto& unnamed = options.unnamed( "--append,--flush,--verbose,-v", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-random: please specify operation" << std::endl; return 1; }
         ::csv = comma::csv::options( options );
-        std::cout.precision(::csv.precision);
+        std::cout.precision( ::csv.precision );
         ::seed = options.optional< int >( "--seed" );
         ::verbose = options.exists( "--verbose,-v" );
         std::string operation = unnamed[0];

From 2100ba137922ef8f66c173db0d139bf12bcba2b8 Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Wed, 15 Jul 2020 15:36:57 +1000
Subject: [PATCH 0176/1056] csv-random: true-random operation; --type=3f;
 shuffle --engine

---
 csv/applications/csv-random.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 8ba5024b4..277d84d1f 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -90,13 +90,15 @@ static void usage( bool verbose )
     std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
     std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, l, ul, f, d; can have more than one <type> i.e. 3ui" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    true-random: output non-deterministic random numbers (if non-deterministic source is not available, e.g. a hardware device, output will be pseudo-random). output is unsigned int" << std::endl;
+    std::cerr << "    true-random: output non-deterministic uniformly distributed unsigned int random numbers (if non-deterministic source is not available" << std::endl;
+    std::cerr << "                 e.g. a hardware device, output will be pseudo-random" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        usage: csv-random true-random [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --append; append random number to stdin input" << std::endl;
     std::cerr << "            --once; output random number only once" << std::endl;
+    std::cerr << "            --type=<type>; default=ui; todo: supported values: ui; e.g: --type=3ui; --type=ui,ui,ui; etc" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        example" << std::endl;
     std::cerr << "            > csv-random make --seed=$( csv-random true-random --once )" << std::endl;
@@ -142,7 +144,6 @@ template <> struct traits< comma::applications::random::shuffle::input >
 
 namespace comma { namespace applications { namespace random {
 
-
 template < typename T >
 struct type_traits
 {

From e60202283ec8d3727ffbb0b1b3fc04034b126f0b Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Thu, 16 Jul 2020 09:46:53 +1000
Subject: [PATCH 0177/1056] system/ansible: added install.python3.yml to
 support python3 installation

---
 system/ansible/install.python3.yml | 62 ++++++++++++++++++++++++++++++
 1 file changed, 62 insertions(+)
 create mode 100644 system/ansible/install.python3.yml

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
new file mode 100644
index 000000000..2189aefd5
--- /dev/null
+++ b/system/ansible/install.python3.yml
@@ -0,0 +1,62 @@
+---
+# sample ansible-playbook script to install comma dependencies and build comma from source; include it as it is or copy to your playbook
+
+- hosts: localhost
+  connection: local
+  vars:
+    - base: "{{ ansible_env.HOME }}"
+    - make_j: 6
+    - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
+
+  tasks:
+  - name: "install comma dependencies"
+    become: true
+    apt: pkg={{ item }} state=present update_cache=yes
+    with_items:
+      - build-essential 
+      - git
+      - cmake-curses-gui
+      - cmake
+      - perl
+      - python
+      - libboost-all-dev
+      - socat
+      - libzmq3-dev
+      - libgtest-dev
+      - python3-dev
+      - python3-numpy
+      - libprocps-dev
+      - recode
+      
+  - name: "comma: make source directory at {{ base }}"
+    file: path={{ base }}/{{ item }} state=directory
+    with_items:
+        - src
+        - build
+    
+  - name: "comma: clone"
+    git:
+        repo: "https://gitlab.com/orthographic/comma.git"
+        dest: "{{ base }}/src/comma"
+        clone: yes
+        update: yes
+        
+  - name: "comma: make build directory at {{ base }}"
+    file: dest="{{ base }}/build/comma" state=directory
+
+  - name: "comma: cmake"
+    vars:
+        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
+    shell: "/usr/bin/cmake {{ comma_cmake_options }} {{ base }}/src/comma chdir={{ base }}/build/comma"
+
+  - name: "comma: make"
+    make:
+        chdir: "{{ base }}/build/comma"
+        params:
+            MAKEFLAGS: "-j {{ make_j }}"
+
+  - name: "comma: install"
+    become: true
+    make:
+        chdir: "{{ base }}/build/comma"
+        target: "install"

From 0d34801502bbc472f36d85d88e2e10fd68277866 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 1 Aug 2020 11:43:06 +1000
Subject: [PATCH 0178/1056] csv/examples: moved examples to csv/examples/matlab

---
 csv/examples/{bin_load.m => load-binary-file.m}       | 0
 csv/examples/{bin_save.m => save-binary-file.m}       | 0
 csv/examples/{iso2seconds.m => time-iso-to-seconds.m} | 0
 csv/examples/{seconds2iso.m => time-seconds-to-iso.m} | 0
 4 files changed, 0 insertions(+), 0 deletions(-)
 rename csv/examples/{bin_load.m => load-binary-file.m} (100%)
 rename csv/examples/{bin_save.m => save-binary-file.m} (100%)
 rename csv/examples/{iso2seconds.m => time-iso-to-seconds.m} (100%)
 rename csv/examples/{seconds2iso.m => time-seconds-to-iso.m} (100%)

diff --git a/csv/examples/bin_load.m b/csv/examples/load-binary-file.m
similarity index 100%
rename from csv/examples/bin_load.m
rename to csv/examples/load-binary-file.m
diff --git a/csv/examples/bin_save.m b/csv/examples/save-binary-file.m
similarity index 100%
rename from csv/examples/bin_save.m
rename to csv/examples/save-binary-file.m
diff --git a/csv/examples/iso2seconds.m b/csv/examples/time-iso-to-seconds.m
similarity index 100%
rename from csv/examples/iso2seconds.m
rename to csv/examples/time-iso-to-seconds.m
diff --git a/csv/examples/seconds2iso.m b/csv/examples/time-seconds-to-iso.m
similarity index 100%
rename from csv/examples/seconds2iso.m
rename to csv/examples/time-seconds-to-iso.m

From 378cd0b5b43080ac8f00b5cfe40829e0fd87ac78 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 1 Aug 2020 11:45:55 +1000
Subject: [PATCH 0179/1056] csv/examples: moved examples to csv/examples/matlab

---
 csv/examples/{ => matlab}/load-binary-file.m    | 0
 csv/examples/{ => matlab}/save-binary-file.m    | 0
 csv/examples/{ => matlab}/time-iso-to-seconds.m | 0
 csv/examples/{ => matlab}/time-seconds-to-iso.m | 0
 4 files changed, 0 insertions(+), 0 deletions(-)
 rename csv/examples/{ => matlab}/load-binary-file.m (100%)
 rename csv/examples/{ => matlab}/save-binary-file.m (100%)
 rename csv/examples/{ => matlab}/time-iso-to-seconds.m (100%)
 rename csv/examples/{ => matlab}/time-seconds-to-iso.m (100%)

diff --git a/csv/examples/load-binary-file.m b/csv/examples/matlab/load-binary-file.m
similarity index 100%
rename from csv/examples/load-binary-file.m
rename to csv/examples/matlab/load-binary-file.m
diff --git a/csv/examples/save-binary-file.m b/csv/examples/matlab/save-binary-file.m
similarity index 100%
rename from csv/examples/save-binary-file.m
rename to csv/examples/matlab/save-binary-file.m
diff --git a/csv/examples/time-iso-to-seconds.m b/csv/examples/matlab/time-iso-to-seconds.m
similarity index 100%
rename from csv/examples/time-iso-to-seconds.m
rename to csv/examples/matlab/time-iso-to-seconds.m
diff --git a/csv/examples/time-seconds-to-iso.m b/csv/examples/matlab/time-seconds-to-iso.m
similarity index 100%
rename from csv/examples/time-seconds-to-iso.m
rename to csv/examples/matlab/time-seconds-to-iso.m

From 89d83e3c55d824db0308fb6d439fe55da8138811 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 1 Aug 2020 12:02:16 +1000
Subject: [PATCH 0180/1056] csv/examples/bash/irregular-stream-to-csv added

---
 csv/examples/bash/irregular-stream-to-csv | 40 +++++++++++++++++++++++
 1 file changed, 40 insertions(+)
 create mode 100755 csv/examples/bash/irregular-stream-to-csv

diff --git a/csv/examples/bash/irregular-stream-to-csv b/csv/examples/bash/irregular-stream-to-csv
new file mode 100755
index 000000000..55bfb2ce9
--- /dev/null
+++ b/csv/examples/bash/irregular-stream-to-csv
@@ -0,0 +1,40 @@
+#!/bin/bash
+
+# suppose we have an ascii stream (e.g. produced by a sensor) that mixes severals
+# values appearing in the stream at various times and we can distinguish different
+# input record types by some keywords
+#
+# we want to convert it into a csv stream with each record containing
+# the latest values
+#
+# notes
+# - the same is possible with a bit more effort with binary data
+# - --unbuffered in sed is required, if your stream has to be realtime
+
+function test-input()
+{
+    cat <<eof
+greeting: hello
+which: holy
+who: cow
+greeting: bye
+which: wicked
+greeting: hi
+which: lazy
+who: fox
+greeting: jump
+which: brown
+eof
+}
+
+test-input \
+    | sed -e 's#\(greeting: .*\)#\1,,#' \
+          -e 's#\(which: .*\)#,\1,#' \
+          -e 's#\(who: .*\)#,,\1#' \
+          --unbuffered \
+    | csv-update --update-non-empty \
+    | sed -e 's#greeting: ##' \
+          -e 's#which: ##' \
+          -e 's#who: ##' \
+          --unbuffered \
+    | tr ',' ' '
\ No newline at end of file

From c2ce0098bf775a8adf89bef45f0a28d601b0ec4a Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 5 Aug 2020 09:25:18 +1000
Subject: [PATCH 0181/1056] csv-shuffle: refactoring to allow optimisation

---
 csv/applications/csv-shuffle.cpp | 73 ++++++++++----------------------
 1 file changed, 23 insertions(+), 50 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index f6d460289..75da77ce7 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -1,31 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2020 Vsevolod Vlaskine
 
 #ifdef WIN32
 #include <fcntl.h>
@@ -71,7 +45,7 @@ static void usage( bool verbose )
     std::cerr << "        output trailing fields: swap x and y, output z" << std::endl;
     std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y --output-fields=y,x,..." << std::endl;
     std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 struct field
@@ -89,13 +63,9 @@ int main( int ac, char** av )
 {
     try
     {
-        comma::command_line_options options( ac, av );
-        bool verbose = options.exists( "--verbose,-v" );
-        if( options.exists( "--help,-h" ) ) { usage( verbose ); }
+        comma::command_line_options options( ac, av, usage );
         comma::csv::options csv( options );
-        csv.full_xpath = false;
-        std::string f = options.value< std::string >( "--input-fields", "" );
-        if( !f.empty() ) { csv.fields = f; }
+        csv.fields = options.value< std::string >( "--input-fields,--fields,-f", "" );
         std::vector< std::string > input_fields = comma::split( csv.fields, ',' );
         std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o" ), ',' );
         bool output_trailing_fields = output_fields.back() == "...";
@@ -103,23 +73,32 @@ int main( int ac, char** av )
         std::vector< field > fields;
         for( unsigned int i = 0; i < output_fields.size(); ++i )
         {
-            if( output_fields[i].empty() ) { continue; }
-            fields.push_back( field( output_fields[i], i ) );
+            if( !output_fields[i].empty() ) { fields.push_back( field( output_fields[i], i ) ); }
         }
-        if( fields.empty() ) { std::cerr << "csv-shuffle: please define at least one output field" << std::endl; return 1; }
-        for( unsigned int i = 0; i < input_fields.size(); ++i )
+        if( csv.binary() )
         {
-            for( unsigned int j = 0; j < fields.size(); ++j )
+            for( unsigned int i = 0; i < input_fields.size(); ++i )
             {
-                if( fields[j].name != input_fields[i] ) { continue; }
-                fields[j].input_index = i;
-                if( csv.binary() )
+                for( unsigned int j = 0; j < fields.size(); ++j )
                 {
+                    if( fields[j].name != input_fields[i] ) { continue; }
+                    fields[j].input_index = i;
                     fields[j].input_offset = csv.format().offset( i ).offset;
                     fields[j].size = csv.format().offset( i ).size;
                 }
             }
         }
+        else
+        {
+            for( unsigned int i = 0; i < input_fields.size(); ++i )
+            {
+                for( unsigned int j = 0; j < fields.size(); ++j )
+                {
+                    if( fields[j].name == input_fields[i] ) { fields[j].input_index = i; }
+                }
+            }
+        }
+        if( fields.empty() ) { std::cerr << "csv-shuffle: please define at least one output field" << std::endl; return 1; }
         for( unsigned int i = 0; i < fields.size(); ++i )
         {
             if( !fields[i].input_index ) { std::cerr << "csv-shuffle: \"" << fields[i].name << "\" not found in input fields " << csv.fields << std::endl; return 1; }
@@ -198,18 +177,12 @@ int main( int ac, char** av )
                 unsigned int previous_index = 0;
                 for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
                 {
-                    for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k )
-                    {
-                        std::cout.write( &buf[ elements[k].offset ], elements[k].size );
-                    }
+                    for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k ) { std::cout.write( &buf[ elements[k].offset ], elements[k].size ); }
                     std::cout.write( &buf[ fields[i].input_offset ], fields[i].size );
                     previous_index = fields[i].index + 1;
                 }
                 //std::cerr << "--> previous_index: " << previous_index << " elements.size(): " << elements.size() << std::endl;
-                for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k )
-                {
-                    std::cout.write( &buf[ elements[k].offset ], elements[k].size );
-                }
+                for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k ) { std::cout.write( &buf[ elements[k].offset ], elements[k].size ); }
                 if( csv.flush ) { std::cout.flush(); }
             }
         }

From 7fdc12ec52118bfbbc59d30c25d9ec9532d7648f Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 5 Aug 2020 13:00:02 +1000
Subject: [PATCH 0182/1056] csv-shuffle: --binary: optimisation added that
 speeds it up 2-3 times for some types of input

---
 csv/applications/csv-shuffle.cpp | 146 ++++++-------------------------
 csv/test/csv-shuffle/expected    |  19 ++++
 csv/test/csv-shuffle/input       |  10 +++
 3 files changed, 58 insertions(+), 117 deletions(-)
 create mode 100644 csv/test/csv-shuffle/expected
 create mode 100644 csv/test/csv-shuffle/input

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 75da77ce7..cbb599753 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -22,10 +22,6 @@ static void usage( bool verbose )
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
     std::cerr << "    --fields,-f,--input-fields <fields>: input fields" << std::endl;
     std::cerr << "    --output-fields,--output,-o <fields>: output fields" << std::endl;
-    std::cerr << "        semantics of outputting trailing fields:" << std::endl;
-    std::cerr << "            \"--output-fields=x,y\": do not output trailing fields" << std::endl;
-    std::cerr << "            \"--output-fields=x,y...\": output trailing fields" << std::endl;
-    std::cerr << "            see example below" << std::endl;
     std::cerr << "    --verbose,-v: more output" << std::endl;
     if( verbose ) { std::cerr << std::endl << comma::csv::options::usage() << std::endl; }
     std::cerr << std::endl;
@@ -40,10 +36,6 @@ static void usage( bool verbose )
     std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=y,z,x" << std::endl;
     std::cerr << "        remove x, swap y,z, append z two times:" << std::endl;
     std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=z,y,z,z" << std::endl;
-    std::cerr << "        do not output trailing fields: swap x and y, do not output z" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y --output-fields=y,x" << std::endl;
-    std::cerr << "        output trailing fields: swap x and y, output z" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y --output-fields=y,x,..." << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
@@ -52,11 +44,10 @@ struct field
 {
     std::string name;
     unsigned int index;
-    unsigned int offset;
     boost::optional< unsigned int > input_index;
     unsigned int input_offset;
     unsigned int size;
-    field( const std::string& name, unsigned int index ) : name( name ), index( index ) {}
+    field( const std::string& name, unsigned int index ) : name( name ), index( index ), input_offset( 0 ), size( 0 ) {}
 };
 
 int main( int ac, char** av )
@@ -66,128 +57,54 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         comma::csv::options csv( options );
         csv.fields = options.value< std::string >( "--input-fields,--fields,-f", "" );
-        std::vector< std::string > input_fields = comma::split( csv.fields, ',' );
-        std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o" ), ',' );
-        bool output_trailing_fields = output_fields.back() == "...";
-        if( output_fields.back() == "..." ) { output_fields.erase( output_fields.end() - 1 ); }
+        std::vector< std::string > input_fields = comma::split( csv.fields, ',', true );
+        std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o" ), ',', true );
+        if( output_fields.empty() ) { std::cerr << "csv-shuffle: please specify at least one output field" << std::endl; return 1; }
+        if( output_fields.back() == "..." ) { std::cerr << "csv-shuffle: support for trailing fields has been removed; please specify input/output fields explicitly" << std::endl; return 1; }
         std::vector< field > fields;
-        for( unsigned int i = 0; i < output_fields.size(); ++i )
-        {
-            if( !output_fields[i].empty() ) { fields.push_back( field( output_fields[i], i ) ); }
-        }
+        unsigned size = 0;
         if( csv.binary() )
         {
-            for( unsigned int i = 0; i < input_fields.size(); ++i )
+            for( unsigned int i = 0; i < output_fields.size(); )
             {
-                for( unsigned int j = 0; j < fields.size(); ++j )
-                {
-                    if( fields[j].name != input_fields[i] ) { continue; }
-                    fields[j].input_index = i;
-                    fields[j].input_offset = csv.format().offset( i ).offset;
-                    fields[j].size = csv.format().offset( i ).size;
-                }
+                fields.push_back( field( output_fields[i], i ) );
+                unsigned int j = 0;
+                for( ; j < input_fields.size() && input_fields[j] != output_fields[i]; ++j );
+                if( j >= input_fields.size() ) { std::cerr << "csv-shuffle: output field '" << output_fields[i] << "' not found in input fields '" << csv.fields << "'" << std::endl; return 1; }
+                fields.back().input_offset = csv.format().offset( j ).offset;
+                for( ; i < output_fields.size() && j < input_fields.size() && input_fields[j] == output_fields[i]; ++i, ++j ) { fields.back().size += csv.format().offset( j ).size; }
+                size += fields.back().size;
             }
-        }
-        else
-        {
-            for( unsigned int i = 0; i < input_fields.size(); ++i )
-            {
-                for( unsigned int j = 0; j < fields.size(); ++j )
-                {
-                    if( fields[j].name == input_fields[i] ) { fields[j].input_index = i; }
-                }
-            }
-        }
-        if( fields.empty() ) { std::cerr << "csv-shuffle: please define at least one output field" << std::endl; return 1; }
-        for( unsigned int i = 0; i < fields.size(); ++i )
-        {
-            if( !fields[i].input_index ) { std::cerr << "csv-shuffle: \"" << fields[i].name << "\" not found in input fields " << csv.fields << std::endl; return 1; }
-        }
-        if( csv.binary() )
-//         {
-//             #ifdef WIN32
-//             _setmode( _fileno( stdin ), _O_BINARY );
-//             _setmode( _fileno( stdout ), _O_BINARY );
-//             #endif
-//             std::vector< char > in( csv.format().size() );
-//             std::vector< comma::csv::format::element > elements;
-//             elements.reserve( csv.format().count() ); // quick and dirty, can be really wasteful on large things like images
-//             for( unsigned int i = 0; i < elements.capacity(); ++i )
-//             {
-//                 elements.push_back( csv.format().offset( i ) );
-//             }
-//             unsigned int previous_index = 0;
-//             unsigned int output_size = 0;
-//             for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
-//             {
-//                 for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k ) { output_size += elements[k].size; }
-//                 output_size += fields[i].size;
-//                 previous_index = fields[i].index + 1;
-//             }
-//             for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k ) { output_size += elements[k].size; }
-//             std::vector< char > out( output_size );
-//             if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
-//             while( std::cin.good() && !std::cin.eof() )
-//             {
-//                 // todo: quick and dirty; if performance is an issue, you could read more than
-//                 // one record every time see comma::csv::binary_input_stream::read() for reference
-//                 std::cin.read( &in[0], csv.format().size() );
-//                 if( std::cin.gcount() == 0 ) { continue; }
-//                 if( std::cin.gcount() < int( csv.format().size() ) ) { std::cerr << "csv-shuffle: expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() << std::endl; return 1; }
-//                 unsigned int offset = 0;
-//                 unsigned int previous_index = 0;
-//                 for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
-//                 {
-//                     for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k )
-//                     {
-//                         std::memcpy( &out[offset], &in[ elements[k].offset ], elements[k].size ); // std::cout.write( &in[ elements[k].offset ], elements[k].size );
-//                         offset += elements[k].size;
-//                     }
-//                     std::memcpy( &out[offset], &in[ fields[i].input_offset ], fields[i].size ); // std::cout.write( &in[ fields[i].input_offset ], fields[i].size );
-//                     offset += fields[i].size;
-//                     previous_index = fields[i].index + 1;
-//                 }
-//                 //std::cerr << "--> previous_index: " << previous_index << " elements.size(): " << elements.size() << std::endl;
-//                 for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k )
-//                 {
-//                     std::memcpy( &out[offset], &in[ elements[k].offset ], elements[k].size ); // std::cout.write( &in[ elements[k].offset ], elements[k].size );
-//                     offset += elements[k].size;
-//                 }
-//                 std::cout.write( &out[0], out.size() );
-//                 if( csv.flush ) { std::cout.flush(); }
-//             }
-//         }
-        {
+            //for( unsigned int i = 0; i < fields.size(); ++i ) { std::cerr << "--> i: " << i << " fields[i].name: " << fields[i].name << " fields[i].input_offset: " << fields[i].input_offset << " fields[i].size: " << fields[i].size << std::endl; }
             #ifdef WIN32
             _setmode( _fileno( stdin ), _O_BINARY );
             _setmode( _fileno( stdout ), _O_BINARY );
             #endif
             std::vector< char > buf( csv.format().size() );
-            std::vector< comma::csv::format::element > elements;
-            elements.reserve( csv.format().count() ); // quick and dirty, can be really wasteful on large things like images
-            for( unsigned int i = 0; i < elements.capacity(); ++i ) { elements.push_back( csv.format().offset( i ) ); }
-            if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
+            if( !csv.flush ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
             while( std::cin.good() && !std::cin.eof() )
             {
-                // todo: quick and dirty; if performance is an issue, you could read more than
-                // one record every time see comma::csv::binary_input_stream::read() for reference
                 std::cin.read( &buf[0], csv.format().size() );
                 if( std::cin.gcount() == 0 ) { continue; }
                 if( std::cin.gcount() < int( csv.format().size() ) ) { std::cerr << "csv-shuffle: expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() << std::endl; return 1; }
-                unsigned int previous_index = 0;
-                for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
-                {
-                    for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k ) { std::cout.write( &buf[ elements[k].offset ], elements[k].size ); }
-                    std::cout.write( &buf[ fields[i].input_offset ], fields[i].size );
-                    previous_index = fields[i].index + 1;
-                }
-                //std::cerr << "--> previous_index: " << previous_index << " elements.size(): " << elements.size() << std::endl;
-                for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k ) { std::cout.write( &buf[ elements[k].offset ], elements[k].size ); }
+                for( unsigned int i = 0; i < fields.size(); ++i ) { std::cout.write( &buf[ fields[i].input_offset ], fields[i].size ); }
                 if( csv.flush ) { std::cout.flush(); }
             }
         }
         else
         {
+            for( unsigned int i = 0; i < output_fields.size(); ++i ) { fields.push_back( field( output_fields[i], i ) ); }
+            for( unsigned int i = 0; i < input_fields.size(); ++i )
+            {
+                for( unsigned int j = 0; j < fields.size(); ++j )
+                {
+                    if( fields[j].name == input_fields[i] ) { fields[j].input_index = i; }
+                }
+            }
+            for( unsigned int i = 0; i < fields.size(); ++i )
+            {
+                if( !fields[i].input_index ) { std::cerr << "csv-shuffle: \"" << fields[i].name << "\" not found in input fields " << csv.fields << std::endl; return 1; }
+            }
             while( std::cin.good() && !std::cin.eof() )
             {
                 std::string line;
@@ -209,11 +126,6 @@ int main( int ac, char** av )
                     if ( *fields[i].input_index < v.size() ) { std::cout << v[ *fields[i].input_index ]; }
                     delimiter = csv.delimiter;
                 }
-                for( unsigned int k = previous_index; output_trailing_fields && k < v.size(); ++k )
-                {
-                    std::cout << delimiter << v[k];
-                    delimiter = csv.delimiter;
-                }
                 std::cout << std::endl;
             }
         }
diff --git a/csv/test/csv-shuffle/expected b/csv/test/csv-shuffle/expected
new file mode 100644
index 000000000..7c2252bd5
--- /dev/null
+++ b/csv/test/csv-shuffle/expected
@@ -0,0 +1,19 @@
+ascii[0]/output="0"
+ascii[0]/status=0
+ascii[1]/output="0,0"
+ascii[1]/status=0
+ascii[2]/output="5"
+ascii[2]/status=0
+ascii[3]/output="5,4"
+ascii[3]/status=0
+ascii[4]/output="1,3,1,3"
+ascii[4]/status=0
+
+binary[0]/output="0"
+binary[0]/status=0
+binary[1]/output="3,4,5,0,1,2"
+binary[1]/status=0
+binary[2]/output="4,5,2,3,0,1"
+binary[2]/status=0
+binary[3]/output="1,2,1,2,1,2"
+binary[3]/status=0
diff --git a/csv/test/csv-shuffle/input b/csv/test/csv-shuffle/input
new file mode 100644
index 000000000..27d66470b
--- /dev/null
+++ b/csv/test/csv-shuffle/input
@@ -0,0 +1,10 @@
+ascii[0]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 0"
+ascii[1]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 0,0"
+ascii[2]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5"
+ascii[3]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5,4"
+ascii[4]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 1,3,1,3"
+
+binary[0]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 0 | csv-from-bin ui"
+binary[1]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 3,4,5,0,1,2 | csv-from-bin 3uw,3ui"
+binary[2]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 4,5,2,3,0,1 | csv-from-bin 2uw,ui,uw,2ui"
+binary[3]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 1,2,1,2,1,2 | csv-from-bin 6ui"

From fac9cb57934724917f97d8e6af248b7ff6119637 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 5 Aug 2020 15:17:39 +1000
Subject: [PATCH 0183/1056] csv-shuffle: default --output-fields implemented

---
 csv/applications/csv-shuffle.cpp | 20 +++++++++-----------
 csv/test/csv-shuffle/expected    |  4 ++++
 csv/test/csv-shuffle/input       |  2 ++
 3 files changed, 15 insertions(+), 11 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index cbb599753..08f291294 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -20,8 +20,9 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
-    std::cerr << "    --fields,-f,--input-fields <fields>: input fields" << std::endl;
-    std::cerr << "    --output-fields,--output,-o <fields>: output fields" << std::endl;
+    std::cerr << "    --fields,-f,--input-fields=<fields>; input fields" << std::endl;
+    std::cerr << "    --output-fields,--output,-o=<fields>; output fields, if not specified, will be set" << std::endl;
+    std::cerr << "                                          to --input-fields, which would chops off trailing input fields" << std::endl;
     std::cerr << "    --verbose,-v: more output" << std::endl;
     if( verbose ) { std::cerr << std::endl << comma::csv::options::usage() << std::endl; }
     std::cerr << std::endl;
@@ -29,13 +30,13 @@ static void usage( bool verbose )
     std::cerr << "    operations (for now): append, remove, swap" << std::endl;
     std::cerr << "    semantics:" << std::endl;
     std::cerr << "        remove:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=x,z" << std::endl;
+    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z" << std::endl;
     std::cerr << "        append:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=x,y,z,x" << std::endl;
+    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=x,y,z,x" << std::endl;
     std::cerr << "        swap:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=y,z,x" << std::endl;
+    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=y,z,x" << std::endl;
     std::cerr << "        remove x, swap y,z, append z two times:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=z,y,z,z" << std::endl;
+    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=z,y,z,z" << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
@@ -58,11 +59,9 @@ int main( int ac, char** av )
         comma::csv::options csv( options );
         csv.fields = options.value< std::string >( "--input-fields,--fields,-f", "" );
         std::vector< std::string > input_fields = comma::split( csv.fields, ',', true );
-        std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o" ), ',', true );
-        if( output_fields.empty() ) { std::cerr << "csv-shuffle: please specify at least one output field" << std::endl; return 1; }
-        if( output_fields.back() == "..." ) { std::cerr << "csv-shuffle: support for trailing fields has been removed; please specify input/output fields explicitly" << std::endl; return 1; }
+        std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o", csv.fields ), ',', true );
+        if( output_fields.back() == "..." ) { std::cerr << "csv-shuffle: support for trailing fields has been removed for now; please specify input/output fields explicitly" << std::endl; return 1; }
         std::vector< field > fields;
-        unsigned size = 0;
         if( csv.binary() )
         {
             for( unsigned int i = 0; i < output_fields.size(); )
@@ -73,7 +72,6 @@ int main( int ac, char** av )
                 if( j >= input_fields.size() ) { std::cerr << "csv-shuffle: output field '" << output_fields[i] << "' not found in input fields '" << csv.fields << "'" << std::endl; return 1; }
                 fields.back().input_offset = csv.format().offset( j ).offset;
                 for( ; i < output_fields.size() && j < input_fields.size() && input_fields[j] == output_fields[i]; ++i, ++j ) { fields.back().size += csv.format().offset( j ).size; }
-                size += fields.back().size;
             }
             //for( unsigned int i = 0; i < fields.size(); ++i ) { std::cerr << "--> i: " << i << " fields[i].name: " << fields[i].name << " fields[i].input_offset: " << fields[i].input_offset << " fields[i].size: " << fields[i].size << std::endl; }
             #ifdef WIN32
diff --git a/csv/test/csv-shuffle/expected b/csv/test/csv-shuffle/expected
index 7c2252bd5..ac8eaab3b 100644
--- a/csv/test/csv-shuffle/expected
+++ b/csv/test/csv-shuffle/expected
@@ -8,6 +8,8 @@ ascii[3]/output="5,4"
 ascii[3]/status=0
 ascii[4]/output="1,3,1,3"
 ascii[4]/status=0
+ascii[5]/output="0,1,2"
+ascii[5]/status=0
 
 binary[0]/output="0"
 binary[0]/status=0
@@ -17,3 +19,5 @@ binary[2]/output="4,5,2,3,0,1"
 binary[2]/status=0
 binary[3]/output="1,2,1,2,1,2"
 binary[3]/status=0
+binary[4]/output="0,1,2"
+binary[4]/status=0
diff --git a/csv/test/csv-shuffle/input b/csv/test/csv-shuffle/input
index 27d66470b..444bc6b59 100644
--- a/csv/test/csv-shuffle/input
+++ b/csv/test/csv-shuffle/input
@@ -3,8 +3,10 @@ ascii[1]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 0,
 ascii[2]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5"
 ascii[3]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5,4"
 ascii[4]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 1,3,1,3"
+ascii[5]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2"
 
 binary[0]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 0 | csv-from-bin ui"
 binary[1]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 3,4,5,0,1,2 | csv-from-bin 3uw,3ui"
 binary[2]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 4,5,2,3,0,1 | csv-from-bin 2uw,ui,uw,2ui"
 binary[3]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 1,2,1,2,1,2 | csv-from-bin 6ui"
+binary[4]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2 | csv-from-bin 3ui"

From 68bd1a650a6bcc1e4659c2154e6fb41913956fe1 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 5 Aug 2020 16:47:48 +1000
Subject: [PATCH 0184/1056] csv-shuffle: brushed up

---
 csv/applications/csv-shuffle.cpp | 61 +++++++++-----------------------
 1 file changed, 16 insertions(+), 45 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 08f291294..50b16ae6c 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -9,6 +9,7 @@
 #include <iostream>
 #include <vector>
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
 
@@ -41,39 +42,31 @@ static void usage( bool verbose )
     exit( 0 );
 }
 
-struct field
+static unsigned int find_( const std::string& n, const std::vector< std::string >& v )
 {
-    std::string name;
-    unsigned int index;
-    boost::optional< unsigned int > input_index;
-    unsigned int input_offset;
-    unsigned int size;
-    field( const std::string& name, unsigned int index ) : name( name ), index( index ), input_offset( 0 ), size( 0 ) {}
-};
+    unsigned int j = 0;
+    for( ; j < v.size(); ++j ) { if( v[j] == n ) { return j; } }
+    COMMA_THROW( comma::exception, "output field '" << n << "' not found in input fields '" << comma::join( v, ',' ) << "'" );
+}
 
 int main( int ac, char** av )
 {
     try
     {
         comma::command_line_options options( ac, av, usage );
-        comma::csv::options csv( options );
-        csv.fields = options.value< std::string >( "--input-fields,--fields,-f", "" );
+        comma::csv::options csv( options, options.value< std::string >( "--input-fields,--fields,-f", "" ) );
         std::vector< std::string > input_fields = comma::split( csv.fields, ',', true );
         std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o", csv.fields ), ',', true );
         if( output_fields.back() == "..." ) { std::cerr << "csv-shuffle: support for trailing fields has been removed for now; please specify input/output fields explicitly" << std::endl; return 1; }
-        std::vector< field > fields;
         if( csv.binary() )
         {
+            std::vector< std::pair< unsigned int, unsigned int > > offsets;
             for( unsigned int i = 0; i < output_fields.size(); )
             {
-                fields.push_back( field( output_fields[i], i ) );
-                unsigned int j = 0;
-                for( ; j < input_fields.size() && input_fields[j] != output_fields[i]; ++j );
-                if( j >= input_fields.size() ) { std::cerr << "csv-shuffle: output field '" << output_fields[i] << "' not found in input fields '" << csv.fields << "'" << std::endl; return 1; }
-                fields.back().input_offset = csv.format().offset( j ).offset;
-                for( ; i < output_fields.size() && j < input_fields.size() && input_fields[j] == output_fields[i]; ++i, ++j ) { fields.back().size += csv.format().offset( j ).size; }
+                unsigned int j = find_( output_fields[i], input_fields );
+                offsets.push_back( std::make_pair( csv.format().offset( j ).offset, 0 ) );
+                for( ; i < output_fields.size() && j < input_fields.size() && input_fields[j] == output_fields[i]; ++i, ++j ) { offsets.back().second += csv.format().offset( j ).size; }
             }
-            //for( unsigned int i = 0; i < fields.size(); ++i ) { std::cerr << "--> i: " << i << " fields[i].name: " << fields[i].name << " fields[i].input_offset: " << fields[i].input_offset << " fields[i].size: " << fields[i].size << std::endl; }
             #ifdef WIN32
             _setmode( _fileno( stdin ), _O_BINARY );
             _setmode( _fileno( stdout ), _O_BINARY );
@@ -85,45 +78,23 @@ int main( int ac, char** av )
                 std::cin.read( &buf[0], csv.format().size() );
                 if( std::cin.gcount() == 0 ) { continue; }
                 if( std::cin.gcount() < int( csv.format().size() ) ) { std::cerr << "csv-shuffle: expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() << std::endl; return 1; }
-                for( unsigned int i = 0; i < fields.size(); ++i ) { std::cout.write( &buf[ fields[i].input_offset ], fields[i].size ); }
+                for( const auto& offset: offsets ) { std::cout.write( &buf[ offset.first ], offset.second ); }
                 if( csv.flush ) { std::cout.flush(); }
             }
         }
         else
         {
-            for( unsigned int i = 0; i < output_fields.size(); ++i ) { fields.push_back( field( output_fields[i], i ) ); }
-            for( unsigned int i = 0; i < input_fields.size(); ++i )
-            {
-                for( unsigned int j = 0; j < fields.size(); ++j )
-                {
-                    if( fields[j].name == input_fields[i] ) { fields[j].input_index = i; }
-                }
-            }
-            for( unsigned int i = 0; i < fields.size(); ++i )
-            {
-                if( !fields[i].input_index ) { std::cerr << "csv-shuffle: \"" << fields[i].name << "\" not found in input fields " << csv.fields << std::endl; return 1; }
-            }
+            std::vector< unsigned int > indices;
+            for( const auto& field: output_fields ) { indices.push_back( find_( field, input_fields ) ); }
             while( std::cin.good() && !std::cin.eof() )
             {
                 std::string line;
                 std::getline( std::cin, line );
                 if( !line.empty() && *line.rbegin() == '\r' ) { line = line.substr( 0, line.length() - 1 ); } // windows... sigh...
                 if( line.empty() ) { continue; }
-                std::vector< std::string > v = comma::split( line, csv.delimiter );
+                const auto& v = comma::split( line, csv.delimiter );
                 std::string delimiter;
-                unsigned int previous_index = 0;
-                for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
-                {
-                    for( unsigned int k = previous_index; k < fields[i].index && k < v.size(); ++k )
-                    {
-                        std::cout << delimiter << v[k];
-                        delimiter = csv.delimiter;
-                    }
-                    previous_index = fields[i].index + 1;
-                    std::cout << delimiter;
-                    if ( *fields[i].input_index < v.size() ) { std::cout << v[ *fields[i].input_index ]; }
-                    delimiter = csv.delimiter;
-                }
+                for( auto index: indices ) { std::cout << delimiter << v[index]; delimiter = csv.delimiter; }
                 std::cout << std::endl;
             }
         }

From c6e2045899b76128aaec8eeb69a5dccc7bfd8ac3 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 5 Aug 2020 16:57:01 +1000
Subject: [PATCH 0185/1056] csv-shuffle: further minor brush-up

---
 csv/applications/csv-shuffle.cpp | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 50b16ae6c..197e0af12 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -42,28 +42,28 @@ static void usage( bool verbose )
     exit( 0 );
 }
 
-static unsigned int find_( const std::string& n, const std::vector< std::string >& v )
-{
-    unsigned int j = 0;
-    for( ; j < v.size(); ++j ) { if( v[j] == n ) { return j; } }
-    COMMA_THROW( comma::exception, "output field '" << n << "' not found in input fields '" << comma::join( v, ',' ) << "'" );
-}
-
 int main( int ac, char** av )
 {
     try
     {
         comma::command_line_options options( ac, av, usage );
-        comma::csv::options csv( options, options.value< std::string >( "--input-fields,--fields,-f", "" ) );
+        comma::csv::options csv( options, options.value< std::string >( "--fields,-f,--input-fields" ) );
         std::vector< std::string > input_fields = comma::split( csv.fields, ',', true );
         std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o", csv.fields ), ',', true );
         if( output_fields.back() == "..." ) { std::cerr << "csv-shuffle: support for trailing fields has been removed for now; please specify input/output fields explicitly" << std::endl; return 1; }
+        auto find_ = [&]( const std::string& n )->unsigned int
+        {
+            if( n.empty() ) { COMMA_THROW( comma::exception, "got empty fields in output fields '" << comma::join( output_fields, ',' ) << "'" ); }
+            unsigned int j = 0;
+            for( ; j < input_fields.size(); ++j ) { if( input_fields[j] == n ) { return j; } }
+            COMMA_THROW( comma::exception, "output field '" << n << "' not found in input fields '" << csv.fields << "'" );
+        };
         if( csv.binary() )
         {
             std::vector< std::pair< unsigned int, unsigned int > > offsets;
             for( unsigned int i = 0; i < output_fields.size(); )
             {
-                unsigned int j = find_( output_fields[i], input_fields );
+                unsigned int j = find_( output_fields[i] );
                 offsets.push_back( std::make_pair( csv.format().offset( j ).offset, 0 ) );
                 for( ; i < output_fields.size() && j < input_fields.size() && input_fields[j] == output_fields[i]; ++i, ++j ) { offsets.back().second += csv.format().offset( j ).size; }
             }
@@ -85,7 +85,7 @@ int main( int ac, char** av )
         else
         {
             std::vector< unsigned int > indices;
-            for( const auto& field: output_fields ) { indices.push_back( find_( field, input_fields ) ); }
+            for( const auto& field: output_fields ) { indices.push_back( find_( field ) ); }
             while( std::cin.good() && !std::cin.eof() )
             {
                 std::string line;

From af5db2164276e354d166826285ca187618be3794 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 19 Aug 2020 10:43:18 +1000
Subject: [PATCH 0186/1056] csv-eval: inconsistency fixed: now exits with
 success on empty input

---
 python/comma/csv/applications/csv_eval.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 1ae279fa0..a6abff2af 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -373,11 +373,11 @@ def prepare_options(args):
         args.binary = False
     else:
         args.first_line = comma.io.readlines_unbuffered(1, sys.stdin)
-        if not args.first_line: raise csv_eval_error("first record is empty - could not guess format")
+        if not args.first_line: return False
         args.format = comma.csv.format.guess_format(args.first_line)
         args.binary = False
         if args.verbose: print( "{}: guessed format: {}".format(__name__, args.format), file = sys.stderr )
-    if args.select or args.exit_if: return
+    if args.select or args.exit_if: return True
     var_names = assignment_variable_names(args.expressions)
     args.update_fields = [f for f in var_names if f in args.fields]
     args.output_fields = [f for f in var_names if f not in args.fields] if args.output_fields is None else split_fields(args.output_fields)
@@ -387,6 +387,7 @@ def prepare_options(args):
         init_types = format_without_blanks( args.init_format, args.init_fields, unnamed_fields = False )
         args.init_t = comma.csv.struct( ','.join( args.init_fields ), *comma.csv.format.to_numpy( init_types ) )
     args.output_format = format_without_blanks( args.output_format, args.output_fields, unnamed_fields = False )
+    return True
 
 def restricted_numpy_env():
     d = np.__dict__.copy()
@@ -565,7 +566,7 @@ def main():
         signal.signal( signal.SIGPIPE, signal.SIG_DFL )
         comma.csv.time.zone('UTC')
         args = get_args()
-        prepare_options(args)
+        if not prepare_options( args ): sys.exit( 0 ) # no data on stdin
         if args.select: select(stream(args))
         elif args.exit_if: exit_if(stream(args))
         else: evaluate(stream(args))

From b7ec85bdb0f12344aa0f9e67db7245f5e5e812a1 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Mon, 24 Aug 2020 06:02:04 +1000
Subject: [PATCH 0187/1056] csv-join: minor bug fixed

---
 csv/applications/csv-join.cpp | 37 +++++------------------------------
 1 file changed, 5 insertions(+), 32 deletions(-)

diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index cf094c7eb..ae996957a 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -73,9 +46,9 @@ static void usage( bool more )
     std::cerr << "    --matching: output only matching records from stdin" << std::endl;
     std::cerr << "    --nearest: if --radius specified, output only nearest record" << std::endl;
     std::cerr << "    --not-matching: not matching records as read from stdin, no join performed" << std::endl;
-    std::cerr << "    --strict: fail, if id on stdin is not found, or there are multiple filter keys on --unique, etc" << std::endl;
+    std::cerr << "    --output-swap,--swap-output,--swap; output filter records first with the stdin record appended, a convenience option" << std::endl;
     std::cerr << "    --radius,--epsilon=<value>; compare keys in given radius; the keys will be interpreted as floating point numbers" << std::endl;
-    std::cerr << "    --swap-output,--swap; output filter records first with the stdin record appended, a convenience option" << std::endl;
+    std::cerr << "    --strict: fail, if id on stdin is not found, or there are multiple filter keys on --unique, etc" << std::endl;
     std::cerr << "    --unique,--unique-matches: expect only unique matches, exit with error otherwise" << std::endl;
     std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
     std::cerr << std::endl;
@@ -501,13 +474,13 @@ int main( int ac, char** av )
         flag_matching = options.exists( "--flag-matching" );
         radius = options.optional< double >( "--radius,--epsilon" );
         nearest = options.exists( "--nearest" );
-        swap_output = options.exists( "--swap-output,--swap" );
+        swap_output = options.exists( "--output-swap,--swap-output,--swap" );
         if( nearest && !radius ) { std::cerr << "csv-join: if using --nearest, please specify --radius" << std::endl; return 1; }
-        options.assert_mutually_exclusive( "--matching,--not-matching,--flag-matching,--swap-output,--swap" );
+        options.assert_mutually_exclusive( "--matching,--not-matching,--flag-matching,--swap-output,--swap,--output-swap" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--first-matching" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--string,-s,--double,--time" );
         stdin_csv = comma::csv::options( options );
-        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-join: please specify the second source" << std::endl; return 1; }
         if( unnamed.size() > 1 ) { std::cerr << "csv-join: expected one file or stream to join, got " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
         comma::name_value::parser parser( "filename", ';', '=', false );

From b928be8ea7dbecbc5f861143fac40505cbd4dbd0 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Mon, 24 Aug 2020 08:53:59 +1000
Subject: [PATCH 0188/1056] python/comma/csv/stream: bug fixed: for python3, if
 size is -1, read the whole stream till eof

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index afa5c7e64..4cb5015bc 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -162,7 +162,7 @@ def _read(self, size):
         if self.binary:
             if sys.version_info.major > 2: #if np.__version__ >= '1.16.0': # sigh...
                 if self.source == sys.stdin:
-                    b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size >= 0 else self.size ) )
+                    b = sys.stdin.buffer.read( ( size * self.input_dtype.itemsize ) if size >= 0 else -1 ) # b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size >= 0 else self.size ) )
                     # todo! test on streams where bytes come with irregular delays!
                     if len(b) % self.input_dtype.itemsize != 0: raise ValueError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
                     return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )

From 7e10280f7ac6bf6e2308c19d6dd94e929539f760 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 25 Aug 2020 19:26:13 +1000
Subject: [PATCH 0189/1056] csv-calc: --append-once implemented

---
 csv/applications/csv-calc.cpp | 59 ++++++++++++-----------------------
 1 file changed, 20 insertions(+), 39 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index d1791dad3..69e0cd6a2 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1,31 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2020 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
@@ -35,8 +9,11 @@
 #include <io.h>
 #endif
 
+#include <deque>
 #include <iostream>
+#include <map>
 #include <type_traits>
+#include <unordered_set>
 #include <boost/bind.hpp>
 #include <boost/function.hpp>
 #include <boost/optional.hpp>
@@ -102,6 +79,7 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "<options>" << std::endl;
     std::cerr << "    --append: append statistics to each input line" << std::endl;
+    std::cerr << "    --append-once,--append-to-first: append statistics to first input line for each block and/or each id" << std::endl;
     std::cerr << "    --delimiter,-d <delimiter> : default ','" << std::endl;
     std::cerr << "    --fields,-f: field names for which the extents should be computed, default: all fields" << std::endl;
     std::cerr << "                 if 'block' field present, calculate block-wise" << std::endl;
@@ -1157,7 +1135,7 @@ struct Operation : public operation_base
 
 typedef boost::unordered_map< comma::uint32, std::vector< operation_base* >* > operations_map_t;
 typedef boost::unordered_map< comma::uint32, std::string > results_map_t;
-typedef std::vector< std::pair < comma::uint32, std::string > > Inputs;
+typedef std::deque< std::pair < comma::uint32, std::string > > inputs_t;
 
 class operations_battery_farm_t // all this pain is because operations polymorhism is too slow when there are a lot of ids
 {
@@ -1238,7 +1216,7 @@ static void output( const comma::csv::options& csv, results_map_t& results, boos
     results.clear();
 }
 
-static void append_and_output( const comma::csv::options& csv, Inputs& inputs, results_map_t& results )
+static void append_and_output( const comma::csv::options& csv, inputs_t& inputs, results_map_t& results, std::unordered_set< comma::uint32 >& ids )
 {
     for ( size_t i = 0; i < inputs.size(); ++i )
     {
@@ -1247,10 +1225,11 @@ static void append_and_output( const comma::csv::options& csv, Inputs& inputs, r
         const auto& r = results.find( inputs[i].first )->second;
         std::cout.write( &r[0], r.size() );
         if( !csv.binary() ) { std::cout << std::endl; }
-        if( csv.flush ) { std::cout.flush(); }
     }
+    if( csv.flush ) { std::cout.flush(); }
     results.clear();
     inputs.clear();
+    ids.clear();
 }
 
 static void calculate( const comma::csv::options& csv, operations_map_t& operations, results_map_t& results )
@@ -1289,7 +1268,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
-        std::vector< std::string > unnamed = options.unnamed( "--append,--flush,--output-fields,--output-format", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
+        std::vector< std::string > unnamed = options.unnamed( "--append,--append-once,--append-to-first,--flush,--output-fields,--output-format", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
         comma::csv::options csv( options );
         csv.full_xpath = false;
         std::cout.precision( csv.precision );
@@ -1315,11 +1294,13 @@ int main( int ac, char** av )
         else { ascii.reset( new ascii_input( csv, format ) ); }
         operations_map_t operations;
         results_map_t results;
-        Inputs inputs;
+        inputs_t inputs;
+        std::unordered_set< comma::uint32 > ids; // quick and dirty
         boost::optional< comma::uint32 > block = boost::make_optional< comma::uint32 >( false, 0 );
         bool has_block = csv.has_field( "block" );
         bool has_id = csv.has_field( "id" );
-        bool append = options.exists( "--append" );
+        bool append_once = options.exists( "--append-once,--append-to-first" );
+        bool append = options.exists( "--append" ) || append_once;
         if( options.exists( "--output-fields" ) )
         {
             std::vector < std::string > fields = comma::split(csv.fields, ',');
@@ -1360,21 +1341,21 @@ int main( int ac, char** av )
                 if( block && *block != v->block() ) 
                 {
                     calculate( csv, operations, results );
-                    if ( append ) { append_and_output( csv, inputs, results ); inputs.clear(); }
-                    else { output( csv, results, block, has_block, has_id ); }
+                    if ( append ) { append_and_output( csv, inputs, results, ids ); } else { output( csv, results, block, has_block, has_id ); }
                 }
                 block = v->block();
             }
             operations_map_t::iterator it = operations.find( v->id() );
-            if( it == operations.end() )
+            if( it == operations.end() ) { it = operations.insert( std::make_pair( v->id(), &operations_battery_farm.make( operations_parameters, v->format() ) ) ).first; }
+            if( append )
             {
-                it = operations.insert( std::make_pair( v->id(), &operations_battery_farm.make( operations_parameters, v->format() ) ) ).first;
+                if( !append_once || ids.find( v->id() ) == ids.end() ) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
+                ids.insert( v->id() ); // quick and dirty
             }
-            if( append ) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
             for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i]->push( v->buffer() ); }
         }
         calculate( csv, operations, results );
-        if ( append ) { append_and_output( csv, inputs, results ); }
+        if ( append ) { append_and_output( csv, inputs, results, ids ); }
         else { output( csv, results, block, has_block, has_id ); }
         return 0;
     }

From 1a43475c2e3632b4c3ff51b1573c51ca1928adab Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sat, 29 Aug 2020 17:59:48 +1000
Subject: [PATCH 0190/1056] csv-time-join: in help, indicate that --bound is
 optional and --buffer has a value

---
 csv/applications/csv-time-join.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-time-join.cpp b/csv/applications/csv-time-join.cpp
index d22c054eb..12754c3d1 100644
--- a/csv/applications/csv-time-join.cpp
+++ b/csv/applications/csv-time-join.cpp
@@ -92,10 +92,10 @@ static void usage( bool verbose )
     std::cerr << "    --binary,-b <format>:       binary format" << std::endl;
     std::cerr << "    --delimiter,-d <delimiter>: ascii only; default ','" << std::endl;
     std::cerr << "    --fields,-f <fields>:       input fields; default: t" << std::endl;
-    std::cerr << "    --bound=<seconds>:          output only points within given bound" << std::endl;
+    std::cerr << "    --bound=[<seconds>]:        output only points within given bound" << std::endl;
     std::cerr << "    --do-not-append,--select:   do not append any field from the second input" << std::endl;
     std::cerr << "    --timestamp-only:           append only timestamp from the second input" << std::endl;
-    std::cerr << "    --buffer:                   bounding data buffer size; default: infinite" << std::endl;
+    std::cerr << "    --buffer=[<records>]:       bounding data buffer size; default: infinite" << std::endl;
     std::cerr << "    --discard-bounding:         discard bounding data if buffer size reached;" << std::endl;
     std::cerr << "                                default is to block until stdin catches up" << std::endl;
     std::cerr << std::endl;

From 6964c7ce87511e2beb57e1f1bc6a084669d0eb03 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 3 Sep 2020 20:51:01 +1000
Subject: [PATCH 0191/1056] csv-sort: --last: todo comments added

---
 csv/applications/csv-sort.cpp | 76 +++++++++++++++--------------------
 1 file changed, 32 insertions(+), 44 deletions(-)

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index c2665e071..c29d5f1ef 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @authors matthew imhoff, dewey nguyen, vsevolod vlaskine
 
@@ -69,7 +42,8 @@ static void usage( bool more )
     std::cerr << "           fields" << std::endl;
     std::cerr << "               id: if present, multiple id fields accepted; output first record for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
     std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
-    std::cerr << "    --min: output only record(s) with minimum value for a given field." << std::endl;
+    std::cerr << "    --last: last line matching given keys; last line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
+    std::cerr << "    --min: output only record(s) with minimum value for a given field" << std::endl;
     std::cerr << "           fields" << std::endl;
     std::cerr << "               id: if present, multiple id fields accepted; output minimum for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
     std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
@@ -313,6 +287,30 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
     return 0;
 }
 
+// todo?
+// static int handle_last( comma::csv::input_stream< input_with_ids_t >& istream, const std::string& first_line, const input_with_ids_t& default_input )
+// {
+//     typedef boost::unordered_set< comma::csv::impl::unstructured, comma::csv::impl::unstructured::hash > set_t;
+//     typedef boost::unordered_map< comma::csv::impl::unstructured, set_t, comma::csv::impl::unstructured::hash > map_t;
+//     map_t keys;
+//     comma::uint32 block = 0;
+//     if( !first_line.empty() )
+//     { 
+//         input_with_ids_t input = comma::csv::ascii< input_with_ids_t >( csv, default_input ).get( first_line );
+//         block = input.block;
+//         keys[ input.ids ].insert( input.keys );
+//         //std::cout << first_line << std::endl;
+//     }
+//     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
+//     {
+//         const input_with_ids_t* p = istream.read();
+//         if( !p ) { break; }
+//         if( p->block != block ) { block = p->block; keys.clear(); }
+//         if( keys[ p->ids ].insert( p->keys ).second ) { output_last_( istream ); }
+//     }
+//     return 0;
+// }
+
 static int handle_sliding_window( comma::csv::input_stream< input_with_block >& istream, const std::string& first_line, const input_with_block& default_input, bool reverse, unsigned int sliding_window )
 {
     if( sliding_window < 2 ) { std::cerr << "csv-sort: expected sliding window greater than 1, got: " << sliding_window << std::endl; return 1; }
@@ -396,28 +394,20 @@ std::vector< comma::csv::impl::unstructured > input_order;
 
 void output_current_block( const limit_map_t& min, const limit_map_t& max )
 {
-    for( std::size_t i=0; i<input_order.size(); ++i )
+    for( std::size_t i = 0; i < input_order.size(); ++i )
     {
         const comma::csv::impl::unstructured& ids = input_order[i];
-        
         if( is_min )
         {
-            const limit_data_t& data = min.at(ids);
-            for ( std::size_t i=0; i<data.records.size(); ++i) {
-                std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() );
-            }
+            const limit_data_t& data = min.at( ids );
+            for( std::size_t i = 0; i < data.records.size(); ++i ) { std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() ); }
         }
-        
-        if( is_min && is_max && is_same_map[ ids ] ) { continue; }
-        
+        if( is_min && is_max && is_same_map[ids] ) { continue; }
         if( is_max )
         {
-            const limit_data_t& data = max.at(ids);
-            for ( std::size_t i=0; i<data.records.size(); ++i) {
-                std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() );
-            }
+            const limit_data_t& data = max.at( ids );
+            for( std::size_t i = 0; i < data.records.size(); ++i ) { std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() ); }
         }
-        
         if( csv.flush ) { std::cout.flush(); }
     }
 }
@@ -565,13 +555,11 @@ int handle_operations_with_ids( const comma::command_line_options& options )
                 }
                 else
                 {
-//                     std::cerr  << "found ids: " << p->ids.strings[0] << std::endl;
                     limit_data_t& data = iter->second;
                     if( *p < data.keys ) {}
                     else if( data.keys == *p ) { data.add_current_record( stdin_stream ); } //  std::cerr  << "equals " << std::endl; } // Else If equals then append
                     else
                     {
-//                         std::cerr  << "new max: " << p->ids.strings[0] << " " << p->keys.longs[0] << " " << data.keys.keys.longs[0] << std::endl;
                         data.keys = *p;
                         data.records.clear();
                         data.add_current_record( stdin_stream );

From 6d665621f7c19bd89a069180618ed5482f6fe678 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 3 Sep 2020 21:54:14 +1000
Subject: [PATCH 0192/1056] csv-update: minor refactoring

---
 csv/applications/csv-update.cpp | 53 +++------------------------------
 1 file changed, 4 insertions(+), 49 deletions(-)

diff --git a/csv/applications/csv-update.cpp b/csv/applications/csv-update.cpp
index 4778f02f2..decefba96 100644
--- a/csv/applications/csv-update.cpp
+++ b/csv/applications/csv-update.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -41,7 +14,6 @@
 #include <boost/unordered_map.hpp>
 #include <boost/graph/graph_concepts.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -59,25 +31,11 @@ static void usage( bool more )
     std::cerr << std::endl;
     std::cerr << "       if update input specified (update.csv above), update" << std::endl;
     std::cerr << "       records from stdin by the ones in the update file" << std::endl;
-    if( more )
-    {
-        std::cerr << "       todo" << std::endl;
-    }
-    else
-    {
-        std::cerr << "       ... use --help --verbose for more" << std::endl;
-    }
+    if( more ) { std::cerr << "       todo" << std::endl; } else { std::cerr << "       ... use --help --verbose for more" << std::endl; }
     std::cerr << std::endl;
     std::cerr << "       if update input not specified, apply updates received" << std::endl;
     std::cerr << "       on stdin itself" << std::endl;
-    if( more )
-    {
-        std::cerr << "       todo" << std::endl;
-    }
-    else
-    {
-        std::cerr << "       ... use --help --verbose for more" << std::endl;
-    }
+    if( more ) { std::cerr << "       todo" << std::endl; } else { std::cerr << "       ... use --help --verbose for more" << std::endl; }
     std::cerr << std::endl;
     std::cerr << "    fields:" << std::endl;
     std::cerr << "        block: block number" << std::endl;
@@ -109,7 +67,7 @@ static void usage( bool more )
     std::cerr << "    --update-non-empty-fields,--update-non-empty,-u:" << std::endl;
     std::cerr << "        if update has empty fields, use the field value from stdin (for binary, empty fields must be defined with --empty)" << std::endl;
     std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
-    if( more ) { std::cerr << std::endl << "csv options:" << std::endl << comma::csv::options::usage() << std::endl; }
+    if( more ) { std::cerr << std::endl << "csv options:" << std::endl << comma::csv::options::usage() << std::endl; } else { std::cerr << std::endl << "csv options ... use --help --verbose for more" << std::endl; }
     std::cerr << std::endl;
     if( more )
     {
@@ -154,8 +112,6 @@ static void usage( bool more )
         std::cerr << "examples ... use --help --verbose" << std::endl;
     }
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
     exit( 0 );
 }
 
@@ -244,8 +200,7 @@ static void output_and_clear( map_t::type& map, bool do_output, comma::csv::outp
         }
         for( output_map_t::const_iterator it = m.begin(); it != m.end(); ++it )
         {   
-            if( ostream ) { ostream->write( it->second->value, it->second->string ); }
-            else { std::cout << it->second->string; }
+            if( ostream ) { ostream->write( it->second->value, it->second->string ); } else { std::cout << it->second->string; }
         }
     }
     map.clear();

From e3504245fc066535653a3fedb5e01dd155a2fa36 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 1 Oct 2020 18:17:33 +1000
Subject: [PATCH 0193/1056] check.c++.standard.cmake: don't overwrite initial
 compiler flags when switching c++ standard

---
 CMakeFiles/check.c++.standard.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeFiles/check.c++.standard.cmake b/CMakeFiles/check.c++.standard.cmake
index d734acf41..5e42f46d0 100644
--- a/CMakeFiles/check.c++.standard.cmake
+++ b/CMakeFiles/check.c++.standard.cmake
@@ -42,7 +42,7 @@
             message( FATAL_ERROR "attempt to use C++ standard ${CXX_STANDARD_TO_USE} but ${CMAKE_CXX_COMPILER} does not support it" )
         endif()
         SET( CXX_STANDARD_LAST ${CXX_STANDARD_TO_USE} CACHE STRING "updating C++ standard to use option" FORCE )
-        set( CMAKE_CXX_FLAGS "${extra_compiler_flags}" CACHE STRING "" FORCE )
+        set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${extra_compiler_flags}" CACHE STRING "" FORCE )
     ENDIF()
 
     set( CMAKE_CXX_STANDARD ${CXX_STANDARD_TO_USE} )

From 33c2efae5870507483ad1c2e5fe1fdd6632448c6 Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Tue, 13 Oct 2020 16:31:32 +1100
Subject: [PATCH 0194/1056] csv-enumerate: --output-map binary output now
 complies with --help

---
 csv/applications/csv-enumerate.cpp | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index 82a3e89c9..74bde27a5 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -49,7 +49,7 @@ static void usage( bool verbose )
     std::cerr << "options" << std::endl;
     std::cerr << "    --fields,-f=<fields>; fields of interest, actual field names do not matter; e.g: --fields ,,,a,,b,,,c" << std::endl;
     std::cerr << "    --format=<binary format>; if input is ascii and deducing data types may be ambiguous, define field types explicitly, value as in --binary" << std::endl;
-    std::cerr << "    --output-map,--map: do not output input records, only an unsorted records" << std::endl;
+    std::cerr << "    --output-map,--map: do not output input records, only an unsorted list of keys" << std::endl;
     std::cerr << "                        output fields" << std::endl;
     std::cerr << "                            - list of input key values; in same binary as input" << std::endl;
     std::cerr << "                            - corresponding enumeration index as ui" << std::endl;
@@ -104,11 +104,16 @@ int main( int ac, char** av )
         }
         input_t default_input;
         std::vector< std::string > v = comma::split( csv.fields, ',' );
+        std::vector< std::string > format; // quick and dirty
+        std::vector< std::string > s;
+        if( csv.binary() ) { format = comma::split( csv.format().expanded_string(), ',' ); }
         for( unsigned int i = 0; i < v.size(); ++i )
         {
             if( v[i].empty() ) { continue; }
             v[i] = default_input.append( f.offset( i ).type );
+            s.push_back( format[i] );
         }
+        std::string map_output_binary_format = comma::join( s, ',' );
         if( verbose ) { std::cerr << "csv-enumerate: fields " << csv.fields << " interpreted as: " << comma::join( v, ',' ) << std::endl; }
         csv.fields = comma::join( v, ',' );
         static map_t map;
@@ -140,7 +145,11 @@ int main( int ac, char** av )
         if( !output_map ) { return 0; }
         comma::csv::options output_map_csv;
         output_map_csv.delimiter = csv.delimiter;
-        if( csv.binary() ) { output_map_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" ); }
+        if( csv.binary() )
+        { 
+            output_map_csv.format( map_output_binary_format + ",2ui" ); //output_map_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" );
+            std::cerr << "csv-enumerate: binary output format for map: \"" << output_map_csv.format().string() << "\"" << std::endl;
+        }
         comma::csv::output_stream< map_t::value_type > omstream( std::cout, output_map_csv, std::make_pair( default_input, std::make_pair( 0, 0 ) ) );
         for( map_t::const_iterator it = map.begin(); it != map.end(); ++it ) { omstream.write( *it ); }
         return 0;

From fbb80bb138d6be11029ab8482cb6ff6e1cba9a53 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 16 Oct 2020 18:33:58 +1100
Subject: [PATCH 0195/1056] csv-paste: --head implemented

---
 csv/applications/csv-paste.cpp | 13 +++++++++----
 csv/test/csv-paste/expected    |  8 ++++++++
 csv/test/csv-paste/input       |  4 ++++
 3 files changed, 21 insertions(+), 4 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 75c736079..04217cd92 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -71,6 +71,9 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --delimiter,-d <delimiter> : default ','" << std::endl;
+    std::cerr << "    --flush; flush stdout on every record" << std::endl;
+    std::cerr << "    --head=[<n>]; output first <n> records and exit; convenience option, e.g. try:" << std::endl;
+    std::cerr << "        csv-paste 'line-number;size=4' 'line-number;size=4;index' --head=16" << std::endl;
     std::cerr << "    --help,-h : help, --help --verbose for more help" << std::endl;
     std::cerr << "    --verbose,-v; more debug output" << std::endl;
     std::cerr << std::endl;
@@ -287,9 +290,11 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         char delimiter = options.value( "--delimiter,-d", ',' );
-        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--step,--block-size" );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--step,--block-size,--head" );
+        bool flush = options.exists( "--flush" );
         boost::ptr_vector< source > sources;
         bool is_binary = false;
+        boost::optional< comma::uint32 > head = options.optional< comma::uint32 >( "--head" );
         for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty; really lousy code duplication
         {
             if( unnamed[i].substr( 0, 6 ) == "value=" ) { if( value( unnamed[i] ).binary() ) { is_binary = true; } }
@@ -324,7 +329,7 @@ int main( int ac, char** av )
             std::size_t size = 0;
             for( unsigned int i = 0; i < sources.size(); ++i ) { size += sources[i].size(); }
             std::vector< char > buffer( size );
-            while( true )
+            while( !head || ( *head )-- )
             {
                 unsigned int streams = 0;
                 char* p = &buffer[0];
@@ -339,12 +344,12 @@ int main( int ac, char** av )
                     if( sources[i].is_stream() ) { ++streams; }
                 }
                 std::cout.write( &buffer[0], buffer.size() );
-                std::cout.flush();
+                if( flush ) { std::cout.flush(); }
             }
         }
         else
         {
-            while( true )
+            while( !head || ( *head )-- )
             {
                 std::ostringstream oss;
                 unsigned int streams = 0;
diff --git a/csv/test/csv-paste/expected b/csv/test/csv-paste/expected
index ae81fcb6c..2b8f54240 100644
--- a/csv/test/csv-paste/expected
+++ b/csv/test/csv-paste/expected
@@ -134,3 +134,11 @@ line_number/step[6]/output/line[8]="14"
 line_number/step[6]/output/line[9]="12"
 line_number/step[6]/status=0
 line_number/step[7]/status=1
+
+head[0]/output=""
+head[0]/status=0
+head[1]/output="0"
+head[1]/status=0
+head[2]/output/line[0]="0"
+head[2]/output/line[1]="1"
+head[2]/status=0
diff --git a/csv/test/csv-paste/input b/csv/test/csv-paste/input
index 331ba378d..de0b2313b 100644
--- a/csv/test/csv-paste/input
+++ b/csv/test/csv-paste/input
@@ -38,3 +38,7 @@ line_number/step[4]="csv-paste "line-number;block-size=5;index;step=2" | head; c
 line_number/step[5]="csv-paste "line-number;block-size=5;index;reverse;step=2" | head; comma_status_ok && exit 0 || exit 1"
 line_number/step[6]="csv-paste "line-number;block-size=5;index;reverse;begin=20;step=2" | head; comma_status_ok && exit 0 || exit 1"
 line_number/step[7]="csv-paste "line-number;block-size=5;index;reverse;begin=4;step=2" | head; comma_status_ok && exit 0 || exit 1"
+
+head[0]="csv-paste 'line-number;size=10;index' --head=0"
+head[1]="csv-paste 'line-number;size=10;index' --head=1"
+head[2]="csv-paste 'line-number;size=10;index' --head=2"

From 139a91091d23e97bd3720104d74d316427de3c31 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 20 Oct 2020 13:22:43 +1100
Subject: [PATCH 0196/1056] csv-fields: minor refactoring

---
 csv/applications/csv-fields.cpp | 89 +++++++++++++--------------------
 1 file changed, 35 insertions(+), 54 deletions(-)

diff --git a/csv/applications/csv-fields.cpp b/csv/applications/csv-fields.cpp
index e56d89efb..d8e46c66a 100644
--- a/csv/applications/csv-fields.cpp
+++ b/csv/applications/csv-fields.cpp
@@ -1,44 +1,16 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
+#include <functional>
 #include <iostream>
 #include <string>
 #include <set>
 #include <map>
-#include "../../application/contact_info.h"
+#include <unordered_map>
 #include "../../application/command_line_options.h"
 #include "../../string/string.h"
 
-using namespace comma;
-
 static void usage( bool )
 {
     std::cerr << std::endl;
@@ -95,9 +67,9 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << "    make-fixed: normalise input to a fixed number of fields" << std::endl;
     std::cerr << "        --count,--size=<n>: number of output fields" << std::endl;
+    std::cerr << "        --force: chop input to <n> fields if larger" << std::endl;
     std::cerr << "        --values=[<values>]: fill missing fields with given values" << std::endl;
     std::cerr << "                             if --count not specified, use number of <values> as desired number of fields" << std::endl;
-    std::cerr << "        --force: chop input to <n> fields if larger" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    numbers" << std::endl;
@@ -167,21 +139,19 @@ static void usage( bool )
     std::cerr << "        a,b,c" << std::endl;
     std::cerr << "        x,y,z" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 int main( int ac, char** av )
 {
     try
     {
-        command_line_options options( ac, av, usage );
+        comma::command_line_options options( ac, av, usage );
         std::string operation = "numbers";
         const std::vector< std::string > unnamed = options.unnamed( "--help,-h", "-.*" );
         char delimiter = options.value( "--delimiter,-d", ',' );
         if( !unnamed.empty() ) { operation = unnamed[0]; }
-        if( operation == "numbers" )
+        auto numbers = [&]()->int
         {
             int from = options.value( "--from", 1 );
             bool fill = options.exists( "--fill" );
@@ -207,8 +177,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "clear" )
+        };
+        auto clear = [&]()->int
         {
             options.assert_mutually_exclusive( "--except,--keep,--mask,--remove,--inverted-mask,--complement-mask,--unmask,--unmasked" );
             std::string keep = options.value< std::string >( "--keep,--except", "" );
@@ -261,8 +231,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "default" )
+        };
+        auto default_operation = [&]()->int
         {
             options.assert_mutually_exclusive( "--value,--values" );
             std::vector< std::string > defaults;
@@ -288,8 +258,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "prefix" )
+        };
+        auto prefix = [&]()->int
         {
             options.assert_mutually_exclusive( "--fields,--except" );
             const std::string& e = options.value< std::string >( "--except", "" );
@@ -321,8 +291,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "rename" )
+        };
+        auto rename = [&]()->int
         {
             const std::vector< std::string >& fields = comma::split( options.value< std::string >( "--fields" ), ',' );
             const std::vector< std::string >& to = comma::split( options.value< std::string >( "--to" ), ',' );
@@ -346,8 +316,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "strip" )
+        };
+        auto strip = [&]()->int
         {
             options.assert_mutually_exclusive( "--fields,--except" );
             const std::string& e = options.value< std::string >( "--except", "" );
@@ -376,8 +346,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "cut" )
+        };
+        auto cut = [&]()->int
         {
             options.assert_mutually_exclusive( "--except,--fields", "--empty" );
             bool except = options.exists( "--except" );
@@ -406,8 +376,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "has" )
+        };
+        auto has = [&]()->int
         {
             const std::string& f = options.value< std::string >( "--fields" );
             const std::vector< std::string >& v = comma::split( f, delimiter );
@@ -423,8 +393,8 @@ int main( int ac, char** av )
             if( !matches ) { return 1; }
             if( any ) { return 0; }
             return matches == fields.size() ? 0 : 1;
-        }
-        if( operation == "make-fixed" )
+        };
+        auto make_fixed = [&]()->int
         {
             const std::vector< std::string >& values = comma::split( options.value< std::string >( "--values", "" ), ',', true );
             const unsigned int count = options.value< unsigned int >( "--count,--size", values.size() );
@@ -450,8 +420,19 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        std::cerr << "csv-fields: expected operation, got: \"" << operation << "\"" << std::endl;
+        };
+        std::unordered_map< std::string, std::function< int() > > operations = { { "clear", clear }
+                                                                               , { "cut", cut }
+                                                                               , { "default", default_operation }
+                                                                               , { "has", has }
+                                                                               , { "make-fixed", make_fixed }
+                                                                               , { "numbers", numbers }
+                                                                               , { "prefix", prefix }
+                                                                               , { "rename", rename }
+                                                                               , { "strip", strip } };
+        auto o = operations.find( operation );
+        if( o != operations.end() ) { return o->second(); }
+        std::cerr << "csv-fields: expected operation, got '" << operation << "'" << std::endl;
         return 1;
     }
     catch( std::exception& ex ) { std::cerr << "csv-fields: " << ex.what() << std::endl; }

From 3015f021fee5732c20b7ba34afa8d273ed1b5113 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 20 Oct 2020 13:40:39 +1100
Subject: [PATCH 0197/1056] csv-enumerate: a trivial bug fixed

---
 csv/applications/csv-enumerate.cpp | 29 +----------------------------
 1 file changed, 1 insertion(+), 28 deletions(-)

diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index 74bde27a5..31f6f0226 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -111,7 +84,7 @@ int main( int ac, char** av )
         {
             if( v[i].empty() ) { continue; }
             v[i] = default_input.append( f.offset( i ).type );
-            s.push_back( format[i] );
+            if( csv.binary() ) { s.push_back( format[i] ); }
         }
         std::string map_output_binary_format = comma::join( s, ',' );
         if( verbose ) { std::cerr << "csv-enumerate: fields " << csv.fields << " interpreted as: " << comma::join( v, ',' ) << std::endl; }

From 113e66d862ad1332ac6d00530c06283fd85a7c3f Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 20 Oct 2020 13:51:50 +1100
Subject: [PATCH 0198/1056] csv-enumerate: a basic unit test implemented

---
 csv/test/csv-enumerate/expected | 22 ++++++++++++++++++++++
 csv/test/csv-enumerate/input    | 10 ++++++++++
 2 files changed, 32 insertions(+)
 create mode 100644 csv/test/csv-enumerate/expected
 create mode 100644 csv/test/csv-enumerate/input

diff --git a/csv/test/csv-enumerate/expected b/csv/test/csv-enumerate/expected
new file mode 100644
index 000000000..5ef5ab006
--- /dev/null
+++ b/csv/test/csv-enumerate/expected
@@ -0,0 +1,22 @@
+ascii[0]/output=""
+ascii[0]/status=1
+ascii[1]/output/line[0]="0,x,a,0"
+ascii[1]/output/line[1]="1,y,b,1"
+ascii[1]/output/line[2]="0,x,c,0"
+ascii[1]/status=0
+ascii[2]/output/line[0]="0,1,a,0"
+ascii[2]/output/line[1]="1,y,b,1"
+ascii[2]/output/line[2]="0,1,c,0"
+ascii[2]/status=0
+
+binary[0]/output/line[0]="0,1,a,0"
+binary[0]/output/line[1]="1,y,b,1"
+binary[0]/output/line[2]="0,1,c,0"
+binary[0]/status=0
+
+map[0]/output/line[0]="1,y,1,1"
+map[0]/output/line[1]="0,x,0,2"
+map[0]/status=0
+map[1]/output/line[0]="1,y,1,1"
+map[1]/output/line[1]="0,x,0,2"
+map[1]/status=0
diff --git a/csv/test/csv-enumerate/input b/csv/test/csv-enumerate/input
new file mode 100644
index 000000000..bf136d6bd
--- /dev/null
+++ b/csv/test/csv-enumerate/input
@@ -0,0 +1,10 @@
+ascii[0]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-enumerate"
+ascii[1]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-enumerate --fields a,b"
+ascii[2]="( echo 0,1,a ; echo 1,y,b; echo 0,1,c ) | csv-enumerate --fields a,b --format ui,s[16],s[16]"
+
+binary[0]="( echo 0,1,a ; echo 1,y,b; echo 0,1,c ) | csv-to-bin ui,s[16],s[16] | csv-enumerate --fields a,b --binary ui,s[16],s[16] | csv-from-bin ui,s[16],s[16],ui"
+
+map[0]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-enumerate --fields a,b --map | sed 's#\"##g' "
+map[1]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-to-bin ui,s[16],s[16] | csv-enumerate --fields a,b --map --binary ui,s[16],s[16] | csv-from-bin ui,s[16],2ui | sed 's#\"##g' "
+
+

From 804ad47e1615905820e42b8371fdd2de157f713f Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 22 Oct 2020 20:38:22 +1100
Subject: [PATCH 0199/1056] csv-format: size operation implemented; csv-size:
 marked as deprecated

---
 csv/applications/csv-format.cpp | 44 +++++----------------------------
 csv/applications/csv-size.cpp   | 43 ++++++--------------------------
 2 files changed, 13 insertions(+), 74 deletions(-)

diff --git a/csv/applications/csv-format.cpp b/csv/applications/csv-format.cpp
index ab0b7bff6..26da4f331 100644
--- a/csv/applications/csv-format.cpp
+++ b/csv/applications/csv-format.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -33,9 +6,7 @@
 #include <iostream>
 #include <sstream>
 #include <string>
-#include <set>
 #include <boost/lexical_cast.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../csv/format.h"
 #include "../../string/string.h"
@@ -43,7 +14,7 @@
 using namespace comma;
 static const char *app_name = "csv-format";
 
-static void usage()
+static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
     std::cerr << "usage: echo \"3f,2f,d\" | " << app_name << " [options] (expand|collapse|count|repeat)" << std::endl;
@@ -64,8 +35,6 @@ static void usage()
     std::cerr << "    repeat:" << std::endl;
     std::cerr << "        --count=n: replicate the format n times" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
     exit( 1 );
 }
 
@@ -116,19 +85,18 @@ int main( int ac, char** av )
 {
     try
     {
-        command_line_options options( ac, av );
-        if( options.exists( "--help,-h" ) ) { usage(); }
+        command_line_options options( ac, av, usage );
         const std::vector< std::string > unnamed = options.unnamed( "--help,-h", "-.*" );
-        if( unnamed.empty() )
-        { std::cerr << app_name << ": expected an operation (e.g. \"expand\")" << std::endl; return 1; }
-        if( unnamed.size() != 1 ) { usage(); }
+        if( unnamed.empty() ) { std::cerr << "csv-format: please specify operation" << std::endl; return 1; }
+        if( unnamed.size() > 1 ) { std::cerr << "csv-format: please only one operation" << std::endl; return 1; }
         std::string operation = unnamed[0];
         std::string line;
         std::function< void( const std::string& ) > handle;
         if( operation == "expand" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).expanded_string() << std::endl; }; }
         else if( operation == "collapse" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).collapsed_string() << std::endl; }; }
         else if( operation == "count" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).count() << std::endl; }; }
-        else if( operation == "guess" ) { handle = [&]( const std::string& s )  {
+        else if( operation == "size" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).size() << std::endl; }; }
+        else if( operation == "guess" ) { handle = [&]( const std::string& s ) {
                                                                                     static const std::vector< std::string >& e = comma::split( incomplete_expanded( options.value< std::string >( "--format", "" ) ), ',' );
                                                                                     static char delimiter = options.value( "--delimiter,-d", ',' );
                                                                                     const std::vector< std::string >& v = comma::split( s, delimiter );
diff --git a/csv/applications/csv-size.cpp b/csv/applications/csv-size.cpp
index 13ef66590..49592e31c 100644
--- a/csv/applications/csv-size.cpp
+++ b/csv/applications/csv-size.cpp
@@ -1,47 +1,20 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
 #include <iostream>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../csv/format.h"
 
 using namespace comma;
 
-static void usage()
+static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
     std::cerr << "a convenience utility: output to stdout size of given binary format" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "DEPRECATED: use csv-format size" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "Usage: csv-size <format> [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
@@ -52,22 +25,20 @@ static void usage()
     std::cerr << "      csv-size 2d will output 16" << std::endl;
     std::cerr << "      csv-size 2d --count will output 2" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( -1 );
+    exit( 0 );
 }
 
 int main( int ac, char** av )
 {
     try
     {
-        command_line_options options( ac, av );
-        if( ac < 2 || options.exists( "--help" ) || options.exists( "-h" ) ) { usage(); }
+        command_line_options options( ac, av, usage );
+        if( ac < 2 ) { usage(); }
         comma::csv::format format( options.unnamed( "--count,-c", "" )[0] );
         std::cout << ( options.exists( "--count,-c" ) ? format.count() : format.size() ) << std::endl;
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "csv-size: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-size: unknown exception" << std::endl; }
-    usage();
+    return 1;
 }

From ec3dbc7ea06daf80d1c04276d110f3ff589214f8 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 22 Oct 2020 20:57:18 +1100
Subject: [PATCH 0200/1056] csv-size: deprecated message added; csv-format
 size: documented in --help

---
 csv/applications/csv-format.cpp | 16 +++++++---------
 csv/applications/csv-size.cpp   |  1 +
 2 files changed, 8 insertions(+), 9 deletions(-)

diff --git a/csv/applications/csv-format.cpp b/csv/applications/csv-format.cpp
index 26da4f331..2f1812d8b 100644
--- a/csv/applications/csv-format.cpp
+++ b/csv/applications/csv-format.cpp
@@ -11,13 +11,10 @@
 #include "../../csv/format.h"
 #include "../../string/string.h"
 
-using namespace comma;
-static const char *app_name = "csv-format";
-
 static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
-    std::cerr << "usage: echo \"3f,2f,d\" | " << app_name << " [options] (expand|collapse|count|repeat)" << std::endl;
+    std::cerr << "usage: echo \"3f,2f,d\" | csv-format [options] (expand|collapse|count|repeat)" << std::endl;
     std::cerr << std::endl;
     std::cerr << "perform various operations on format strings" << std::endl;
     std::cerr << std::endl;
@@ -27,6 +24,7 @@ static void usage( bool verbose = false )
     std::cerr << "    guess: take a csv string, output (roughly) guessed format; e.g: echo 20170101T000000,1,2,3 | csv-format guess --format ,,ui" << std::endl;
     std::cerr << "    expand: output fully expand format, e.g. 2i,3f -> i,i,f,f,f" << std::endl;
     std::cerr << "    repeat: replicate the format n times, e.g. 2i,3f --count 2 -> 2i,3f,2i,3f" << std::endl;
+    std::cerr << "    size: output format size in bytes, e.g: echo 2i,3f | csv-format size would output 20" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    guess:" << std::endl;
@@ -35,7 +33,7 @@ static void usage( bool verbose = false )
     std::cerr << "    repeat:" << std::endl;
     std::cerr << "        --count=n: replicate the format n times" << std::endl;
     std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 static std::string incomplete_expanded( const std::string& s ) // quick and dirty
@@ -85,7 +83,7 @@ int main( int ac, char** av )
 {
     try
     {
-        command_line_options options( ac, av, usage );
+        comma::command_line_options options( ac, av, usage );
         const std::vector< std::string > unnamed = options.unnamed( "--help,-h", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-format: please specify operation" << std::endl; return 1; }
         if( unnamed.size() > 1 ) { std::cerr << "csv-format: please only one operation" << std::endl; return 1; }
@@ -118,7 +116,7 @@ int main( int ac, char** av )
                                                                                         std::cout << std::endl;
                                                                                     }
                                                                                 }; }
-        else { std::cerr << app_name << ": expected operation; got: \"" << operation << "\"" << std::endl; return 1; }
+        else { std::cerr << "csv-format: expected operation; got: \"" << operation << "\"" << std::endl; return 1; }
         while( std::getline( std::cin, line ) )
         {
             const std::string& stripped = comma::strip( line );
@@ -126,7 +124,7 @@ int main( int ac, char** av )
         }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << app_name << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << app_name << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-format: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-format: unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/applications/csv-size.cpp b/csv/applications/csv-size.cpp
index 49592e31c..4400b43e3 100644
--- a/csv/applications/csv-size.cpp
+++ b/csv/applications/csv-size.cpp
@@ -32,6 +32,7 @@ int main( int ac, char** av )
 {
     try
     {
+        std::cerr << "csv-size: DEPRECATED, use echo <format> | csv-format size" << std::endl;
         command_line_options options( ac, av, usage );
         if( ac < 2 ) { usage(); }
         comma::csv::format format( options.unnamed( "--count,-c", "" )[0] );

From 3487573404410c8afad98b9dd70f1d0eb9628702 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 26 Oct 2020 12:48:12 +1100
Subject: [PATCH 0201/1056] comma-timeout-group: reflowed help text to work on
 an 80-column term

---
 util/applications/comma-timeout-group.cpp | 153 +++++++++++++---------
 1 file changed, 94 insertions(+), 59 deletions(-)

diff --git a/util/applications/comma-timeout-group.cpp b/util/applications/comma-timeout-group.cpp
index 47fcf3d42..555e7a3fc 100644
--- a/util/applications/comma-timeout-group.cpp
+++ b/util/applications/comma-timeout-group.cpp
@@ -57,68 +57,99 @@ namespace {
 void usage( bool )
 {
     static char const * const msg_general =
-        "\nRun a given command with its arguments. Kill the command if it is still running after the given"
-        "\ntime duration."
+        "\nRun a given command with its arguments. Kill the command if it is still running"
+        "\nafter the given time duration."
         "\n"
-        "\nUsage:"
-        "\n    comma-timeout-group <options> duration command <args>"
+        "\nUsage: comma-timeout-group <options> duration command <args>"
         "\n"
-        "\nA drop-in replacement of the standard timeout(1) utility for most common usage patterns."
-        "\nThe capability to wait for all processes in a process group added."
+        "\nA drop-in replacement of the standard timeout(1) utility for most common usage"
+        "\npatterns. The capability to wait for all processes in a process group added."
 #ifndef HAVE_PROCPS_DEV
-        "\nWARNING: this new capability is not available in this build. Install procps (or procps-ng)"
-        "\ndevelopment package (containing headers and library) and recompile comma-timeout-group."
+        "\n"
+        "\nWARNING: this new capability is not available in this build. Install procps"
+        "\n(or procps-ng) development package (containing headers and library) and"
+        "\nrecompile comma-timeout-group."
 #endif
-        "\nSome options of timeout (1) are not supported, and, if given, this utility exits in error."
+        "\n"
+        "\nSome options of timeout(1) are not supported, and, if given, this utility exits"
+        "\nin error."
         "\n"
         "\nOptions:"
-        "\n    -h,--help, print this help and exit"
-        "\n    -v,--verbose, chat more"
-        "\n    --report-timeout, run silently but print a message if a command times out"
-        "\n    --verbose-signal-handler, print messages on stderr when sending signals within signal handler;"
-        "\n        WARNING: generally output routines are not re-entrant and shall not be invoked in signal"
-        "\n        handlers; use for debugging but not in production code"
-        "\n    --preserve-status, exit with the same status as <command>, even when the command timed out"
-        "\n    --foreground, not supported"
-        "\n    -k, --kill-after=duration, if the command is still running this long after the initial"
-        "\n        signal was sent, send the KILL signal to finish it off"
-        "\n    --wait-for-process-group=duration, after the initial signal, wait this time for all the processes"
-        "\n        in the current process group to finish; if some processes are still left, send the KILL signal"
-        "\n        to finish them off (same as -k duration); if both this option and '-k' is given, the duration"
-        "\n        specified by '-k' takes precedence"
+        "\n    -h,--help:                 print this help and exit"
+        "\n    -v,--verbose:              chat more"
+        "\n    --report-timeout:          run silently but print a message if a command"
+        "\n                               times out"
+        "\n    --verbose-signal-handler:  print messages on stderr when sending signals"
+        "\n                               within signal handler"
+        "\n"
+        "\n               WARNING: generally output routines are not re-entrant and should"
+        "\n               not be invoked in signal handlers; use for debugging but not in"
+        "\n               production code"
+        "\n"
+        "\n    --preserve-status:         exit with the same status as <command>, even when"
+        "\n                               the command timed out"
+        "\n    --foreground:              not supported"
+        "\n    -k, --kill-after=duration: if the command is still running this long after"
+        "\n                               the initial signal was sent, send the KILL"
+        "\n                               signal to finish it off"
+        "\n    --wait-for-process-group=<duration>:"
+        "\n                               after the initial signal, wait this time for all"
+        "\n                               the processes in the current process group to"
+        "\n                               finish; if some processes are still left send"
+        "\n                               the KILL signal to finish them off (same as -k"
+        "\n                               duration); if both this option and -k is given,"
+        "\n                               the duration specified by -k takes precedence"
 #ifndef HAVE_PROCPS_DEV
-        "\n        WARNING: your version of comma-timeout-group is built without procps support, the capability to"
-        "\n        wait for process group is not available, and this options is a synonym to '-k'"
+        "\n"
+        "\n               WARNING: your version of comma-timeout-group is built without"
+        "\n               procps support, the capability to wait for process group is not"
+        "\n               available, and this options is a synonym to -k"
+        "\n"
 #endif
-        "\n    --enforce-group, enforce waiting for process groups; if comma-timeout-group is built without procps"
-        "\n        support, '--wait-for-process-group' would exit in error rather then become a synonym to '-k';"
-        "\n        this option does nothing if procps support is built in"
-        "\n    --wait-for-process-group-delay=value, when waiting for all processes in the group to finish, a delay"
-        "\n        is inserted between each parsing of the process tree; the value in microseconds is passed to"
-        "\n        usleep (2), default is 100000 (0.1 s); note that low delay values make the program more"
-        "\n        responsive at the cost of higher CPU load when parsing the process tree"
+        "\n    --enforce-group:           enforce waiting for process groups; if"
+        "\n                               comma-timeout-group is built without procps"
+        "\n                               support, --wait-for-process-group would exit in"
+        "\n                               error rather then become a synonym to -k; this"
+        "\n                               option does nothing if procps support is built in"
+        "\n    --wait-for-process-group-delay=<value>:"
+        "\n                               when waiting for all processes in the group to"
+        "\n                               finish, a delay is inserted between each parsing"
+        "\n                               of the process tree; the value in microseconds is"
+        "\n                               passed to usleep(2), default is 100000 (0.1s);"
+        "\n                               note that low delay values make the program more"
+        "\n                               responsive at the cost of higher CPU load when"
+        "\n                               parsing the process tree"
 #ifndef HAVE_PROCPS_DEV
-        "\n        WARNING: your version of comma-timeout-group is built without procps support, this option"
-        "\n        has no effect"
+        "\n"
+        "\n               WARNING: your version of comma-timeout-group is built without"
+        "\n               procps support, this option has no effect"
+        "\n"
 #endif
-        "\n    -s, --signal=signal, the signal to be sent on timeout, given as a name (HUP, SIGHUP) or number;"
-        "\n        only a sub-set of all available signal names is supported, use '--list-known-signals' to list;"
-        "\n        arbitrary signal to use can be specified as a number, see 'kill -l' for the values;"
-        "\n        by default, use SIGTERM"
-        "\n    --list-known-signals, list the supported signals, one per line, and exit"
-        "\n    --can-wait-for-process-group, if built with procps library and can wait for process groups, exit"
-        "\n        with status success, otherwise, exit with failure"
+        "\n    -s, --signal=<signal>:     the signal to be sent on timeout, given as a name"
+        "\n                               (HUP, SIGHUP) or number; only a sub-set of all"
+        "\n                               available signal names is supported, use"
+        "\n                               --list-known-signals to list; arbitrary signal"
+        "\n                               to use can be specified as a number, see"
+        "\n                               'kill -l' for the values; by default, use SIGTERM"
+        "\n    --list-known-signals:      list the supported signals and exit"
+        "\n    --can-wait-for-process-group:"
+        "\n                               if built with procps library and can wait for"
+        "\n                               process groups, exit with status success,"
+        "\n                               otherwise, exit with failure"
+        "\n"
+        "\n    All the timeout durations are specified as floating point numbers with"
+        "\n    optional suffixes 's' for seconds (default), 'm' for minutes, 'h' for hours,"
+        "\n    and 'd' for days. The --wait-for-process-group option also accepts special"
+        "\n    duration 'forever' (equal to max double) as a literal string (no quotes)."
         "\n"
-        "\nAll the timeout durations are specified as floating point numbers with optional suffixes 's' for seconds,"
-        "\n(default), 'm' for minutes, 'h' for hours, and 'd' for days. The '--wait-for-process-group' option also"
-        "\n accepts special duration 'forever' (equal to max double) given as a literal string (no quotes). If both"
-        "\n'--kill-after and --wait-for-process-group' durations are specified, the former takes precedence."
+        "\n    If both --kill-after and --wait-for-process-group durations are specified,"
+        "\n    the former takes precedence."
         "\n"
         "\nReturn value:"
-        "\n    - if the command times out, exit with status 124"
-        "\n    - if the command does not exit on the first signal, and the KILL signal is sent, exit with"
-        "\n      status 128+9"
-        "\n    - otherwise, exit with the status of command"
+        "\n    * if the command times out, exit with status 124"
+        "\n    * if the command does not exit on the first signal, and the KILL signal is"
+        "\n      sent, exit with status 128+9"
+        "\n    * otherwise, exit with the status of command"
         "\n"
         "\nExamples:"
         "\n    Run an application:"
@@ -131,21 +162,25 @@ void usage( bool )
         "\n"
         "\n    Run an application, send KILL signal in 5 seconds if does not die:"
         "\n        comma-timeout-group -k 5 10 sleep 3"
-        "\n            if the application does not exit within 5 s in response to the first signal (TERM,"
-        "\n            default), send KILL signal"
+        "\n            if the application does not exit within 5 s in response to the first"
+        "\n            signal (TERM, default), send KILL signal"
         "\n"
         "\n    Pass custom signal:"
         "\n        comma-timeout-group --signal=USR1 10 sleep 3"
-        "\n            send USR1 after 10 s timeout"
-        "\n            send the bash process the USR1 signal if it is still running in 10 s after start"
-        "\n            send the entire process group the KILL signal if it is still running after another 5 s"
+        "\n            * send USR1 after 10s timeout"
+        "\n            * send the bash process the USR1 signal if it is still running 10s"
+        "\n              after start"
+        "\n            * send the entire process group the KILL signal if it is still"
+        "\n              running after another 5s"
         "\n"
         "\n    Wait for all processes in the group:"
-        "\n        comma-timeout-group --wait-for-process-group=5 10 application"
-        "\n            or"
-        "\n        comma-timeout-group --wait-for-process-group=5 10 application"
-        "\n            wait for 5 s for all processes in the group to exit; if some are left, send KILL"
-        "\n            if your version is built without procps support, however, the call above"
+        "\n        comma-timeout-group --wait-for-process-group=5 10 cmd"
+        "\n            wait for 5 s for all processes in the group to exit; if some are"
+        "\n            left, send KILL"
+        "\n        -or-"
+        "\n        comma-timeout-group --wait-for-process-group=5 --enforce-group 10 cmd"
+        "\n            as above, but if comma-timeout-group is built without procps support"
+        "\n            exit with error"
         "\n"
         "\n";
     std::cerr << msg_general << comma::contact_info << std::endl << std::endl;

From 9a19e5e990fb9b1567216a16484fa715192979e9 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 26 Oct 2020 19:17:15 +1100
Subject: [PATCH 0202/1056] util/applications/CMakeLists.txt: don't cache
 procps result on failure

so that we can check again next time in case the dev package has been installed
---
 util/applications/CMakeLists.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/util/applications/CMakeLists.txt b/util/applications/CMakeLists.txt
index daffc41a6..3b5519214 100644
--- a/util/applications/CMakeLists.txt
+++ b/util/applications/CMakeLists.txt
@@ -17,6 +17,9 @@ if( NOT WIN32 )
             if( HAVE_PROCPS_SYSTEMD )
                 set_source_files_properties( comma-timeout-group.cpp PROPERTIES COMPILE_FLAGS "-DHAVE_PROCPS_DEV -DWITH_SYSTEMD" )
             endif( HAVE_PROCPS_SYSTEMD )
+        else()
+            # unset the cached result, so that we check again next time, in case the library is installed
+            unset( HAVE_PROCPS_DEV CACHE )
         endif( HAVE_PROCPS_DEV )
         target_link_libraries(comma-timeout-group ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_name_value ${LIBPROCPS} )
         INSTALL( TARGETS comma-timeout-group RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )

From 3ae324fdd131d27841ed01390c7cfc9252e874d2 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 28 Oct 2020 13:34:53 +1100
Subject: [PATCH 0203/1056] cmake: fixing cpack...

---
 CMakeLists.txt | 30 ++++++++++++++----------------
 1 file changed, 14 insertions(+), 16 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e21f8de81..c6fffbdc0 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -323,33 +323,31 @@ ADD_SUBDIRECTORY( python )
 #if we set them up to install to bin they might be packaged through, e.g. roughly (using GLOB):
 #install(FILES "${Boost_LIBRARY_DIRS}/*.dll" DESTINATION bin )
 
-#the following set up optional parameters for cpack
-SET(CPACK_PACKAGE_NAME "comma")
-SET(CPACK_PACKAGE_DESCRIPTION_SUMMARY "Command line utilities to manipulate various structured and unstructured data from offline or real time data.")
-SET(CPACK_PACKAGE_VENDOR "Australian Centre for Field Robotics")
-SET(CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING")
-SET(CPACK_PACKAGE_VERSION_MAJOR "1")
-SET(CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE})
-SET(CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH})
-SET(CPACK_PACKAGE_CONTACT "t.teo@acfr.usyd.edu.au")
-
+set( CPACK_PACKAGE_NAME "comma" )
+set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "command line utilities to manipulate various structured and unstructured data from offline or realtime data" )
+set( CPACK_PACKAGE_VENDOR "orthographic" )
+set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING" )
+set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
+set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
+set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
+set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "libzmq5 (>= 4.2.5-1), libprocps6 (>= 2:3.3.0), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
+
+# this code needs a brush-up
 # If the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
 IF( BUILD_SHARED_LIBS )
-	SET(CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig")
+    SET(CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig")
 ENDIF( BUILD_SHARED_LIBS )
-
-
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy")
     SET(CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
     SET(CPACK_RPM_PRE_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-pre-install.sh" )
-	# Prevents /tmp from permission change when installing RPM package
-	SET(CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" )
+    # Prevents /tmp from permission change when installing RPM package
+    SET(CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" )
 ELSE( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread socat psmisc recode")
 ENDIF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
 
-
 #this line finds the appropriate Visual Studio DLLS in windows. Maybe it would find other dlls if a different build tool were used. Probably should be windows only.
 INCLUDE( InstallRequiredSystemLibraries )
 

From 6e41001c2688245d8b843922f479588060a32aba Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 28 Oct 2020 16:19:03 +1100
Subject: [PATCH 0204/1056] system/apt: in progress...

---
 system/apt/Dockerfile             |  8 ++++++++
 system/apt/comma-apt-cpack        | 20 ++++++++++++++++++++
 system/apt/comma-apt-docker-build |  6 ++++++
 system/apt/comma-apt-docker-run   | 15 +++++++++++++++
 4 files changed, 49 insertions(+)
 create mode 100644 system/apt/Dockerfile
 create mode 100755 system/apt/comma-apt-cpack
 create mode 100755 system/apt/comma-apt-docker-build
 create mode 100755 system/apt/comma-apt-docker-run

diff --git a/system/apt/Dockerfile b/system/apt/Dockerfile
new file mode 100644
index 000000000..f30988c19
--- /dev/null
+++ b/system/apt/Dockerfile
@@ -0,0 +1,8 @@
+ARG version
+FROM ubuntu:${version}
+ENV DEBIAN_FRONTEND="noninteractive"
+RUN apt update \
+    && apt install software-properties-common --yes \
+    && apt install --yes ansible git build-essential cmake cmake-curses-gui
+
+# && apt-add-repository --yes --update ppa:ansible/ansible \
diff --git a/system/apt/comma-apt-cpack b/system/apt/comma-apt-cpack
new file mode 100755
index 000000000..6c894bfe6
--- /dev/null
+++ b/system/apt/comma-apt-cpack
@@ -0,0 +1,20 @@
+#!/bin/bash
+
+version_major=$1
+version_minor=$2
+version_patch=$3
+comma_dir="$4"
+[[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
+[[ -n "$version_patch" ]] || { echo "usage: $0 <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
+echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.python3.yml'..." >&2
+ansible-playbook "$comma_dir/system/ansible/install.python3.yml"
+(
+    cd ~/src/comma/build
+    echo "$0: running cmake in $( pwd )" >&2
+    cmake -DCPACK_GENERATOR=DEB -DCPACK_PACKAGE_VERSION_MAJOR=$version_major -DCPACK_PACKAGE_VERSION_MINOR=$version_minor -DCPACK_PACKAGE_VERSION_PATCH=$version_patch
+    echo "$0: running cpack in $( pwd )" >&2
+    cmake cpack
+    cd ~/src/comma/python
+    echo "$0: setting up python in $( pwd )" >&2
+    python3 setup.py --command-packages=stdeb.command bdist_deb
+)
diff --git a/system/apt/comma-apt-docker-build b/system/apt/comma-apt-docker-build
new file mode 100755
index 000000000..61de002fb
--- /dev/null
+++ b/system/apt/comma-apt-docker-build
@@ -0,0 +1,6 @@
+#!/bin/bash
+version=$1
+comma_dir="$2"
+[[ -n "$version" ]] || { echo "usage: $0 <ubuntu version> [<comma dir>]; e.g. $0 20.04" >&2; exit 1; }
+[[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
+docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/apt/Dockerfile" .
diff --git a/system/apt/comma-apt-docker-run b/system/apt/comma-apt-docker-run
new file mode 100755
index 000000000..9b6e984ae
--- /dev/null
+++ b/system/apt/comma-apt-docker-run
@@ -0,0 +1,15 @@
+#!/bin/bash
+
+ubuntu_version=$1
+comma_version_major=$2
+comma_version_minor=$3
+comma_version_patch=$4
+comma_dir="$5"
+[[ -n "$comma_version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
+[[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
+
+docker run \
+       --mount type=bind,source=$comma_dir,target=/mnt/comma \
+       --mount type=bind,source=$( pwd ),target=/root/src/comma/build \
+       ubuntu.$ubuntu_version.build.basics \
+       /mnt/comma/system/apt/comma-apt-cpack $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma

From d6aa8cc93570bfd3e23f595bb820ba8f9dafd910 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 28 Oct 2020 19:16:59 +1100
Subject: [PATCH 0205/1056] system/apt: in progress...

---
 system/apt/comma-apt-cpack      | 16 ++++++++++------
 system/apt/comma-apt-docker-run |  2 +-
 2 files changed, 11 insertions(+), 7 deletions(-)

diff --git a/system/apt/comma-apt-cpack b/system/apt/comma-apt-cpack
index 6c894bfe6..a38222604 100755
--- a/system/apt/comma-apt-cpack
+++ b/system/apt/comma-apt-cpack
@@ -1,20 +1,24 @@
 #!/bin/bash
 
+function die() { echo "$0: $@" >&2; exit 1; }
+
 version_major=$1
 version_minor=$2
 version_patch=$3
 comma_dir="$4"
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
 [[ -n "$version_patch" ]] || { echo "usage: $0 <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
-echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.python3.yml'..." >&2
-ansible-playbook "$comma_dir/system/ansible/install.python3.yml"
+cd ~
+echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.python3.yml' in $( pwd )..." >&2
+ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
 (
-    cd ~/src/comma/build
+    cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
-    cmake -DCPACK_GENERATOR=DEB -DCPACK_PACKAGE_VERSION_MAJOR=$version_major -DCPACK_PACKAGE_VERSION_MINOR=$version_minor -DCPACK_PACKAGE_VERSION_PATCH=$version_patch
+    cmake . -DCPACK_GENERATOR=DEB -DCPACK_PACKAGE_VERSION_MAJOR=$version_major -DCPACK_PACKAGE_VERSION_MINOR=$version_minor -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
-    cmake cpack
+    cmake cpack || die "failed"
     cd ~/src/comma/python
     echo "$0: setting up python in $( pwd )" >&2
-    python3 setup.py --command-packages=stdeb.command bdist_deb
+    python3 setup.py --command-packages=stdeb.command bdist_deb  || die "failed"
+    echo "$0: done" >&2
 )
diff --git a/system/apt/comma-apt-docker-run b/system/apt/comma-apt-docker-run
index 9b6e984ae..e3d6df41a 100755
--- a/system/apt/comma-apt-docker-run
+++ b/system/apt/comma-apt-docker-run
@@ -10,6 +10,6 @@ comma_dir="$5"
 
 docker run \
        --mount type=bind,source=$comma_dir,target=/mnt/comma \
-       --mount type=bind,source=$( pwd ),target=/root/src/comma/build \
+       --mount type=bind,source=$( pwd ),target=/root/build/comma \
        ubuntu.$ubuntu_version.build.basics \
        /mnt/comma/system/apt/comma-apt-cpack $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma

From b67af098de0ba9437a0527297db38f234a6501c8 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 28 Oct 2020 19:24:37 +1100
Subject: [PATCH 0206/1056] system/apt: typo fixed; in progress...

---
 system/apt/comma-apt-cpack | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/apt/comma-apt-cpack b/system/apt/comma-apt-cpack
index a38222604..54cb3bfd5 100755
--- a/system/apt/comma-apt-cpack
+++ b/system/apt/comma-apt-cpack
@@ -16,7 +16,7 @@ ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB -DCPACK_PACKAGE_VERSION_MAJOR=$version_major -DCPACK_PACKAGE_VERSION_MINOR=$version_minor -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
-    cmake cpack || die "failed"
+    cpack || die "failed"
     cd ~/src/comma/python
     echo "$0: setting up python in $( pwd )" >&2
     python3 setup.py --command-packages=stdeb.command bdist_deb  || die "failed"

From 3b948c57edf4a662c68c9cdc040c34ea4b818a24 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 28 Oct 2020 19:34:30 +1100
Subject: [PATCH 0207/1056] system/apt: maintainer added; in progress...

---
 CMakeLists.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c6fffbdc0..e5b7f894d 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -332,6 +332,7 @@ set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "libzmq5 (>= 4.2.5-1), libprocps6 (>= 2:3.3.0), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
+set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
 # this code needs a brush-up
 # If the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.

From 88e670f86545148bbbe17317006a72cdaba0687b Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Wed, 28 Oct 2020 19:38:39 +1100
Subject: [PATCH 0208/1056] system/apt: readme added; in progress...

---
 system/apt/readme | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)
 create mode 100644 system/apt/readme

diff --git a/system/apt/readme b/system/apt/readme
new file mode 100644
index 000000000..4872a8310
--- /dev/null
+++ b/system/apt/readme
@@ -0,0 +1,16 @@
+to build docker that has ansible, cmake, etc, run:
+
+> comma-apt-docker-build 18.04 # ubuntu 18.04
+> comma-apt-docker-build 20.04 # ubuntu 20.04
+
+to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
+
+> comma-apt-docker-build 20.04 1 2 3
+
+if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run:
+
+to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
+
+> comma-apt-docker-build 20.04 1 2 3 ~/my/src/comma
+
+debian package will be built in your current directory

From 7d5ea9d7625f5f4dd01a4810a38c1ebc80770db4 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 28 Oct 2020 22:31:38 +1100
Subject: [PATCH 0209/1056] system/apt: readme brushed up

---
 system/apt/readme | 12 +++++-------
 1 file changed, 5 insertions(+), 7 deletions(-)

diff --git a/system/apt/readme b/system/apt/readme
index 4872a8310..a0e9ec923 100644
--- a/system/apt/readme
+++ b/system/apt/readme
@@ -1,16 +1,14 @@
-to build docker that has ansible, cmake, etc, run:
+to build docker that has ansible, cmake, etc, run (you may need to run as sudo - am not sure why; try without sudo first):
 
-> comma-apt-docker-build 18.04 # ubuntu 18.04
-> comma-apt-docker-build 20.04 # ubuntu 20.04
+> ./comma-apt-docker-build 18.04 # ubuntu 18.04
+> ./comma-apt-docker-build 20.04 # ubuntu 20.04
 
 to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
 
-> comma-apt-docker-build 20.04 1 2 3
+> ./comma-apt-docker-build 20.04 1 2 3
 
 if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run:
 
-to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
-
-> comma-apt-docker-build 20.04 1 2 3 ~/my/src/comma
+> ./comma-apt-docker-run 20.04 1 2 3 ~/my/src/comma
 
 debian package will be built in your current directory

From 6a783756e89f4dbf707207d1a9b08d675dd25c26 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 12:23:11 +1100
Subject: [PATCH 0210/1056] system/apt: disabled building a separate python
 package; in progress...

---
 system/apt/comma-apt-cpack      |  6 +++---
 system/apt/comma-apt-docker-run | 10 +++++++---
 2 files changed, 10 insertions(+), 6 deletions(-)

diff --git a/system/apt/comma-apt-cpack b/system/apt/comma-apt-cpack
index 54cb3bfd5..80fe95233 100755
--- a/system/apt/comma-apt-cpack
+++ b/system/apt/comma-apt-cpack
@@ -17,8 +17,8 @@ ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
     cmake . -DCPACK_GENERATOR=DEB -DCPACK_PACKAGE_VERSION_MAJOR=$version_major -DCPACK_PACKAGE_VERSION_MINOR=$version_minor -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"
-    cd ~/src/comma/python
-    echo "$0: setting up python in $( pwd )" >&2
-    python3 setup.py --command-packages=stdeb.command bdist_deb  || die "failed"
+    #cd ~/src/comma/python
+    #echo "$0: setting up python in $( pwd )" >&2
+    #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     echo "$0: done" >&2
 )
diff --git a/system/apt/comma-apt-docker-run b/system/apt/comma-apt-docker-run
index e3d6df41a..21b54b211 100755
--- a/system/apt/comma-apt-docker-run
+++ b/system/apt/comma-apt-docker-run
@@ -8,8 +8,12 @@ comma_dir="$5"
 [[ -n "$comma_version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
 
+rm -rf build
+mkdir build -p
 docker run \
-       --mount type=bind,source=$comma_dir,target=/mnt/comma \
-       --mount type=bind,source=$( pwd ),target=/root/build/comma \
+       --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
+       --mount "type=bind,source=$( pwd )/build,target=/root/build/comma" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/apt/comma-apt-cpack $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma
+       /mnt/comma/system/apt/comma-apt-cpack $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
+cp build/comma-$comma_version_major.$comma_version_minor.$comma_version_patch-Linux.deb .
+rm -rf build

From b6f984edf756711c25c7c46bd6c578417ab072b1 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 12:52:00 +1100
Subject: [PATCH 0211/1056] system/apt: testing package

---
 system/apt/comma-apt-docker-run                  |  4 ++--
 system/apt/comma-apt-docker-test                 | 16 ++++++++++++++++
 .../{comma-apt-cpack => comma-apt-package-make}  |  0
 system/apt/comma-apt-package-test                | 13 +++++++++++++
 system/apt/readme                                |  5 +++++
 5 files changed, 36 insertions(+), 2 deletions(-)
 create mode 100755 system/apt/comma-apt-docker-test
 rename system/apt/{comma-apt-cpack => comma-apt-package-make} (100%)
 create mode 100755 system/apt/comma-apt-package-test

diff --git a/system/apt/comma-apt-docker-run b/system/apt/comma-apt-docker-run
index 21b54b211..aba18b287 100755
--- a/system/apt/comma-apt-docker-run
+++ b/system/apt/comma-apt-docker-run
@@ -14,6 +14,6 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$( pwd )/build,target=/root/build/comma" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/apt/comma-apt-cpack $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/apt/comma-apt-package-make $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
 cp build/comma-$comma_version_major.$comma_version_minor.$comma_version_patch-Linux.deb .
-rm -rf build
+sudo rm -rf build
diff --git a/system/apt/comma-apt-docker-test b/system/apt/comma-apt-docker-test
new file mode 100755
index 000000000..e4882de8d
--- /dev/null
+++ b/system/apt/comma-apt-docker-test
@@ -0,0 +1,16 @@
+#!/bin/bash
+
+function die() { echo "$0: $@" >&2; exit 1; }
+
+package="$1"
+comma_dir="$2"
+[[ -n "$package" ]] || { echo "usage: $0 <package> [<comma dir>]" >&2; exit 1; }
+[[ -s "$package" ]] || die "file not found or empty: '$package'"
+[[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
+package_dir=$( dirname "$( realpath "$package" )" )
+
+docker run \
+       --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
+       --mount "type=bind,source=$package_dir,target=/mnt/package" \
+       ubuntu.$ubuntu_version.build.basics \
+       /mnt/comma/system/apt/comma-apt-package-test "/mnt/package/$( basename "$package" )" || { echo "$0: failed" >&2; exit 1; }
diff --git a/system/apt/comma-apt-cpack b/system/apt/comma-apt-package-make
similarity index 100%
rename from system/apt/comma-apt-cpack
rename to system/apt/comma-apt-package-make
diff --git a/system/apt/comma-apt-package-test b/system/apt/comma-apt-package-test
new file mode 100755
index 000000000..91b2eef56
--- /dev/null
+++ b/system/apt/comma-apt-package-test
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+package="$1"
+[[ -n "$package" ]] || { echo "usage: $0 <package>" >&2; exit 1; }
+apt install --yes "$package"
+
+echo '======================================' >&2
+ls /usr/bin/csv-* | cat >&2
+echo '======================================' >&2
+
+csv-paste line-number | csv-to-bin ui | csv-from-bin ui | head >&2
+
+echo '======================================' >&2
diff --git a/system/apt/readme b/system/apt/readme
index a0e9ec923..60045ac16 100644
--- a/system/apt/readme
+++ b/system/apt/readme
@@ -12,3 +12,8 @@ if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run:
 > ./comma-apt-docker-run 20.04 1 2 3 ~/my/src/comma
 
 debian package will be built in your current directory
+
+test that package is ok
+
+> ./comma-apt-docker-test comma-1.0.0-Linux.deb
+

From 1fd29778d2b125d6b72db67a314192e879efa311 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 12:54:14 +1100
Subject: [PATCH 0212/1056] system/apt: testing package...

---
 system/apt/comma-apt-docker-test | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/system/apt/comma-apt-docker-test b/system/apt/comma-apt-docker-test
index e4882de8d..7c80859c9 100755
--- a/system/apt/comma-apt-docker-test
+++ b/system/apt/comma-apt-docker-test
@@ -2,9 +2,10 @@
 
 function die() { echo "$0: $@" >&2; exit 1; }
 
-package="$1"
-comma_dir="$2"
-[[ -n "$package" ]] || { echo "usage: $0 <package> [<comma dir>]" >&2; exit 1; }
+ubuntu_version="$1"
+package="$2"
+comma_dir="$3"
+[[ -n "$package" ]] || { echo "usage: $0 <ubuntu version> <package> [<comma dir>]" >&2; exit 1; }
 [[ -s "$package" ]] || die "file not found or empty: '$package'"
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
 package_dir=$( dirname "$( realpath "$package" )" )

From de976d012377c0b5b966af29025771b617435e16 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 13:00:01 +1100
Subject: [PATCH 0213/1056] system/apt: renamed to system/package

---
 system/{apt => package}/Dockerfile                   |  0
 .../comma-package-docker-build}                      |  2 +-
 .../comma-package-docker-run}                        |  2 +-
 .../comma-package-docker-test}                       |  2 +-
 .../comma-package-make}                              |  0
 .../comma-package-test}                              |  4 +++-
 system/{apt => package}/readme                       | 12 ++++++------
 7 files changed, 12 insertions(+), 10 deletions(-)
 rename system/{apt => package}/Dockerfile (100%)
 rename system/{apt/comma-apt-docker-build => package/comma-package-docker-build} (80%)
 rename system/{apt/comma-apt-docker-run => package/comma-package-docker-run} (92%)
 rename system/{apt/comma-apt-docker-test => package/comma-package-docker-test} (90%)
 rename system/{apt/comma-apt-package-make => package/comma-package-make} (100%)
 rename system/{apt/comma-apt-package-test => package/comma-package-test} (73%)
 rename system/{apt => package}/readme (53%)

diff --git a/system/apt/Dockerfile b/system/package/Dockerfile
similarity index 100%
rename from system/apt/Dockerfile
rename to system/package/Dockerfile
diff --git a/system/apt/comma-apt-docker-build b/system/package/comma-package-docker-build
similarity index 80%
rename from system/apt/comma-apt-docker-build
rename to system/package/comma-package-docker-build
index 61de002fb..8c9faa137 100755
--- a/system/apt/comma-apt-docker-build
+++ b/system/package/comma-package-docker-build
@@ -3,4 +3,4 @@ version=$1
 comma_dir="$2"
 [[ -n "$version" ]] || { echo "usage: $0 <ubuntu version> [<comma dir>]; e.g. $0 20.04" >&2; exit 1; }
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
-docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/apt/Dockerfile" .
+docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/Dockerfile" .
diff --git a/system/apt/comma-apt-docker-run b/system/package/comma-package-docker-run
similarity index 92%
rename from system/apt/comma-apt-docker-run
rename to system/package/comma-package-docker-run
index aba18b287..8eaec95ef 100755
--- a/system/apt/comma-apt-docker-run
+++ b/system/package/comma-package-docker-run
@@ -14,6 +14,6 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$( pwd )/build,target=/root/build/comma" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/apt/comma-apt-package-make $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/comma-package-make $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
 cp build/comma-$comma_version_major.$comma_version_minor.$comma_version_patch-Linux.deb .
 sudo rm -rf build
diff --git a/system/apt/comma-apt-docker-test b/system/package/comma-package-docker-test
similarity index 90%
rename from system/apt/comma-apt-docker-test
rename to system/package/comma-package-docker-test
index 7c80859c9..d0b888693 100755
--- a/system/apt/comma-apt-docker-test
+++ b/system/package/comma-package-docker-test
@@ -14,4 +14,4 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$package_dir,target=/mnt/package" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/apt/comma-apt-package-test "/mnt/package/$( basename "$package" )" || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/comma-package-test "/mnt/package/$( basename "$package" )" || { echo "$0: failed" >&2; exit 1; }
diff --git a/system/apt/comma-apt-package-make b/system/package/comma-package-make
similarity index 100%
rename from system/apt/comma-apt-package-make
rename to system/package/comma-package-make
diff --git a/system/apt/comma-apt-package-test b/system/package/comma-package-test
similarity index 73%
rename from system/apt/comma-apt-package-test
rename to system/package/comma-package-test
index 91b2eef56..411c86f0f 100755
--- a/system/apt/comma-apt-package-test
+++ b/system/package/comma-package-test
@@ -1,8 +1,10 @@
 #!/bin/bash
 
+function die() { echo "$0: $@" >&2; exit 1; }
+
 package="$1"
 [[ -n "$package" ]] || { echo "usage: $0 <package>" >&2; exit 1; }
-apt install --yes "$package"
+apt install --yes "$package" || die "failed to install package '$package'"
 
 echo '======================================' >&2
 ls /usr/bin/csv-* | cat >&2
diff --git a/system/apt/readme b/system/package/readme
similarity index 53%
rename from system/apt/readme
rename to system/package/readme
index 60045ac16..5cde855c0 100644
--- a/system/apt/readme
+++ b/system/package/readme
@@ -1,19 +1,19 @@
 to build docker that has ansible, cmake, etc, run (you may need to run as sudo - am not sure why; try without sudo first):
 
-> ./comma-apt-docker-build 18.04 # ubuntu 18.04
-> ./comma-apt-docker-build 20.04 # ubuntu 20.04
+> ./comma-package-docker-build 18.04 # ubuntu 18.04
+> ./comma-package-docker-build 20.04 # ubuntu 20.04
 
 to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
 
-> ./comma-apt-docker-build 20.04 1 2 3
+> ./comma-package-docker-build 20.04 1 2 3
 
 if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run:
 
-> ./comma-apt-docker-run 20.04 1 2 3 ~/my/src/comma
+> ./comma-package-docker-run 20.04 1 2 3 ~/my/src/comma
 
 debian package will be built in your current directory
 
-test that package is ok
+test that package is ok, e.g:
 
-> ./comma-apt-docker-test comma-1.0.0-Linux.deb
+> ./comma-package-docker-test 20.04 comma-1.0.0-Linux.deb
 

From 9c529d5800735ca3dfd6d4482b0c36a2d11af5cc Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Thu, 29 Oct 2020 13:20:02 +1100
Subject: [PATCH 0214/1056] csv-random: true-random: implemented --type,
 updated usage

---
 csv/applications/csv-random.cpp | 96 +++++++++++++++++++++------------
 1 file changed, 61 insertions(+), 35 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 277d84d1f..ff415e1ae 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -79,8 +79,8 @@ static void usage( bool verbose )
     std::cerr << "operations" << std::endl;
     std::cerr << "    make: output pseudo-random numbers" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "        usage: csv-random make <options> > random.csv" << std::endl;
-    std::cerr << "               cat records.csv | csv-random make --append <options> > appended.csv" << std::endl;
+    std::cerr << "        usage: csv-random make [<options>] > random.csv" << std::endl;
+    std::cerr << "               cat records.csv | csv-random make --append [<options>] > appended.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --append; append random numbers to stdin input" << std::endl;
@@ -94,10 +94,12 @@ static void usage( bool verbose )
     std::cerr << "                 e.g. a hardware device, output will be pseudo-random" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        usage: csv-random true-random [<options>]" << std::endl;
+    std::cerr << "               cat records.csv | csv-random true-random --append <options> > appended.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --append; append random number to stdin input" << std::endl;
     std::cerr << "            --once; output random number only once" << std::endl;
+    std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
     std::cerr << "            --type=<type>; default=ui; todo: supported values: ui; e.g: --type=3ui; --type=ui,ui,ui; etc" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        example" << std::endl;
@@ -147,19 +149,19 @@ namespace comma { namespace applications { namespace random {
 template < typename T >
 struct type_traits
 {
-    static T cast( T t ) { return t; }
+    static T cast( const T t ) { return t; }
 };
 
 template <>
 struct type_traits< char >
 {
-    static int cast( char t ) { return static_cast< int >( t ); }
+    static int cast( const char t ) { return static_cast< int >( t ); }
 };
 
 template <>
 struct type_traits< unsigned char >
 {
-    static unsigned int cast( unsigned char t ) { return static_cast< int >( t ); }
+    static unsigned int cast( const unsigned char t ) { return static_cast< int >( t ); }
 };
 
 namespace make {
@@ -406,58 +408,82 @@ static int run( const comma::command_line_options& options )
 
 namespace true_random {
 
-static int run( const comma::command_line_options& options )
+template < typename T >
+static int run_impl( const comma::command_line_options& options, std::size_t count )
 {
     std::random_device rd;
-    bool binary = options.exists( "--output-binary" ) || ::csv.binary();
-    if( options.exists( "--once" ) )
+    const bool binary = options.exists( "--output-binary" ) || ::csv.binary();
+    const bool flush = options.exists( "--flush" ) || ::csv.flush;
+    auto output_line_to_stdout = [&]( std::string&& initial_delimiter )
     {
-        auto r = rd();
-        if ( binary ) { std::cout.write( reinterpret_cast< char * >( &r ), sizeof( r ) ); }
-        else { std::cout << r << std::endl; }
-        return 0;
-    }
+        for( std::size_t i = 0; i < count; ++i )
+        {
+            const T r = rd();
+            if( binary ) { std::cout.write( reinterpret_cast< const char* >( &r ), sizeof( T ) ); }
+            else { std::cout << std::exchange( initial_delimiter, ::csv.delimiter ) << type_traits< T >::cast( r ); }
+        }
+        if( !binary ) { std::cout << std::endl; }
+        if( flush ) { std::cout << std::flush; }
+    };
     if( options.exists( "--append" ) )
     {
-        if( ::csv.binary() )
+        while( std::cin.good() )
         {
-            std::vector< char > buf( ::csv.format().size() );
-            while( std::cin.good() )
+            auto buf = ::csv.binary() ? std::string( ::csv.format().size(), {} ) : std::string{};
+            if( ::csv.binary() )
             {
                 std::cin.read( &buf[0], buf.size() );
-                if( std::cin.gcount() == 0 ) { break; }
-                if( std::cin.gcount() != static_cast< int >( buf.size() ) ) { std::cerr << "csv-random true-random: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
-                std::cout.write( &buf[0], buf.size() );
-                auto r = rd();
-                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( r ) );
-                if( ::csv.flush ) { std::cout.flush(); }
+                if( std::cin.gcount() == 0 ) { return 0; }
+                if( std::cin.gcount() != static_cast< int >( buf.size() ) )
+                {
+                    std::cerr << "csv-random true-random: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl;
+                    return 1;
+                }
             }
-        }
-        else
-        {
-            while( std::cin.good() )
+            else
             {
-                std::string s;
-                std::getline( std::cin, s );
-                if( s.empty() ) { continue; }
-                std::cout << s << ::csv.delimiter << rd() << std::endl;
-                if( ::csv.flush ) { std::cout.flush(); }
+                std::getline( std::cin, buf );
+                if( buf.empty() ) { continue; }
             }
+            std::cout.write( &buf[0], buf.size() );
+            output_line_to_stdout( { ::csv.delimiter } );
         }
     }
     else
     {
         while( std::cout.good() )
         {
-            auto r = rd();
-            if( binary ) { std::cout.write( reinterpret_cast< char* >( &r ), sizeof( r ) ); }
-            else { std::cout << r << std::endl; }
-            if( ::csv.flush ) { std::cout.flush(); }
+            output_line_to_stdout( {} );
+            if( options.exists( "--once" ) ) { break; }
         }
     }
     return 0;
 }
 
+static int run( const comma::command_line_options& options )
+{
+    const auto format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
+    if( format.collapsed_string().find( ',' ) != std::string::npos )
+    {
+        std::cerr << "csv-random true-random: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl;
+        return 1;
+    }
+    switch( format.offset( 0 ).type ) {
+        case csv::format::int8: return run_impl< char >( options, format.count() );
+        case csv::format::uint8: return run_impl< unsigned char >( options, format.count() );
+        case csv::format::int16: return run_impl< comma::int16 >( options, format.count() );
+        case csv::format::uint16: return run_impl< comma::uint16 >( options, format.count() );
+        case csv::format::int32: return run_impl< comma::int32 >( options, format.count() );
+        case csv::format::uint32: return run_impl< comma::uint32 >( options, format.count() );
+        case csv::format::int64: return run_impl< comma::int64 >( options, format.count() );
+        case csv::format::uint64: return run_impl< comma::uint64 >( options, format.count() );
+        case csv::format::float_t: return run_impl< float >( options, format.count() );
+        case csv::format::double_t: return run_impl< double >( options, format.count() );
+        default: std::cerr << "csv-random true-random: expected type; got: '" << format.string() << "'" << std::endl;
+    }
+    return 1;
+}
+
 } // namespace true_random {
 
 } } } // namespace comma { namespace applications { namespace random {

From 021f7342124f760cbbb0b2583f8279837b2486a8 Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Thu, 29 Oct 2020 13:39:14 +1100
Subject: [PATCH 0215/1056] csv-shape: brushed up usage

---
 csv/applications/csv-shape.cpp | 39 +++++++++++++++++-----------------
 1 file changed, 19 insertions(+), 20 deletions(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index bae53b53d..e346a6186 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -55,18 +55,14 @@ static void usage( bool verbose=false )
     std::cerr << "Usage: cat data.csv | csv-shape <operation> [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
-    std::cerr << "    --binary,-b=[<format>]: in binary mode: format string of the input csv data types" << std::endl;
-    std::cerr << "    --delimiter,-d=[<char>]; default=','; in ascii mode, field separating character." << std::endl;
+    std::cerr << "    --expected-records; output the expected records for given --size and --step, and exit" << std::endl;
     std::cerr << "    --help,-h;  see this usage message" << std::endl;
+    std::cerr << "    --size,-n=<num>; number of input records in each grouping, range: 2 and above" << std::endl;
+    std::cerr << "    --step=<num>; default=1; relative offset of the records to be concatenated" << std::endl;
     std::cerr << "    --verbose,-v: more output to stderr, shows examples with --help,-h" << std::endl;
     std::cerr << std::endl;
-    if( verbose ) { std::cerr << comma::csv::format::usage() << std::endl; }
     std::cerr << "operations options" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "   common options" << std::endl;
-    std::cerr << "      --size,-n=<num>; number of input records in each grouping, range: 2 and above" << std::endl;
-    std::cerr << "      --step=<num>; default=1; relative offset of the records to be concatenated" << std::endl;
-    std::cerr << "      --expected-records; output the expected records for given --size and --step, and exit" << std::endl;
     std::cerr << "   concatenate" << std::endl;
     std::cerr << "      --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
     std::cerr << "      --reverse; output records in reverse order (e.g. b,a)" << std::endl;
@@ -77,9 +73,9 @@ static void usage( bool verbose=false )
     std::cerr << std::endl;
     if( verbose )
     {
-        std::cerr << "examples" << std::endl;   
+        std::cerr << "examples" << std::endl;
         std::cerr << "   concatenate" << std::endl;
-        std::cerr << "      non overlaping groups:" << std::endl;
+        std::cerr << "      non-overlapping groups:" << std::endl;
         std::cerr << "          concatenate each group of 5 input records into one output record." << std::endl;
         std::cerr << "          input records 1 to 5 create the first output record, input records 6-10 create the second output record, and so forth." << std::endl;
         std::cerr << "              seq 1 15 | csv-shape concatenate -n 5" << std::endl;
@@ -87,6 +83,9 @@ static void usage( bool verbose=false )
         std::cerr << "          move a sliding window of size 5 along the input records, every time the sliding window moves, make an output record from window" << std::endl;
         std::cerr << "          input records 1 to 5 create the first output record, input records 2 to 6 create the second record, input records 3 to 7 create the third record, and so forth" << std::endl;
         std::cerr << "              seq 1 10 | csv-shape concatenate -n 5 --sliding-window" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "csv options" << std::endl;
+        std::cerr << comma::csv::options::usage() << std::endl;
     }
     else
     {
@@ -114,7 +113,7 @@ class concatenate_
 {
 public:
 
-    concatenate_() 
+    concatenate_()
         : use_sliding_window_(false)
         , bidirectional_(false)
         , reverse_(false)
@@ -153,7 +152,7 @@ class concatenate_
                 if (!verify(deque)) { return 1; }
                 count_ = 0;
                 if ( looping_ ) { output_loop(deque, first, csv); }
-                deque.clear();  
+                deque.clear();
             }
             block_ = p->block;
             deque.push_back( istream.last() );
@@ -184,17 +183,17 @@ class concatenate_
     comma::uint32 expected_records_;
 
     bool verify( const std::deque<std::string>& deque )
-    { 
+    {
         if( use_sliding_window_ && count_ < step_ * ( size_ - 1 ) + 1 )
-        { 
+        {
             std::cerr << comma::verbose.app_name() << ": --size,-n=" << size_ << ", --step=" << step_ << ", expected records count (" << step_ * ( size_ - 1 ) + 1
-                      << ") is bigger than total number of input records: " << count_ << std::endl; 
-            return false; 
+                      << ") is bigger than total number of input records: " << count_ << std::endl;
+            return false;
         }
-        if ( !use_sliding_window_ && !deque.empty() ) 
-        { 
-            std::cerr << comma::verbose.app_name() << ": error, leftover tail input record found: " << deque.size() << " lines." << std::endl; 
-            return false; 
+        if ( !use_sliding_window_ && !deque.empty() )
+        {
+            std::cerr << comma::verbose.app_name() << ": error, leftover tail input record found: " << deque.size() << " lines." << std::endl;
+            return false;
         }
         return true;
     }
@@ -209,7 +208,7 @@ class concatenate_
             if(!is_binary){ std::cout << std::endl; }
             if (csv.flush) { std::cout.flush(); }
         }
-        if (bidirectional_ || reverse_ ) 
+        if (bidirectional_ || reverse_ )
         {
             std::cout.write( &( deque.back()[0] ), deque.back().size() );
             auto is = deque.crbegin(); while( ( is + 1 ) != deque.crend() ) { if(!is_binary){ std::cout << csv.delimiter; } is += step_; std::cout.write( &(*is)[0], is->size() ); }

From 75077b5c5b1cef276ebd36a47ab84564c6037388 Mon Sep 17 00:00:00 2001
From: Kent Hu <khu.1998@icloud.com>
Date: Thu, 29 Oct 2020 13:43:54 +1100
Subject: [PATCH 0216/1056] packed/detail/endian.h: void* cast changed to char*
 cast in memcpy line

---
 packed/detail/endian.h | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index 11c52363c..8f013980d 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -71,7 +71,7 @@ static_assert( sizeof( float ) == 4, "expected float of 4 bytes" );
 static_assert( sizeof( double ) == 8, "expected double of 8 bytes" );
 
 enum endiannes { little = 0, big = 1 };
-    
+
 template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false > struct endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
 template < endiannes Endianness > struct endian_traits< Endianness, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
 template < endiannes Endianness > struct endian_traits< Endianness, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
@@ -127,9 +127,9 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
     static const unsigned int size = Size;
 
     typedef typename endian_traits< Endianness, Size, Signed, Floating >::type type;
-    
+
     static_assert( size <= sizeof( type ), "expected size less than size of type" );
-    
+
     static_assert( Signed || !Floating, "expected signed or non-floating point type" ); // unsigned floats don't make sense
 
     typedef packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size > base_type;
@@ -137,18 +137,18 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
     static type default_value() { return 0; }
 
     typedef typename endian_traits< Endianness, size, Signed, Floating >::uint_of_same_size uint_of_same_size;
-    
+
     static void pack( char* storage, type value )
     {
         uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
         *p = convert< Endianness >::from_host( *p );
-        ::memcpy( storage, ( void* )p + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), size );
+        ::memcpy( storage, reinterpret_cast< char * >( p ) + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), size );
     }
-    
+
     static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
     {
         uint_of_same_size i = ( !Floating && Signed && ( storage[ Endianness == little ? size - 1 : 0 ] & 0x80 ) ) ? -1 : 0;
-        ::memcpy( ( void* )&i + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), storage, size );
+        ::memcpy( reinterpret_cast< char * >( &i ) + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), storage, size );
         i = convert< Endianness >::to_host( i );
         return *( reinterpret_cast< type* >( &i ) );
     }

From cc91ed241e331b2d80269ae499aad9f381f55dfc Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 13:48:41 +1100
Subject: [PATCH 0217/1056] csv-random: compile error fixed

---
 csv/applications/csv-random.cpp   | 58 ++-----------------------------
 system/package/comma-package-test |  6 +---
 2 files changed, 3 insertions(+), 61 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index ff415e1ae..8e7789ee3 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -1,60 +1,6 @@
-// This file is provided in addition to comma and is not an integral
-// part of comma library.
 // Copyright (c) 2018 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-// comma is a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-/// @author vsevolod vlaskine
+/// @authors vsevolod vlaskine, kent hu
 
 #include <algorithm>
 #include <cstring>
@@ -420,7 +366,7 @@ static int run_impl( const comma::command_line_options& options, std::size_t cou
         {
             const T r = rd();
             if( binary ) { std::cout.write( reinterpret_cast< const char* >( &r ), sizeof( T ) ); }
-            else { std::cout << std::exchange( initial_delimiter, ::csv.delimiter ) << type_traits< T >::cast( r ); }
+            else { std::cout << initial_delimiter << type_traits< T >::cast( r ); initial_delimiter = ::csv.delimiter; }
         }
         if( !binary ) { std::cout << std::endl; }
         if( flush ) { std::cout << std::flush; }
diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 411c86f0f..2b1a50465 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -6,10 +6,6 @@ package="$1"
 [[ -n "$package" ]] || { echo "usage: $0 <package>" >&2; exit 1; }
 apt install --yes "$package" || die "failed to install package '$package'"
 
-echo '======================================' >&2
-ls /usr/bin/csv-* | cat >&2
-echo '======================================' >&2
+# todo
 
 csv-paste line-number | csv-to-bin ui | csv-from-bin ui | head >&2
-
-echo '======================================' >&2

From 28dd3b33ca56a4207e2e0b3600bac2ce255e289a Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 14:49:27 +1100
Subject: [PATCH 0218/1056] system/package: making python included in deb

---
 system/package/comma-package-make |  6 +++++-
 system/package/comma-package-test | 12 ++++++++++--
 2 files changed, 15 insertions(+), 3 deletions(-)

diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 80fe95233..da800279d 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -14,7 +14,11 @@ ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
 (
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
-    cmake . -DCPACK_GENERATOR=DEB -DCPACK_PACKAGE_VERSION_MAJOR=$version_major -DCPACK_PACKAGE_VERSION_MINOR=$version_minor -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
+    cmake . -DCPACK_GENERATOR=DEB \
+            -DADD_PYTHON_PACKAGES_TO_RPM=ON \
+            -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
+            -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
+            -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"
     #cd ~/src/comma/python
diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 2b1a50465..38ba9854c 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -6,6 +6,14 @@ package="$1"
 [[ -n "$package" ]] || { echo "usage: $0 <package>" >&2; exit 1; }
 apt install --yes "$package" || die "failed to install package '$package'"
 
-# todo
+echo "$0: testing basic csv utilities..."
+output=$( csv-paste line-number | head | csv-to-bin ui | csv-from-bin ui ) || die "failed: failed to run"
+expected=$( seq 0 9 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+echo "$0: testing basic csv utilities: done"
 
-csv-paste line-number | csv-to-bin ui | csv-from-bin ui | head >&2
+echo "$0: testing csv-eval..."
+output=$( csv-paste line-number | head | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
+expected=$( seq 1 10 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+echo "$0: testing csv-eval: done"

From e9ae1aac0f8c62b181eb13a384fc2d5b7d5cc04d Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 14:53:08 +1100
Subject: [PATCH 0219/1056] system/ansible/install.python3.yml: building python
 packages explicitely turned on

---
 system/ansible/install.python3.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index 2189aefd5..8064e048a 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -46,7 +46,7 @@
 
   - name: "comma: cmake"
     vars:
-        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
+        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -DBUILD_PYTHON_PACKAGES=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
     shell: "/usr/bin/cmake {{ comma_cmake_options }} {{ base }}/src/comma chdir={{ base }}/build/comma"
 
   - name: "comma: make"

From d996b7978f20c7ab207396a4a9b8c61277667bee Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 15:09:22 +1100
Subject: [PATCH 0220/1056] system/package: making 20.04 working

---
 CMakeLists.txt                          |  3 ++-
 system/package/comma-package-docker-run |  2 +-
 system/package/comma-package-make       | 17 ++++++++++++-----
 3 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e5b7f894d..b9f6cba5f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -331,7 +331,8 @@ set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "libzmq5 (>= 4.2.5-1), libprocps6 (>= 2:3.3.0), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
+set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
 # this code needs a brush-up
diff --git a/system/package/comma-package-docker-run b/system/package/comma-package-docker-run
index 8eaec95ef..534f2aa3c 100755
--- a/system/package/comma-package-docker-run
+++ b/system/package/comma-package-docker-run
@@ -14,6 +14,6 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$( pwd )/build,target=/root/build/comma" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/package/comma-package-make $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
 cp build/comma-$comma_version_major.$comma_version_minor.$comma_version_patch-Linux.deb .
 sudo rm -rf build
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index da800279d..d636b6bd3 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -2,20 +2,27 @@
 
 function die() { echo "$0: $@" >&2; exit 1; }
 
-version_major=$1
-version_minor=$2
-version_patch=$3
-comma_dir="$4"
+ubuntu_version=$1
+version_major=$2
+version_minor=$3
+version_patch=$4
+comma_dir="$5"
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
-[[ -n "$version_patch" ]] || { echo "usage: $0 <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
+[[ -n "$version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
 cd ~
 echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.python3.yml' in $( pwd )..." >&2
 ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
+case $ubuntu_version in
+    18.04) libproc_version="libprocps6 (>= 2:3.3.0)" ;;
+    20.04) libproc_version="libprocps8 (>= 1)" ;;
+    *) libproc_version="libprocps8 (>= 1)" ;; # for now
+esac
 (
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
             -DADD_PYTHON_PACKAGES_TO_RPM=ON \
+            -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
             -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"

From 158e9be685871151e90aeec8bd2c3b42ceabdb3d Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 16:51:03 +1100
Subject: [PATCH 0221/1056] system/package: making 20.04 working...

---
 CMakeLists.txt                    | 2 +-
 system/package/comma-package-make | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b9f6cba5f..bcefb44fc 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -331,7 +331,7 @@ set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
-set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
+set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 for Ubuntu 20.04" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index d636b6bd3..aced2e4fa 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -14,8 +14,8 @@ echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.python3.ym
 ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
 case $ubuntu_version in
     18.04) libproc_version="libprocps6 (>= 2:3.3.0)" ;;
-    20.04) libproc_version="libprocps8 (>= 1)" ;;
-    *) libproc_version="libprocps8 (>= 1)" ;; # for now
+    20.04) libproc_version="libprocps8" ;;
+    *) libproc_version="libprocps8" ;; # for now
 esac
 (
     cd ~/build/comma

From 7c831097a0beeb6fb6ecd59b439302588e59aa98 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 16:52:12 +1100
Subject: [PATCH 0222/1056] system/package: making 20.04 working...

---
 CMakeLists.txt                    | 2 +-
 system/package/comma-package-make | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index bcefb44fc..b9f6cba5f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -331,7 +331,7 @@ set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
-set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 for Ubuntu 20.04" )
+set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index aced2e4fa..d636b6bd3 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -14,8 +14,8 @@ echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.python3.ym
 ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
 case $ubuntu_version in
     18.04) libproc_version="libprocps6 (>= 2:3.3.0)" ;;
-    20.04) libproc_version="libprocps8" ;;
-    *) libproc_version="libprocps8" ;; # for now
+    20.04) libproc_version="libprocps8 (>= 1)" ;;
+    *) libproc_version="libprocps8 (>= 1)" ;; # for now
 esac
 (
     cd ~/build/comma

From 7e3ad9356f14a49422b948bcae3eb836071ae0d8 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 16:56:30 +1100
Subject: [PATCH 0223/1056] comma-package-test: in progress...

---
 system/package/comma-package-test | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 38ba9854c..20f5e72fa 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -12,6 +12,10 @@ expected=$( seq 0 9 )
 [[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
 echo "$0: testing basic csv utilities: done"
 
+echo "$0: testing bash utils..."
+type -p comma-application-util || die "failed: failed"
+echo "$0: testing bash utils: done"
+
 echo "$0: testing csv-eval..."
 output=$( csv-paste line-number | head | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
 expected=$( seq 1 10 )

From ad916063a9992bbde060921225a05a89b1215fbd Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:12:13 +1100
Subject: [PATCH 0224/1056] comma-package-make: trying to fix python
 packaging...

---
 CMakeLists.txt                    | 3 +--
 system/package/comma-package-make | 1 +
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b9f6cba5f..c17fed662 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -344,8 +344,7 @@ IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy")
     SET(CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
     SET(CPACK_RPM_PRE_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-pre-install.sh" )
-    # Prevents /tmp from permission change when installing RPM package
-    SET(CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" )
+    SET(CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" ) # Prevents /tmp from permission change when installing RPM package
 ELSE( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread socat psmisc recode")
 ENDIF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index d636b6bd3..4ebc0d2c2 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -21,6 +21,7 @@ esac
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
+            -DBUILD_PYTHON_PACKAGES=ON \
             -DADD_PYTHON_PACKAGES_TO_RPM=ON \
             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \

From 9b4cc26d6d19fcec0984676ec1e21838fdce3cc0 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:23:07 +1100
Subject: [PATCH 0225/1056] python: packaging: installation version fixed

---
 python/comma/version.py   | 29 +----------------------------
 python/setup.py           |  5 +++--
 system/package/Dockerfile |  1 +
 3 files changed, 5 insertions(+), 30 deletions(-)

diff --git a/python/comma/version.py b/python/comma/version.py
index be136aaf5..92b04f53c 100644
--- a/python/comma/version.py
+++ b/python/comma/version.py
@@ -1,31 +1,4 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 # if you change this file, check that it still works with ../setup.py, which gets the comma version by reading this file
-__version__ = "1.0"
+__version__ = "1.0.0"
diff --git a/python/setup.py b/python/setup.py
index 05c56d2a5..e26a8f89c 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,14 +1,15 @@
 #!/usr/bin/env python
 
 from distutils.core import setup
+import comma.version
 
 setup(
         name                = 'comma',
-        version             = open('comma/version.py').readlines()[-1].strip().split()[-1].strip('\"'),
+        version             = comma.version.__version__,
         description         = 'comma python utilties',
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
-        scripts             =["comma/csv/applications/csv-eval"],
+        scripts             = ["comma/csv/applications/csv-eval"],
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] }
diff --git a/system/package/Dockerfile b/system/package/Dockerfile
index f30988c19..0fbfb24a8 100644
--- a/system/package/Dockerfile
+++ b/system/package/Dockerfile
@@ -4,5 +4,6 @@ ENV DEBIAN_FRONTEND="noninteractive"
 RUN apt update \
     && apt install software-properties-common --yes \
     && apt install --yes ansible git build-essential cmake cmake-curses-gui
+RUN apt install python3-stdeb
 
 # && apt-add-repository --yes --update ppa:ansible/ansible \

From 74231b55a113758f0f21d7856667fbe1c4b46f71 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:26:46 +1100
Subject: [PATCH 0226/1056] python: packaging...

---
 CMakeLists.txt                    | 2 +-
 system/package/comma-package-make | 6 +++---
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c17fed662..01ffbbc9f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -332,7 +332,7 @@ set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
 # this code needs a brush-up
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 4ebc0d2c2..fbce4a441 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -29,8 +29,8 @@ esac
             -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"
-    #cd ~/src/comma/python
-    #echo "$0: setting up python in $( pwd )" >&2
-    #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
+    cd ~/src/comma/python
+    echo "$0: setting up python in $( pwd )" >&2
+    python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     echo "$0: done" >&2
 )

From fa9c3b9d736289ba7103db155d9e22a8385b23bf Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:27:58 +1100
Subject: [PATCH 0227/1056] python: packaging...

---
 system/package/Dockerfile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/Dockerfile b/system/package/Dockerfile
index 0fbfb24a8..fe6b58b42 100644
--- a/system/package/Dockerfile
+++ b/system/package/Dockerfile
@@ -4,6 +4,6 @@ ENV DEBIAN_FRONTEND="noninteractive"
 RUN apt update \
     && apt install software-properties-common --yes \
     && apt install --yes ansible git build-essential cmake cmake-curses-gui
-RUN apt install python3-stdeb
+RUN apt install --yes python3-stdeb
 
 # && apt-add-repository --yes --update ppa:ansible/ansible \

From 4e7b16098a18f75ca037eb911c46c2c6bcd0ca62 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:44:36 +1100
Subject: [PATCH 0228/1056] python: packaging...

---
 system/package/comma-package-docker-run | 7 +------
 system/package/comma-package-make       | 2 ++
 2 files changed, 3 insertions(+), 6 deletions(-)

diff --git a/system/package/comma-package-docker-run b/system/package/comma-package-docker-run
index 534f2aa3c..f8e355f2e 100755
--- a/system/package/comma-package-docker-run
+++ b/system/package/comma-package-docker-run
@@ -8,12 +8,7 @@ comma_dir="$5"
 [[ -n "$comma_version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
 
-rm -rf build
-mkdir build -p
 docker run \
-       --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
-       --mount "type=bind,source=$( pwd )/build,target=/root/build/comma" \
+       --mount "type=bind,source=$( pwd ),target=/root/output" \
        ubuntu.$ubuntu_version.build.basics \
        /mnt/comma/system/package/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
-cp build/comma-$comma_version_major.$comma_version_minor.$comma_version_patch-Linux.deb .
-sudo rm -rf build
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index fbce4a441..d30133b9c 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -34,3 +34,5 @@ esac
     python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     echo "$0: done" >&2
 )
+cp ~/build/comma-$version_major.$version_minor.$version_patch-Linux.deb output
+cp ~/src/comma/python/deb_dist/python3-comma*.deb output

From e5353cf00b89e69771f054750d0c1cad486e48c1 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:46:19 +1100
Subject: [PATCH 0229/1056] python: packaging...

---
 system/package/comma-package-docker-run | 1 +
 1 file changed, 1 insertion(+)

diff --git a/system/package/comma-package-docker-run b/system/package/comma-package-docker-run
index f8e355f2e..5daab2c5a 100755
--- a/system/package/comma-package-docker-run
+++ b/system/package/comma-package-docker-run
@@ -9,6 +9,7 @@ comma_dir="$5"
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
 
 docker run \
+       --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$( pwd ),target=/root/output" \
        ubuntu.$ubuntu_version.build.basics \
        /mnt/comma/system/package/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }

From 82f061d69728008eda3b7f89bbb9e0773201bfe0 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:48:39 +1100
Subject: [PATCH 0230/1056] python: packaging...

---
 system/package/comma-package-test | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 20f5e72fa..bb4d3d701 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -3,7 +3,9 @@
 function die() { echo "$0: $@" >&2; exit 1; }
 
 package="$1"
-[[ -n "$package" ]] || { echo "usage: $0 <package>" >&2; exit 1; }
+python_package="$2"
+[[ -n "$python_package" ]] || { echo "usage: $0 <package> <python package>" >&2; exit 1; }
+apt install --yes "$python_package" || die "failed to install package '$python_package'"
 apt install --yes "$package" || die "failed to install package '$package'"
 
 echo "$0: testing basic csv utilities..."

From 86e6513f60ffa50eb7d95819ea038a806b1f4f40 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 17:51:48 +1100
Subject: [PATCH 0231/1056] python: packaging...

---
 system/package/comma-package-make | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index d30133b9c..93f1efdc0 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -34,5 +34,5 @@ esac
     python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     echo "$0: done" >&2
 )
-cp ~/build/comma-$version_major.$version_minor.$version_patch-Linux.deb output
+cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
 cp ~/src/comma/python/deb_dist/python3-comma*.deb output

From 56d6b873f920e374a3851b873b769a1061a92329 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 18:01:22 +1100
Subject: [PATCH 0232/1056] python: packaging...

---
 CMakeLists.txt                           | 2 +-
 system/package/comma-package-docker-test | 8 +++++---
 2 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 01ffbbc9f..ba83344d1 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -332,7 +332,7 @@ set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
 # this code needs a brush-up
diff --git a/system/package/comma-package-docker-test b/system/package/comma-package-docker-test
index d0b888693..d23128cc2 100755
--- a/system/package/comma-package-docker-test
+++ b/system/package/comma-package-docker-test
@@ -4,9 +4,11 @@ function die() { echo "$0: $@" >&2; exit 1; }
 
 ubuntu_version="$1"
 package="$2"
-comma_dir="$3"
-[[ -n "$package" ]] || { echo "usage: $0 <ubuntu version> <package> [<comma dir>]" >&2; exit 1; }
+python_package="$3"
+comma_dir="$4"
+[[ -n "$package" ]] || { echo "usage: $0 <ubuntu version> <package> <python package> [<comma dir>]" >&2; exit 1; }
 [[ -s "$package" ]] || die "file not found or empty: '$package'"
+[[ -s "$python_package" ]] || die "file not found or empty: '$python_package'"
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
 package_dir=$( dirname "$( realpath "$package" )" )
 
@@ -14,4 +16,4 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$package_dir,target=/mnt/package" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/package/comma-package-test "/mnt/package/$( basename "$package" )" || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/comma-package-test "/mnt/package/$( basename "$package" )" "/mnt/package/$( basename "$python_package" )" || { echo "$0: failed" >&2; exit 1; }

From ca852425c180735ee5ee956d9381e088d5dc45b8 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 19:37:30 +1100
Subject: [PATCH 0233/1056] packaging...

---
 python/comma/csv/stream.py | 2 +-
 python/setup.py            | 1 +
 system/package/Dockerfile  | 2 +-
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 4cb5015bc..1a78441ba 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -134,7 +134,7 @@ def read(self, size=None):
         return self._struct_array(self._input_array, self.missing_values)
 
     def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in numpy 1.14; see doc of encoding parameter in https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.genfromtxt.html
-        if np.__version__ >= '1.14.0':
+        if np.__version__ >= '1.13.0': # if np.__version__ >= '1.14.0':
             return np.genfromtxt( self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter
diff --git a/python/setup.py b/python/setup.py
index e26a8f89c..1ec0ca7ef 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -7,6 +7,7 @@
         name                = 'comma',
         version             = comma.version.__version__,
         description         = 'comma python utilties',
+        install_requires    = [ 'numpy' ],
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
         scripts             = ["comma/csv/applications/csv-eval"],
diff --git a/system/package/Dockerfile b/system/package/Dockerfile
index fe6b58b42..3c7f63dbd 100644
--- a/system/package/Dockerfile
+++ b/system/package/Dockerfile
@@ -3,7 +3,7 @@ FROM ubuntu:${version}
 ENV DEBIAN_FRONTEND="noninteractive"
 RUN apt update \
     && apt install software-properties-common --yes \
-    && apt install --yes ansible git build-essential cmake cmake-curses-gui
+    && apt install --yes ansible git build-essential cmake cmake-curses-gui python3-pip
 RUN apt install --yes python3-stdeb
 
 # && apt-add-repository --yes --update ppa:ansible/ansible \

From b935a2c5057aaaf9fe405fbfcf3fc498a26349f8 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 19:39:33 +1100
Subject: [PATCH 0234/1056] packaging...

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 1a78441ba..4cb5015bc 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -134,7 +134,7 @@ def read(self, size=None):
         return self._struct_array(self._input_array, self.missing_values)
 
     def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in numpy 1.14; see doc of encoding parameter in https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.genfromtxt.html
-        if np.__version__ >= '1.13.0': # if np.__version__ >= '1.14.0':
+        if np.__version__ >= '1.14.0':
             return np.genfromtxt( self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter

From 9a6df561e2be7f8c0d4650f88bfb9a1a0fc25402 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 19:42:18 +1100
Subject: [PATCH 0235/1056] packaging...

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index ba83344d1..211b886b2 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -332,7 +332,7 @@ set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat" ) #, python3-numpy" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
 # this code needs a brush-up

From e2c2f0d643f058847a7bf150ab954449e8c96cda Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 19:48:07 +1100
Subject: [PATCH 0236/1056] packaging...

---
 python/setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/setup.py b/python/setup.py
index 1ec0ca7ef..767cac36e 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python
 
-from distutils.core import setup
+from setuptools import setup # from distutils.core import setup
 import comma.version
 
 setup(

From 38a8d5eb83a9c8522020df17569629cba3e0daed Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Thu, 29 Oct 2020 20:08:39 +1100
Subject: [PATCH 0237/1056] packaging...

---
 python/CMakeLists.txt             | 2 +-
 python/setup.py                   | 2 +-
 system/package/comma-package-test | 1 +
 3 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index b8a695df2..2777db060 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -68,7 +68,7 @@ IF( PYTHON_PACKAGE_INSTALL_PREFIX )
     ENDIF( NOT WIN32 )
 ENDIF( PYTHON_PACKAGE_INSTALL_PREFIX )
 
-SET( SETUP_PY "${CMAKE_CURRENT_SOURCE_DIR}/setup.py" )
+SET( SETUP_PY "${CMAKE_CURRENT_SOURCE_DIR}/setup.py" ) # todo: uses pip instead
 
 SET( BUILD_BASE "${CMAKE_CURRENT_BINARY_DIR}/build" )
 
diff --git a/python/setup.py b/python/setup.py
index 767cac36e..6d5c87393 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python
 
-from setuptools import setup # from distutils.core import setup
+from distutils.core import setup # from setuptools import setup
 import comma.version
 
 setup(
diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index bb4d3d701..5eeb97f23 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -5,6 +5,7 @@ function die() { echo "$0: $@" >&2; exit 1; }
 package="$1"
 python_package="$2"
 [[ -n "$python_package" ]] || { echo "usage: $0 <package> <python package>" >&2; exit 1; }
+pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
 apt install --yes "$python_package" || die "failed to install package '$python_package'"
 apt install --yes "$package" || die "failed to install package '$package'"
 

From 496904994bfbb62ff41228176c4db98ccd8f90b8 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Oct 2020 22:28:47 +1100
Subject: [PATCH 0238/1056] packaging...

---
 CMakeLists.txt                    | 2 +-
 system/package/comma-package-test | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 211b886b2..d9cf51ead 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -332,7 +332,7 @@ set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat" ) #, python3-numpy" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1)" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
 # this code needs a brush-up
diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 5eeb97f23..5db3fb28e 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -5,7 +5,7 @@ function die() { echo "$0: $@" >&2; exit 1; }
 package="$1"
 python_package="$2"
 [[ -n "$python_package" ]] || { echo "usage: $0 <package> <python package>" >&2; exit 1; }
-pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
+# pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
 apt install --yes "$python_package" || die "failed to install package '$python_package'"
 apt install --yes "$package" || die "failed to install package '$package'"
 

From 45c387ad573fba019a6d9d0f9316d6da358ddc18 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Oct 2020 22:30:08 +1100
Subject: [PATCH 0239/1056] system/package/readme fixed; packaging...

---
 system/package/readme | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/readme b/system/package/readme
index 5cde855c0..c677fb934 100644
--- a/system/package/readme
+++ b/system/package/readme
@@ -5,7 +5,7 @@ to build docker that has ansible, cmake, etc, run (you may need to run as sudo -
 
 to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
 
-> ./comma-package-docker-build 20.04 1 2 3
+> ./comma-package-docker-run 20.04 1 2 3
 
 if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run:
 

From deec795f74f3c5b7e09dcd87d3d7dfed441c4c1a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Oct 2020 23:40:23 +1100
Subject: [PATCH 0240/1056] system/package/comma-package-test: temporary hack:
 installing numpy with pip3

---
 system/package/comma-package-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 5db3fb28e..5eeb97f23 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -5,7 +5,7 @@ function die() { echo "$0: $@" >&2; exit 1; }
 package="$1"
 python_package="$2"
 [[ -n "$python_package" ]] || { echo "usage: $0 <package> <python package>" >&2; exit 1; }
-# pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
+pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
 apt install --yes "$python_package" || die "failed to install package '$python_package'"
 apt install --yes "$package" || die "failed to install package '$package'"
 

From 24ef3daef317dd32229ade92bb50d26ba91db47b Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 30 Oct 2020 00:07:27 +1100
Subject: [PATCH 0241/1056] system/package/Dockerfile: added python3-all to fix
 python packaging on ubuntu 20.04

---
 system/package/Dockerfile | 1 +
 1 file changed, 1 insertion(+)

diff --git a/system/package/Dockerfile b/system/package/Dockerfile
index 3c7f63dbd..8c868912a 100644
--- a/system/package/Dockerfile
+++ b/system/package/Dockerfile
@@ -5,5 +5,6 @@ RUN apt update \
     && apt install software-properties-common --yes \
     && apt install --yes ansible git build-essential cmake cmake-curses-gui python3-pip
 RUN apt install --yes python3-stdeb
+RUN apt install --yes python3-all
 
 # && apt-add-repository --yes --update ppa:ansible/ansible \

From 5e0701bccb55940a05311027c7fd8d2d03c795ab Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 30 Oct 2020 19:29:27 +1100
Subject: [PATCH 0242/1056] csv-play: --help: example added

---
 csv/applications/csv-play.cpp | 43 ++++++++---------------------------
 1 file changed, 9 insertions(+), 34 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 62d084c11..1e3bc6997 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author cedric wohlleber
 
@@ -50,7 +22,6 @@
 #include <fstream>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../csv/options.h"
@@ -60,7 +31,7 @@
 #include "../../csv/applications/play/play.h"
 #include "../../csv/applications/play/multiplay.h"
 
-static void usage()
+static void usage( bool )
 {
     std::cerr << std::endl;
     std::cerr << "play back timestamped data from standard input in a real time manner" << std::endl;
@@ -117,9 +88,14 @@ static void usage()
     std::cerr << "    output multiple inputs of the same format to stdout:" << std::endl;
     std::cerr << "        csv-play \"file1.csv;-\" \"file2.csv;-\" &" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
+    std::cerr << "    use binary data (try it)" << std::endl;
+    std::cerr << "        > csv-play <( csv-paste line-number | csv-repeat --pace --period 1 | csv-time-amp | csv-to-bin t,ui --flush )';-;binary=t,ui' \\" << std::endl;
+    std::cerr << "                 <( csv-paste line-number value=0 | csv-repeat --pace --period 1 | csv-time-stamp | csv-to-bin t,2ui --flush )';tcp:8888;binary=t,2ui' \\" << std::endl;
+    std::cerr << "            | csv-from-bin t,ui" << std::endl;
+    std::cerr << "        > #in another shell, run" << std::endl;
+    std::cerr << "        > socat tcp:localhost:8888 - | csv-from-bin t,2ui" << std::endl;
     std::cerr << std::endl;
-    exit( -1 );
+    exit( 0 );
 }
 
 class key_press_handler_t
@@ -243,8 +219,7 @@ int main( int argc, char** argv )
     {
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
         comma::signal_flag shutdown_flag( signals );
-        comma::command_line_options options( argc, argv );
-        if( options.exists( "--help,-h" ) ) { usage(); }
+        comma::command_line_options options( argc, argv, usage );
         options.assert_mutually_exclusive( "--speed,--slow,--slowdown" );
         double speed = options.value( "--speed", 1.0 / options.value< double >( "--slow,--slowdown", 1.0 ) );
         double resolution = options.value< double >( "--resolution", 0.01 );

From 418f629d3c3cca7536e2f57a5e065b629fe460b5 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 30 Oct 2020 19:38:10 +1100
Subject: [PATCH 0243/1056] contact_info removed

---
 application/contact_info.h                    |  38 -----
 csv/applications/csv-analyse.cpp              |   2 -
 csv/applications/csv-bin-cut.cpp              |   2 -
 csv/applications/csv-blocks.cpp               |   2 -
 csv/applications/csv-calc.cpp                 |   2 -
 csv/applications/csv-calc.new.cpp             |   2 -
 csv/applications/csv-cast.cpp                 |   2 -
 csv/applications/csv-crc.cpp                  |   2 -
 csv/applications/csv-from-bin.cpp             |   2 -
 csv/applications/csv-join.cpp                 |   2 -
 csv/applications/csv-paste.cpp                |   2 -
 csv/applications/csv-repeat.cpp               |   2 -
 csv/applications/csv-select.cpp               |   2 -
 csv/applications/csv-sort.cpp                 |   2 -
 csv/applications/csv-thin.cpp                 |   2 -
 csv/applications/csv-time-delay.cpp           |   2 -
 csv/applications/csv-time-join.cpp            |   2 -
 csv/applications/csv-time-stamp.cpp           |   2 -
 csv/applications/csv-time.cpp                 | 147 +++++++-----------
 csv/applications/csv-to-bin.cpp               |   2 -
 csv/applications/csv-units.cpp                |   2 -
 io/applications/io-bandwidth.cpp              |   2 -
 io/applications/io-buffer.cpp                 |   2 -
 io/applications/io-cat.cpp                    |   2 -
 io/applications/io-line.cpp                   |   2 -
 io/applications/io-publish.cpp                |   2 -
 io/applications/udp-client.cpp                |   2 -
 io/applications/zero-cat.cpp                  |   2 -
 .../applications/name-value-convert.cpp       |   2 -
 .../applications/name-value-from-csv.cpp      |   2 -
 name_value/applications/name-value-get.cpp    |   2 -
 .../applications/name-value-permute.cpp       |   2 -
 util/applications/comma-timeout-group.cpp     |   2 -
 33 files changed, 54 insertions(+), 193 deletions(-)
 delete mode 100644 application/contact_info.h

diff --git a/application/contact_info.h b/application/contact_info.h
deleted file mode 100644
index d4154064c..000000000
--- a/application/contact_info.h
+++ /dev/null
@@ -1,38 +0,0 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-/// @author vsevolod vlaskine
-
-#pragma once
-
-namespace comma {
-
-static const char* contact_info = "more info: https://gitlab.com/orthographic/comma#readme";
-    
-} // namespace comma {
diff --git a/csv/applications/csv-analyse.cpp b/csv/applications/csv-analyse.cpp
index a551673ca..d86a9c760 100644
--- a/csv/applications/csv-analyse.cpp
+++ b/csv/applications/csv-analyse.cpp
@@ -37,7 +37,6 @@
 #include <iostream>
 #include <map>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 
 using namespace comma;
 
@@ -115,7 +114,6 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << "See also: \"csv-size\", \"csv-bin-cut\"" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( -1 );
 }
diff --git a/csv/applications/csv-bin-cut.cpp b/csv/applications/csv-bin-cut.cpp
index ae1309d96..b95315d14 100644
--- a/csv/applications/csv-bin-cut.cpp
+++ b/csv/applications/csv-bin-cut.cpp
@@ -40,7 +40,6 @@
 #include <fstream>
 #include <numeric>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../csv/format.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
@@ -150,7 +149,6 @@ namespace {
             std::cerr << "Format specifications:" << std::endl;
             std::cerr << csv::format::usage() << std::endl;
         }
-        std::cerr << comma::contact_info << std::endl;
         std::cerr << std::endl;
         exit( 0 );
     }
diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index a2be3c024..ebcab1dd0 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -41,7 +41,6 @@
 
 #include <boost/unordered_map.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -225,7 +224,6 @@ static void usage( bool more )
     std::cerr << "            After indexing the input in reverse order, the stream is read block-by-block, with the first line given the maximal" << std::endl;
     std::cerr << "            element id in the block, essentially, the block size" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "contact info: " << comma::contact_info <<std::endl;
     std::cerr << std::endl;
     exit(0);
 }
diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 69e0cd6a2..b8abe0b97 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -21,7 +21,6 @@
 #include <boost/scoped_ptr.hpp>
 #include <boost/unordered_map.hpp>
 #include <boost/date_time/posix_time/posix_time_types.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/verbose.h"
 #include "../../base/exception.h"
 #include "../../csv/format.h"
@@ -122,7 +121,6 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | " << comma::verbose.app_name() << " --fields=a,id percentile=0.9" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( -1 );
 }
diff --git a/csv/applications/csv-calc.new.cpp b/csv/applications/csv-calc.new.cpp
index c064cc641..00d590c6d 100644
--- a/csv/applications/csv-calc.new.cpp
+++ b/csv/applications/csv-calc.new.cpp
@@ -39,7 +39,6 @@
 #include <boost/bind.hpp>
 #include <boost/function.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -82,7 +81,6 @@ static void usage()
     std::cerr << "examples" << std::endl;
     std::cerr << "    todo" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/csv/applications/csv-cast.cpp b/csv/applications/csv-cast.cpp
index 7370731bc..fcf3e1b3d 100644
--- a/csv/applications/csv-cast.cpp
+++ b/csv/applications/csv-cast.cpp
@@ -39,7 +39,6 @@
 #include <cstring>
 #include <iostream>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/format.h"
 
@@ -76,7 +75,6 @@ static void usage()
     std::cerr << "    lexical cast, convert s[22],s[10],s[6] to t,2d (creates sample binary data)" << std::endl;
     std::cerr << "        echo {0..9}.2345789,3.1415 | fmt -1 | csv-time-stamp | csv-to-bin s[22],s[10],s[6] | csv-cast s[22],s[10],s[6] t,2d | csv-from-bin t,2d" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
 }
 
diff --git a/csv/applications/csv-crc.cpp b/csv/applications/csv-crc.cpp
index cdaabdc39..ff12dc6ba 100644
--- a/csv/applications/csv-crc.cpp
+++ b/csv/applications/csv-crc.cpp
@@ -42,7 +42,6 @@
 #include <boost/crc.hpp>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 
 static void usage( bool )
@@ -88,7 +87,6 @@ static void usage( bool )
     std::cerr << "                         packets (binary) are valid, before output; default 0, i.e. recover on the next valid" << std::endl;
     std::cerr << "    --discard-on-recovery,--discard: discard those <n> packets accumulated during the recovery check" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/csv/applications/csv-from-bin.cpp b/csv/applications/csv-from-bin.cpp
index 644dc4524..f901114c7 100644
--- a/csv/applications/csv-from-bin.cpp
+++ b/csv/applications/csv-from-bin.cpp
@@ -39,7 +39,6 @@
 #include <stdlib.h>
 #include <iostream>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/format.h"
 #include "../../string/string.h"
@@ -54,7 +53,6 @@ static void usage()
     std::cerr << "--precision: set precision (number of mantissa digits) for floating point types" << std::endl;
     std::cerr << csv::format::usage() << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index ae996957a..2573a630a 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -16,7 +16,6 @@
 #include <boost/optional.hpp>
 #include <boost/unordered_map.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -110,7 +109,6 @@ static void usage( bool more )
     std::cerr << "        <input:3>" << std::endl;
     std::cerr << "        <input:3>" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 04217cd92..9be67252d 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -37,7 +37,6 @@
 #include <boost/lexical_cast.hpp>
 #include <boost/ptr_container/ptr_vector.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/format.h"
 #include "../../io/stream.h"
@@ -103,7 +102,6 @@ static void usage( bool verbose )
     std::cerr << "csv format parameters" << std::endl;
     if( verbose ) { std::cerr << comma::csv::format::usage() << std::endl; } else { std::cerr << "    run csv-paste --help --verbose for more..." << std::endl; }
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index b622a6b4b..a3efd08ca 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -34,7 +34,6 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/thread/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../csv/options.h"
 #include "../../csv/stream.h"
@@ -108,7 +107,6 @@ void usage( bool verbose = false )
     std::cerr << std::endl;
     std::cerr << "    { echo -e \"1\\n2\\n3\"; sleep 10; } | csv-repeat --timeout=3" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/csv/applications/csv-select.cpp b/csv/applications/csv-select.cpp
index e0fb9c1ff..f72286756 100644
--- a/csv/applications/csv-select.cpp
+++ b/csv/applications/csv-select.cpp
@@ -39,7 +39,6 @@
 #include <boost/regex.hpp>
 #include <boost/scoped_ptr.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -91,7 +90,6 @@ void usage()
     std::cerr << "    cat a.csv | csv-select --fields=t,scalar \"t;from=20120101T000000;sorted\" \"scalar;from=-10;to=20.5\"" << std::endl;
     std::cerr << "    echo hello,world | csv-select --fields=h,w \"h;regex=he.*\"" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index c29d5f1ef..fce62ba3f 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -16,7 +16,6 @@
 #include <boost/unordered_set.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
@@ -84,7 +83,6 @@ static void usage( bool more )
     std::cerr << "        using id" << std::endl;
     std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; echo 5,b,7; echo 3,b,9 ) | csv-sort --max --min --fields=,id,a" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     if( more )
     {
diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index 310da562a..d9b892ca7 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -42,7 +42,6 @@
 #include <boost/random/uniform_real.hpp>
 #include <boost/random/variate_generator.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../io/file_descriptor.h"
@@ -83,7 +82,6 @@ static void usage( bool verbose = false )
     std::cerr << "    using timestamp from input:  cat full.csv | csv-thin --period 2 --fields t" << std::endl;
     std::cerr << "    binary data:                 cat full.bin | csv-thin 0.1 --binary 3d" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/csv/applications/csv-time-delay.cpp b/csv/applications/csv-time-delay.cpp
index 6f80d0f30..2b715a8ae 100644
--- a/csv/applications/csv-time-delay.cpp
+++ b/csv/applications/csv-time-delay.cpp
@@ -33,7 +33,6 @@
 #include <iostream>
 #include <string>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../name_value/parser.h"
@@ -50,7 +49,6 @@ static void usage()
     std::cerr << "<options>" << std::endl;
     std::cerr << comma::csv::options::usage( "t" ) << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( -1 );
 }
diff --git a/csv/applications/csv-time-join.cpp b/csv/applications/csv-time-join.cpp
index 12754c3d1..290cbeeff 100644
--- a/csv/applications/csv-time-join.cpp
+++ b/csv/applications/csv-time-join.cpp
@@ -36,7 +36,6 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
@@ -135,7 +134,6 @@ static void usage( bool verbose )
         std::cerr << "    try --help --verbose for more examples" << std::endl;
     }
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/csv/applications/csv-time-stamp.cpp b/csv/applications/csv-time-stamp.cpp
index b77dece7e..cf77da7e3 100644
--- a/csv/applications/csv-time-stamp.cpp
+++ b/csv/applications/csv-time-stamp.cpp
@@ -40,7 +40,6 @@
 #include <string>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
 
@@ -62,7 +61,6 @@ static void usage()
     std::cerr << "    cat input.bin | csv-time-stamp --binary=3ui" << std::endl;
     std::cerr << "    cat input.bin | csv-time-stamp --size=12" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( -1 );
 }
diff --git a/csv/applications/csv-time.cpp b/csv/applications/csv-time.cpp
index 887db2cfb..8c585df14 100644
--- a/csv/applications/csv-time.cpp
+++ b/csv/applications/csv-time.cpp
@@ -1,35 +1,6 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
-/// @author vsevolod vlaskine
-/// @author mathew hounsell
+/// @authors vsevolod vlaskine mathew hounsell
 
 #include <string.h>
 #include <time.h>
@@ -43,7 +14,6 @@
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/date_time/local_time/local_time.hpp>
 #include <boost/date_time/c_local_time_adjustor.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -54,57 +24,55 @@
 
 static void usage( bool )
 {
-    static char const * const msg_general =
-        "\n"
-        "\nConvert between a couple of common time representation"
-        "\n"
-        "\nUsage:"
-        "\n    cat log.csv | csv-time <options> > converted.csv"
-        "\n"
-        "\nOptions"
-        "\n    --from <what>: input format: any, iso, seconds, sql, xsd, local; default iso"
-        "\n    --to <what>: output format: iso, seconds, sql, xsd, local; default iso"
-        "\n    --delimiter,-d <delimiter> : default: ','"
-        "\n    --fields <fields> : time field names or field numbers as in \"cut\""
-        "\n                        e.g. \"1,5,7\" or \"a,b,,d\""
-        "\n                        defaults to \"a\" (first field only is datetime)"
-        "\n    --empty-as-not-a-date-time,--accept-empty,-e: if time field is empty, consider it as not-a-date-time"
-        "\n"
-        "\nNote: no --binary option, do not use this utility on binary; instead read as unsigned long-long (time in microseconds)"
-        "\n"
-        "\nTime formats"
-        "\n    - any, guess"
-        "\n            a special input format - try to convert from all those supported,"
-        "\n            default input format, will be slower"
-        "\n    - format"
-        "\n            user given time format, for e.g 'format;%Y%m%dT%H%M%S' will also convert to/from iso format"
-        "\n            see man date for details about time format specifications"
-        "\n    - iso, iso-8601-basic"
-        "\n            YYYYMMDDTHHMMSS.FFFFFF, e.g. 20140101T001122.333000"
-        "\n    - iso-always-with-fractions"
-        "\n            YYYYMMDDTHHMMSS.FFFFFF"
-        "\n            output 20140101T000000.000000, not 20140101T000000"
-        "\n    - local"
-        "\n            same as iso but converts from/to local time adjusted using current machine settings"
-        "\n    - microseconds, us"
-        "\n            microseconds since UNIX epoch as integer"
-        "\n    - seconds"
-        "\n            seconds since UNIX epoch as double"
-        "\n    - sql, posix, ieee-std-1003.1"
-        "\n            e.g. 2014-01-01 00:11:22"
-        "\n    - xsd, iso-8601-extended"
-        "\n            used in xsd:dateTime, xs:dateTime, gml and derivatives"
-        "\n            e.g. 2014-12-25T00:00:00.000Z"
-        "\n                 2014-12-25T00:00:00.000+11:00"
-        "\n                 2014-12-25T00:00:00.000+1100"
-        "\n                 2014-12-25T00:00:00.000+11"
-        "\n"
-        "\nDeprecated options:"
-        "\n    --to-seconds,--sec,-s: iso input expected; use --from, --to"
-        "\n    --to-iso-string,--iso,-i: input as seconds expected; use --from, --to"
-        "\n"
-        "\n";
-    std::cerr << msg_general << comma::contact_info << std::endl << std::endl;
+    std::cerr << "\n"
+                 "\nConvert between a couple of common time representation"
+                 "\n"
+                 "\nUsage:"
+                 "\n    cat log.csv | csv-time <options> > converted.csv"
+                 "\n"
+                 "\nOptions"
+                 "\n    --from <what>: input format: any, iso, seconds, sql, xsd, local; default iso"
+                 "\n    --to <what>: output format: iso, seconds, sql, xsd, local; default iso"
+                 "\n    --delimiter,-d <delimiter> : default: ','"
+                 "\n    --fields <fields> : time field names or field numbers as in \"cut\""
+                 "\n                        e.g. \"1,5,7\" or \"a,b,,d\""
+                 "\n                        defaults to \"a\" (first field only is datetime)"
+                 "\n    --empty-as-not-a-date-time,--accept-empty,-e: if time field is empty, consider it as not-a-date-time"
+                 "\n"
+                 "\nNote: no --binary option, do not use this utility on binary; instead read as unsigned long-long (time in microseconds)"
+                 "\n"
+                 "\nTime formats"
+                 "\n    - any, guess"
+                 "\n            a special input format - try to convert from all those supported,"
+                 "\n            default input format, will be slower"
+                 "\n    - format"
+                 "\n            user given time format, for e.g 'format;%Y%m%dT%H%M%S' will also convert to/from iso format"
+                 "\n            see man date for details about time format specifications"
+                 "\n    - iso, iso-8601-basic"
+                 "\n            YYYYMMDDTHHMMSS.FFFFFF, e.g. 20140101T001122.333000"
+                 "\n    - iso-always-with-fractions"
+                 "\n            YYYYMMDDTHHMMSS.FFFFFF"
+                 "\n            output 20140101T000000.000000, not 20140101T000000"
+                 "\n    - local"
+                 "\n            same as iso but converts from/to local time adjusted using current machine settings"
+                 "\n    - microseconds, us"
+                 "\n            microseconds since UNIX epoch as integer"
+                 "\n    - seconds"
+                 "\n            seconds since UNIX epoch as double"
+                 "\n    - sql, posix, ieee-std-1003.1"
+                 "\n            e.g. 2014-01-01 00:11:22"
+                 "\n    - xsd, iso-8601-extended"
+                 "\n            used in xsd:dateTime, xs:dateTime, gml and derivatives"
+                 "\n            e.g. 2014-12-25T00:00:00.000Z"
+                 "\n                 2014-12-25T00:00:00.000+11:00"
+                 "\n                 2014-12-25T00:00:00.000+1100"
+                 "\n                 2014-12-25T00:00:00.000+11"
+                 "\n"
+                 "\nDeprecated options:"
+                 "\n    --to-seconds,--sec,-s: iso input expected; use --from, --to"
+                 "\n    --to-iso-string,--iso,-i: input as seconds expected; use --from, --to"
+                 "\n"
+                 "\n";
     exit( 0 );
 }
 
@@ -187,11 +155,8 @@ static what_t what( const std::string& option, const comma::command_line_options
 static boost::posix_time::ptime from_string_xsd( const std::string& s )
 {
     std::string t = s;
-
-    // Set the delimiter between date and time to be what time_from_string expects
-    const size_t idx_t = t.find( 'T' );
+    const size_t idx_t = t.find( 'T' ); // Set the delimiter between date and time to be what time_from_string expects
     if ( std::string::npos != idx_t ) t[idx_t] = ' ';
-
     // Determine the timezone offset. Could be any of Z,+-hh:mm,+-hhmm,+-hh
     signed hrs = 0;
     signed mins = 0;
@@ -220,7 +185,7 @@ static boost::posix_time::ptime from_string_xsd( const std::string& s )
     }
     // Construct the time from the string and apply the offset
     boost::posix_time::ptime result = boost::posix_time::time_from_string( t );
-    result += boost::posix_time::hours(hrs) + boost::posix_time::minutes(mins);
+    result += boost::posix_time::hours( hrs ) + boost::posix_time::minutes( mins );
     return result;
 }
 
@@ -388,7 +353,6 @@ namespace comma { namespace visiting {
 template <> struct traits< input_t >
 {
     template < typename K, typename V > static void visit( const K&, const input_t& p, V& v ) { v.apply( "values", p.values ); }
-
     template < typename K, typename V > static void visit( const K&, input_t& p, V& v ) { v.apply( "values", p.values ); }
 };
 
@@ -434,8 +398,7 @@ static void init_input()
         {
             fields += comma;
             comma = ",";
-            if( keep[i] )
-                fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]";
+            if( keep[i] ) { fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]"; }
         }
     }
     else
@@ -444,9 +407,7 @@ static void init_input()
         {
             fields += comma;
             comma = ",";
-
-            if( ! names[i].empty() )
-                fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]";
+            if( ! names[i].empty() ) { fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]"; }
         }
     }
 
diff --git a/csv/applications/csv-to-bin.cpp b/csv/applications/csv-to-bin.cpp
index acf8ed667..22c8d024a 100644
--- a/csv/applications/csv-to-bin.cpp
+++ b/csv/applications/csv-to-bin.cpp
@@ -38,7 +38,6 @@
 
 #include <stdlib.h>
 #include <iostream>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../csv/format.h"
 #include "../../string/string.h"
@@ -58,7 +57,6 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << csv::format::usage() << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index c2bf85f77..de79a13e3 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -53,7 +53,6 @@
 #include <boost/units/base_units/angle/degree.hpp>
 
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
 #include "../../visiting/traits.h"
@@ -114,7 +113,6 @@ static void usage(char const * const txt = "")
     std::cerr << msg_general << std::endl; // endl to make this function easier to debug by flushing
     std::cerr << "\ncsv options\n" << comma::csv::options::usage() << std::endl;
     std::cerr << msg_examples << std::endl;
-    std::cerr << '\n' << comma::contact_info << '\n' << std::endl;
     exit( 1 );
 }
 
diff --git a/io/applications/io-bandwidth.cpp b/io/applications/io-bandwidth.cpp
index 86ebfef73..f774f9ec3 100644
--- a/io/applications/io-bandwidth.cpp
+++ b/io/applications/io-bandwidth.cpp
@@ -36,7 +36,6 @@
 #include <boost/circular_buffer.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../io/select.h"
 #include "../../io/stream.h"
 
@@ -105,7 +104,6 @@ void usage( bool verbose = false )
     std::cerr << "            dd if=/dev/urandom bs=100 count=1 2> /dev/null; sleep 0.1" << std::endl;
     std::cerr << "        done | io-bandwidth 2> >( io-publish tcp:8888 ) | hexdump" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/io/applications/io-buffer.cpp b/io/applications/io-buffer.cpp
index f2901cfb4..23cbf7d78 100644
--- a/io/applications/io-buffer.cpp
+++ b/io/applications/io-buffer.cpp
@@ -48,7 +48,6 @@
 #include <boost/interprocess/sync/scoped_lock.hpp>
 #include <boost/algorithm/string.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../io/stream.h"
@@ -102,7 +101,6 @@ void usage( bool verbose = false )
     std::cerr << "          See 'out' operation, in this mode, the program write to standard output and exits when buffer is full." << std::endl;
     std::cerr << "          Call io-buffer multiple times to read more input data." << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 0e85ec4e7..ad2e13d68 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -40,7 +40,6 @@
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -104,7 +103,6 @@ void usage( bool verbose = false )
     std::cerr << "        merge line-based input with stdin" << std::endl;
     std::cerr << "            echo hello | io-cat tcp:localhost:55555 -" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/io/applications/io-line.cpp b/io/applications/io-line.cpp
index 3194ea6f9..db471345c 100644
--- a/io/applications/io-line.cpp
+++ b/io/applications/io-line.cpp
@@ -38,7 +38,6 @@
 #include <string>
 #include <vector>
  
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 
@@ -79,7 +78,6 @@ void usage( bool const verbose = false )
         "\n    ( echo xxx ; echo yy ; echo zzzz ) | io-line length | while true ; do echo 'read line:' ; io-line get || break ; done"
         "\n"
         "\n";
-    std::cerr << message << comma::contact_info << '\n' << std::endl;
     std::exit( 0 );
 }
 
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index bda3ad29f..06a7a9908 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -39,7 +39,6 @@
 #include <boost/ptr_container/ptr_vector.hpp>
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../application/signal_flag.h"
 #include "../../base/last_error.h"
@@ -109,7 +108,6 @@ static void usage( bool verbose = false )
     std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand --exec \"camera-cat arg1 arg2\"" << std::endl;
     std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand -- camera-cat arg1 arg2" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 232079a86..f15a61114 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -39,7 +39,6 @@
 #include <boost/asio/ip/udp.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/noncopyable.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
@@ -60,7 +59,6 @@ void usage()
     std::cerr << "    --reuse-addr,--reuseaddr: reuse udp address/port" << std::endl;
     std::cerr << "    --timestamp: output packet timestamp (currently just system time)" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/io/applications/zero-cat.cpp b/io/applications/zero-cat.cpp
index 52ac3750a..acec1baf2 100644
--- a/io/applications/zero-cat.cpp
+++ b/io/applications/zero-cat.cpp
@@ -41,7 +41,6 @@
 #include <boost/array.hpp>
 #include <boost/program_options.hpp>
 #include <boost/thread.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../io/publisher.h"
 #include "../../string/string.h"
@@ -116,7 +115,6 @@ void usage( boost::program_options::options_description const & description, boo
                  "\n        If outputting messages to a single pipe it is better to keep zero-cat"
                  "\n        running to minimise load and maximise throughput."
                  "\n"
-                << comma::contact_info
                 << std::endl;
 }
 
diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index 6c0ac8d18..1aab4213f 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -40,7 +40,6 @@
 #include <boost/regex.hpp>
 #include <boost/version.hpp>
 #include "../../base/exception.h"
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../name_value/ptree.h"
 #include "../../name_value/serialize.h"
@@ -88,7 +87,6 @@ static void usage( bool verbose = false )
     std::cerr << "    --linewise,-l: if present, treat each input line as a record" << std::endl;
     std::cerr << "                   if absent, treat all of the input as one record" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/name_value/applications/name-value-from-csv.cpp b/name_value/applications/name-value-from-csv.cpp
index a6302d60a..a5cb18ffc 100644
--- a/name_value/applications/name-value-from-csv.cpp
+++ b/name_value/applications/name-value-from-csv.cpp
@@ -31,7 +31,6 @@
 
 #include <iostream>
 #include <boost/lexical_cast.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../string/split.h"
 
@@ -82,7 +81,6 @@ static void usage( bool verbose = false )
     std::cerr << "    a[1]/foo/bar/baz[\"aa\"]/c=3" << std::endl;
     std::cerr << "    a[4]/foo/bar/baz[\"bb\"]/c=6" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index 17600b684..e4570b68f 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -39,7 +39,6 @@
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/regex.hpp>
 #include "../../base/exception.h"
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../name_value/ptree.h"
 #include "../../name_value/serialize.h"
@@ -89,7 +88,6 @@ static void usage( bool verbose = false )
     std::cerr << "    --linewise,-l: if present, treat each input line as a record" << std::endl;
     std::cerr << "                   if absent, treat all of the input as one record" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/name_value/applications/name-value-permute.cpp b/name_value/applications/name-value-permute.cpp
index bd845f266..43148e1a7 100644
--- a/name_value/applications/name-value-permute.cpp
+++ b/name_value/applications/name-value-permute.cpp
@@ -32,7 +32,6 @@
 #include <boost/lexical_cast.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include "../../base/exception.h"
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../string/split.h"
 
@@ -68,7 +67,6 @@ static void usage( bool verbose = false )
     std::cerr << "          string=\"a,\";b;c" << std::endl;
     std::cerr << "          unchanged=unchanged' | name-value-permute --stdout --delimiter=';'" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/util/applications/comma-timeout-group.cpp b/util/applications/comma-timeout-group.cpp
index 555e7a3fc..5ab4eceed 100644
--- a/util/applications/comma-timeout-group.cpp
+++ b/util/applications/comma-timeout-group.cpp
@@ -47,7 +47,6 @@
 #include <boost/lexical_cast.hpp>
 #include <boost/assign/list_of.hpp>
 
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -183,7 +182,6 @@ void usage( bool )
         "\n            exit with error"
         "\n"
         "\n";
-    std::cerr << msg_general << comma::contact_info << std::endl << std::endl;
     exit( 0 );
 }
 

From 79ea52bedcc7cafaa3ce3e9f0535aa815cc1de2e Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:05:00 +1100
Subject: [PATCH 0244/1056] python/comma: numpy version check temporarily added
 to make csv-eval working on ubuntu 18.04 in which apt install python3-numpy
 installs numpy 1.13; this change makes csv-eval slower in ascii and thus it
 will be removed, once ubuntu 18.04 support is not required anymore

---
 python/comma/csv/stream.py | 7 +++++--
 python/comma/csv/time.py   | 2 ++
 2 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 4cb5015bc..ecdc5a2a7 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -44,6 +44,7 @@
 from .struct import struct
 
 DEFAULT_PRECISION = 12
+NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
 
 def custom_formatwarning(msg, *args): return __name__ + " warning: " + str(msg) + '\n'
 
@@ -134,7 +135,7 @@ def read(self, size=None):
         return self._struct_array(self._input_array, self.missing_values)
 
     def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in numpy 1.14; see doc of encoding parameter in https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.genfromtxt.html
-        if np.__version__ >= '1.14.0':
+        if NUMPY_VERSION_MAJOR_ >= 1 or NUMPY_VERSION_MINOR_ >= 14: # quick and dirty, since ubuntu 18.04 python3-numpy still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
             return np.genfromtxt( self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter
@@ -144,7 +145,9 @@ def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in
                                 , comments = None
                                 , encoding = None )
         else:
-            return np.genfromtxt( self._ascii_buffer
+            # https://github.com/numpy/numpy/issues/10511 genfromtxt issue in numpy 1.13.x
+            from io import BytesIO
+            return np.genfromtxt( BytesIO( bytes( '\n'.join( self._ascii_buffer ).encode( 'utf-8' ) ) ) if major == 1 and minor == 13 else self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter
                                 , converters = self.ascii_converters
diff --git a/python/comma/csv/time.py b/python/comma/csv/time.py
index b1deaa33f..c11003f09 100644
--- a/python/comma/csv/time.py
+++ b/python/comma/csv/time.py
@@ -42,6 +42,7 @@
 POSITIVE_INFINITY = np.datetime64('294247-01-09T04:00:54.775807')
 NEGATIVE_INFINITY = np.datetime64('-290308-12-22T19:59:05.224191')
 BASESTRING = basestring if sys.version_info.major < 3 else str # sigh...
+NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
 
 def is_undefined(numpy_time): return str(numpy_time) == str(NOT_A_DATE_TIME)
 
@@ -65,6 +66,7 @@ def to_numpy(t):
     >>> to_numpy('')
     numpy.datetime64('NaT')
     """
+    if NUMPY_VERSION_MAJOR_ == 1 and NUMPY_VERSION_MAJOR_ < 14 and isinstance( t, bytes ): t = t.decode( 'utf-8' ) # quick and dirty, since ubuntu 18.04 python3-numpy still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
     if t in ['', 'not-a-date-time']: return NOT_A_DATE_TIME
     if t in ['+infinity', '+inf', 'infinity', 'inf']: return POSITIVE_INFINITY
     if t in ['-infinity', '-inf']: return NEGATIVE_INFINITY

From fc5902db46238861704469b9b44ecbfb24b5e15c Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:08:49 +1100
Subject: [PATCH 0245/1056] python/comma/csv: a minor bug fixed

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index ecdc5a2a7..ebe0375d5 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -135,7 +135,7 @@ def read(self, size=None):
         return self._struct_array(self._input_array, self.missing_values)
 
     def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in numpy 1.14; see doc of encoding parameter in https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.genfromtxt.html
-        if NUMPY_VERSION_MAJOR_ >= 1 or NUMPY_VERSION_MINOR_ >= 14: # quick and dirty, since ubuntu 18.04 python3-numpy still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
+        if NUMPY_VERSION_MAJOR_ > 1 or NUMPY_VERSION_MINOR_ >= 14: # quick and dirty, since ubuntu 18.04 python3-numpy still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
             return np.genfromtxt( self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter

From 068d71e31afe6efb729cce391633e2d967d1fb74 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:23:34 +1100
Subject: [PATCH 0246/1056] system/package/readme: typo fixed

---
 system/package/readme | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/readme b/system/package/readme
index c677fb934..316c27bb4 100644
--- a/system/package/readme
+++ b/system/package/readme
@@ -15,5 +15,5 @@ debian package will be built in your current directory
 
 test that package is ok, e.g:
 
-> ./comma-package-docker-test 20.04 comma-1.0.0-Linux.deb
+> ./comma-package-docker-test 20.04 comma-1.0.0-Linux.deb python3-comma_1.0.0-1_all.deb
 

From 3ddb1e244188ab8a0eee96cc6142d6515556a76e Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:25:08 +1100
Subject: [PATCH 0247/1056] system/package/comma-package-docker-test: typo
 fixed

---
 system/package/comma-package-docker-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/comma-package-docker-test b/system/package/comma-package-docker-test
index d23128cc2..3c9eb490e 100755
--- a/system/package/comma-package-docker-test
+++ b/system/package/comma-package-docker-test
@@ -6,7 +6,7 @@ ubuntu_version="$1"
 package="$2"
 python_package="$3"
 comma_dir="$4"
-[[ -n "$package" ]] || { echo "usage: $0 <ubuntu version> <package> <python package> [<comma dir>]" >&2; exit 1; }
+[[ -n "$python_package" ]] || { echo "usage: $0 <ubuntu version> <package> <python package> [<comma dir>]" >&2; exit 1; }
 [[ -s "$package" ]] || die "file not found or empty: '$package'"
 [[ -s "$python_package" ]] || die "file not found or empty: '$python_package'"
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"

From 2351d8b7cc62fb2ef74846ce14ae1939fcec6b84 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:26:41 +1100
Subject: [PATCH 0248/1056] system/package/comma-package-test: removed manual
 numpy installation with pip3

---
 system/package/comma-package-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 5eeb97f23..615d9bd81 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -5,7 +5,7 @@ function die() { echo "$0: $@" >&2; exit 1; }
 package="$1"
 python_package="$2"
 [[ -n "$python_package" ]] || { echo "usage: $0 <package> <python package>" >&2; exit 1; }
-pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
+#pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
 apt install --yes "$python_package" || die "failed to install package '$python_package'"
 apt install --yes "$package" || die "failed to install package '$package'"
 

From ae0014f5d3f4fcd56d35dfda1feb291987bb4623 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:43:34 +1100
Subject: [PATCH 0249/1056] system/package: trying to make it work for ubuntu
 18.04 with numpy 1.13...

---
 python/comma/csv/stream.py        | 29 +----------------------------
 python/comma/csv/time.py          | 29 +----------------------------
 system/package/comma-package-test |  2 +-
 3 files changed, 3 insertions(+), 57 deletions(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index ebe0375d5..99aafe877 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -1,31 +1,4 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import print_function
 import copy
@@ -44,7 +17,7 @@
 from .struct import struct
 
 DEFAULT_PRECISION = 12
-NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
+NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATCH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
 
 def custom_formatwarning(msg, *args): return __name__ + " warning: " + str(msg) + '\n'
 
diff --git a/python/comma/csv/time.py b/python/comma/csv/time.py
index c11003f09..742773092 100644
--- a/python/comma/csv/time.py
+++ b/python/comma/csv/time.py
@@ -1,31 +1,4 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import absolute_import
 import numpy as np
@@ -42,7 +15,7 @@
 POSITIVE_INFINITY = np.datetime64('294247-01-09T04:00:54.775807')
 NEGATIVE_INFINITY = np.datetime64('-290308-12-22T19:59:05.224191')
 BASESTRING = basestring if sys.version_info.major < 3 else str # sigh...
-NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
+NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATCH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
 
 def is_undefined(numpy_time): return str(numpy_time) == str(NOT_A_DATE_TIME)
 
diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index 615d9bd81..c06d6cc21 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -20,7 +20,7 @@ type -p comma-application-util || die "failed: failed"
 echo "$0: testing bash utils: done"
 
 echo "$0: testing csv-eval..."
-output=$( csv-paste line-number | head | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
+output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
 expected=$( seq 1 10 )
 [[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
 echo "$0: testing csv-eval: done"

From 80bbe096c543227ea8068a00db8bd0db32ffa9f7 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:53:05 +1100
Subject: [PATCH 0250/1056] numpy version added to --help, since it has been
 causing so much pain

---
 python/comma/csv/applications/csv_eval.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index a6abff2af..1d406afd9 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -15,7 +15,8 @@
 
 description = """
 evaluate numerical expressions and append computed values to csv stream
-"""
+
+using numpy version """ + np.__version__ + "\n"
 
 notes_and_examples = """
 input fields:

From 397bf1e210c0dbbc37664123d5806a6b00d9345b Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 11:56:40 +1100
Subject: [PATCH 0251/1056] numpy version added to --help, since it has been
 causing so much pain

---
 system/package/comma-package-test | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/system/package/comma-package-test b/system/package/comma-package-test
index c06d6cc21..250fe74f9 100755
--- a/system/package/comma-package-test
+++ b/system/package/comma-package-test
@@ -9,18 +9,21 @@ python_package="$2"
 apt install --yes "$python_package" || die "failed to install package '$python_package'"
 apt install --yes "$package" || die "failed to install package '$package'"
 
-echo "$0: testing basic csv utilities..."
+echo "$0: testing basic csv utilities..." >&2
 output=$( csv-paste line-number | head | csv-to-bin ui | csv-from-bin ui ) || die "failed: failed to run"
 expected=$( seq 0 9 )
 [[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
-echo "$0: testing basic csv utilities: done"
+echo "$0: testing basic csv utilities: done" >&2
 
 echo "$0: testing bash utils..."
 type -p comma-application-util || die "failed: failed"
-echo "$0: testing bash utils: done"
+echo "$0: testing bash utils: done" >&2
 
-echo "$0: testing csv-eval..."
+echo "$0: running csv-eval --help (for reference)..." >&2
+csv-eval --help
+
+echo "$0: testing csv-eval..." >&2
 output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
 expected=$( seq 1 10 )
 [[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
-echo "$0: testing csv-eval: done"
+echo "$0: testing csv-eval: done" >&2

From f323ca2beafa0eb065a122db253ee15520370625 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 12:00:46 +1100
Subject: [PATCH 0252/1056] system/package: trying to make it work for ubuntu
 18.04 with numpy 1.13...

---
 python/comma/csv/stream.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/comma/csv/stream.py b/python/comma/csv/stream.py
index 99aafe877..3bdc89b81 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/stream.py
@@ -120,7 +120,7 @@ def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in
         else:
             # https://github.com/numpy/numpy/issues/10511 genfromtxt issue in numpy 1.13.x
             from io import BytesIO
-            return np.genfromtxt( BytesIO( bytes( '\n'.join( self._ascii_buffer ).encode( 'utf-8' ) ) ) if major == 1 and minor == 13 else self._ascii_buffer
+            return np.genfromtxt( BytesIO( bytes( '\n'.join( self._ascii_buffer ).encode( 'utf-8' ) ) ) if NUMPY_VERSION_MAJOR_ == 1 and NUMPY_VERSION_MINOR_ == 13 else self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter
                                 , converters = self.ascii_converters

From 8cd000649ca385cd839ccf0853f40d7a17e83427 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Nov 2020 12:26:49 +1100
Subject: [PATCH 0253/1056] system/package: fixing packaging for ubuntu 20.04

---
 system/package/Dockerfile | 1 +
 1 file changed, 1 insertion(+)

diff --git a/system/package/Dockerfile b/system/package/Dockerfile
index 8c868912a..f9e25ee2c 100644
--- a/system/package/Dockerfile
+++ b/system/package/Dockerfile
@@ -6,5 +6,6 @@ RUN apt update \
     && apt install --yes ansible git build-essential cmake cmake-curses-gui python3-pip
 RUN apt install --yes python3-stdeb
 RUN apt install --yes python3-all
+RUN apt install --yes dh-python
 
 # && apt-add-repository --yes --update ppa:ansible/ansible \

From 38e50362f0b8ccdb1a34e63e59980b314cb3b662 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 3 Nov 2020 22:27:12 +1100
Subject: [PATCH 0254/1056] io-line, io-concole: --help fixed

---
 io/applications/io-console.cpp | 29 +----------------------------
 io/applications/io-line.cpp    | 29 +----------------------------
 2 files changed, 2 insertions(+), 56 deletions(-)

diff --git a/io/applications/io-console.cpp b/io/applications/io-console.cpp
index 5ff2525d8..4e8206310 100644
--- a/io/applications/io-console.cpp
+++ b/io/applications/io-console.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <termios.h>
 #include <iostream>
@@ -51,7 +24,7 @@ int main( int argc, char** argv )
 
         if ( vm.count( "help" ) )
         {
-            std::cerr << "take arrow keys, output key numeric values to stdout" << std::endl;
+            std::cerr << "take key presses, output key numeric values to stdout" << std::endl;
             std::cerr << "usage: io-console [<options>]" << std::endl;
             std::cerr << description << std::endl;
             return 1;
diff --git a/io/applications/io-line.cpp b/io/applications/io-line.cpp
index db471345c..7617634f0 100644
--- a/io/applications/io-line.cpp
+++ b/io/applications/io-line.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author mathew hounsell
 
@@ -43,7 +16,7 @@
 
 void usage( bool const verbose = false )
 {
-    static char const * const message =
+    std::cerr <<
         "\n"
         "\nA toolkit for quick access to ascii line-based input stream"
         "\n"

From 48431a964131b0c5992be4ad198bae9bf50c42f4 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 4 Nov 2020 00:06:40 +1100
Subject: [PATCH 0255/1056] name-value-calc: --help fixed

---
 name_value/applications/name-value-calc | 78 +++++++------------------
 1 file changed, 20 insertions(+), 58 deletions(-)

diff --git a/name_value/applications/name-value-calc b/name_value/applications/name-value-calc
index 0dc525d72..261d85d78 100755
--- a/name_value/applications/name-value-calc
+++ b/name_value/applications/name-value-calc
@@ -1,51 +1,22 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 name=$( basename $0 )
 
-source $( which comma-application-util ) || { echo "$name: cannot source 'comma-application-util'" >&2; exit 1; }
+source $( type -p comma-application-util )
 
 simple_usage()
 {
-    cat <<EOF
-Usage: $name <file1> <file2> ... [--add|--sub|--other-operations] [-h|--help]
-       ${name//?/ } [--json] [--strict] [--details] [--exclude path]
-EOF
-    if [[ $# != 0 ]]; then exit $1; fi
+    cat <<eof >&2
+Usage: name-value-calc <file1> <file2> ... [--add|--sub|--other-operations] [-h|--help] [--json] [--strict] [--details] [--exclude <path>]
+eof
 }
 
 usage()
 {
     simple_usage
-    cat >&2 <<EOF
+    cat <<eof >&2
 
 Perform simple calculations on corresponding values in multiple name=value or .json input files.
 
@@ -89,40 +60,36 @@ Notes on comparison:
 
 Examples:
 
-    $name f1 f2 f3 --add
+    name-value-calc f1 f2 f3 --add
         -- add all values in f1, f2 and f3
 
-    $name f1.json --sub f2.json --json
+    name-value-calc f1.json --sub f2.json --json
         -- subtract all values in f2.json from f1.json (output in .json format)
 
-    $name f1.json f2.json --sub --json
+    name-value-calc f1.json f2.json --sub --json
         -- same as above; placement of the operation option does not matter
 
-    v=\$( $name f1 f2 --less )
+    v=\$( name-value-calc f1 f2 --less )
         -- capture the comparison result in a variable; v is 1 if comparison is true
 
-    (( $($name f1 --less f2) == 1 )) && echo "f1 < f2" || echo "f1 is not < f2"
+    (( \$( name-value-calc f1 --less f2 ) == 1 )) && echo "f1 < f2" || echo "f1 is not < f2"
         -- compares values in f1 and f2 and reports the outcome
 
-    $name f1 f2 --sub --strict > outfile
-    (( $? == 0 )) || exit 1
+    name-value-calc f1 f2 --sub --strict > outfile
+    (( \$? == 0 )) || exit 1
         -- will fail if the first input file contains string data (operation '-' is not
            defined for strings)
 
-    $name f1 f2 --sub --strict --exclude "path/to/string" > outfile
+    name-value-calc f1 f2 --sub --strict --exclude "path/to/string" > outfile
         -- specifically exclude a specified data path from the operation, e.g., because
            the '-' operation is not defined for strings
 
-EOF
-    if [[ $# != 0 ]]; then exit $1; fi
+eof
+    exit
 }
 
-function bye()
-{
-    if [[ -z $1 ]] ; then exit 1 ; else exit $1; fi
-}
+function bye() { [[ -z "$1" ]] || exit 1; exit $1; }
 
-# arguments are an error message to print
 function die()
 {
     echo "$name: $*" >&2
@@ -134,12 +101,7 @@ function inlist()
 {
     local value="$1"
     local list="$2"
-    local c
-    for c in $list ; do
-        if [[ "$c" == "$value" ]]; then
-            return 0
-        fi
-    done
+    for c in $list ; do [[ "$c" != "$value" ]] || return 0; done
     return 1
 }
 
@@ -241,7 +203,7 @@ function invert_grep()
     echo $?
 }
 
-if [[ $# == 0 ]]; then simple_usage 1; fi
+[[ $# > 0 ]] || { simple_usage; exit 1; }
 
 input_files=()
 operation=
@@ -253,7 +215,7 @@ debug=1
 
 while [[ $# -gt 0 ]]; do
     case "$1" in
-        -h|--help)                usage 0;;
+        -h|--help)                usage;;
         --add)                    operation="+";;
         --sub|--subtract)         operation="-";;
         --mul|--mult|--multiply)  operation="*";;
@@ -281,7 +243,7 @@ done
 binary_operands=( "-" "/" "//" "<" "<=" ">" ">=" "==" "!=" )
 logical_operands=( "<" "<=" ">" ">=" "==" "!=" )
 
-if [[ ${#input_files[@]} == 0 ]]; then simple_usage 1; fi
+[[ ${#input_files[@]} != 0 ]] || { simple_usage; exit 1; }
 if [[ ${#input_files[@]} == 1 ]]; then echo "$name: at least two input files required" >&2; exit 1; fi
 if [[ -z "$operation" ]]; then echo "$name: operation must be specified (e.g. --subtract)" >&2; exit 1; fi
 if binary_op "$operation" && [[ ${#input_files[@]} > 2 ]]; then echo "$name: only two input files permitted with $operation operation"; exit 1; fi

From 7969c4f9fc5c079fd5c280c36a533855921c22a4 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 6 Nov 2020 11:12:11 +1100
Subject: [PATCH 0256/1056] name-value-apply: --help improved

---
 name_value/applications/name-value-apply | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/name_value/applications/name-value-apply b/name_value/applications/name-value-apply
index d6d8a5ca3..a5f540966 100755
--- a/name_value/applications/name-value-apply
+++ b/name_value/applications/name-value-apply
@@ -23,7 +23,10 @@ function usage()
 {
     cat >&2 <<EOF
 
-derive a config from multiple input configs
+take multiple path-value inputs, apply on top of each other
+    
+e.g: assume we have a default config file and then the user would like to set just some values and leave
+     the rest as default; then we simply apply the user's config on top of default as in examples below
 
 usage
     name-value-apply [<options>] <files...>

From 35786d95cf9d650f73630f7e1eb79963328bcd52 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 Nov 2020 11:51:46 +1100
Subject: [PATCH 0257/1056] name-value-to-csv: --unindexed-stream implemented;
 a basic test added

---
 name_value/applications/name-value-to-csv.cpp | 52 +++++++------------
 .../unindexed_stream/expected                 |  5 ++
 .../unindexed_fields/unindexed_stream/input   |  1 +
 .../unindexed_fields/unindexed_stream/test    |  3 ++
 4 files changed, 28 insertions(+), 33 deletions(-)
 create mode 100644 name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
 create mode 100644 name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
 create mode 100755 name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/test

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index d52114b4f..0abe2d4d9 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -1,31 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2020 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
@@ -52,6 +26,7 @@ static void usage( bool )
     std::cerr << "    --fields,-f=<fields>; fields to output" << std::endl;
     std::cerr << "    --prefix,--path,-p=[<prefix>]; optional prefix" << std::endl;
     std::cerr << "    --unindexed-fields=<fields>; if no --fields specified, output unindexed fields once, if --fields specified, append given unindexed fields to all records" << std::endl;
+    std::cerr << "    --unindexed-stream; read a stream of key-value pairs, on every input record output all up-to-date values of fields present in --unindexed-fields, see example below" << std::endl;
     std::cerr << "    --unsorted; the input data is not sorted by index" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
@@ -72,18 +47,24 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << "    unindexed fields" << std::endl;
     std::cerr << "        todo" << std::endl;
+    std::cerr << "    unindexed fields with --unindexed-stream" << std::endl;
+    std::cerr << "        > ( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream" << std::endl;
+    std::cerr << "        1," << std::endl;
+    std::cerr << "        1,3" << std::endl;
+    std::cerr << "        2,3" << std::endl;
+    std::cerr << "        2,4" << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
 
 typedef std::unordered_map< std::string, std::string > values_t;
 
-static std::string join( const std::vector< std::string >& fields, values_t& values, char delimiter )
+static std::string join( const std::vector< std::string >& fields, values_t& values, char delimiter, bool clear = true )
 {
     std::ostringstream oss;
     std::string comma;
     for( const auto& f: fields ) { oss << comma << values[f]; comma = delimiter; } // quick and dirty as everything else
-    values.clear();
+    if( clear ) { values.clear(); }
     return oss.str();
 }
 
@@ -92,10 +73,12 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
+        options.assert_mutually_exclusive( "--fields", "--unindexed-stream" );
         std::string fs = options.value< std::string >( "--fields,-f", "" );
         std::vector< std::string > fields = comma::split( fs, ',' );
         std::vector< std::string > unindexed_fields;
         std::string ufs = options.value< std::string >( "--unindexed-fields", "" );
+        bool unindexed_stream = options.exists( "--unindexed-stream" );
         std::unordered_set< std::string > unindexed_fields_set;
         if( !ufs.empty() )
         { 
@@ -105,8 +88,6 @@ int main( int ac, char** av )
         if( fields[0].empty() && unindexed_fields.empty() ) { std::cerr << "name-value-to-csv: please specify --fields or --unindexed-fields" << std::endl; return 1; }
         bool unindexed = fields[0].empty();
         values_t unindexed_values;
-        options.assert_mutually_exclusive( "--unsorted", "--unindexed,--no-index" );
-        options.assert_mutually_exclusive( "--unindexed,--no-index", "--unindexed-fields" );
         bool unsorted = options.exists( "--unsorted" );
         char delimiter = options.value( "--delimiter,-d", ',' );
         char equal_sign = options.value( "--equal-sign,-e", '=' );
@@ -122,7 +103,12 @@ int main( int ac, char** av )
             auto e = s.find_first_of( equal_sign ); // todo: use boost::spirit
             if( e == std::string::npos ) { std::cerr << "name-value-to-csv: expected path-value pair; got: '" << s << "'" << std::endl; return 1; }
             std::string name = s.substr( 0, e );
-            if( unindexed_fields_set.find( name ) != unindexed_fields_set.end() ) { unindexed_values[name] = s.substr( e + 1 ); continue; }
+            if( unindexed_fields_set.find( name ) != unindexed_fields_set.end() )
+            {
+                unindexed_values[name] = s.substr( e + 1 );
+                if( unindexed_stream ) { std::cout << join( unindexed_fields, unindexed_values, delimiter, false ) << std::endl; }
+                continue;
+            }
             if( name.substr( 0, prefix.size() ) != prefix ) { continue; }
             if( unindexed )
             {
@@ -141,7 +127,7 @@ int main( int ac, char** av )
             values[name.substr( b + 2 )] = s.substr( e + 1 );
             index = current_index;
         }
-        if( unindexed )
+        if( unindexed && !unindexed_stream )
         { 
             std::cout << join( unindexed_fields, unindexed_values, delimiter ) << std::endl;
         }
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
new file mode 100644
index 000000000..ff8f6058c
--- /dev/null
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
@@ -0,0 +1,5 @@
+unindexed_stream/basics[0]/output/line[0]="1,"
+unindexed_stream/basics[0]/output/line[1]="1,3"
+unindexed_stream/basics[0]/output/line[2]="2,3"
+unindexed_stream/basics[0]/output/line[3]="2,4"
+unindexed_stream/basics[0]/status=0
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
new file mode 100644
index 000000000..f7a0dbf62
--- /dev/null
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
@@ -0,0 +1 @@
+unindexed_stream/basics[0]="( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream"
\ No newline at end of file
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/test b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/test
new file mode 100755
index 000000000..988ba14ee
--- /dev/null
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+comma_test_commands

From 03005b644da4b01e7ae7621a1087916007bb9096 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 Nov 2020 16:31:30 +1100
Subject: [PATCH 0258/1056] name-value-to-csv: --unindexed-stream-update
 implemented

---
 name_value/applications/name-value-to-csv.cpp    | 16 ++++++++++++----
 .../unindexed_fields/unindexed_stream/expected   | 12 +++++++++---
 .../unindexed_fields/unindexed_stream/input      |  3 ++-
 3 files changed, 23 insertions(+), 8 deletions(-)

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index 0abe2d4d9..cadd823e4 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -26,7 +26,8 @@ static void usage( bool )
     std::cerr << "    --fields,-f=<fields>; fields to output" << std::endl;
     std::cerr << "    --prefix,--path,-p=[<prefix>]; optional prefix" << std::endl;
     std::cerr << "    --unindexed-fields=<fields>; if no --fields specified, output unindexed fields once, if --fields specified, append given unindexed fields to all records" << std::endl;
-    std::cerr << "    --unindexed-stream; read a stream of key-value pairs, on every input record output all up-to-date values of fields present in --unindexed-fields, see example below" << std::endl;
+    std::cerr << "    --unindexed-stream,--stream; read a stream of key-value pairs, on every input record output csv record with the field value set and other fields empty, see example below" << std::endl;
+    std::cerr << "    --unindexed-stream-update,--update; read a stream of key-value pairs, on every input record output all up-to-date values of fields present in --unindexed-fields, see example below" << std::endl;
     std::cerr << "    --unsorted; the input data is not sorted by index" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
@@ -50,6 +51,12 @@ static void usage( bool )
     std::cerr << "    unindexed fields with --unindexed-stream" << std::endl;
     std::cerr << "        > ( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream" << std::endl;
     std::cerr << "        1," << std::endl;
+    std::cerr << "        ,3" << std::endl;
+    std::cerr << "        2," << std::endl;
+    std::cerr << "        ,4" << std::endl;
+    std::cerr << "    unindexed fields with --unindexed-stream-update" << std::endl;
+    std::cerr << "        > ( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream" << std::endl;
+    std::cerr << "        1," << std::endl;
     std::cerr << "        1,3" << std::endl;
     std::cerr << "        2,3" << std::endl;
     std::cerr << "        2,4" << std::endl;
@@ -73,12 +80,13 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        options.assert_mutually_exclusive( "--fields", "--unindexed-stream" );
+        options.assert_mutually_exclusive( "--fields", "--unindexed-stream,--stream,--unindexed-stream-update,--update" );
         std::string fs = options.value< std::string >( "--fields,-f", "" );
         std::vector< std::string > fields = comma::split( fs, ',' );
         std::vector< std::string > unindexed_fields;
         std::string ufs = options.value< std::string >( "--unindexed-fields", "" );
-        bool unindexed_stream = options.exists( "--unindexed-stream" );
+        bool unindexed_stream_update = options.exists( "--unindexed-stream-update,--update" );
+        bool unindexed_stream = options.exists( "--unindexed-stream,--stream" ) || unindexed_stream_update;
         std::unordered_set< std::string > unindexed_fields_set;
         if( !ufs.empty() )
         { 
@@ -106,7 +114,7 @@ int main( int ac, char** av )
             if( unindexed_fields_set.find( name ) != unindexed_fields_set.end() )
             {
                 unindexed_values[name] = s.substr( e + 1 );
-                if( unindexed_stream ) { std::cout << join( unindexed_fields, unindexed_values, delimiter, false ) << std::endl; }
+                if( unindexed_stream ) { std::cout << join( unindexed_fields, unindexed_values, delimiter, !unindexed_stream_update ) << std::endl; }
                 continue;
             }
             if( name.substr( 0, prefix.size() ) != prefix ) { continue; }
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
index ff8f6058c..2d3b5bd94 100644
--- a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
@@ -1,5 +1,11 @@
 unindexed_stream/basics[0]/output/line[0]="1,"
-unindexed_stream/basics[0]/output/line[1]="1,3"
-unindexed_stream/basics[0]/output/line[2]="2,3"
-unindexed_stream/basics[0]/output/line[3]="2,4"
+unindexed_stream/basics[0]/output/line[1]=",3"
+unindexed_stream/basics[0]/output/line[2]="2,"
+unindexed_stream/basics[0]/output/line[3]=",4"
 unindexed_stream/basics[0]/status=0
+
+unindexed_stream/basics[1]/output/line[0]="1,"
+unindexed_stream/basics[1]/output/line[1]="1,3"
+unindexed_stream/basics[1]/output/line[2]="2,3"
+unindexed_stream/basics[1]/output/line[3]="2,4"
+unindexed_stream/basics[1]/status=0
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
index f7a0dbf62..20cea67ab 100644
--- a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
@@ -1 +1,2 @@
-unindexed_stream/basics[0]="( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream"
\ No newline at end of file
+unindexed_stream/basics[0]="( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream"
+unindexed_stream/basics[1]="( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream-update"
\ No newline at end of file

From eb15c7efabc655363530a10e5cece77ead376541 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 Nov 2020 17:08:20 +1100
Subject: [PATCH 0259/1056] comma-application-swiss-util: first cut done;
 debugging...

---
 bash/comma-application-swiss-util | 70 +++++++++++++++++++++++++++++++
 bash/comma-application-util       | 28 +------------
 2 files changed, 71 insertions(+), 27 deletions(-)
 create mode 100644 bash/comma-application-swiss-util

diff --git a/bash/comma-application-swiss-util b/bash/comma-application-swiss-util
new file mode 100644
index 000000000..08a620507
--- /dev/null
+++ b/bash/comma-application-swiss-util
@@ -0,0 +1,70 @@
+#!/bin/bash
+
+# Copyright (c) 2020 Vsevolod Vlaskine
+
+source $( type -p comma-application-util )
+
+function comma-application-swiss-init()
+{
+    local name=$( basename "$0" )
+    [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
+    comma_application_swiss_operation="$1"
+    if comma_options_help $@; then
+        if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
+            if [[ $( type -t usage ) == "function" ]]; then usage; else comma-application-swiss-usage; fi
+        else
+            echo
+            echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
+            echo
+            comma-application-swiss-usage-operation "${comma_application_swiss_operation}"
+            echo
+        fi >&2
+        exit 0
+    fi
+    function say() { echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
+    function die() { say "$@"; exit 1; }
+    [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
+    if [[ $( type -t common-options ) == "function" ]]; then
+        local options; options=$( common-options | comma-options-to-name-value "$@" ) || die "invalid options"
+        eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
+        #(( !options_verbose )) || verbose_option="--verbose"
+        #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
+        #(( !options_input_format )) || { eval "echo \$${operation//-/_}_input_format"; exit 0; } # quick and dirty
+        #(( !options_output_fields )) || { eval "echo \$${operation//-/_}_output_fields"; exit 0; } # quick and dirty
+        #(( !options_output_format )) || { eval "echo \$${operation//-/_}_output_format"; exit 0; } # quick and dirty
+    fi
+    if [[ $( type -t ${comma_application_swiss_operation}-options ) == "function" ]]; then
+        local operation_options; operation_options=$( ${comma_application_swiss_operation}-options | comma-options-to-name-value "$@" ) || die "invalid options"
+        eval "$( grep -v '^"' <<< "$operation_options" | sed 's#^#options_#' | comma_path_value_mangle )"
+    fi
+}
+
+function comma-application-swiss-usage-operation()
+{
+    local operation="$1"
+    local found=0
+    echo "${comma_application_swiss_operation}"
+    [[ $( type -t ${comma_application_swiss_operation}-description ) != "function" ]] || { ${comma_application_swiss_operation}-description | sed 's#^#    #'; found=1; }
+    [[ $( type -t ${comma_application_swiss_operation}-usage ) != "function" ]] || { echo "    usage"; ${comma_application_swiss_operation}-usage | sed 's#^#        #'; found=1; }
+    [[ $( type -t common-options ) != "function" ]] || { echo "    common options"; common-options | sed 's#^#        #'; found=1; }
+    [[ $( type -t ${comma_application_swiss_operation}-options ) != "function" ]] || { echo "    options"; ${comma_application_swiss_operation}-options | sed 's#^#        #'; found=1; }
+    [[ $( type -t ${comma_application_swiss_operation}-examples ) != "function" ]] || { echo "    examples"; ${comma_application_swiss_operation}-examples | sed 's#^#        #'; found=1; }
+    (( ! found )) || return 0
+    echo "    expected operation, got: '${comma_application_swiss_operation}', see --help with no other options for more information"
+    return 1
+}
+
+function comma-application-swiss-usage()
+{
+    echo
+    echo "usage: $( basename "$0" ) <operation> <options>"
+    [[ $( type -t common-options ) != "function" ]] || { echo; echo "common options"; common-options | sed 's#^#   #'; }
+    echo; echo "available operations: $@"
+    echo; echo "operations"
+    for operation in $@; do
+        comma-application-swiss-usage-operation "${comma_application_swiss_operation}" | sed 's#^#    #'
+        echo
+    done
+}
+
+function comma-application-swiss-run() { ${comma_application_swiss_operation}-run "$@"; }
\ No newline at end of file
diff --git a/bash/comma-application-util b/bash/comma-application-util
index ab656d7b8..7e1bfa817 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -1,33 +1,7 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+# Copyright (c) 2020 Vsevolod Vlaskine
 
 ## @page comma-application-util comma-application-util
 # this script is designed to be included in another script directly, for example:

From 7c37c3005e3486b18bc09a2e146f4699ef6c3722 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 Nov 2020 20:29:05 +1100
Subject: [PATCH 0260/1056] bash/cmake: comma-application-swiss-util made
 installable

---
 bash/CMakeLists.txt | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/bash/CMakeLists.txt b/bash/CMakeLists.txt
index 49d6ee611..31477f6e1 100644
--- a/bash/CMakeLists.txt
+++ b/bash/CMakeLists.txt
@@ -1,13 +1,14 @@
-INSTALL( PROGRAMS comma-application-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-log-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-name-value-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-progress-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-resources-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-sync-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-units-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-application-swiss-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-application-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-log-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-name-value-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-progress-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-resources-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-sync-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-units-util DESTINATION ${comma_INSTALL_BIN_DIR} )
 
 if( comma_BUILD_APPLICATIONS )
     add_subdirectory( applications )
 endif( comma_BUILD_APPLICATIONS )
-ADD_SUBDIRECTORY( process )
-ADD_SUBDIRECTORY( misc )
+add_subdirectory( process )
+add_subdirectory( misc )

From 79a2ff4e8d78d85f695d93077b09907a83115e3f Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 Nov 2020 21:32:52 +1100
Subject: [PATCH 0261/1056] name-value-convert: bug fixed

---
 name_value/impl/json_writer.h | 64 +++++++----------------------------
 1 file changed, 13 insertions(+), 51 deletions(-)

diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index 619c5cb05..d6d0833bf 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -1,69 +1,41 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_NAME_VALUE_JSON_WRITER_H_
-#define COMMA_NAME_VALUE_JSON_WRITER_H_
+#pragma once
 
+#include <algorithm>
 #include <iostream>
 #include <sstream>
 #include <string>
-#include <algorithm>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../base/exception.h"
 
-
 namespace comma { namespace name_value { namespace impl {
 
-// NOTE: assume valid json.
-template< typename C > void json_remove_quotes( std::basic_string< C >& json_text )
+template< typename C > void json_remove_quotes( std::basic_string< C >& json_text ) // assuming valid json
 {
     using string_type = std::basic_string< C >;
-
     string_type const true_str( std::initializer_list< C >{ 't', 'r', 'u', 'e' } );
     string_type const false_str( std::initializer_list< C >{ 'f', 'a', 'l', 's', 'e' } );
-
     auto source = json_text.begin();
     auto target = json_text.cbegin();
-
     while( target != json_text.cend() )
     {
         auto value_begin = std::find( target, json_text.cend(), '"' );
         while( target != value_begin ) { *source++ = *target++; }
         if( json_text.cend() == value_begin ) { break; }
-
         auto value_end = value_begin;
-        do { value_end = std::find( value_end + 1, json_text.cend(), '"' ); } while( '\\' == *( value_end - 1 ) );
+        //do { value_end = std::find( value_end + 1, json_text.cend(), '"' ); } while( '\\' == *( value_end - 1 ) );
+        while( true )
+        {
+            value_end = std::find( value_end + 1, json_text.cend(), '"' );
+            auto i = value_end - 1;
+            if( *i != '\\' || *( i - 1 ) == '\\' ) { break; } // hyper quick and dirty fix, sigh
+        }
         auto next_token = std::find_if_not( value_end + 1, json_text.cend(), []( C ch ) { return ' ' == ch || '\t' == ch || '\n' == ch; } );
-
         bool quoted = true;
         if( ':' != *next_token )
         {
@@ -71,7 +43,6 @@ template< typename C > void json_remove_quotes( std::basic_string< C >& json_tex
             if( true_str == value || false_str == value ) { quoted = false; }
             else { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
         }
-
         if( !quoted ) { value_begin++; }
         while( value_begin != value_end ) { *source++ = *value_begin++; }
         if( !quoted ) { value_end++; } 
@@ -90,7 +61,6 @@ inline void remove_quotes( std::string& s )
     std::string value;
     struct looking_for { enum what { first_quote, second_quote, escaped, colon }; };
     looking_for::what state = looking_for::first_quote;
-
     for( char* source = &s[0]; source != end; ++source )
     {
         switch( state )
@@ -112,15 +82,9 @@ inline void remove_quotes( std::string& s )
                 bool skip = false;
                 switch( *source )
                 {
-                    case ' ': case '\t': case '\n':
-                        skip=true;
-                        // todo
-                        break;
-                    case ':':
-                        break;
-                    default:
-                        try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} // hyper quick and dirty for now
-                        
+                    case ' ': case '\t': case '\n': skip=true; break;
+                    case ':': break;
+                    default: try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} // hyper quick and dirty for now
                 }
                 if( skip ) { break; }
                 if( quoted ) { *target++ = '"'; ++size; }
@@ -149,5 +113,3 @@ template<class Ptree> void write_json(std::basic_ostream< typename Ptree::key_ty
 }
  
 } } }
-
-#endif //COMMA_NAME_VALUE_JSON_WRITER_H_

From d0a545915964ac6f987a97593dd6d0b01715cac3 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Mon, 16 Nov 2020 12:58:43 +1100
Subject: [PATCH 0262/1056] comma-application-swiss-util: source guard added

---
 bash/comma-application-swiss-util | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/bash/comma-application-swiss-util b/bash/comma-application-swiss-util
index 08a620507..e772b88a0 100644
--- a/bash/comma-application-swiss-util
+++ b/bash/comma-application-swiss-util
@@ -2,6 +2,9 @@
 
 # Copyright (c) 2020 Vsevolod Vlaskine
 
+[[ -n "$comma_application_swiss_util_include_guard_" ]] && return 0
+readonly comma_application_swiss_util_include_guard_=1
+
 source $( type -p comma-application-util )
 
 function comma-application-swiss-init()
@@ -67,4 +70,4 @@ function comma-application-swiss-usage()
     done
 }
 
-function comma-application-swiss-run() { ${comma_application_swiss_operation}-run "$@"; }
\ No newline at end of file
+function comma-application-swiss-run() { ${comma_application_swiss_operation}-run "$@"; }

From 945a8a2aee754b4dcf9eff15a4384bfd891b5853 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Mon, 16 Nov 2020 15:26:50 +1100
Subject: [PATCH 0263/1056] comma-application-swiss-util: removed; code moved
 to comma-application-util

---
 bash/CMakeLists.txt               |  1 -
 bash/comma-application-swiss-util | 73 -----------------------------
 bash/comma-application-util       | 76 ++++++++++++++++++++++++++++++-
 3 files changed, 74 insertions(+), 76 deletions(-)
 delete mode 100644 bash/comma-application-swiss-util

diff --git a/bash/CMakeLists.txt b/bash/CMakeLists.txt
index 31477f6e1..4f3460a12 100644
--- a/bash/CMakeLists.txt
+++ b/bash/CMakeLists.txt
@@ -1,4 +1,3 @@
-install( PROGRAMS comma-application-swiss-util DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-application-util DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-log-util DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-name-value-util DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/bash/comma-application-swiss-util b/bash/comma-application-swiss-util
deleted file mode 100644
index e772b88a0..000000000
--- a/bash/comma-application-swiss-util
+++ /dev/null
@@ -1,73 +0,0 @@
-#!/bin/bash
-
-# Copyright (c) 2020 Vsevolod Vlaskine
-
-[[ -n "$comma_application_swiss_util_include_guard_" ]] && return 0
-readonly comma_application_swiss_util_include_guard_=1
-
-source $( type -p comma-application-util )
-
-function comma-application-swiss-init()
-{
-    local name=$( basename "$0" )
-    [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
-    comma_application_swiss_operation="$1"
-    if comma_options_help $@; then
-        if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
-            if [[ $( type -t usage ) == "function" ]]; then usage; else comma-application-swiss-usage; fi
-        else
-            echo
-            echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
-            echo
-            comma-application-swiss-usage-operation "${comma_application_swiss_operation}"
-            echo
-        fi >&2
-        exit 0
-    fi
-    function say() { echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
-    function die() { say "$@"; exit 1; }
-    [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
-    if [[ $( type -t common-options ) == "function" ]]; then
-        local options; options=$( common-options | comma-options-to-name-value "$@" ) || die "invalid options"
-        eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
-        #(( !options_verbose )) || verbose_option="--verbose"
-        #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
-        #(( !options_input_format )) || { eval "echo \$${operation//-/_}_input_format"; exit 0; } # quick and dirty
-        #(( !options_output_fields )) || { eval "echo \$${operation//-/_}_output_fields"; exit 0; } # quick and dirty
-        #(( !options_output_format )) || { eval "echo \$${operation//-/_}_output_format"; exit 0; } # quick and dirty
-    fi
-    if [[ $( type -t ${comma_application_swiss_operation}-options ) == "function" ]]; then
-        local operation_options; operation_options=$( ${comma_application_swiss_operation}-options | comma-options-to-name-value "$@" ) || die "invalid options"
-        eval "$( grep -v '^"' <<< "$operation_options" | sed 's#^#options_#' | comma_path_value_mangle )"
-    fi
-}
-
-function comma-application-swiss-usage-operation()
-{
-    local operation="$1"
-    local found=0
-    echo "${comma_application_swiss_operation}"
-    [[ $( type -t ${comma_application_swiss_operation}-description ) != "function" ]] || { ${comma_application_swiss_operation}-description | sed 's#^#    #'; found=1; }
-    [[ $( type -t ${comma_application_swiss_operation}-usage ) != "function" ]] || { echo "    usage"; ${comma_application_swiss_operation}-usage | sed 's#^#        #'; found=1; }
-    [[ $( type -t common-options ) != "function" ]] || { echo "    common options"; common-options | sed 's#^#        #'; found=1; }
-    [[ $( type -t ${comma_application_swiss_operation}-options ) != "function" ]] || { echo "    options"; ${comma_application_swiss_operation}-options | sed 's#^#        #'; found=1; }
-    [[ $( type -t ${comma_application_swiss_operation}-examples ) != "function" ]] || { echo "    examples"; ${comma_application_swiss_operation}-examples | sed 's#^#        #'; found=1; }
-    (( ! found )) || return 0
-    echo "    expected operation, got: '${comma_application_swiss_operation}', see --help with no other options for more information"
-    return 1
-}
-
-function comma-application-swiss-usage()
-{
-    echo
-    echo "usage: $( basename "$0" ) <operation> <options>"
-    [[ $( type -t common-options ) != "function" ]] || { echo; echo "common options"; common-options | sed 's#^#   #'; }
-    echo; echo "available operations: $@"
-    echo; echo "operations"
-    for operation in $@; do
-        comma-application-swiss-usage-operation "${comma_application_swiss_operation}" | sed 's#^#    #'
-        echo
-    done
-}
-
-function comma-application-swiss-run() { ${comma_application_swiss_operation}-run "$@"; }
diff --git a/bash/comma-application-util b/bash/comma-application-util
index 7e1bfa817..0b3a92e0e 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -17,8 +17,7 @@
 [[ -n "$comma_application_util_include_guard_" ]] && return 0
 readonly comma_application_util_include_guard_=1
 
-source $( type -p comma-name-value-util ) \
-    || { echo "$name: cannot source 'comma-name-value-util' from '$BASH_SOURCE'" >&2; exit 1; }
+source $( type -p comma-name-value-util ) || { echo "$name: cannot source 'comma-name-value-util' from '$BASH_SOURCE'" >&2; exit 1; }
 
 ## @page comma_options_from_name_value comma_options_from_name_value
 # @section comma_options_from_name_value
@@ -203,3 +202,76 @@ function comma_tee_function()
     io-tee "${file_and_options[@]}" "$functions ${functions:+;} $command" "${command_args[@]}"
 }
 export -f comma_tee_function
+
+function comma-application-swiss-init()
+{
+    local name=$( basename "$0" )
+    [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
+    comma_application_swiss_operation="$1"
+    if comma_options_help $@; then
+        if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
+            if [[ $( type -t usage ) == "function" ]]; then usage; else comma-application-swiss-usage; fi
+        else
+            echo
+            echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
+            echo
+            comma-application-swiss-usage-operation "${comma_application_swiss_operation}"
+            echo
+        fi >&2
+        exit 0
+    fi
+    function say() { echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
+    function die() { say "$@"; exit 1; }
+    [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
+    if [[ $( type -t common-options ) == "function" ]]; then
+        local options; options=$( common-options | comma-options-to-name-value "$@" ) || die "invalid options"
+        eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
+        #(( !options_verbose )) || verbose_option="--verbose"
+        #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
+        #(( !options_input_format )) || { eval "echo \$${operation//-/_}_input_format"; exit 0; } # quick and dirty
+        #(( !options_output_fields )) || { eval "echo \$${operation//-/_}_output_fields"; exit 0; } # quick and dirty
+        #(( !options_output_format )) || { eval "echo \$${operation//-/_}_output_format"; exit 0; } # quick and dirty
+    fi
+    if [[ $( type -t ${comma_application_swiss_operation}-options ) == "function" ]]; then
+        local operation_options; operation_options=$( ${comma_application_swiss_operation}-options | comma-options-to-name-value "$@" ) || die "invalid options"
+        eval "$( grep -v '^"' <<< "$operation_options" | sed 's#^#options_#' | comma_path_value_mangle )"
+    fi
+}
+
+export -f comma-application-swiss-init
+
+function comma-application-swiss-usage-operation()
+{
+    local operation="$1"
+    local found=0
+    echo "${comma_application_swiss_operation}"
+    [[ $( type -t ${comma_application_swiss_operation}-description ) != "function" ]] || { ${comma_application_swiss_operation}-description | sed 's#^#    #'; found=1; }
+    [[ $( type -t ${comma_application_swiss_operation}-usage ) != "function" ]] || { echo "    usage"; ${comma_application_swiss_operation}-usage | sed 's#^#        #'; found=1; }
+    [[ $( type -t common-options ) != "function" ]] || { echo "    common options"; common-options | sed 's#^#        #'; found=1; }
+    [[ $( type -t ${comma_application_swiss_operation}-options ) != "function" ]] || { echo "    options"; ${comma_application_swiss_operation}-options | sed 's#^#        #'; found=1; }
+    [[ $( type -t ${comma_application_swiss_operation}-examples ) != "function" ]] || { echo "    examples"; ${comma_application_swiss_operation}-examples | sed 's#^#        #'; found=1; }
+    (( ! found )) || return 0
+    echo "    expected operation, got: '${comma_application_swiss_operation}', see --help with no other options for more information"
+    return 1
+}
+
+export -f comma-application-swiss-usage-operation
+
+function comma-application-swiss-usage()
+{
+    echo
+    echo "usage: $( basename "$0" ) <operation> <options>"
+    [[ $( type -t common-options ) != "function" ]] || { echo; echo "common options"; common-options | sed 's#^#   #'; }
+    echo; echo "available operations: $@"
+    echo; echo "operations"
+    for operation in $@; do
+        comma-application-swiss-usage-operation "${comma_application_swiss_operation}" | sed 's#^#    #'
+        echo
+    done
+}
+
+export -f comma-application-swiss-usage
+
+function comma-application-swiss-run() { ${comma_application_swiss_operation}-run "$@"; }
+
+export -f comma-application-swiss-run

From cb329cb79699809cb95edfb4a6c45262f6a52909 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Mon, 16 Nov 2020 18:41:11 +1100
Subject: [PATCH 0264/1056] bash/comma-application-util: swiss in progress...

---
 bash/comma-application-util | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 0b3a92e0e..878084db9 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -206,6 +206,7 @@ export -f comma_tee_function
 function comma-application-swiss-init()
 {
     local name=$( basename "$0" )
+    local common_options=$( cat )
     [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
     comma_application_swiss_operation="$1"
     if comma_options_help $@; then
@@ -223,8 +224,8 @@ function comma-application-swiss-init()
     function say() { echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
     function die() { say "$@"; exit 1; }
     [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
-    if [[ $( type -t common-options ) == "function" ]]; then
-        local options; options=$( common-options | comma-options-to-name-value "$@" ) || die "invalid options"
+    if [[ -n "$common_options" ]]; then
+        local options; options=$( echo "$common_options" | comma-options-to-name-value "$@" ) || die "invalid options"
         eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
         #(( !options_verbose )) || verbose_option="--verbose"
         #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
@@ -243,11 +244,12 @@ export -f comma-application-swiss-init
 function comma-application-swiss-usage-operation()
 {
     local operation="$1"
+    local common_options=$( cat )
     local found=0
     echo "${comma_application_swiss_operation}"
     [[ $( type -t ${comma_application_swiss_operation}-description ) != "function" ]] || { ${comma_application_swiss_operation}-description | sed 's#^#    #'; found=1; }
     [[ $( type -t ${comma_application_swiss_operation}-usage ) != "function" ]] || { echo "    usage"; ${comma_application_swiss_operation}-usage | sed 's#^#        #'; found=1; }
-    [[ $( type -t common-options ) != "function" ]] || { echo "    common options"; common-options | sed 's#^#        #'; found=1; }
+    [[ -z "$common_options" ]] || { echo "    common options"; echo "$common_options" | sed 's#^#        #'; found=1; }
     [[ $( type -t ${comma_application_swiss_operation}-options ) != "function" ]] || { echo "    options"; ${comma_application_swiss_operation}-options | sed 's#^#        #'; found=1; }
     [[ $( type -t ${comma_application_swiss_operation}-examples ) != "function" ]] || { echo "    examples"; ${comma_application_swiss_operation}-examples | sed 's#^#        #'; found=1; }
     (( ! found )) || return 0
@@ -259,9 +261,10 @@ export -f comma-application-swiss-usage-operation
 
 function comma-application-swiss-usage()
 {
+    local common_options=$( cat )
     echo
     echo "usage: $( basename "$0" ) <operation> <options>"
-    [[ $( type -t common-options ) != "function" ]] || { echo; echo "common options"; common-options | sed 's#^#   #'; }
+    [[ -z "$common_options" ]] || { echo; echo "common options"; echo "$common_options" | sed 's#^#   #'; }
     echo; echo "available operations: $@"
     echo; echo "operations"
     for operation in $@; do

From 9d1d892122693efa258eb04daa0e184384110bef Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 17 Nov 2020 10:42:18 +1100
Subject: [PATCH 0265/1056] comma-test-run: --max-parallel: -P alias added

---
 util/applications/comma-test-run | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 9aaa742e6..0cd3b7df8 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -102,7 +102,7 @@ function description_resources()
     cat <<EOF
 --estimate-resources; in serial mode, accumulates performance data using comma-top into 'output/performance.csv' files;
   note: file may be empty for very short tests
---max-parallel=[<N>]; run up to N tests in parallel; default: $max_parallel
+--max-parallel,-P=[<N>]; run up to N tests in parallel; default: $max_parallel
 --max-memory-main=[<N>]; limit on main memory, in MB; default: $max_memory_main
 --max-memory-shared=[<N>]; limit on shared memory, in MB; default: $max_memory_shared
 --max-wait-time=[<time>]; maximal time to wait for available CPUs before failing a test, default: ${max_wait_time}

From cd6af4280cdf1386cec355ed7e8b78685088f312 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 17 Nov 2020 10:42:56 +1100
Subject: [PATCH 0266/1056] comma-application-util: comma-application-init:
 first cut implemented; debugging...

---
 bash/comma-application-util | 39 +++++++++++++++++++++++++++++++++++--
 1 file changed, 37 insertions(+), 2 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 878084db9..d397b903d 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -203,20 +203,55 @@ function comma_tee_function()
 }
 export -f comma_tee_function
 
+function comma-application-init()
+{
+    local name=$( basename "$0" )
+    local prologue="$1"
+    local epilogue="$2"
+    local common_options=$( cat )
+    if comma_options_help $@; then
+    
+        [[ -z "$prologue" ]] || $prologue >&2
+        cat <<eof >&2
+
+usage: $name [<options>]
+
+options
+$( "$common_options" | sed 's#^#    #' )
+
+eof
+        [[ -z "$epilogue" ]] || $epilogue >&2
+        exit 0
+    fi
+    function say() { echo "$name: $@" >&2; }
+    function die() { say "$@"; exit 1; }
+    local options; options=$( echo "$common_options" | comma-options-to-name-value "$@" ) || die "invalid options"
+    eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
+    declare -a options_unnamed
+    mapfile -t options_unnamed < <( grep '^"' <<< "$options" )
+    
+}
+
+export -f comma-application-init
+
 function comma-application-swiss-init()
 {
     local name=$( basename "$0" )
+    local prologue="$1"
+    local epilogue="$2"
     local common_options=$( cat )
     [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
     comma_application_swiss_operation="$1"
     if comma_options_help $@; then
         if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
-            if [[ $( type -t usage ) == "function" ]]; then usage; else comma-application-swiss-usage; fi
+            [[ -z "$prologue" ]] || $prologue >&2
+            comma-application-swiss-usage
+            [[ -z "$epilogue" ]] || $epilogue >&2
         else
             echo
             echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
             echo
-            comma-application-swiss-usage-operation "${comma_application_swiss_operation}"
+            echo "$common_options" | comma-application-swiss-usage-operation "${comma_application_swiss_operation}"
             echo
         fi >&2
         exit 0

From f9dad65aa85f28632ba3b8a42c324698b0f4934f Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 17 Nov 2020 12:56:12 +1100
Subject: [PATCH 0267/1056] comma-application-util: comma-application-init: bug
 fixed; debugging...

---
 bash/comma-application-util                   | 16 +++++------
 .../comma_status_ok/expected                  |  0
 .../comma_status_ok/test                      |  0
 util/applications/comma-test-run              | 27 -------------------
 4 files changed, 6 insertions(+), 37 deletions(-)
 rename bash/test/{ => comma-application-util}/comma_status_ok/expected (100%)
 rename bash/test/{ => comma-application-util}/comma_status_ok/test (100%)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index d397b903d..57196c391 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -210,17 +210,16 @@ function comma-application-init()
     local epilogue="$2"
     local common_options=$( cat )
     if comma_options_help $@; then
-    
-        [[ -z "$prologue" ]] || $prologue >&2
+        [[ "$( type -p prologue )" == "function" ]] || { echo; prologue; } >&2
         cat <<eof >&2
 
 usage: $name [<options>]
 
 options
-$( "$common_options" | sed 's#^#    #' )
+$( sed 's#^#    #' <<< "$common_options" )
 
 eof
-        [[ -z "$epilogue" ]] || $epilogue >&2
+        [[ "$( type -p epilogue )" == "function" ]] || { epilogue; echo; } >&2
         exit 0
     fi
     function say() { echo "$name: $@" >&2; }
@@ -229,7 +228,6 @@ eof
     eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
     declare -a options_unnamed
     mapfile -t options_unnamed < <( grep '^"' <<< "$options" )
-    
 }
 
 export -f comma-application-init
@@ -237,16 +235,14 @@ export -f comma-application-init
 function comma-application-swiss-init()
 {
     local name=$( basename "$0" )
-    local prologue="$1"
-    local epilogue="$2"
     local common_options=$( cat )
     [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
     comma_application_swiss_operation="$1"
     if comma_options_help $@; then
         if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
-            [[ -z "$prologue" ]] || $prologue >&2
+            [[ "$( type -p prologue )" == "function" ]] || { echo; prologue; } >&2
             comma-application-swiss-usage
-            [[ -z "$epilogue" ]] || $epilogue >&2
+            [[ "$( type -p epilogue )" == "function" ]] || { epilogue; echo; } >&2
         else
             echo
             echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
@@ -284,7 +280,7 @@ function comma-application-swiss-usage-operation()
     echo "${comma_application_swiss_operation}"
     [[ $( type -t ${comma_application_swiss_operation}-description ) != "function" ]] || { ${comma_application_swiss_operation}-description | sed 's#^#    #'; found=1; }
     [[ $( type -t ${comma_application_swiss_operation}-usage ) != "function" ]] || { echo "    usage"; ${comma_application_swiss_operation}-usage | sed 's#^#        #'; found=1; }
-    [[ -z "$common_options" ]] || { echo "    common options"; echo "$common_options" | sed 's#^#        #'; found=1; }
+    [[ -z "$common_options" ]] || { echo "    common options"; sed 's#^#        #' <<< "$common_options"; found=1; }
     [[ $( type -t ${comma_application_swiss_operation}-options ) != "function" ]] || { echo "    options"; ${comma_application_swiss_operation}-options | sed 's#^#        #'; found=1; }
     [[ $( type -t ${comma_application_swiss_operation}-examples ) != "function" ]] || { echo "    examples"; ${comma_application_swiss_operation}-examples | sed 's#^#        #'; found=1; }
     (( ! found )) || return 0
diff --git a/bash/test/comma_status_ok/expected b/bash/test/comma-application-util/comma_status_ok/expected
similarity index 100%
rename from bash/test/comma_status_ok/expected
rename to bash/test/comma-application-util/comma_status_ok/expected
diff --git a/bash/test/comma_status_ok/test b/bash/test/comma-application-util/comma_status_ok/test
similarity index 100%
rename from bash/test/comma_status_ok/test
rename to bash/test/comma-application-util/comma_status_ok/test
diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 0cd3b7df8..2dcc5b32d 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -1,33 +1,6 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 name=$( basename $0 )
 

From 94661e2f0ed907a1ca0d596320d79aea5b2d8c4d Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 17 Nov 2020 13:21:36 +1100
Subject: [PATCH 0268/1056] comma-application-util: comma-application-init:
 basic unit test added

---
 bash/comma-application-util                   |  4 +-
 .../comma-application-init/application        | 24 ++++++++
 .../comma-application-init/expected           | 60 +++++++++++++++++++
 .../comma-application-init/input              |  9 +++
 4 files changed, 95 insertions(+), 2 deletions(-)
 create mode 100755 bash/test/comma-application-util/comma-application-init/application
 create mode 100644 bash/test/comma-application-util/comma-application-init/expected
 create mode 100644 bash/test/comma-application-util/comma-application-init/input

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 57196c391..ec07d0553 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -226,8 +226,8 @@ eof
     function die() { say "$@"; exit 1; }
     local options; options=$( echo "$common_options" | comma-options-to-name-value "$@" ) || die "invalid options"
     eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
-    declare -a options_unnamed
-    mapfile -t options_unnamed < <( grep '^"' <<< "$options" )
+    # declare -a options_unnamed
+    mapfile -t options_unnamed < <( grep '^"' <<< "$options" | sed -e 's#^"##' -e 's#"$##' )
 }
 
 export -f comma-application-init
diff --git a/bash/test/comma-application-util/comma-application-init/application b/bash/test/comma-application-util/comma-application-init/application
new file mode 100755
index 000000000..001411dcf
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-init/application
@@ -0,0 +1,24 @@
+#!/bin/bash
+
+source $( type -p comma-application-util )
+
+function prologue() { echo "sample application: print parsed command line option values and exit"; }
+
+function epilogue() { echo "example: ./application some unnamed --mandatory blah stuff"; }
+
+function options-description()
+{
+    cat <<eof
+--defaulting,-d=<value>; default=hello; default value
+--flag; flag option
+--mandatory,-m=<value>; this is mandatory option
+--optional,-o=[<value>]; this is optional option
+eof
+}
+
+comma-application-init $@ < <( options-description ) || exit 1
+echo "options/defaulting=$options_defaulting"
+echo "options/flag=$options_flag"
+echo "options/mandatory=$options_mandatory"
+echo "options/optional=$options_optional"
+for (( i = 0; i < ${#options_unnamed[@]}; ++i )); do echo "options/unnamed[$i]=${options_unnamed[$i]}"; done
diff --git a/bash/test/comma-application-util/comma-application-init/expected b/bash/test/comma-application-util/comma-application-init/expected
new file mode 100644
index 000000000..7d5c81924
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-init/expected
@@ -0,0 +1,60 @@
+help/output/line[0]=""
+help/output/line[1]="sample application: print parsed command line option values and exit"
+help/output/line[2]=""
+help/output/line[3]="usage: application [<options>]"
+help/output/line[4]=""
+help/output/line[5]="options"
+help/output/line[6]="--defaulting,-d=<value>; default=hello; default value"
+help/output/line[7]="--flag; flag option"
+help/output/line[8]="--mandatory,-m=<value>; this is mandatory option"
+help/output/line[9]="--optional,-o=[<value>]; this is optional option"
+help/output/line[10]=""
+help/output/line[11]="example: ./application some unnamed --mandatory blah stuff"
+help/status=0
+
+options/mandatory[0]/output/line[0]="options/defaulting=hello"
+options/mandatory[0]/output/line[1]="options/flag="
+options/mandatory[0]/output/line[2]="options/mandatory=blah"
+options/mandatory[0]/output/line[3]="options/optional="
+options/mandatory[0]/status=0
+options/mandatory[1]/output=""
+options/mandatory[1]/status=1
+
+options/optional[0]/output/line[0]="options/defaulting=hello"
+options/optional[0]/output/line[1]="options/flag="
+options/optional[0]/output/line[2]="options/mandatory=blah"
+options/optional[0]/output/line[3]="options/optional="
+options/optional[0]/status=0
+options/optional[1]/output/line[0]="options/defaulting=hello"
+options/optional[1]/output/line[1]="options/flag="
+options/optional[1]/output/line[2]="options/mandatory=blah"
+options/optional[1]/output/line[3]="options/optional=bye"
+options/optional[1]/status=0
+
+options/flag[0]/output/line[0]="options/defaulting=hello"
+options/flag[0]/output/line[1]="options/flag="
+options/flag[0]/output/line[2]="options/mandatory=blah"
+options/flag[0]/output/line[3]="options/optional="
+options/flag[0]/status=0
+options/flag[1]/output/line[0]="options/defaulting=hello"
+options/flag[1]/output/line[1]="options/flag=1"
+options/flag[1]/output/line[2]="options/mandatory=blah"
+options/flag[1]/output/line[3]="options/optional="
+options/flag[1]/status=0
+
+options/unnamed[0]/output/line[0]="options/defaulting=hello"
+options/unnamed[0]/output/line[1]="options/flag="
+options/unnamed[0]/output/line[2]="options/mandatory=blah"
+options/unnamed[0]/output/line[3]="options/optional="
+options/unnamed[0]/output/line[4]="options/unnamed[0]=a"
+options/unnamed[0]/output/line[5]="options/unnamed[1]=b"
+options/unnamed[0]/output/line[6]="options/unnamed[2]=c"
+options/unnamed[0]/status=0
+options/unnamed[1]/output/line[0]="options/defaulting=hello"
+options/unnamed[1]/output/line[1]="options/flag=1"
+options/unnamed[1]/output/line[2]="options/mandatory=blah"
+options/unnamed[1]/output/line[3]="options/optional="
+options/unnamed[1]/output/line[4]="options/unnamed[0]=a"
+options/unnamed[1]/output/line[5]="options/unnamed[1]=b"
+options/unnamed[1]/output/line[6]="options/unnamed[2]=c"
+options/unnamed[1]/status=0
diff --git a/bash/test/comma-application-util/comma-application-init/input b/bash/test/comma-application-util/comma-application-init/input
new file mode 100644
index 000000000..9ab3eccd0
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-init/input
@@ -0,0 +1,9 @@
+help="./application -h 2>&1"
+options/mandatory[0]="./application --mandatory blah"
+options/mandatory[1]="./application"
+options/optional[0]="./application --mandatory blah"
+options/optional[1]="./application --mandatory blah --optional bye"
+options/flag[0]="./application --mandatory blah"
+options/flag[1]="./application --mandatory blah --flag"
+options/unnamed[0]="./application a b --mandatory blah c"
+options/unnamed[1]="./application a b --mandatory blah --flag c"

From d93e6a1f2f6d41d58a9fad523c4760bd3ea5a6ee Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 17 Nov 2020 14:17:00 +1100
Subject: [PATCH 0269/1056] comma-application-util:
 comma-application-swiss-init: first cut done; debugging...

---
 bash/comma-application-util | 29 +++++++++++++++--------------
 1 file changed, 15 insertions(+), 14 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index ec07d0553..bc6b7e6fe 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -237,17 +237,14 @@ function comma-application-swiss-init()
     local name=$( basename "$0" )
     local common_options=$( cat )
     [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
-    comma_application_swiss_operation="$1"
+    comma_application_swiss_operation="$1" # todo? quick and dirty, allow --help anywhere on the command line?
     if comma_options_help $@; then
         if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
             [[ "$( type -p prologue )" == "function" ]] || { echo; prologue; } >&2
             comma-application-swiss-usage
             [[ "$( type -p epilogue )" == "function" ]] || { epilogue; echo; } >&2
         else
-            echo
-            echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
-            echo
-            echo "$common_options" | comma-application-swiss-usage-operation "${comma_application_swiss_operation}"
+            echo "$common_options" | comma-application-swiss-usage-operation "${comma_application_swiss_operation}" || exit 1
             echo
         fi >&2
         exit 0
@@ -275,16 +272,20 @@ export -f comma-application-swiss-init
 function comma-application-swiss-usage-operation()
 {
     local operation="$1"
+    [[ $( type -t ${operation}-run ) == "function" ]] || { echo "$( basename $0 ): expected operation, got: '${comma_application_swiss_operation}', see --help with no other options for more information" >&2; return 1; } # quick and dirty
     local common_options=$( cat )
     local found=0
-    echo "${comma_application_swiss_operation}"
-    [[ $( type -t ${comma_application_swiss_operation}-description ) != "function" ]] || { ${comma_application_swiss_operation}-description | sed 's#^#    #'; found=1; }
-    [[ $( type -t ${comma_application_swiss_operation}-usage ) != "function" ]] || { echo "    usage"; ${comma_application_swiss_operation}-usage | sed 's#^#        #'; found=1; }
+    echo
+    echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
+    echo
+    echo "${operation}"
+    [[ $( type -t ${operation}-description ) != "function" ]] || { ${operation}-description | sed 's#^#    #'; found=1; }
+    [[ $( type -t ${operation}-usage ) != "function" ]] || { echo "    usage"; ${operation}-usage | sed 's#^#        #'; found=1; }
     [[ -z "$common_options" ]] || { echo "    common options"; sed 's#^#        #' <<< "$common_options"; found=1; }
-    [[ $( type -t ${comma_application_swiss_operation}-options ) != "function" ]] || { echo "    options"; ${comma_application_swiss_operation}-options | sed 's#^#        #'; found=1; }
-    [[ $( type -t ${comma_application_swiss_operation}-examples ) != "function" ]] || { echo "    examples"; ${comma_application_swiss_operation}-examples | sed 's#^#        #'; found=1; }
+    [[ $( type -t ${operation}-options ) != "function" ]] || { echo "    options"; ${operation}-options | sed 's#^#        #'; found=1; }
+    [[ $( type -t ${operation}-examples ) != "function" ]] || { echo "    examples"; ${operation}-examples | sed 's#^#        #'; found=1; }
     (( ! found )) || return 0
-    echo "    expected operation, got: '${comma_application_swiss_operation}', see --help with no other options for more information"
+    echo "$( basename $0 ): expected operation, got: '${operation}', see --help with no other options for more information" >&2
     return 1
 }
 
@@ -296,10 +297,10 @@ function comma-application-swiss-usage()
     echo
     echo "usage: $( basename "$0" ) <operation> <options>"
     [[ -z "$common_options" ]] || { echo; echo "common options"; echo "$common_options" | sed 's#^#   #'; }
-    echo; echo "available operations: $@"
+    echo; echo "available operations: ${operations[@]}"
     echo; echo "operations"
-    for operation in $@; do
-        comma-application-swiss-usage-operation "${comma_application_swiss_operation}" | sed 's#^#    #'
+    for operation in ${operations[@]}; do
+        comma-application-swiss-usage-operation "${operation}" | sed 's#^#    #'
         echo
     done
 }

From f5ea8f536eb31dc1861397b1b814956bb18ac389 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod@abysssolutions.com.au>
Date: Tue, 17 Nov 2020 14:27:37 +1100
Subject: [PATCH 0270/1056] comma-application-util:
 comma-application-swiss-init: basic regression test added

---
 .../comma-application-swiss-init/application  | 24 ++++++
 .../comma-application-swiss-init/expected     | 73 +++++++++++++++++++
 .../comma-application-swiss-init/input        | 10 +++
 3 files changed, 107 insertions(+)
 create mode 100755 bash/test/comma-application-util/comma-application-swiss-init/application
 create mode 100644 bash/test/comma-application-util/comma-application-swiss-init/expected
 create mode 100644 bash/test/comma-application-util/comma-application-swiss-init/input

diff --git a/bash/test/comma-application-util/comma-application-swiss-init/application b/bash/test/comma-application-util/comma-application-swiss-init/application
new file mode 100755
index 000000000..bd9db9fb4
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-swiss-init/application
@@ -0,0 +1,24 @@
+#!/bin/bash
+
+source $( type -p comma-application-util )
+
+operations=( lol roll )
+
+function prologue() { echo "sample application: for a given operation, print parsed command line option values and exit"; }
+
+function epilogue() { echo "example: ./application lol"; }
+
+function options-description() { echo "--some-common-option=[<value>]; default=hello; a sample common option"; }
+
+function lol-description() { echo "laugh out loud"; }
+function lol-usage() { echo "specialised usage: ./application lol [<options>]"; }
+function lol-options() { echo "--how-loud=<value>; default=0; how loud to laugh in dB"; }
+function lol-run() { echo "lol/options/how_loud=$options_how_loud"; }
+
+function roll-description() { echo "roll on the floor"; }
+function roll-options() { echo "--screaming; roll on the floor screaming"; }
+function roll-run() { echo "roll/options/screaming=$options_screaming"; }
+
+comma-application-swiss-init $@ < <( options-description ) || exit 1
+echo "options/some_common_option=$options_some_common_option"
+comma-application-swiss-run $@
diff --git a/bash/test/comma-application-util/comma-application-swiss-init/expected b/bash/test/comma-application-util/comma-application-swiss-init/expected
new file mode 100644
index 000000000..333a82693
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-swiss-init/expected
@@ -0,0 +1,73 @@
+help[0]/output/line[0]=""
+help[0]/output/line[1]="sample application: for a given operation, print parsed command line option values and exit"
+help[0]/output/line[2]=""
+help[0]/output/line[3]="usage: application <operation> <options>"
+help[0]/output/line[4]=""
+help[0]/output/line[5]="available operations: lol roll"
+help[0]/output/line[6]=""
+help[0]/output/line[7]="operations"
+help[0]/output/line[8]=""
+help[0]/output/line[9]="usage: application --help [<options>]"
+help[0]/output/line[10]=""
+help[0]/output/line[11]="lol"
+help[0]/output/line[12]="laugh out loud"
+help[0]/output/line[13]="usage"
+help[0]/output/line[14]="specialised usage: ./application lol [<options>]"
+help[0]/output/line[15]="options"
+help[0]/output/line[16]="--how-loud=<value>; default=0; how loud to laugh in dB"
+help[0]/output/line[17]=""
+help[0]/output/line[18]=""
+help[0]/output/line[19]="usage: application --help [<options>]"
+help[0]/output/line[20]=""
+help[0]/output/line[21]="roll"
+help[0]/output/line[22]="roll on the floor"
+help[0]/output/line[23]="options"
+help[0]/output/line[24]="--screaming; roll on the floor screaming"
+help[0]/output/line[25]=""
+help[0]/output/line[26]="example: ./application lol"
+help[0]/status=0
+
+help[1]/output/line[0]=""
+help[1]/output/line[1]="usage: application lol [<options>]"
+help[1]/output/line[2]=""
+help[1]/output/line[3]="lol"
+help[1]/output/line[4]="laugh out loud"
+help[1]/output/line[5]="usage"
+help[1]/output/line[6]="specialised usage: ./application lol [<options>]"
+help[1]/output/line[7]="common options"
+help[1]/output/line[8]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[1]/output/line[9]="options"
+help[1]/output/line[10]="--how-loud=<value>; default=0; how loud to laugh in dB"
+help[1]/status=0
+
+help[2]/output/line[0]=""
+help[2]/output/line[1]="usage: application roll [<options>]"
+help[2]/output/line[2]=""
+help[2]/output/line[3]="roll"
+help[2]/output/line[4]="roll on the floor"
+help[2]/output/line[5]="common options"
+help[2]/output/line[6]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[2]/output/line[7]="options"
+help[2]/output/line[8]="--screaming; roll on the floor screaming"
+help[2]/status=0
+
+help[3]/status=1
+
+run/lol[0]/output/line[0]="options/some_common_option=hello"
+run/lol[0]/output/line[1]="lol/options/how_loud=0"
+run/lol[0]/status=0
+
+run/lol[1]/output/line[0]="options/some_common_option=blah"
+run/lol[1]/output/line[1]="lol/options/how_loud=120"
+run/lol[1]/status=0
+
+run/roll[0]/output/line[0]="options/some_common_option=hello"
+run/roll[0]/output/line[1]="roll/options/screaming="
+run/roll[0]/status=0
+
+run/roll[1]/output/line[0]="options/some_common_option=hello"
+run/roll[1]/output/line[1]="roll/options/screaming=1"
+run/roll[1]/status=0
+
+run/fall[0]/output=""
+run/fall[0]/status=1
diff --git a/bash/test/comma-application-util/comma-application-swiss-init/input b/bash/test/comma-application-util/comma-application-swiss-init/input
new file mode 100644
index 000000000..2aa5d0237
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-swiss-init/input
@@ -0,0 +1,10 @@
+help[0]="./application --help 2>&1"
+help[1]="./application lol --help 2>&1"
+help[2]="./application roll --help 2>&1"
+help[3]="./application fall --help 2>&1"
+
+run/lol[0]="./application lol"
+run/lol[1]="./application lol --some-common-option blah --how-loud=120"
+run/roll[0]="./application roll"
+run/roll[1]="./application roll --screaming"
+run/fall[0]="./application fall"

From 8e844abb7d63cf38541065cd86ad66805ce4983a Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 18 Nov 2020 00:16:25 +1100
Subject: [PATCH 0271/1056] bash/test: forgotten test file added

---
 bash/comma-application-util | 8 ++++----
 bash/test/test              | 3 +++
 2 files changed, 7 insertions(+), 4 deletions(-)
 create mode 100755 bash/test/test

diff --git a/bash/comma-application-util b/bash/comma-application-util
index bc6b7e6fe..5563e6954 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -210,7 +210,7 @@ function comma-application-init()
     local epilogue="$2"
     local common_options=$( cat )
     if comma_options_help $@; then
-        [[ "$( type -p prologue )" == "function" ]] || { echo; prologue; } >&2
+        [[ "$( type -t prologue )" != "function" ]] || { echo; prologue; } >&2
         cat <<eof >&2
 
 usage: $name [<options>]
@@ -219,7 +219,7 @@ options
 $( sed 's#^#    #' <<< "$common_options" )
 
 eof
-        [[ "$( type -p epilogue )" == "function" ]] || { epilogue; echo; } >&2
+        [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; } >&2
         exit 0
     fi
     function say() { echo "$name: $@" >&2; }
@@ -240,9 +240,9 @@ function comma-application-swiss-init()
     comma_application_swiss_operation="$1" # todo? quick and dirty, allow --help anywhere on the command line?
     if comma_options_help $@; then
         if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
-            [[ "$( type -p prologue )" == "function" ]] || { echo; prologue; } >&2
+            [[ "$( type -t prologue )" != "function" ]] || { echo; prologue; } >&2
             comma-application-swiss-usage
-            [[ "$( type -p epilogue )" == "function" ]] || { epilogue; echo; } >&2
+            [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; } >&2
         else
             echo "$common_options" | comma-application-swiss-usage-operation "${comma_application_swiss_operation}" || exit 1
             echo
diff --git a/bash/test/test b/bash/test/test
new file mode 100755
index 000000000..639918470
--- /dev/null
+++ b/bash/test/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util )
+comma_test_commands

From ca95e22e943acf6b689b74b5866fcd77e296efb4 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 18 Nov 2020 12:33:51 +1100
Subject: [PATCH 0272/1056] bash/comma-application-util: application name fixed

---
 bash/comma-application-util | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 5563e6954..541e3d17a 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -205,7 +205,7 @@ export -f comma_tee_function
 
 function comma-application-init()
 {
-    local name=$( basename "$0" )
+    comma_application_name=$( basename "$0" )
     local prologue="$1"
     local epilogue="$2"
     local common_options=$( cat )
@@ -222,7 +222,7 @@ eof
         [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; } >&2
         exit 0
     fi
-    function say() { echo "$name: $@" >&2; }
+    function say() { echo "$comma_application_name: $@" >&2; }
     function die() { say "$@"; exit 1; }
     local options; options=$( echo "$common_options" | comma-options-to-name-value "$@" ) || die "invalid options"
     eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"

From 8fc52be84133a7b97864e352fb78118db53d1735 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 18 Nov 2020 17:54:17 +1100
Subject: [PATCH 0273/1056] comma-application-util: typo fixed

---
 bash/comma-application-util | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 541e3d17a..f26e46227 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -213,7 +213,7 @@ function comma-application-init()
         [[ "$( type -t prologue )" != "function" ]] || { echo; prologue; } >&2
         cat <<eof >&2
 
-usage: $name [<options>]
+usage: $comma_application_name [<options>]
 
 options
 $( sed 's#^#    #' <<< "$common_options" )

From 572f268d1b0f0773a22441df2ca8a54266ec78a8 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 20 Nov 2020 12:47:33 +1100
Subject: [PATCH 0274/1056] bash/comma-application-util: saymore() and
 verbose() added to application template functions

---
 bash/comma-application-util | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index f26e46227..6ba28d3f0 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -223,6 +223,8 @@ eof
         exit 0
     fi
     function say() { echo "$comma_application_name: $@" >&2; }
+    function saymore() { (( ! options_verbose )) || echo "$comma_application_name: $@" >&2; }
+    function verbose() { (( ! options_verbose )) || echo "$comma_application_name: $@" >&2; }
     function die() { say "$@"; exit 1; }
     local options; options=$( echo "$common_options" | comma-options-to-name-value "$@" ) || die "invalid options"
     eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
@@ -250,6 +252,8 @@ function comma-application-swiss-init()
         exit 0
     fi
     function say() { echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
+    function saymore() { (( ! options_verbose )) || echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
+    function verbose() { (( ! options_verbose )) || echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
     function die() { say "$@"; exit 1; }
     [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
     if [[ -n "$common_options" ]]; then

From a5ef3383bba25164d6093c8242c01fc43ba97779 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 20 Nov 2020 13:33:17 +1100
Subject: [PATCH 0275/1056] bash/comma-application-util: --verbose common
 option added; --help improved

---
 bash/comma-application-util                   | 50 +++++++------
 .../comma-application-init/expected           |  5 +-
 .../comma-application-swiss-init/expected     | 74 +++++++++----------
 3 files changed, 66 insertions(+), 63 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 6ba28d3f0..8440c82b1 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -203,6 +203,15 @@ function comma_tee_function()
 }
 export -f comma_tee_function
 
+function comma-application-common-options()
+{
+    cat <<eof
+--verbose,-v; output more messages to stderr
+eof
+}
+
+export -f comma-application-common-options
+
 function comma-application-init()
 {
     comma_application_name=$( basename "$0" )
@@ -216,7 +225,7 @@ function comma-application-init()
 usage: $comma_application_name [<options>]
 
 options
-$( sed 's#^#    #' <<< "$common_options" )
+$( ( [[ -z "$common_options" ]] || echo "$common_options"; comma-application-common-options ) | sed 's#^#    #' )
 
 eof
         [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; } >&2
@@ -226,7 +235,7 @@ eof
     function saymore() { (( ! options_verbose )) || echo "$comma_application_name: $@" >&2; }
     function verbose() { (( ! options_verbose )) || echo "$comma_application_name: $@" >&2; }
     function die() { say "$@"; exit 1; }
-    local options; options=$( echo "$common_options" | comma-options-to-name-value "$@" ) || die "invalid options"
+    local options; options=$( ( echo "$common_options"; comma-application-common-options ) | comma-options-to-name-value "$@" ) || die "invalid options"
     eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
     # declare -a options_unnamed
     mapfile -t options_unnamed < <( grep '^"' <<< "$options" | sed -e 's#^"##' -e 's#"$##' )
@@ -242,11 +251,11 @@ function comma-application-swiss-init()
     comma_application_swiss_operation="$1" # todo? quick and dirty, allow --help anywhere on the command line?
     if comma_options_help $@; then
         if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
-            [[ "$( type -t prologue )" != "function" ]] || { echo; prologue; } >&2
-            comma-application-swiss-usage
-            [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; } >&2
+            [[ "$( type -t prologue )" != "function" ]] || { echo; prologue; }
+            echo "$common_options" | comma-application-swiss-usage >&2
+            [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; }
         else
-            echo "$common_options" | comma-application-swiss-usage-operation "${comma_application_swiss_operation}" || exit 1
+            { [[ -z "$common_options" ]] || echo "$common_options"; comma-application-common-options; } | comma-application-swiss-usage-operation "${comma_application_swiss_operation}" || exit 1
             echo
         fi >&2
         exit 0
@@ -256,15 +265,13 @@ function comma-application-swiss-init()
     function verbose() { (( ! options_verbose )) || echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
     function die() { say "$@"; exit 1; }
     [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
-    if [[ -n "$common_options" ]]; then
-        local options; options=$( echo "$common_options" | comma-options-to-name-value "$@" ) || die "invalid options"
-        eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
-        #(( !options_verbose )) || verbose_option="--verbose"
-        #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
-        #(( !options_input_format )) || { eval "echo \$${operation//-/_}_input_format"; exit 0; } # quick and dirty
-        #(( !options_output_fields )) || { eval "echo \$${operation//-/_}_output_fields"; exit 0; } # quick and dirty
-        #(( !options_output_format )) || { eval "echo \$${operation//-/_}_output_format"; exit 0; } # quick and dirty
-    fi
+    local options; options=$( ( echo "$common_options"; comma-application-common-options ) | comma-options-to-name-value "$@" ) || die "invalid options"
+    eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
+    #(( !options_verbose )) || verbose_option="--verbose"
+    #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
+    #(( !options_input_format )) || { eval "echo \$${operation//-/_}_input_format"; exit 0; } # quick and dirty
+    #(( !options_output_fields )) || { eval "echo \$${operation//-/_}_output_fields"; exit 0; } # quick and dirty
+    #(( !options_output_format )) || { eval "echo \$${operation//-/_}_output_format"; exit 0; } # quick and dirty
     if [[ $( type -t ${comma_application_swiss_operation}-options ) == "function" ]]; then
         local operation_options; operation_options=$( ${comma_application_swiss_operation}-options | comma-options-to-name-value "$@" ) || die "invalid options"
         eval "$( grep -v '^"' <<< "$operation_options" | sed 's#^#options_#' | comma_path_value_mangle )"
@@ -279,13 +286,11 @@ function comma-application-swiss-usage-operation()
     [[ $( type -t ${operation}-run ) == "function" ]] || { echo "$( basename $0 ): expected operation, got: '${comma_application_swiss_operation}', see --help with no other options for more information" >&2; return 1; } # quick and dirty
     local common_options=$( cat )
     local found=0
-    echo
-    echo "usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"
-    echo
-    echo "${operation}"
+    if [[ -z "$common_options" ]]; then echo "${operation}"; else echo "$( basename "$0" ) ${operation}"; fi # uber quick and dirty for now
     [[ $( type -t ${operation}-description ) != "function" ]] || { ${operation}-description | sed 's#^#    #'; found=1; }
-    [[ $( type -t ${operation}-usage ) != "function" ]] || { echo "    usage"; ${operation}-usage | sed 's#^#        #'; found=1; }
-    [[ -z "$common_options" ]] || { echo "    common options"; sed 's#^#        #' <<< "$common_options"; found=1; }
+    if [[ $( type -t ${operation}-usage ) == "function" ]]; then echo "    usage"; ${operation}-usage | sed 's#^#        #'; found=1
+    else echo "    usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"; fi
+    [[ -z "$common_options" ]] || { echo "    common options"; echo "$common_options" | sed 's#^#        #'; }
     [[ $( type -t ${operation}-options ) != "function" ]] || { echo "    options"; ${operation}-options | sed 's#^#        #'; found=1; }
     [[ $( type -t ${operation}-examples ) != "function" ]] || { echo "    examples"; ${operation}-examples | sed 's#^#        #'; found=1; }
     (( ! found )) || return 0
@@ -300,7 +305,8 @@ function comma-application-swiss-usage()
     local common_options=$( cat )
     echo
     echo "usage: $( basename "$0" ) <operation> <options>"
-    [[ -z "$common_options" ]] || { echo; echo "common options"; echo "$common_options" | sed 's#^#   #'; }
+    echo; echo "common options"
+    { [[ -z "$common_options" ]] || echo "$common_options"; comma-application-common-options; } | sed 's#^#   #'
     echo; echo "available operations: ${operations[@]}"
     echo; echo "operations"
     for operation in ${operations[@]}; do
diff --git a/bash/test/comma-application-util/comma-application-init/expected b/bash/test/comma-application-util/comma-application-init/expected
index 7d5c81924..c60f7fcb7 100644
--- a/bash/test/comma-application-util/comma-application-init/expected
+++ b/bash/test/comma-application-util/comma-application-init/expected
@@ -8,8 +8,9 @@ help/output/line[6]="--defaulting,-d=<value>; default=hello; default value"
 help/output/line[7]="--flag; flag option"
 help/output/line[8]="--mandatory,-m=<value>; this is mandatory option"
 help/output/line[9]="--optional,-o=[<value>]; this is optional option"
-help/output/line[10]=""
-help/output/line[11]="example: ./application some unnamed --mandatory blah stuff"
+help/output/line[10]="--verbose,-v; output more messages to stderr"
+help/output/line[11]=""
+help/output/line[12]="example: ./application some unnamed --mandatory blah stuff"
 help/status=0
 
 options/mandatory[0]/output/line[0]="options/defaulting=hello"
diff --git a/bash/test/comma-application-util/comma-application-swiss-init/expected b/bash/test/comma-application-util/comma-application-swiss-init/expected
index 333a82693..38c190c8b 100644
--- a/bash/test/comma-application-util/comma-application-swiss-init/expected
+++ b/bash/test/comma-application-util/comma-application-swiss-init/expected
@@ -3,52 +3,48 @@ help[0]/output/line[1]="sample application: for a given operation, print parsed
 help[0]/output/line[2]=""
 help[0]/output/line[3]="usage: application <operation> <options>"
 help[0]/output/line[4]=""
-help[0]/output/line[5]="available operations: lol roll"
-help[0]/output/line[6]=""
-help[0]/output/line[7]="operations"
+help[0]/output/line[5]="common options"
+help[0]/output/line[6]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[0]/output/line[7]="--verbose,-v; output more messages to stderr"
 help[0]/output/line[8]=""
-help[0]/output/line[9]="usage: application --help [<options>]"
+help[0]/output/line[9]="available operations: lol roll"
 help[0]/output/line[10]=""
-help[0]/output/line[11]="lol"
-help[0]/output/line[12]="laugh out loud"
-help[0]/output/line[13]="usage"
-help[0]/output/line[14]="specialised usage: ./application lol [<options>]"
-help[0]/output/line[15]="options"
-help[0]/output/line[16]="--how-loud=<value>; default=0; how loud to laugh in dB"
-help[0]/output/line[17]=""
+help[0]/output/line[11]="operations"
+help[0]/output/line[12]="lol"
+help[0]/output/line[13]="laugh out loud"
+help[0]/output/line[14]="usage"
+help[0]/output/line[15]="specialised usage: ./application lol [<options>]"
+help[0]/output/line[16]="options"
+help[0]/output/line[17]="--how-loud=<value>; default=0; how loud to laugh in dB"
 help[0]/output/line[18]=""
-help[0]/output/line[19]="usage: application --help [<options>]"
-help[0]/output/line[20]=""
-help[0]/output/line[21]="roll"
-help[0]/output/line[22]="roll on the floor"
-help[0]/output/line[23]="options"
-help[0]/output/line[24]="--screaming; roll on the floor screaming"
-help[0]/output/line[25]=""
-help[0]/output/line[26]="example: ./application lol"
+help[0]/output/line[19]="roll"
+help[0]/output/line[20]="roll on the floor"
+help[0]/output/line[21]="usage: application --help [<options>]"
+help[0]/output/line[22]="options"
+help[0]/output/line[23]="--screaming; roll on the floor screaming"
+help[0]/output/line[24]=""
+help[0]/output/line[25]="example: ./application lol"
 help[0]/status=0
 
-help[1]/output/line[0]=""
-help[1]/output/line[1]="usage: application lol [<options>]"
-help[1]/output/line[2]=""
-help[1]/output/line[3]="lol"
-help[1]/output/line[4]="laugh out loud"
-help[1]/output/line[5]="usage"
-help[1]/output/line[6]="specialised usage: ./application lol [<options>]"
-help[1]/output/line[7]="common options"
-help[1]/output/line[8]="--some-common-option=[<value>]; default=hello; a sample common option"
-help[1]/output/line[9]="options"
-help[1]/output/line[10]="--how-loud=<value>; default=0; how loud to laugh in dB"
+help[1]/output/line[0]="application lol"
+help[1]/output/line[1]="laugh out loud"
+help[1]/output/line[2]="usage"
+help[1]/output/line[3]="specialised usage: ./application lol [<options>]"
+help[1]/output/line[4]="common options"
+help[1]/output/line[5]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[1]/output/line[6]="--verbose,-v; output more messages to stderr"
+help[1]/output/line[7]="options"
+help[1]/output/line[8]="--how-loud=<value>; default=0; how loud to laugh in dB"
 help[1]/status=0
 
-help[2]/output/line[0]=""
-help[2]/output/line[1]="usage: application roll [<options>]"
-help[2]/output/line[2]=""
-help[2]/output/line[3]="roll"
-help[2]/output/line[4]="roll on the floor"
-help[2]/output/line[5]="common options"
-help[2]/output/line[6]="--some-common-option=[<value>]; default=hello; a sample common option"
-help[2]/output/line[7]="options"
-help[2]/output/line[8]="--screaming; roll on the floor screaming"
+help[2]/output/line[0]="application roll"
+help[2]/output/line[1]="roll on the floor"
+help[2]/output/line[2]="usage: application roll [<options>]"
+help[2]/output/line[3]="common options"
+help[2]/output/line[4]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[2]/output/line[5]="--verbose,-v; output more messages to stderr"
+help[2]/output/line[6]="options"
+help[2]/output/line[7]="--screaming; roll on the floor screaming"
 help[2]/status=0
 
 help[3]/status=1

From 6073e76bafd39f2c10db739f16ad16fe8e13d449 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 21 Nov 2020 13:45:01 +1100
Subject: [PATCH 0276/1056] csv-paste: --begin: handling negative values
 implemented

---
 csv/applications/csv-paste.cpp | 52 ++++++++--------------------------
 1 file changed, 12 insertions(+), 40 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 9be67252d..6aeb894a7 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -85,7 +57,7 @@ static void usage( bool verbose )
     std::cerr << "    value : value=<csv values>[;binary=<format>]; specify size or format, if binary" << std::endl;
     std::cerr << "    line-number[;<options>] : add the line number; as ui, if binary (quick and dirty, will override the file named \"line-number\")" << std::endl;
     std::cerr << "        options" << std::endl;
-    std::cerr << "            --begin <index>: start line number count at <index>; default: 0" << std::endl;
+    std::cerr << "            --begin <index>: start line number count at <index>, can be negative; default: 0" << std::endl;
     std::cerr << "            --block-size,--size=<size>: number of records with the same line number; default: 1" << std::endl;
     std::cerr << "                 WARNING: --size: deprecated, since it is confusing for files" << std::endl;
     std::cerr << "            --index; instead of block number output record index in the block" << std::endl;
@@ -203,11 +175,11 @@ class line_number : public source
                 comma::uint32 size;
                 bool index;
                 bool reverse;
-                comma::uint32 step;
-                comma::uint32 begin;
+                comma::int32 step;
+                comma::int32 begin;
                 std::string format;
                 
-                options( boost::optional< comma::uint32 > b = boost::optional< comma::uint32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false, unsigned int s = 1 )
+                options( const boost::optional< comma::int32 >& b = boost::optional< comma::int32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false, int s = 1 )
                     : size( size )
                     , index( index )
                     , reverse( reverse )
@@ -218,23 +190,23 @@ class line_number : public source
                 
                 options( const std::string& properties, const comma::command_line_options& o ) // quick and dirty: use visiting instead
                 {
-                    options defaults( boost::optional< comma::uint32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::uint32 >( "--step", 1 ) );
+                    options defaults( boost::optional< comma::int32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::int32 >( "--step", 1 ) );
                     comma::name_value::map map( properties, ';', '=' );
                     size = map.value< comma::uint32 >( map.get().find( "block-size" ) != map.get().end() ? "block-size" : "size", defaults.size ); // quick and dirty
                     index = map.value< bool >( "index", defaults.index );
                     reverse = map.value< bool >( "reverse", defaults.reverse );
-                    step = map.value< comma::uint32 >( "step", defaults.step );
-                    auto b = map.optional< comma::uint32 >( "begin" );
-                    if( !b ) { b = o.optional< comma::uint32 >( "--begin" ); }
+                    step = map.value< comma::int32 >( "step", defaults.step );
+                    auto b = map.optional< comma::int32 >( "begin" );
+                    if( !b ) { b = o.optional< comma::int32 >( "--begin" ); }
                     begin = begin_( b );
                     format = map.value< std::string >( "binary", "" );
                     if( !format.empty() && format != "ui" ) { std::cerr << "csv-paste: currently only ui supported for line-number; got: '" << format << "'" << std::endl; exit( 1 ); } // quick and dirty for now
                 }
                 
             private:
-                comma::uint32 begin_( const boost::optional< comma::uint32 >& b )
+                comma::int32 begin_( const boost::optional< comma::int32 >& b ) // todo! handle size correctly for negative values for begin and step
                 {
-                    if( index && reverse && b && ( *b + step ) < size * step ) { COMMA_THROW( comma::exception, "for --reverse --index, for --size " << size << " expected --begin not less than " << ( size - 1 ) << "; got: " << *b ); }
+                    if( index && reverse && b && ( *b + step ) < int( size ) * step ) { COMMA_THROW( comma::exception, "for --reverse --index, for --size " << size << " expected --begin not less than " << ( size - 1 ) << "; got: " << *b ); }
                     return b ? *b : reverse ? ( size - 1 ) * step : 0;
                 }
         };
@@ -256,7 +228,7 @@ class line_number : public source
         
         const char* read( char* buf ) // quick and dirty
         {
-            comma::csv::format::traits< comma::uint32 >::to_bin( value_, buf );
+            comma::csv::format::traits< comma::int32 >::to_bin( value_, buf );
             update_();
             return buf;
         }
@@ -264,7 +236,7 @@ class line_number : public source
     private:
         options options_;
         comma::uint32 count_;
-        comma::uint32 value_;
+        comma::int32 value_;
         std::string serialized_;
         
         void update_()

From 055fc901d520cfb440a04f76893fb4e6d440b4c9 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 23 Nov 2020 17:18:53 +1100
Subject: [PATCH 0277/1056] csv-shuffle: number of fields check added in ascii
 mode

---
 csv/applications/csv-shuffle.cpp | 27 +++++++++++++--------------
 1 file changed, 13 insertions(+), 14 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 197e0af12..274de4a2f 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -81,22 +81,21 @@ int main( int ac, char** av )
                 for( const auto& offset: offsets ) { std::cout.write( &buf[ offset.first ], offset.second ); }
                 if( csv.flush ) { std::cout.flush(); }
             }
+            return 0;
         }
-        else
+        std::vector< unsigned int > indices;
+        for( const auto& field: output_fields ) { indices.push_back( find_( field ) ); }
+        while( std::cin.good() && !std::cin.eof() )
         {
-            std::vector< unsigned int > indices;
-            for( const auto& field: output_fields ) { indices.push_back( find_( field ) ); }
-            while( std::cin.good() && !std::cin.eof() )
-            {
-                std::string line;
-                std::getline( std::cin, line );
-                if( !line.empty() && *line.rbegin() == '\r' ) { line = line.substr( 0, line.length() - 1 ); } // windows... sigh...
-                if( line.empty() ) { continue; }
-                const auto& v = comma::split( line, csv.delimiter );
-                std::string delimiter;
-                for( auto index: indices ) { std::cout << delimiter << v[index]; delimiter = csv.delimiter; }
-                std::cout << std::endl;
-            }
+            std::string line;
+            std::getline( std::cin, line );
+            if( !line.empty() && *line.rbegin() == '\r' ) { line = line.substr( 0, line.length() - 1 ); } // windows... sigh...
+            if( line.empty() ) { continue; }
+            const auto& v = comma::split( line, csv.delimiter );
+            if( v.size() < input_fields.size() ) { std::cerr << "csv-shuffle: expected at least " << input_fields.size() << " fields, got only " << v.size() << " in record \"" << line << "\"" << std::endl; return 1; }
+            std::string delimiter;
+            for( auto index: indices ) { std::cout << delimiter << v[index]; delimiter = csv.delimiter; }
+            std::cout << std::endl;
         }
         return 0;
     }

From 55eb282aa6f7a7eb961e66ab5c1b62927c552246 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 4 Dec 2020 14:16:22 +1100
Subject: [PATCH 0278/1056] ansible: gawk dependency added

---
 system/ansible/install.python3.yml | 1 +
 system/ansible/install.yml         | 1 +
 2 files changed, 2 insertions(+)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index 8064e048a..30f3ed6f7 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -17,6 +17,7 @@
       - git
       - cmake-curses-gui
       - cmake
+      - gawk
       - perl
       - python
       - libboost-all-dev
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 2ddad404c..02ec72734 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -17,6 +17,7 @@
       - git
       - cmake-curses-gui
       - cmake
+      - gawk
       - perl
       - python
       - libboost-all-dev

From 71963f53abc754c80e12159b68128cff8cc73e4e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 4 Dec 2020 14:27:58 +1100
Subject: [PATCH 0279/1056] ansible: net-tools added to dependencies

---
 system/ansible/install.python3.yml | 1 +
 system/ansible/install.yml         | 1 +
 2 files changed, 2 insertions(+)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index 30f3ed6f7..a2f87be08 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -19,6 +19,7 @@
       - cmake
       - gawk
       - perl
+      - net-tools
       - python
       - libboost-all-dev
       - socat
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 02ec72734..c55c72009 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -18,6 +18,7 @@
       - cmake-curses-gui
       - cmake
       - gawk
+      - net-tools
       - perl
       - python
       - libboost-all-dev

From 0029c24b58331a14222736856f5866e72f56268d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 4 Dec 2020 14:30:05 +1100
Subject: [PATCH 0280/1056] ansible: slight refactoring

---
 system/ansible/install.python3.yml | 7 ++++++-
 system/ansible/install.yml         | 7 ++++++-
 2 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index a2f87be08..7c85e8dcc 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -19,7 +19,6 @@
       - cmake
       - gawk
       - perl
-      - net-tools
       - python
       - libboost-all-dev
       - socat
@@ -30,6 +29,12 @@
       - libprocps-dev
       - recode
       
+  - name: "install comma regressions test dependencies"
+    become: true
+    apt: pkg={{ item }} state=present update_cache=yes
+    with_items:
+      - net-tools
+      
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
     with_items:
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index c55c72009..734951d76 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -18,7 +18,6 @@
       - cmake-curses-gui
       - cmake
       - gawk
-      - net-tools
       - perl
       - python
       - libboost-all-dev
@@ -29,6 +28,12 @@
       - python-numpy
       - libprocps-dev
       - recode
+
+  - name: "install comma regressions test dependencies"
+    become: true
+    apt: pkg={{ item }} state=present update_cache=yes
+    with_items:
+      - net-tools
       
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory

From df8beb74245515fb0a13b7a9744ea351cb54f66c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 4 Dec 2020 14:37:25 +1100
Subject: [PATCH 0281/1056] ansible: moreutils added to dependencies

---
 system/ansible/install.python3.yml | 1 +
 system/ansible/install.yml         | 1 +
 2 files changed, 2 insertions(+)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index 7c85e8dcc..03637a052 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -34,6 +34,7 @@
     apt: pkg={{ item }} state=present update_cache=yes
     with_items:
       - net-tools
+      - moreutils
       
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 734951d76..881201edc 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -34,6 +34,7 @@
     apt: pkg={{ item }} state=present update_cache=yes
     with_items:
       - net-tools
+      - moreutils
       
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory

From ca62fc5489e775521f8c90fe87be39b849ccf02e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 4 Dec 2020 17:53:41 +1100
Subject: [PATCH 0282/1056] ansible: pv added as dependency for comma
 regression test

---
 system/ansible/install.python3.yml | 3 ++-
 system/ansible/install.yml         | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index 03637a052..fcbe2c851 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -33,8 +33,9 @@
     become: true
     apt: pkg={{ item }} state=present update_cache=yes
     with_items:
-      - net-tools
       - moreutils
+      - net-tools
+      - pv
       
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 881201edc..eed77cf05 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -33,8 +33,9 @@
     become: true
     apt: pkg={{ item }} state=present update_cache=yes
     with_items:
-      - net-tools
       - moreutils
+      - net-tools
+      - pv
       
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory

From da3a0968948dcec3de536429c6142703660c9821 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 4 Dec 2020 20:30:40 +1100
Subject: [PATCH 0283/1056] csv-paste: trivial refactoring

---
 csv/applications/csv-paste.cpp | 29 ++++++++++++++---------------
 1 file changed, 14 insertions(+), 15 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 6aeb894a7..e421d87f9 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -316,27 +316,26 @@ int main( int ac, char** av )
                 std::cout.write( &buffer[0], buffer.size() );
                 if( flush ) { std::cout.flush(); }
             }
+            return 0;
         }
-        else
+        while( !head || ( *head )-- )
         {
-            while( !head || ( *head )-- )
+            std::ostringstream oss;
+            unsigned int streams = 0;
+            for( unsigned int i = 0; i < sources.size(); ++i )
             {
-                std::ostringstream oss;
-                unsigned int streams = 0;
-                for( unsigned int i = 0; i < sources.size(); ++i )
+                const std::string* s = sources[i].read();
+                if( s == nullptr )
                 {
-                    const std::string* s = sources[i].read();
-                    if( s == nullptr )
-                    {
-                        if( streams == 0 ) { return 0; }
-                        std::cerr << "csv-paste: unexpected end of file in " << unnamed[i] << std::endl; return 1;
-                    }
-                    if( sources[i].is_stream() ) { ++streams; }
-                    if( i > 0 ) { oss << delimiter; }
-                    oss << *s;
+                    if( streams == 0 ) { return 0; }
+                    std::cerr << "csv-paste: unexpected end of file in " << unnamed[i] << std::endl;
+                    return 1;
                 }
-                std::cout << oss.str() << std::endl;
+                if( sources[i].is_stream() ) { ++streams; }
+                if( i > 0 ) { oss << delimiter; }
+                oss << *s;
             }
+            std::cout << oss.str() << std::endl;
         }
         return 0;
     }

From c997e46eb7463ee1450b33af84ae2b445c1ec626 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 7 Dec 2020 17:36:34 +1100
Subject: [PATCH 0284/1056] name_value/test/eval: fixed in a quick and dirty
 way (was failing, since the test is too sensitive and expects the error
 messages from python to match; but depending on python version, the error
 messages may vary); todo: refactor the test completely to remove assumptions
 about the python error messages?

---
 name_value/test/eval/test | 16 +++++++++++++---
 1 file changed, 13 insertions(+), 3 deletions(-)

diff --git a/name_value/test/eval/test b/name_value/test/eval/test
index 580bdc23a..36189340f 100755
--- a/name_value/test/eval/test
+++ b/name_value/test/eval/test
@@ -31,7 +31,7 @@ total_count=0
 python_version="$( python -c "from __future__ import print_function; import sys; print( sys.version_info.major )" )" # sigh...
 python_prefix="python${python_version}:"
 
-for input in $data_dir/input*; do
+for input in $data_dir/input_*; do # for input in $data_dir/input*; do
     (( ++total_count ))
     suffix=${input#*input_}
     if (( verbose )); then echo "$name: running test $suffix" >&2; fi
@@ -47,8 +47,18 @@ for input in $data_dir/input*; do
     if ! cmp --quiet $stdout $data_dir/stdout_$suffix; then
         echo "$name: test failed for input_$suffix (stdout is different):" >&2
         diff $stdout $data_dir/stdout_$suffix >&2
-    elif ! cmp --quiet <( echo "$actual_stderr" ) <( echo "$expected_stderr" ); then
-        diff <( echo "$actual_stderr" ) <( echo "$expected_stderr" ) >&2
+    elif [[ "$actual_stderr" != "$expected_stderr" ]]; then # quick and dirty; sigh...
+        # quick and dirty; sigh... error messages keep changing from one python version to the next
+        if (( python_version == 2 )) || [[ "$( cut -d: -f3 <<< "$actual_stderr" )" != "$( cut -d: -f3 <<< "$expected_stderr" )" ]]; then
+            echo "expected error message:" >&2
+            echo "$expected_stderr" | sed 's#^#    #' >&2
+            echo "actual error message:" >&2
+            echo "$actual_stderr" | sed 's#^#    #' >&2
+        else
+            (( ++pass_count ))
+            if (( verbose )); then echo "$name: test $suffix passed" >&2; fi
+            echo $(basename "$input" )"=\"pass\""
+        fi
     else
         (( ++pass_count ))
         if (( verbose )); then echo "$name: test $suffix passed" >&2; fi

From d0eb4c27ce45c5bbbada112de6f8188983d2f544 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 11:18:49 +1100
Subject: [PATCH 0285/1056] io/test/io-publish/on-demand: instrumented with
 debug messages, since test fails on ubuntu 20.04

---
 io/test/io-publish/on-demand/input | 12 ++++++++++--
 io/test/io-publish/test            | 10 +++++-----
 2 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/io/test/io-publish/on-demand/input b/io/test/io-publish/on-demand/input
index fd04a154e..562b9d507 100644
--- a/io/test/io-publish/on-demand/input
+++ b/io/test/io-publish/on-demand/input
@@ -1,10 +1,11 @@
 # because we source these files into the test script, we can use functions from the test script
 
-port=42643
+port=42743
 options="--on-demand"
 test_duration=40
 report_interval=0.5
 
+# yes | csv-repeat --pace --period 0.25
 function exec_cmd()
 {
     yes
@@ -13,25 +14,32 @@ export -f exec_cmd
 
 function read_port()
 {
-    echo "test: creating reader" >&2
+    echo "test: creating reader..." >&2
     socat tcp:localhost:$port -
+    echo "test: created reader" >&2
 }
 
 function client_cmd()
 {
     sleep 5
+    echo "test: starting client 1 of 3..." >&2
     read_port &
     first_client_pid=$!
+    echo "test: started client 1 of 3 with pid $first_client_pid" >&2
     sleep 5
+    echo "test: starting client 2 of 3..." >&2
     read_port &
     second_client_pid=$!
+    echo "test: started client 2 of 3 with pid $second_client_pid" >&2
     sleep 5
     kill_pid_and_children $first_client_pid
     sleep 5
     kill_pid_and_children $second_client_pid
     sleep 5
+    echo "test: starting client 3 of 3..." >&2
     read_port &
     third_client_pid=$!
+    echo "test: started client 3 of 3 with pid $third_client_pid" >&2
     sleep 5
     kill_pid_and_children $third_client_pid
     sleep 5
diff --git a/io/test/io-publish/test b/io/test/io-publish/test
index f88757263..d5ddc8630 100755
--- a/io/test/io-publish/test
+++ b/io/test/io-publish/test
@@ -15,11 +15,11 @@ function kill_pid_and_children()
 {
     pid=$1
     local child_pids=$( pgrep -P $pid )
-    echo "killing children: $child_pids" >&2
-    [[ $child_pids ]] && kill $child_pids
-    echo "killing $pid" >&2
+    if [[ -n "$child_pids" ]]; then echo "killing children with pid(s): $child_pids" >&2; kill $child_pids; fi
+    echo "test: killing $pid" >&2
     kill $pid 2> /dev/null
     wait $pid
+    echo "test: killed $pid" >&2
 }
 
 [[ -d output ]] || mkdir output
@@ -33,7 +33,7 @@ else
     io-publish tcp:$port $options &
 fi
 io_publish_pid=$!
-echo "io_publish_pid=$io_publish_pid" >&2
+echo "test: io_publish_pid: $io_publish_pid port: $port" >&2
 
 if [[ $( type -t client_cmd ) == "function" ]]; then
     sleep 1                     # allow time for io-publish to open the port
@@ -60,7 +60,7 @@ done | sed 's/,$//;s/,[^,]* <defunct>//g' | grep -v ",bash$" | uniq \
 if [[ $client_cmd_pid ]]; then
     kill_pid_and_children $client_cmd_pid
 fi
-echo "killing io-publish: $io_publish_pid" >&2
+echo "test: killing io-publish: $io_publish_pid" >&2
 kill_pid_and_children $io_publish_pid
 
 if [[ -f client.out ]]; then

From f6ae541a58ba434a5e64e433abe3df6f410c783c Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Dec 2020 11:19:32 +1100
Subject: [PATCH 0286/1056] csv-repeat/test: use first timestamp as offset for
 all timestamps

this removes a small bit of delay compared to taking a timestamp at the start
of the test, and so makes the comparison with expected values more accurate
and reliable
---
 csv/test/csv-repeat/test | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/csv/test/csv-repeat/test b/csv/test/csv-repeat/test
index 3f960c7ab..324c6ae59 100755
--- a/csv/test/csv-repeat/test
+++ b/csv/test/csv-repeat/test
@@ -14,10 +14,8 @@ time_fields=t,$( csv-fields clear --except time <<< $output_fields )
 
 for mode in ascii binary; do
 
-    now=$( echo "1" | csv-time-stamp | csv-shuffle --fields=t, --output-fields=t | csv-time --to seconds )
-
-    csv_eval_expr="t-=$now"
-    [[ $append =~ time ]] && csv_eval_expr+="; time-=$now"
+    csv_eval_expr="t-=init_t"
+    [[ $append =~ time ]] && csv_eval_expr+="; time-=init_t"
 
     while IFS=, read data pause; do
         echo $data
@@ -31,7 +29,8 @@ for mode in ascii binary; do
               csv-repeat --timeout=$timeout $period_option $append_option
           fi \
         | csv-time-stamp | csv-time --fields $time_fields --to seconds \
-        | csv-eval --fields=$time_fields "$csv_eval_expr" --flush \
+        | gawk 'BEGIN { FS="," } { if( init_t == 0 ) init_t=$1; print $0,init_t }' OFS=, \
+        | csv-eval --fields=$time_fields,init_t "$csv_eval_expr" --flush \
         | name-value-from-csv --fields=timestamp,$output_fields --line-number --prefix=$mode \
         | csv-quote -d = --unquote
 

From 9d949c7a7565e704eaea4904ef4d619acc843eca Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 11:25:15 +1100
Subject: [PATCH 0287/1056] io/test/io-publish/on-demand: port reverted to what
 it used to be

---
 io/test/io-publish/on-demand/input | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/test/io-publish/on-demand/input b/io/test/io-publish/on-demand/input
index 562b9d507..731c9dc4e 100644
--- a/io/test/io-publish/on-demand/input
+++ b/io/test/io-publish/on-demand/input
@@ -1,6 +1,6 @@
 # because we source these files into the test script, we can use functions from the test script
 
-port=42743
+port=42643
 options="--on-demand"
 test_duration=40
 report_interval=0.5

From 5dc00f4311f73ab128e9f0bd105eabf70855e442 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Dec 2020 14:21:07 +1100
Subject: [PATCH 0288/1056] csv-repeat/test: reverse order of input data

it's clearer what the output should be when the pause comes first
---
 csv/test/csv-repeat/append/all/input       | 12 ++++++------
 csv/test/csv-repeat/append/repeating/input | 11 ++++++-----
 csv/test/csv-repeat/append/time/input      | 12 ++++++------
 csv/test/csv-repeat/period/input           | 12 ++++++------
 csv/test/csv-repeat/test                   |  4 ++--
 csv/test/csv-repeat/timeout/input          | 12 ++++++------
 6 files changed, 32 insertions(+), 31 deletions(-)

diff --git a/csv/test/csv-repeat/append/all/input b/csv/test/csv-repeat/append/all/input
index a39a3c325..b69e23b5f 100644
--- a/csv/test/csv-repeat/append/all/input
+++ b/csv/test/csv-repeat/append/all/input
@@ -3,9 +3,9 @@ period=0.1
 append="repeating,time"
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.55
-123,0.01
-456,0.55
-"
+0,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999"
diff --git a/csv/test/csv-repeat/append/repeating/input b/csv/test/csv-repeat/append/repeating/input
index 49ada6517..c527d02d9 100644
--- a/csv/test/csv-repeat/append/repeating/input
+++ b/csv/test/csv-repeat/append/repeating/input
@@ -3,9 +3,10 @@ period=0.1
 append="repeating"
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.55
-123,0.01
-456,0.55
+0,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999
 "
diff --git a/csv/test/csv-repeat/append/time/input b/csv/test/csv-repeat/append/time/input
index 4710d985e..03de5148d 100644
--- a/csv/test/csv-repeat/append/time/input
+++ b/csv/test/csv-repeat/append/time/input
@@ -3,9 +3,9 @@ period=0.1
 append="time"
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.55
-123,0.01
-456,0.55
-"
+0,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999"
diff --git a/csv/test/csv-repeat/period/input b/csv/test/csv-repeat/period/input
index 82f37d0f4..b3ff2bc79 100644
--- a/csv/test/csv-repeat/period/input
+++ b/csv/test/csv-repeat/period/input
@@ -2,9 +2,9 @@ timeout=0.3
 period=0.1
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.48
-123,0.01
-456,0.49
-"
+0,123
+0.01,456
+0.01,789
+0.48,123
+0.01,456
+0.49,999"
diff --git a/csv/test/csv-repeat/test b/csv/test/csv-repeat/test
index 324c6ae59..94f7999b9 100755
--- a/csv/test/csv-repeat/test
+++ b/csv/test/csv-repeat/test
@@ -17,9 +17,9 @@ for mode in ascii binary; do
     csv_eval_expr="t-=init_t"
     [[ $append =~ time ]] && csv_eval_expr+="; time-=init_t"
 
-    while IFS=, read data pause; do
-        echo $data
+    while IFS=, read pause data; do
         sleep $pause
+        echo $data
     done <<< "$data" \
         | if [[ $mode == "binary" ]]; then
               csv-to-bin $format --flush \
diff --git a/csv/test/csv-repeat/timeout/input b/csv/test/csv-repeat/timeout/input
index 67127068f..1aa54a871 100644
--- a/csv/test/csv-repeat/timeout/input
+++ b/csv/test/csv-repeat/timeout/input
@@ -1,9 +1,9 @@
 timeout=0.3
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.48
-123,0.01
-456,0.49
-"
+0,123
+0.01,456
+0.01,789
+0.48,123
+0.01,456
+0.49,999"

From fa7f6962b453b5d25c14d0454d5b1b584acf1bd8 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Dec 2020 14:27:53 +1100
Subject: [PATCH 0289/1056] csv-repeat/test: timestamp data immediately after
 csv-repeat runs

which should improve timestamping accuracy
---
 csv/test/csv-repeat/test | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/csv/test/csv-repeat/test b/csv/test/csv-repeat/test
index 94f7999b9..5976114e2 100755
--- a/csv/test/csv-repeat/test
+++ b/csv/test/csv-repeat/test
@@ -24,11 +24,12 @@ for mode in ascii binary; do
         | if [[ $mode == "binary" ]]; then
               csv-to-bin $format --flush \
                   | csv-repeat --timeout=$timeout $period_option $append_option --binary=$format \
-                  | csv-from-bin $output_format --flush
+                  | csv-time-stamp --binary $output_format \
+                  | csv-from-bin t,$output_format --flush
           else
-              csv-repeat --timeout=$timeout $period_option $append_option
+              csv-repeat --timeout=$timeout $period_option $append_option | csv-time-stamp
           fi \
-        | csv-time-stamp | csv-time --fields $time_fields --to seconds \
+        | csv-time --fields $time_fields --to seconds \
         | gawk 'BEGIN { FS="," } { if( init_t == 0 ) init_t=$1; print $0,init_t }' OFS=, \
         | csv-eval --fields=$time_fields,init_t "$csv_eval_expr" --flush \
         | name-value-from-csv --fields=timestamp,$output_fields --line-number --prefix=$mode \

From bea9a21c0887ab5a5621e64f4eb8bc2bfe5b7c91 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Dec 2020 15:30:57 +1100
Subject: [PATCH 0290/1056] csv-repeat/test: have a small delay at the start

so that all the applications in the pipeline can be loaded thus reducing
errors in timestamps
---
 csv/test/csv-repeat/append/all/input       | 2 +-
 csv/test/csv-repeat/append/repeating/input | 2 +-
 csv/test/csv-repeat/append/time/input      | 2 +-
 csv/test/csv-repeat/period/input           | 2 +-
 csv/test/csv-repeat/timeout/input          | 2 +-
 5 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/csv/test/csv-repeat/append/all/input b/csv/test/csv-repeat/append/all/input
index b69e23b5f..04a7f90fe 100644
--- a/csv/test/csv-repeat/append/all/input
+++ b/csv/test/csv-repeat/append/all/input
@@ -3,7 +3,7 @@ period=0.1
 append="repeating,time"
 format=ui
 data="
-0,123
+0.20,123
 0.01,456
 0.01,789
 0.55,123
diff --git a/csv/test/csv-repeat/append/repeating/input b/csv/test/csv-repeat/append/repeating/input
index c527d02d9..ff35214a0 100644
--- a/csv/test/csv-repeat/append/repeating/input
+++ b/csv/test/csv-repeat/append/repeating/input
@@ -3,7 +3,7 @@ period=0.1
 append="repeating"
 format=ui
 data="
-0,123
+0.20,123
 0.01,456
 0.01,789
 0.55,123
diff --git a/csv/test/csv-repeat/append/time/input b/csv/test/csv-repeat/append/time/input
index 03de5148d..f301085f3 100644
--- a/csv/test/csv-repeat/append/time/input
+++ b/csv/test/csv-repeat/append/time/input
@@ -3,7 +3,7 @@ period=0.1
 append="time"
 format=ui
 data="
-0,123
+0.20,123
 0.01,456
 0.01,789
 0.55,123
diff --git a/csv/test/csv-repeat/period/input b/csv/test/csv-repeat/period/input
index b3ff2bc79..0f912c422 100644
--- a/csv/test/csv-repeat/period/input
+++ b/csv/test/csv-repeat/period/input
@@ -2,7 +2,7 @@ timeout=0.3
 period=0.1
 format=ui
 data="
-0,123
+0.20,123
 0.01,456
 0.01,789
 0.48,123
diff --git a/csv/test/csv-repeat/timeout/input b/csv/test/csv-repeat/timeout/input
index 1aa54a871..197070675 100644
--- a/csv/test/csv-repeat/timeout/input
+++ b/csv/test/csv-repeat/timeout/input
@@ -1,7 +1,7 @@
 timeout=0.3
 format=ui
 data="
-0,123
+0.20,123
 0.01,456
 0.01,789
 0.48,123

From cc3ad20aa9aded15d2370e8a6c272a5480e4e97f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 15:44:27 +1100
Subject: [PATCH 0291/1056] io-publish: --on-demand --exec: fixed properly;
 don't even know how it worked before

---
 io/applications/io-publish.cpp     | 78 +++++++++++-------------------
 io/test/io-publish/on-demand/input |  1 -
 io/test/io-publish/test            |  2 +
 3 files changed, 29 insertions(+), 52 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 06a7a9908..8ce55bded 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -1,31 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2020 Vsevolod Vlaskine
 
 /// @authors cedric wohlleber, vsevolod vlaskine, dave jennings
 
@@ -36,6 +10,8 @@
 
 #include <boost/bind.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/iostreams/device/file_descriptor.hpp>
+#include <boost/iostreams/stream.hpp>
 #include <boost/ptr_container/ptr_vector.hpp>
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
@@ -69,9 +45,9 @@ static void usage( bool verbose = false )
     std::cerr << "    --multiplier,-m: multiplier for packet size, default is 1. The actual packet size will be m * s" << std::endl;
     std::cerr << "    --no-discard: if present, do blocking write to every open stream" << std::endl;
     std::cerr << "    --no-flush: if present, do not flush the output stream (use on high bandwidth sources)" << std::endl;
-    std::cerr << "    --exec=[<cmd>]: read from cmd rather than stdin" << std::endl;
-    std::cerr << "    -- [<cmd>]: alternate syntax for specifying a command (simplifies quoting)" << std::endl;
-    std::cerr << "    --on-demand: only run <cmd> when a client is connected" << std::endl;
+    std::cerr << "    --exec=[<command>]: read from <command> rather than stdin" << std::endl;
+    std::cerr << "    -- [<command>]: alternate syntax for specifying a command (simplifies quoting)" << std::endl;
+    std::cerr << "    --on-demand: only run <command> when a client is connected" << std::endl;
     std::cerr << std::endl;
     std::cerr << "client options" << std::endl;
     std::cerr << "    --exit-on-no-clients,-e: once the last client disconnects, exit" << std::endl;
@@ -244,13 +220,12 @@ class publish
 class command
 {
     public:
-        command( const std::string& cmd )
-            : cmd_( cmd )
-            , child_pid_( -1 )
+        command( const std::string& command ): command_( command ), child_pid_( -1 )
         {
-            comma::verbose << "launching " << cmd << std::endl;
+            comma::verbose << "launching command: " << command << std::endl;
             int fd[2];
             if( ::pipe( fd ) == -1 ) { comma::last_error::to_exception( "couldn't open pipe" ); } // create a pipe to send the child stdout to the parent stdin
+            fd_ = fd[0];
             pid_t pid = fork();
             if( pid == -1 ) { comma::last_error::to_exception( "failed to fork()" ); }
             if( pid == 0 )
@@ -259,36 +234,38 @@ class command
                 while( ( dup2( fd[1], STDOUT_FILENO ) == -1 ) && ( errno == EINTR ) ) {} // connect pipe input to stdout in child
                 ::close( fd[1] );     // no longer need fd[1], now that it's duped
                 ::close( fd[0] );     // don't need pipe output in the child
-                ::execlp( "bash", "bash", "-c", &cmd_[0], NULL );
+                ::execlp( "bash", "bash", "-c", &command_[0], NULL );
                 std::cerr << "io-publish: failed to exec child: errno " << comma::last_error::value() << " - " << comma::last_error::to_string() << std::endl;
                 exit( 1 );
             }
             child_pid_ = pid;
-            while( ( ::dup2( fd[0], STDIN_FILENO ) == -1 ) && ( errno == EINTR ) ) {} // connect pipe output to stdin in parent
-            ::close( fd[0] ); // no longer need fd[0], now that it's duped
+            comma::verbose << "launched command with pid: " << pid << std::endl;
+            ::close( STDIN_FILENO );
             ::close( fd[1] ); // don't need pipe input in the parent
         }
+        
+        int fd() const { return fd_; }
 
         ~command()
         {
-            comma::verbose << "killing child pid " << child_pid_ << " for " << cmd_ << "..." << std::endl;
+            comma::verbose << "killing child pid " << child_pid_ << " for " << command_ << "..." << std::endl;
             ::kill( -child_pid_, SIGTERM );
             comma::verbose << "waiting for pid " << child_pid_ << "..." << std::endl;
             if( ::waitpid( -child_pid_, NULL, 0 ) < 0 ) { comma::verbose << "warning: waiting for pid " << child_pid_ << " failed" << std::endl; }
-            while( std::getchar() >= 0 ); // todo: lame, but select or c-style reading produce bizarre results; investigate further
+            while( std::getchar() >= 0 ); // todo: lame, but select or c-style reading produce bizarre results; investigate sometime
             comma::verbose << "waiting for pid " << child_pid_ << " done" << std::endl;
         }
 
     private:
-        std::string cmd_;
+        std::string command_;
         pid_t child_pid_;
+        int fd_;
 };
 
 int main( int ac, char** av )
 {
     try
     {
-        //comma::command_line_options options( ac, av, usage );
         std::vector< std::string > head, tail;
         for( int i = 0; i < ac && std::string( "--" ) != av[i]; ++i ) { head.push_back( av[i] ); }
         for( int i = head.size() + 1; i < ac; ++i ) { tail.push_back( av[i] ); }
@@ -319,18 +296,17 @@ int main( int ac, char** av )
         else
         {
             bool done = false;
+            int fd[2];
+            if( ::pipe( fd ) == -1 ) { comma::last_error::to_exception( "couldn't open pipe" ); } // create a pipe to send the child stdout to the parent stdin
             while( !done && !is_shutdown )
             {
-                if( !on_demand || p.num_clients() > 0 )
-                {
-                    command cmd( exec_command );
-                    while( std::cin.good() && !is_shutdown && p.read( std::cin ) );
-                    if( !on_demand ) { done = true; }
-                }
-                else
-                {
-                    ::sleep( 0.1 );
-                }
+                if( on_demand && p.num_clients() == 0 ) { ::sleep( 0.1 ); continue; }
+                comma::verbose << "number of clients: " << p.num_clients() << std::endl;
+                command cmd( exec_command );
+                typedef boost::iostreams::file_descriptor_source fd_t;
+                boost::iostreams::stream< fd_t > is( fd_t( cmd.fd(), boost::iostreams::never_close_handle ) );
+                while( is.good() && !is_shutdown && p.read( is ) );
+                if( !on_demand ) { break; }
             }
         }
         //ProfilerStop(); }
diff --git a/io/test/io-publish/on-demand/input b/io/test/io-publish/on-demand/input
index 731c9dc4e..4fdc5e2ab 100644
--- a/io/test/io-publish/on-demand/input
+++ b/io/test/io-publish/on-demand/input
@@ -5,7 +5,6 @@ options="--on-demand"
 test_duration=40
 report_interval=0.5
 
-# yes | csv-repeat --pace --period 0.25
 function exec_cmd()
 {
     yes
diff --git a/io/test/io-publish/test b/io/test/io-publish/test
index d5ddc8630..42987104b 100755
--- a/io/test/io-publish/test
+++ b/io/test/io-publish/test
@@ -37,6 +37,7 @@ echo "test: io_publish_pid: $io_publish_pid port: $port" >&2
 
 if [[ $( type -t client_cmd ) == "function" ]]; then
     sleep 1                     # allow time for io-publish to open the port
+    echo "test: running client command..." >&2
     client_cmd > /dev/null &
     client_cmd_pid=$!
     echo "client_cmd_pid=$client_cmd_pid" >&2
@@ -64,5 +65,6 @@ echo "test: killing io-publish: $io_publish_pid" >&2
 kill_pid_and_children $io_publish_pid
 
 if [[ -f client.out ]]; then
+    echo "test: outputting $( realpath client.out )" >&2
     cat client.out | name-value-from-csv line --prefix output -n -d @
 fi

From 81904195ed749850765ec79b835ca349bee6129e Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Dec 2020 16:29:41 +1100
Subject: [PATCH 0292/1056] csv-repeat/test: change smallest interval in period
 test from 0.01 to 0.1s

0.01s is too small for a bash-driven test using sleep to be reliable
---
 csv/test/csv-repeat/period/expected | 36 ++++++++++++++---------------
 csv/test/csv-repeat/period/input    | 14 +++++------
 2 files changed, 25 insertions(+), 25 deletions(-)

diff --git a/csv/test/csv-repeat/period/expected b/csv/test/csv-repeat/period/expected
index a233be089..3f3faac3c 100644
--- a/csv/test/csv-repeat/period/expected
+++ b/csv/test/csv-repeat/period/expected
@@ -1,37 +1,37 @@
-ascii[0]/timestamp=0.00 +/- 0.03
+ascii[0]/timestamp=0.0 +/- 0.03
 ascii[0]/data=123
-ascii[1]/timestamp=0.01 +/- 0.03
+ascii[1]/timestamp=0.1 +/- 0.03
 ascii[1]/data=456
-ascii[2]/timestamp=0.02 +/- 0.03
+ascii[2]/timestamp=0.2 +/- 0.03
 ascii[2]/data=789
-ascii[3]/timestamp=0.32 +/- 0.03
+ascii[3]/timestamp=0.5 +/- 0.03
 ascii[3]/data=789
-ascii[4]/timestamp=0.42 +/- 0.03
+ascii[4]/timestamp=0.7 +/- 0.03
 ascii[4]/data=789
-ascii[5]/timestamp=0.50 +/- 0.03
+ascii[5]/timestamp=0.8 +/- 0.03
 ascii[5]/data=123
-ascii[6]/timestamp=0.51 +/- 0.03
+ascii[6]/timestamp=0.9 +/- 0.03
 ascii[6]/data=456
-ascii[7]/timestamp=0.81 +/- 0.03
+ascii[7]/timestamp=1.2 +/- 0.03
 ascii[7]/data=456
-ascii[8]/timestamp=0.91 +/- 0.03
+ascii[8]/timestamp=1.4 +/- 0.03
 ascii[8]/data=456
 
-binary[0]/timestamp=0.00 +/- 0.03
+binary[0]/timestamp=0.0 +/- 0.03
 binary[0]/data=123
-binary[1]/timestamp=0.01 +/- 0.03
+binary[1]/timestamp=0.1 +/- 0.03
 binary[1]/data=456
-binary[2]/timestamp=0.02 +/- 0.03
+binary[2]/timestamp=0.2 +/- 0.03
 binary[2]/data=789
-binary[3]/timestamp=0.32 +/- 0.03
+binary[3]/timestamp=0.5 +/- 0.03
 binary[3]/data=789
-binary[4]/timestamp=0.42 +/- 0.03
+binary[4]/timestamp=0.7 +/- 0.03
 binary[4]/data=789
-binary[5]/timestamp=0.50 +/- 0.03
+binary[5]/timestamp=0.8 +/- 0.03
 binary[5]/data=123
-binary[6]/timestamp=0.51 +/- 0.03
+binary[6]/timestamp=0.9 +/- 0.03
 binary[6]/data=456
-binary[7]/timestamp=0.81 +/- 0.03
+binary[7]/timestamp=1.2 +/- 0.03
 binary[7]/data=456
-binary[8]/timestamp=0.91 +/- 0.03
+binary[8]/timestamp=1.4 +/- 0.03
 binary[8]/data=456
diff --git a/csv/test/csv-repeat/period/input b/csv/test/csv-repeat/period/input
index 0f912c422..f2e0a2acc 100644
--- a/csv/test/csv-repeat/period/input
+++ b/csv/test/csv-repeat/period/input
@@ -1,10 +1,10 @@
 timeout=0.3
-period=0.1
+period=0.2
 format=ui
 data="
-0.20,123
-0.01,456
-0.01,789
-0.48,123
-0.01,456
-0.49,999"
+0.2,123
+0.1,456
+0.1,789
+0.6,123
+0.1,456
+1.0,999"

From aa9cd84da20b822e6cda3edd89158b0cbfadae07 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 16:49:32 +1100
Subject: [PATCH 0293/1056] io-publish: if --on-demand, require --exec

---
 io/applications/io-publish.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 8ce55bded..a89782b54 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -291,6 +291,7 @@ int main( int ac, char** av )
         //ProfilerStart( "io-publish.prof" ); {
         if( exec_command.empty() )
         {
+            if( on_demand ) { std::cerr << "io-publish: got --on-demand; please specify --exec <command> or -- <command>" << std::endl; return 1; }
             while( std::cin.good() && !is_shutdown ) { if( !p.read( std::cin ) && exit_on_no_clients ) { break; } }
         }
         else

From 255952ad7cad1f2947c1bd73c26b1323fe9c04f3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 16:57:02 +1100
Subject: [PATCH 0294/1056] io-publish: message improved

---
 io/applications/io-publish.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index a89782b54..d3728a07a 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -291,7 +291,7 @@ int main( int ac, char** av )
         //ProfilerStart( "io-publish.prof" ); {
         if( exec_command.empty() )
         {
-            if( on_demand ) { std::cerr << "io-publish: got --on-demand; please specify --exec <command> or -- <command>" << std::endl; return 1; }
+            if( on_demand ) { std::cerr << "io-publish: got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" << std::endl; return 1; }
             while( std::cin.good() && !is_shutdown ) { if( !p.read( std::cin ) && exit_on_no_clients ) { break; } }
         }
         else

From 92b67588b6f3b3e02a0ecda71f02b88f030ec075 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Dec 2020 18:07:06 +1100
Subject: [PATCH 0295/1056] csv-time-stamp/test: preheat the cache, so that
 timestamps are more accurate

---
 csv/test/csv-time-stamp/test | 25 ++++++++++++++++---------
 1 file changed, 16 insertions(+), 9 deletions(-)

diff --git a/csv/test/csv-time-stamp/test b/csv/test/csv-time-stamp/test
index fd3691851..e10c00d8d 100755
--- a/csv/test/csv-time-stamp/test
+++ b/csv/test/csv-time-stamp/test
@@ -4,8 +4,6 @@ source $( type -p comma-application-util )
 
 comma_path_value_to_var < <( cat )
 
-now=$( date -u +%Y%m%dT%H%M%S.%N | csv-time --from iso --to seconds )
-
 input_fn=cat
 output_fn=cat
 if [[ $options =~ --binary|--size ]]; then
@@ -13,13 +11,22 @@ if [[ $options =~ --binary|--size ]]; then
     output_fn="csv-from-bin t,$format"
 fi
 
+function timestamper()
+{
+    local now=$( date -u +%Y%m%dT%H%M%S.%N | csv-time --from iso --to seconds )
+    $input_fn \
+        | csv-time-stamp $options \
+        | $output_fn | csv-time --from iso --to seconds \
+        | csv-eval --fields=t "d=t-$now" \
+        | name-value-from-csv --prefix=output --line-number --fields=t,$fields,d \
+        | csv-quote --unquote --delimiter='='
+}
+
+# prime the system to load everything from disk, so that timestamp comparison is more accurate
+
+echo "dummy" | timestamper >/dev/null 2>&1
+
 # put a small delay between the outputting of each line,
 # so the timestamps are different
 
-echo -e $input | while read line; do echo $line; sleep 0.1; done \
-    | $input_fn \
-    | csv-time-stamp $options \
-    | $output_fn | csv-time --from iso --to seconds \
-    | csv-eval --fields=t "d=t-$now" \
-    | name-value-from-csv --prefix=output --line-number --fields=t,$fields,d \
-    | csv-quote --unquote --delimiter='='
+echo -e $input | while read line; do echo $line; sleep 0.1; done | timestamper

From caab7ee6294643f307d7ceecb417c8fb656c1535 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Dec 2020 18:08:07 +1100
Subject: [PATCH 0296/1056] csv-time-join/tests/realtime: allow +/-1 on
 results, as timing is a little variable

---
 csv/test/csv-time-join/realtime/simple/expected         | 4 ++--
 csv/test/csv-time-join/realtime/timestamp-only/expected | 4 ++--
 csv/test/csv-time-join/test                             | 3 ++-
 3 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/csv/test/csv-time-join/realtime/simple/expected b/csv/test/csv-time-join/realtime/simple/expected
index 557a39cf2..ebc28fe03 100644
--- a/csv/test/csv-time-join/realtime/simple/expected
+++ b/csv/test/csv-time-join/realtime/simple/expected
@@ -1,2 +1,2 @@
-num_records="10"
-num_fields="4"
+num_records=10 +/- 1
+num_fields=4
diff --git a/csv/test/csv-time-join/realtime/timestamp-only/expected b/csv/test/csv-time-join/realtime/timestamp-only/expected
index df5c38113..373fa6438 100644
--- a/csv/test/csv-time-join/realtime/timestamp-only/expected
+++ b/csv/test/csv-time-join/realtime/timestamp-only/expected
@@ -1,2 +1,2 @@
-num_records="10"
-num_fields="3"
+num_records=10 +/- 1
+num_fields=3
diff --git a/csv/test/csv-time-join/test b/csv/test/csv-time-join/test
index 07f0ab933..2a0e3b47b 100755
--- a/csv/test/csv-time-join/test
+++ b/csv/test/csv-time-join/test
@@ -33,7 +33,8 @@ cat $input \
     | if [[ $options =~ --realtime ]]; then
           sed 's/[^,]//g' | wc -lc | tr -s ' ' | sed 's/^ //' | tr ' ' , \
               | csv-eval --fields=lines,chars "chars = chars / lines" \
-              | name-value-from-csv -f num_records,num_fields
+              | name-value-from-csv -f num_records,num_fields \
+              | csv-quote --unquote -d =
       else
           name-value-from-csv -f line -d : -n -p output
       fi

From d03e376053f857838139c69ef8d89033305b5cea Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 20:16:33 +1100
Subject: [PATCH 0297/1056] io-publish: minor refactoring in preparation for
 master property implementation

---
 io/applications/io-publish.cpp | 26 +++++++++++++-------------
 io/impl/publisher.cpp          | 28 ----------------------------
 2 files changed, 13 insertions(+), 41 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index d3728a07a..389eb430f 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -7,12 +7,11 @@
 #include <signal.h>
 #include <sys/wait.h>
 #include <unistd.h>
-
+#include <memory>
 #include <boost/bind.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/iostreams/device/file_descriptor.hpp>
 #include <boost/iostreams/stream.hpp>
-#include <boost/ptr_container/ptr_vector.hpp>
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
@@ -91,7 +90,7 @@ static void usage( bool verbose = false )
 class publish
 {
     public:
-        typedef comma::synchronized< boost::ptr_vector< comma::io::publisher > > publishers_t;
+        typedef comma::synchronized< std::vector< std::unique_ptr< comma::io::publisher > > > publishers_t;
         
         typedef publishers_t::scoped_transaction transaction_t;
         
@@ -116,12 +115,13 @@ class publish
             sigaction( SIGPIPE, NULL, &old_action );
             sigaction( SIGPIPE, &new_action, NULL );
             transaction_t t( publishers_ );
+            t->resize( filenames.size() );
             for( std::size_t i = 0; i < filenames.size(); ++i )
             {
-                t->push_back( new comma::io::publisher( filenames[i]
-                                                      , is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii
-                                                      , !discard
-                                                      , flush ));
+                ( *t )[i].reset( new comma::io::publisher( filenames[i]
+                                                         , is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii
+                                                         , !discard
+                                                         , flush ) );
             }
             acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
         }
@@ -131,7 +131,7 @@ class publish
             is_shutdown_ = true;
             acceptor_thread_->join();
             transaction_t t( publishers_ );
-            { for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i].close(); } }
+            { for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i]->close(); } }
         }
         
         bool read( std::istream& input )
@@ -148,7 +148,7 @@ class publish
                 if( !input.good() ) { return false; }
             }
             transaction_t t( publishers_ );
-            for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i].write( &buffer_[0], buffer_.size(), false ); }
+            for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); }
             return handle_sizes_( t );
         }
 
@@ -157,14 +157,14 @@ class publish
     private:
         bool is_binary_() const { return packet_size_ > 0; }
         
-        bool handle_sizes_( transaction_t& t )
+        bool handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
         {
             if( !output_number_of_clients_ && !report_no_clients_ ) { return true; }
             unsigned int total = 0;
             bool changed = false;
             for( unsigned int i = 0; i < t->size(); ++i )
             {
-                unsigned int size = ( *t )[i].size();
+                unsigned int size = ( *t )[i]->size();
                 total += size;
                 if( sizes_[i] == size ) { continue; }
                 sizes_[i] = size;
@@ -191,7 +191,7 @@ class publish
             comma::io::select select;
             {
                 transaction_t t( publishers_ );
-                for( unsigned int i = 0; i < t->size(); ++i ) { if( ( *t )[i].acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i].acceptor_file_descriptor() ); } }
+                for( unsigned int i = 0; i < t->size(); ++i ) { if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); } }
             }
             while( !is_shutdown_ )
             {
@@ -199,7 +199,7 @@ class publish
                 transaction_t t( publishers_ );
                 for( unsigned int i = 0; i < t->size(); ++i )
                 {
-                    if( select.read().ready( ( *t )[i].acceptor_file_descriptor() ) ) { ( *t )[i].accept(); }
+                    if( select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) ) { ( *t )[i]->accept(); }
                 }
                 handle_sizes_( t );
             }
diff --git a/io/impl/publisher.cpp b/io/impl/publisher.cpp
index 5511ddbee..48bec03b6 100644
--- a/io/impl/publisher.cpp
+++ b/io/impl/publisher.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author cedric wohlleber
 

From 708e5688dbf9b5013b83fc25b5daedb5cd4bcf30 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 22:27:08 +1100
Subject: [PATCH 0298/1056] io-publish: implementing secondary endpoints...

---
 io/applications/io-publish.cpp | 51 ++++++++++++++++++++++++++--------
 1 file changed, 39 insertions(+), 12 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 389eb430f..fdbf81618 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -19,6 +19,7 @@
 #include "../../base/last_error.h"
 #include "../../io/file_descriptor.h"
 #include "../../io/publisher.h"
+#include "../../name_value/map.h"
 #include "../../string/string.h"
 #include "../../sync/synchronized.h"
 
@@ -94,7 +95,14 @@ class publish
         
         typedef publishers_t::scoped_transaction transaction_t;
         
-        publish( const std::vector< std::string >& filenames
+        struct endpoint
+        {
+            std::string address;
+            bool secondary;
+            endpoint( const std::string& address = "", bool secondary = false ): secondary( secondary ) {}
+        };
+        
+        publish( const std::vector< std::string >& endpoints
                , unsigned int packet_size
                , bool discard
                , bool flush
@@ -105,23 +113,25 @@ class publish
             , output_number_of_clients_( output_number_of_clients )
             , report_no_clients_( report_no_clients )
             , got_first_client_ever_( false )
-            , sizes_( filenames.size(), 0 )
+            , sizes_( endpoints.size(), 0 )
             , num_clients_( 0 )
             , is_shutdown_( false )
         {
+            for( unsigned int i = 0; i < endpoints.size(); ++i )
+            {
+                comma::name_value::map m( endpoints[i], "address", ';', '=' );
+                endpoints_.push_back( endpoint( m.value< std::string >( "address" ), !m.exists( "primary" ) && m.exists( "secondary" ) ) ); // todo? quick and dirty; better usage semantics?
+            }
             struct sigaction new_action, old_action;
             new_action.sa_handler = SIG_IGN;
             sigemptyset( &new_action.sa_mask );
             sigaction( SIGPIPE, NULL, &old_action );
             sigaction( SIGPIPE, &new_action, NULL );
             transaction_t t( publishers_ );
-            t->resize( filenames.size() );
-            for( std::size_t i = 0; i < filenames.size(); ++i )
+            t->resize( endpoints.size() );
+            for( std::size_t i = 0; i < endpoints.size(); ++i )
             {
-                ( *t )[i].reset( new comma::io::publisher( filenames[i]
-                                                         , is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii
-                                                         , !discard
-                                                         , flush ) );
+                if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::publisher( endpoints[i], is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
             }
             acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
         }
@@ -131,7 +141,7 @@ class publish
             is_shutdown_ = true;
             acceptor_thread_->join();
             transaction_t t( publishers_ );
-            { for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i]->close(); } }
+            { for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } } }
         }
         
         bool read( std::istream& input )
@@ -148,7 +158,7 @@ class publish
                 if( !input.good() ) { return false; }
             }
             transaction_t t( publishers_ );
-            for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); }
+            for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
             return handle_sizes_( t );
         }
 
@@ -162,10 +172,12 @@ class publish
             if( !output_number_of_clients_ && !report_no_clients_ ) { return true; }
             unsigned int total = 0;
             bool changed = false;
+            has_primary_clients_ = false;
             for( unsigned int i = 0; i < t->size(); ++i )
             {
-                unsigned int size = ( *t )[i]->size();
+                unsigned int size = ( *t )[i] ? ( *t )[i]->size() : 0;
                 total += size;
+                if( !endpoints_[i].secondary && size > 0 ) { has_primary_clients_ = true; }
                 if( sizes_[i] == size ) { continue; }
                 sizes_[i] = size;
                 changed = true;
@@ -191,7 +203,11 @@ class publish
             comma::io::select select;
             {
                 transaction_t t( publishers_ );
-                for( unsigned int i = 0; i < t->size(); ++i ) { if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); } }
+                for( unsigned int i = 0; i < t->size(); ++i )
+                {
+                    if( !( *t )[i] ) { continue; }
+                    if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
+                }
             }
             while( !is_shutdown_ )
             {
@@ -199,12 +215,22 @@ class publish
                 transaction_t t( publishers_ );
                 for( unsigned int i = 0; i < t->size(); ++i )
                 {
+                    if( !( *t )[i] ) { continue; }
                     if( select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) ) { ( *t )[i]->accept(); }
                 }
                 handle_sizes_( t );
+                if( has_primary_clients_ )
+                {
+                    // todo: restore secondary acceptors
+                }
+                else
+                {
+                    // todo: reset secondary acceptors
+                }
             }
         }
         
+        std::vector< endpoint > endpoints_;
         publishers_t publishers_;
         std::string buffer_;
         unsigned int packet_size_;
@@ -212,6 +238,7 @@ class publish
         bool report_no_clients_;
         bool got_first_client_ever_;
         std::vector< unsigned int > sizes_;
+        bool has_primary_clients_;
         unsigned int num_clients_;
         boost::scoped_ptr< boost::thread > acceptor_thread_;
         bool is_shutdown_;

From 9bf6424a92545b2aa402b9dff0acd16990d54082 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Dec 2020 23:37:08 +1100
Subject: [PATCH 0299/1056] io-publish: secondary streams: first cut
 implemented; debugging...

---
 io/applications/io-publish.cpp | 54 ++++++++++++++++++++++++----------
 1 file changed, 39 insertions(+), 15 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index fdbf81618..6a3a9125f 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -72,12 +72,19 @@ static void usage( bool verbose = false )
     std::cerr << "               but might take a while to notice that a client has gone." << std::endl;
     std::cerr << "               This affects --output-number-of-clients and --on-demand." << std::endl;
     std::cerr << std::endl;
-    std::cerr << "output streams" << std::endl;
-    std::cerr << "    tcp:<port>: e.g. tcp:1234" << std::endl;
-    std::cerr << "    udp:<port>: e.g. udp:1234 (todo)" << std::endl;
-    std::cerr << "    local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
-    std::cerr << "    <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
-    std::cerr << "    <filename>: a regular file" << std::endl;
+    std::cerr << "output streams: <address>[,<options>]" << std::endl;
+    std::cerr << "    <address>" << std::endl;
+    std::cerr << "        tcp:<port>: e.g. tcp:1234" << std::endl;
+    std::cerr << "        udp:<port>: e.g. udp:1234 (todo)" << std::endl;
+    std::cerr << "        local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
+    std::cerr << "        <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
+    std::cerr << "        <filename>: a regular file" << std::endl;
+    std::cerr << "        -: stdout" << std::endl;
+    std::cerr << "    <options>" << std::endl;
+    std::cerr << "        primary (default): clients always can connect to the 'primary' stream" << std::endl;
+    std::cerr << "        secondary: clients can connect to the 'secondary' stream, only if there are existing clients on a primary stream" << std::endl;
+    std::cerr << "                   if a client connects to a 'primary' stream, 'secondary' streams will be opened" << std::endl;
+    std::cerr << "                   if last client on a 'primary' stream disconnects, 'secondary' streams will be closed" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    cat data | io-publish tcp:1234 --size 100" << std::endl;
@@ -99,7 +106,7 @@ class publish
         {
             std::string address;
             bool secondary;
-            endpoint( const std::string& address = "", bool secondary = false ): secondary( secondary ) {}
+            endpoint( const std::string& address = "", bool secondary = false ): address( address ), secondary( secondary ) {}
         };
         
         publish( const std::vector< std::string >& endpoints
@@ -108,7 +115,9 @@ class publish
                , bool flush
                , bool output_number_of_clients
                , bool report_no_clients )
-            : buffer_( packet_size, '\0' )
+            : discard_( discard )
+            , flush_( flush )
+            , buffer_( packet_size, '\0' )
             , packet_size_( packet_size )
             , output_number_of_clients_( output_number_of_clients )
             , report_no_clients_( report_no_clients )
@@ -117,11 +126,15 @@ class publish
             , num_clients_( 0 )
             , is_shutdown_( false )
         {
+            bool has_primary_stream = false;
             for( unsigned int i = 0; i < endpoints.size(); ++i )
             {
                 comma::name_value::map m( endpoints[i], "address", ';', '=' );
-                endpoints_.push_back( endpoint( m.value< std::string >( "address" ), !m.exists( "primary" ) && m.exists( "secondary" ) ) ); // todo? quick and dirty; better usage semantics?
+                bool secondary = !m.exists( "primary" ) && m.exists( "secondary" );
+                endpoints_.push_back( endpoint( m.value< std::string >( "address" ), secondary ) ); // todo? quick and dirty; better usage semantics?
+                if( !secondary ) { has_primary_stream = true; }
             }
+            if( !has_primary_stream ) { std::cerr << "io-publish: please specify at least one primary stream" << std::endl; exit( 1 ); }
             struct sigaction new_action, old_action;
             new_action.sa_handler = SIG_IGN;
             sigemptyset( &new_action.sa_mask );
@@ -131,7 +144,7 @@ class publish
             t->resize( endpoints.size() );
             for( std::size_t i = 0; i < endpoints.size(); ++i )
             {
-                if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::publisher( endpoints[i], is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
+                if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
             }
             acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
         }
@@ -141,7 +154,7 @@ class publish
             is_shutdown_ = true;
             acceptor_thread_->join();
             transaction_t t( publishers_ );
-            { for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } } }
+            for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
         }
         
         bool read( std::istream& input )
@@ -215,22 +228,33 @@ class publish
                 transaction_t t( publishers_ );
                 for( unsigned int i = 0; i < t->size(); ++i )
                 {
-                    if( !( *t )[i] ) { continue; }
-                    if( select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) ) { ( *t )[i]->accept(); }
+                    if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) ) { ( *t )[i]->accept(); }
                 }
                 handle_sizes_( t );
                 if( has_primary_clients_ )
                 {
-                    // todo: restore secondary acceptors
+                    for( unsigned int i = 0; i < t->size(); ++i )
+                    {
+                        if( !endpoints_[i].secondary || ( *t )[i] ) { continue; }
+                        ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
+                        if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
+                    }
                 }
                 else
                 {
-                    // todo: reset secondary acceptors
+                    for( unsigned int i = 0; i < t->size(); ++i )
+                    {
+                        if( !endpoints_[i].secondary || !( *t )[i] ) { continue; }
+                        select.read().remove( ( *t )[i]->acceptor_file_descriptor() );
+                        ( *t )[i].reset();
+                    }
                 }
             }
         }
         
         std::vector< endpoint > endpoints_;
+        bool discard_;
+        bool flush_;
         publishers_t publishers_;
         std::string buffer_;
         unsigned int packet_size_;

From 39a46261fc0a5502c259b858945a578f7bc6b6dc Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 10 Dec 2020 09:34:24 +1100
Subject: [PATCH 0300/1056] io-publish: secondary streams: --help: example
 added; debugging...

---
 io/applications/io-publish.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 6a3a9125f..c3010b4c9 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -85,6 +85,7 @@ static void usage( bool verbose = false )
     std::cerr << "        secondary: clients can connect to the 'secondary' stream, only if there are existing clients on a primary stream" << std::endl;
     std::cerr << "                   if a client connects to a 'primary' stream, 'secondary' streams will be opened" << std::endl;
     std::cerr << "                   if last client on a 'primary' stream disconnects, 'secondary' streams will be closed" << std::endl;
+    std::cerr << "                   e.g: io-publish tcp:8888 'tcp:9999;secondary'" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    cat data | io-publish tcp:1234 --size 100" << std::endl;

From d8fb1eb5d2b0d14f48f1ea777aac500381bd2976 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 10 Dec 2020 14:52:14 +1100
Subject: [PATCH 0301/1056] csv/test: added csv-to-from-bin

motivated by failure of:
$ echo -64 | csv-to-bin b | csv-from-bin b
on ARM processors. It outputs 192.

Underlying reason is definition of char, which is unsigned on ARM
---
 csv/test/csv-to-from-bin/expected | 4 ++++
 csv/test/csv-to-from-bin/input    | 8 ++++++++
 csv/test/csv-to-from-bin/test     | 7 +++++++
 3 files changed, 19 insertions(+)
 create mode 100644 csv/test/csv-to-from-bin/expected
 create mode 100644 csv/test/csv-to-from-bin/input
 create mode 100755 csv/test/csv-to-from-bin/test

diff --git a/csv/test/csv-to-from-bin/expected b/csv/test/csv-to-from-bin/expected
new file mode 100644
index 000000000..2d2e0e82b
--- /dev/null
+++ b/csv/test/csv-to-from-bin/expected
@@ -0,0 +1,4 @@
+#python
+
+for n in range( number_of( test )):
+    expect test[n]/output == test[n]/input
diff --git a/csv/test/csv-to-from-bin/input b/csv/test/csv-to-from-bin/input
new file mode 100644
index 000000000..be15fceac
--- /dev/null
+++ b/csv/test/csv-to-from-bin/input
@@ -0,0 +1,8 @@
+b 0,64,127,-64,-127
+ub 0,64,127,128,255
+w 0,64,127,-64,-127,-1000,1000
+uw 0,64,127,128,255,1000,3000
+i 0,64,127,-64,-127,-1000,1000,-1000000000,1000000000
+ui 0,64,127,128,255,1000,3000,1000000000,3000000000
+l 0,64,127,-64,-127,-1000,1000,-1000000000,1000000000,-10000000000,10000000000
+ul 0,64,127,128,255,1000,3000,1000000000,3000000000,10000000000,30000000000
diff --git a/csv/test/csv-to-from-bin/test b/csv/test/csv-to-from-bin/test
new file mode 100755
index 000000000..25c74455f
--- /dev/null
+++ b/csv/test/csv-to-from-bin/test
@@ -0,0 +1,7 @@
+#!/bin/bash
+
+while read format data; do
+    for x in $( tr , ' ' <<< $data ); do
+        echo $format,$x,$( echo $x | csv-to-bin $format | csv-from-bin $format )
+    done
+done | name-value-from-csv format,input,output --prefix test --line-number

From fb76e60404ba9f7d4a49ef0b5e08edc97ce2152b Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 10 Dec 2020 14:54:10 +1100
Subject: [PATCH 0302/1056] csv/format.cpp: correctly handle signed byte format
 on ARM

Compilers on ARM processors default to unsigned for char type, unlike x86
which defaults to signed. Handle the difference with an explicit cast.
---
 csv/format.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/format.cpp b/csv/format.cpp
index 048535ed6..956e1ceaf 100644
--- a/csv/format.cpp
+++ b/csv/format.cpp
@@ -302,7 +302,7 @@ static std::size_t bin_to_csv( std::ostringstream& oss, const char* buf, format:
     switch( type ) // todo: tear down bin_to_csv, use format::traits
     {
         case format::int8:
-            oss << static_cast< int >( *buf );
+            oss << static_cast< int >( static_cast< signed char >( *buf ));
             return sizeof( char );
         case format::uint8:
             oss << static_cast< unsigned int >( static_cast< unsigned char >( *buf ) );

From 76cb4923bb36acbe11ede2733ac7ed9b332a7d1e Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 10 Dec 2020 16:06:54 +1100
Subject: [PATCH 0303/1056] csv/test/format_test.cpp: added tests for signed
 and unsigned bytes

---
 csv/test/format_test.cpp | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/csv/test/format_test.cpp b/csv/test/format_test.cpp
index 28ea7f599..e3a08c7da 100644
--- a/csv/test/format_test.cpp
+++ b/csv/test/format_test.cpp
@@ -41,6 +41,14 @@ TEST( csv, format )
         try { comma::csv::format f( "%" ); EXPECT_TRUE( false ); } catch ( ... ) {}
         try { comma::csv::format f( "blah" ); EXPECT_TRUE( false ); } catch ( ... ) {}
     }
+    {
+        comma::csv::format f( "%ub" );
+        EXPECT_EQ( f.bin_to_csv( f.csv_to_bin( "64" ) ), "64" );
+    }
+    {
+        comma::csv::format f( "%b" );
+        EXPECT_EQ( f.bin_to_csv( f.csv_to_bin( "-64" ) ), "-64" );
+    }
     {
         comma::csv::format f( "%uw" );
         EXPECT_EQ( f.bin_to_csv( f.csv_to_bin( "1234" ) ), "1234" );

From c3d7d0f1893150781d88d15fba05ca741a00a2f9 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 10 Dec 2020 21:27:00 +1100
Subject: [PATCH 0304/1056] io-topics: topics_from_config(): refactored;
 publish: secondary/address, secondary/port added

---
 io/applications/io-topics | 31 ++++++++++++++++++++-----------
 1 file changed, 20 insertions(+), 11 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 2ff6ad9e7..a2077e807 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -120,6 +120,8 @@ binary
 command
 on_demand
 port
+secondary/address
+secondary/port
 size
 eof
 }
@@ -132,6 +134,8 @@ binary; if publisher publishes binary data, the binary format of the data, overr
 command; command for the publisher to run
 on_demand; if present, same meaning as io-publish --on-demand
 port; tcp port for publishing, unless address field is present
+secondary/address; if present, passed verbatim to io-publish as '<address>;secondary', in this case port attribute ignored
+secondary/port; if present, secondary tcp port for publishing, unless address field is present, io-publish as 'tcp:<port>;secondary'
 size; if publisher publishes binary data, size of the binary record, if no binary attribute given
 eof
 }
@@ -216,24 +220,26 @@ eof
 
 function publish_command()
 {
-    [[ -n "$topic_command" ]] || die "command not specified for topic '$topic' in files ${configs[@]}"
-    [[ -n "$topic_address" || -n "$topic_port" ]] || die "neither address nor port specified for topic '$topic' in files ${configs[@]}"
+    [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
+    [[ -n "$topic_address" || -n "$topic_port" ]] || die "topic '$topic': neither address nor port specified in files ${configs[@]}"
     [[ -n "$topic_address" ]] || topic_address="tcp:$topic_port"
+    [[ -n "$topic_secondary_address" ]] || { [[ -z "$topic_secondary_port" ]] || topic_secondary_address="tcp:$topic_secondary_port"; }
+    [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
-    local cmd="io-publish $topic_address $size_option $on_demand -- $topic_command"
+    local cmd="io-publish $topic_address $topic_secondary_address $size_option $on_demand -- $topic_command"
     verbose "$cmd"
     echo "$cmd"
 }
 
 function set_topic_address()
 {
-    [[ -n "$topic_address" || ( -n "$topic_host" && -n "$topic_port" ) ]] || die "neither address nor host/port specified for topic '$topic' in files ${configs[@]}"
+    [[ -n "$topic_address" || ( -n "$topic_host" && -n "$topic_port" ) ]] || die "topic '$topic': neither address nor host/port specified in files ${configs[@]}"
     [[ -n "$topic_address" ]] || topic_address="tcp:$topic_host:$topic_port"
 }
 
 function cat_command()
 {
-    [[ -n "$topic_command" ]] || die "command not specified for topic '$topic' in files ${configs[@]}"
+    [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
     set_topic_address
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     if [[ -n "$topic_flush" ]]; then flush_option="--flush"; else unset flush_option; fi # todo! make flush default?!
@@ -270,14 +276,13 @@ function log_command()
         if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
         if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
         if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
-        #if [[ -n "$options_verbose" ]]; then say "--> verbose set"; else say "--> verbose not set"; fi
         cmd="io-cat $topic_address $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_index | csv-split -t $period $size_option $suffix_option $flush_option"
     fi
     local path
     [[ -z "$topic_path" ]] || path+="$topic_path/"
     path+="$options_log_dir/$topic"
     [[ -z "$topic_restart" ]] || cmd="io_topics_log_run_forever \"$cmd\""
-    (( "$options_dry_run" )) || mkdir -p $path || die "failed to make directory $path for topic $topic"
+    (( "$options_dry_run" )) || mkdir -p $path || die "topic '$topic': failed to make directory $path"
     cmd="( cd $path && $cmd )"
     echo "bash -c $cmd"
 }
@@ -291,9 +296,13 @@ function cat_config()
 
 function topics_from_config() # quick and dirty
 {
-    if [[ -n "$options_topics_from_all_configs" ]]; then egrep -e "/address=|/port=|/command=" <<< "$config" | cut -d= -f1 | sed -e 's#/address$##' -e 's#/port$##' -e 's#/command$##' | uniq; return; fi
-    grep '=""' <<< "$master_config" | cut -d= -f1
-    for path in $( grep -v '=""' <<< "$master_config" | cut -d= -f1 ); do dirname $path; done | uniq # todo: don't do it just through the dirname? join with operation fields and filter by them instead
+    local expression="/address=|/port=|/command=|/secondary/address=|/secondary/port="
+    function grep_by_topic_config_fields() { egrep -e "$expression" | cut -d= -f1 | sed -e 's#/secondary/address$##' -e 's#/secondary/port$##' -e 's#/address$##' -e 's#/port$##' -e 's#/command$##'; }
+    [[ -z "$options_topics_from_all_configs" ]] || { grep_by_topic_config_fields <<< "$config" | sort --unique; return; }
+    {
+        { grep '=""' <<< "$master_config"; grep -v '=""' <<< "$master_config" | egrep -v -e "$expression" | csv-strings dirname --emplace; } | cut -d= -f1 # quick and dirty, is it even correct?
+        grep_by_topic_config_fields <<< "$master_config"
+    } | sort --unique
 }
 
 function read_configs()
@@ -331,7 +340,7 @@ for topic in ${topics[@]}; do
     if [[ -n "$topic_binary" ]]; then size_option="--size $( csv-size $topic_binary )"
     elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
     else unset size_option; fi
-    cmd="$( ${operation}_command $topic )" || die "on topic $topic: making command failed"
+    cmd="$( ${operation}_command $topic )" || die "topic $topic: making command failed"
     commands+=( "$cmd" )
 done
 say "will run 'comma_execute_and_wait --group' with commands:"

From 12bc12f1995307f843fc4602c98dca39605fcbf1 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 10 Dec 2020 21:32:58 +1100
Subject: [PATCH 0305/1056] io-topics: publish: example with secondary port
 added

---
 io/applications/io-topics | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index a2077e807..9b9b07a58 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -69,6 +69,12 @@ examples
             3
             4
             
+        secondary address or port with --dry-run (try it without dry run)
+            > io-topics publish --config <( echo "a/command=csv-paste line-number"; echo "a/port=12345"; echo "b/command=csv-paste line-number"; echo "b/port=12346"; echo "b/secondary/port=8888"; echo "b/on_demand=1" ) --dry-run
+            io-topics: publish: will run 'comma_execute_and_wait --group' with commands:
+            io-topics: publish:     io-publish tcp:12345    -- csv-paste line-number
+            io-topics: publish:     io-publish tcp:12346 tcp:8888;secondary  --on-demand -- csv-paste line-number
+            
     cat
         run publisher
             > io-topics publish --config <( echo "a/command=csv-paste line-number"; echo "a/port=12345"; echo "b/command=csv-paste line-number"; echo "b/port=12346"; echo "b/on_demand=1" )

From 46ec4dcbe7aca19c9b98f10246e64afcf3719f25 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Dec 2020 09:43:51 +1100
Subject: [PATCH 0306/1056] io-topics: adding host field

---
 io/applications/io-topics | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 9b9b07a58..54d513359 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -302,8 +302,8 @@ function cat_config()
 
 function topics_from_config() # quick and dirty
 {
-    local expression="/address=|/port=|/command=|/secondary/address=|/secondary/port="
-    function grep_by_topic_config_fields() { egrep -e "$expression" | cut -d= -f1 | sed -e 's#/secondary/address$##' -e 's#/secondary/port$##' -e 's#/address$##' -e 's#/port$##' -e 's#/command$##'; }
+    local expression="/address=|/host=|/port=|/command=|/secondary/address=|/secondary/host|/secondary/port="
+    function grep_by_topic_config_fields() { egrep -e "$expression" | cut -d= -f1 | sed -e 's#/secondary/address$##' -e 's#/secondary/host$##' -e 's#/secondary/port$##' -e 's#/address$##' -e 's#/host$##' -e 's#/port$##' -e 's#/command$##'; }
     [[ -z "$options_topics_from_all_configs" ]] || { grep_by_topic_config_fields <<< "$config" | sort --unique; return; }
     {
         { grep '=""' <<< "$master_config"; grep -v '=""' <<< "$master_config" | egrep -v -e "$expression" | csv-strings dirname --emplace; } | cut -d= -f1 # quick and dirty, is it even correct?
@@ -324,6 +324,7 @@ function get_topics()
     topics=( ${unnamed[@]:1} )
     if (( ${#topics[@]} == 0 )); then topics=( $( topics_from_config ) ); fi
     (( ${#topics[@]} > 0 )) || die "no topics in config files ${configs[@]}"
+    verbose "topics: ${topics[@]}"
 }
 
 (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )) && usage

From 69a7daa342460321abf26670839e7c0f673394ff Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Dec 2020 11:13:05 +1100
Subject: [PATCH 0307/1056] mistakenly removed copyright notice restored

---
 bash/comma-application-util        | 27 +++++++++++++++++++++++++++
 csv/applications/csv-calc.cpp      | 27 +++++++++++++++++++++++++++
 csv/applications/csv-crc.cpp       |  1 -
 csv/applications/csv-enumerate.cpp | 27 +++++++++++++++++++++++++++
 csv/applications/csv-fields.cpp    | 27 +++++++++++++++++++++++++++
 csv/applications/csv-format.cpp    | 27 +++++++++++++++++++++++++++
 csv/applications/csv-join.cpp      | 27 +++++++++++++++++++++++++++
 csv/applications/csv-paste.cpp     | 27 +++++++++++++++++++++++++++
 csv/applications/csv-play.cpp      | 27 +++++++++++++++++++++++++++
 csv/applications/csv-select.cpp    |  1 -
 csv/applications/csv-shuffle.cpp   | 30 ++++++++++++++++++++++++++++++
 csv/applications/csv-size.cpp      | 27 +++++++++++++++++++++++++++
 csv/applications/csv-sort.cpp      | 27 +++++++++++++++++++++++++++
 csv/applications/csv-strings.cpp   | 23 -----------------------
 csv/applications/csv-time.cpp      | 29 ++++++++++++++++++++++++++++-
 csv/applications/csv-units.cpp     |  3 +--
 io/applications/io-console.cpp     | 27 +++++++++++++++++++++++++++
 io/applications/io-ls.cpp          | 29 +++++++++++++++++++++++++++++
 io/applications/io-publish.cpp     | 27 +++++++++++++++++++++++++++
 io/applications/io-topics          | 30 ++++++++++++++++++++++++++++++
 io/applications/zero-publish       | 29 +++++++++++++++++++++++++++++
 21 files changed, 471 insertions(+), 28 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 8440c82b1..76db1f92f 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -1,7 +1,34 @@
 #!/bin/bash
 
+# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
 # Copyright (c) 2020 Vsevolod Vlaskine
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are met:
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. Neither the name of the University of Sydney nor the
+#    names of its contributors may be used to endorse or promote products
+#    derived from this software without specific prior written permission.
+#
+# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 ## @page comma-application-util comma-application-util
 # this script is designed to be included in another script directly, for example:
diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index b8abe0b97..630e6fc10 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1,5 +1,32 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // Copyright (c) 2020 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-crc.cpp b/csv/applications/csv-crc.cpp
index ff12dc6ba..637bd4775 100644
--- a/csv/applications/csv-crc.cpp
+++ b/csv/applications/csv-crc.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 /// @author james underwood
 
diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index 31f6f0226..459c40719 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-fields.cpp b/csv/applications/csv-fields.cpp
index d8e46c66a..f2f705901 100644
--- a/csv/applications/csv-fields.cpp
+++ b/csv/applications/csv-fields.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-format.cpp b/csv/applications/csv-format.cpp
index 2f1812d8b..f9cbc8bd4 100644
--- a/csv/applications/csv-format.cpp
+++ b/csv/applications/csv-format.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 2573a630a..302e5300b 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index e421d87f9..1fbc51677 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 1e3bc6997..ebaa2d151 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author cedric wohlleber
 
diff --git a/csv/applications/csv-select.cpp b/csv/applications/csv-select.cpp
index f72286756..66ef2c3fc 100644
--- a/csv/applications/csv-select.cpp
+++ b/csv/applications/csv-select.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #include <iostream>
diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 274de4a2f..9df07b8ef 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -1,5 +1,35 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // Copyright (c) 2020 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2011 The University of Sydney
+
+/// @author vsevolod vlaskine
 
 #ifdef WIN32
 #include <fcntl.h>
diff --git a/csv/applications/csv-size.cpp b/csv/applications/csv-size.cpp
index 4400b43e3..d37a6cb32 100644
--- a/csv/applications/csv-size.cpp
+++ b/csv/applications/csv-size.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index fce62ba3f..d896aedc3 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @authors matthew imhoff, dewey nguyen, vsevolod vlaskine
 
diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 8ca0e9b50..78e0e0258 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -1,27 +1,4 @@
 // Copyright (c) 2018 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
diff --git a/csv/applications/csv-time.cpp b/csv/applications/csv-time.cpp
index 8c585df14..8a73940f8 100644
--- a/csv/applications/csv-time.cpp
+++ b/csv/applications/csv-time.cpp
@@ -1,6 +1,33 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-/// @authors vsevolod vlaskine mathew hounsell
+/// @authors vsevolod vlaskine, mathew hounsell
 
 #include <string.h>
 #include <time.h>
diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index de79a13e3..cea524656 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 /// @author kai huang
 
@@ -50,7 +49,7 @@
 #include <boost/units/base_units/us/mile.hpp>
 #include <boost/units/base_units/metric/knot.hpp>
 #include <boost/units/base_units/angle/radian.hpp>
-#include <boost/units/base_units/angle/degree.hpp>
+// Copyright (c) 2011 The University of Sydney#include <boost/units/base_units/angle/degree.hpp>
 
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
diff --git a/io/applications/io-console.cpp b/io/applications/io-console.cpp
index 4e8206310..fc12de231 100644
--- a/io/applications/io-console.cpp
+++ b/io/applications/io-console.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <termios.h>
 #include <iostream>
diff --git a/io/applications/io-ls.cpp b/io/applications/io-ls.cpp
index 80c5b8308..05ad1fe2a 100644
--- a/io/applications/io-ls.cpp
+++ b/io/applications/io-ls.cpp
@@ -1,3 +1,32 @@
+// This file is part of comma, a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
 #include "../../application/command_line_options.h"
 #include "../../application/verbose.h"
 #include "../../csv/stream.h"
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index c3010b4c9..ab9ec23de 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -1,5 +1,32 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // Copyright (c) 2020 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @authors cedric wohlleber, vsevolod vlaskine, dave jennings
 
diff --git a/io/applications/io-topics b/io/applications/io-topics
index 54d513359..e96f2dea8 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -1,5 +1,35 @@
 #!/bin/bash
 
+# This file is part of comma, a generic and flexible library
+# Copyright (c) 2011 The University of Sydney
+# Copyright (c) 2020 Vsevolod Vlaskine
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are met:
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. Neither the name of the University of Sydney nor the
+#    names of its contributors may be used to endorse or promote products
+#    derived from this software without specific prior written permission.
+#
+# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
 scriptname=$( basename $0 )
 
 source $( type -p comma-application-util ) || { echo "io-topics: could not source 'comma-application-util'" >&2; exit 1; }
diff --git a/io/applications/zero-publish b/io/applications/zero-publish
index e0c51def5..7fcef8c5c 100644
--- a/io/applications/zero-publish
+++ b/io/applications/zero-publish
@@ -1,5 +1,34 @@
 #!/bin/bash
 
+# This file is part of comma, a generic and flexible library
+# Copyright (c) 2011 The University of Sydney
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are met:
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. Neither the name of the University of Sydney nor the
+#    names of its contributors may be used to endorse or promote products
+#    derived from this software without specific prior written permission.
+#
+# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
 function usage()
 {
     echo "publish data on tcp in a packet-based manner"

From 8375f720c0afbbecc0ff2ef45ba06cb8befd074d Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Dec 2020 11:17:38 +1100
Subject: [PATCH 0308/1056] trivial compilation error fixed

---
 csv/applications/csv-units.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index cea524656..18f3eb8a4 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -49,7 +49,7 @@
 #include <boost/units/base_units/us/mile.hpp>
 #include <boost/units/base_units/metric/knot.hpp>
 #include <boost/units/base_units/angle/radian.hpp>
-// Copyright (c) 2011 The University of Sydney#include <boost/units/base_units/angle/degree.hpp>
+#include <boost/units/base_units/angle/degree.hpp>
 
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"

From 8b44965bbbfe7ddf782d9eb8f70a225c7b0b0ce7 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Dec 2020 19:32:06 +1100
Subject: [PATCH 0309/1056] io-topics: a bug fixed: binary option handled
 correctly now

---
 io/applications/io-topics | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index e96f2dea8..1bab20b65 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -336,7 +336,8 @@ function topics_from_config() # quick and dirty
     function grep_by_topic_config_fields() { egrep -e "$expression" | cut -d= -f1 | sed -e 's#/secondary/address$##' -e 's#/secondary/host$##' -e 's#/secondary/port$##' -e 's#/address$##' -e 's#/host$##' -e 's#/port$##' -e 's#/command$##'; }
     [[ -z "$options_topics_from_all_configs" ]] || { grep_by_topic_config_fields <<< "$config" | sort --unique; return; }
     {
-        { grep '=""' <<< "$master_config"; grep -v '=""' <<< "$master_config" | egrep -v -e "$expression" | csv-strings dirname --emplace; } | cut -d= -f1 # quick and dirty, is it even correct?
+        grep '=""' <<< "$master_config" | cut -d= -f1
+        grep -v '=""' <<< "$master_config" | egrep -v -e "$expression" | cut -d= -f1 | csv-strings dirname --emplace # quick and dirty, is it even correct?
         grep_by_topic_config_fields <<< "$master_config"
     } | sort --unique
 }

From 1e273c3fc5427e5c37dafa77fce7567bbab5c2a1 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Dec 2020 20:14:55 +1100
Subject: [PATCH 0310/1056] io-topics: publish: input topic field: basics done;
 more extensive configuration: todo

---
 io/applications/io-topics | 32 ++++++++++++++++++++++----------
 1 file changed, 22 insertions(+), 10 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 1bab20b65..9dbebc7ab 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -148,12 +148,13 @@ function die() { say "$@"; exit 1; }
 
 function list_topic_fields() { :; }
 
-function publish_topic_fields()
+function publish_topic_fields() # todo: flush field? flush is default behaviour in io-publish, which is inconsistent with log and cat operations and thus introducing flush in publish might be confusing
 {
     cat <<eof
 address
 binary
 command
+input
 on_demand
 port
 secondary/address
@@ -168,6 +169,7 @@ function publish_topic_fields_help()
 address; if present, passed verbatim to io-publish, in this case port attribute ignored
 binary; if publisher publishes binary data, the binary format of the data, overrides size
 command; command for the publisher to run
+input; input topic for publish command to read on stdin
 on_demand; if present, same meaning as io-publish --on-demand
 port; tcp port for publishing, unless address field is present
 secondary/address; if present, passed verbatim to io-publish as '<address>;secondary', in this case port attribute ignored
@@ -263,6 +265,7 @@ function publish_command()
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $on_demand -- $topic_command"
+    [[ -z "$topic_input" ]] || cmd="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=unlimited --flush | $cmd" # todo! quick and dirty, expose connect parameters and flush (?) in config?
     verbose "$cmd"
     echo "$cmd"
 }
@@ -275,14 +278,17 @@ function set_topic_address()
 
 function cat_command()
 {
-    [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
+    local topic=$1
+    local ignore_command=$2
+    (( ignore_command )) || [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
     set_topic_address
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     if [[ -n "$topic_flush" ]]; then flush_option="--flush"; else unset flush_option; fi # todo! make flush default?!
     if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
     if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
-    local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_command" # todo? comma_execute_and_wait?
+    local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option" # todo? comma_execute_and_wait?
+    (( ignore_command )) || cmd+=" | $topic_command"
     verbose "$cmd"
     echo "$cmd"
 }
@@ -358,6 +364,18 @@ function get_topics()
     verbose "topics: ${topics[@]}"
 }
 
+function set_topic_variables()
+{
+    local operation="$1"
+    local topic="$2"
+    eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
+    eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
+    topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )" # quick and dirty
+    if [[ -n "$topic_binary" ]]; then size_option="--size $( csv-size $topic_binary )"
+    elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
+    else unset size_option; fi
+}
+
 (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )) && usage
 operation=$1
 [[ $( type -t ${operation}_topic_fields ) == "function" ]] || die "expected operation, got '$operation'" # quick and dirty
@@ -371,13 +389,7 @@ get_topics
 if [[ $operation == "list" ]]; then for topic in ${topics[@]}; do echo $topic; done; exit; fi
 commands=()
 for topic in ${topics[@]}; do
-    eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
-    eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
-    topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )"
-    #[[ -n "$topic_command" ]] || die "command not specified for topic '$topic' in files ${configs[@]}"
-    if [[ -n "$topic_binary" ]]; then size_option="--size $( csv-size $topic_binary )"
-    elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
-    else unset size_option; fi
+    set_topic_variables "$operation" "$topic"
     cmd="$( ${operation}_command $topic )" || die "topic $topic: making command failed"
     commands+=( "$cmd" )
 done

From 32bb3387d012cbb89aeb302aa52556a9789ce011 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Dec 2020 21:44:25 +1100
Subject: [PATCH 0311/1056] io-topics: publish: input: basics seem working...

---
 io/applications/io-topics | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 9dbebc7ab..fc0bfb8a6 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -264,8 +264,9 @@ function publish_command()
     [[ -n "$topic_secondary_address" ]] || { [[ -z "$topic_secondary_port" ]] || topic_secondary_address="tcp:$topic_secondary_port"; }
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
-    local cmd="io-publish $topic_address $topic_secondary_address $size_option $on_demand -- $topic_command"
-    [[ -z "$topic_input" ]] || cmd="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=unlimited --flush | $cmd" # todo! quick and dirty, expose connect parameters and flush (?) in config?
+    local cmd="io-publish $topic_address $topic_secondary_address $size_option $on_demand -- "
+    if [[ -z "$topic_input" ]]; then local cmd+="$topic_command"
+    else cmd+="bash -c '$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=unlimited --flush --verbose | $topic_command'"; fi # todo! quick and dirty, expose connect parameters and flush (?) in config?
     verbose "$cmd"
     echo "$cmd"
 }
@@ -287,8 +288,8 @@ function cat_command()
     if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
     if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
-    local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option" # todo? comma_execute_and_wait?
-    (( ignore_command )) || cmd+=" | $topic_command"
+    if (( ignore_command )); then local cmd="io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option"
+    else local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_command"; fi # todo? comma_execute_and_wait?
     verbose "$cmd"
     echo "$cmd"
 }

From ac7c0975681876599f3090eacb650016e5eea757 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 30 Dec 2020 12:45:17 +1100
Subject: [PATCH 0312/1056] io-topics: publish: input: goes crazy when input is
 a secondary topic or when the server disconnectes; debugging...

---
 io/applications/io-topics | 68 +++++++++++++++++++++------------------
 1 file changed, 37 insertions(+), 31 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index fc0bfb8a6..a067be2cf 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -256,6 +256,34 @@ function log_options()
 eof
 }
 
+function io_topics_restart_topic()
+{
+    local is_shutdown=0
+    trap "local is_shutdown=1" HUP INT TERM
+    while (( ! is_shutdown )) ; do bash -c "$@"; sleep 0.1; done # quick and dirty
+}
+
+export -f io_topics_restart_topic
+
+function set_topic_address()
+{
+    [[ -n "$topic_address" || ( -n "$topic_host" && -n "$topic_port" ) ]] || die "topic '$topic': neither address nor host/port specified in files ${configs[@]}"
+    [[ -n "$topic_address" ]] || topic_address="tcp:$topic_host:$topic_port"
+    [[ -n "$topic_address" ]] || die "topic: '$topic': failed to set topic address"
+}
+
+function set_topic_variables()
+{
+    local operation="$1"
+    local topic="$2"
+    eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
+    eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
+    topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )" # quick and dirty
+    if [[ -n "$topic_binary" ]]; then size_option="--size $( csv-size $topic_binary )"
+    elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
+    else unset size_option; fi
+}
+
 function publish_command()
 {
     [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
@@ -265,18 +293,17 @@ function publish_command()
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $on_demand -- "
-    if [[ -z "$topic_input" ]]; then local cmd+="$topic_command"
-    else cmd+="bash -c '$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=unlimited --flush --verbose | $topic_command'"; fi # todo! quick and dirty, expose connect parameters and flush (?) in config?
+    if [[ -z "$topic_input" ]]; then
+        cmd+="$topic_command"
+    else
+        #cmd+="bash -c '$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=1 --flush --verbose | $topic_command'" || die "topic '$topic': failed to configure input topic '$topic_input'" # todo! quick and dirty, expose connect parameters and flush (?) in config?
+        cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=1 --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"
+        cmd="bash -c io_topics_restart_topic '$cmd'"
+    fi
     verbose "$cmd"
     echo "$cmd"
 }
 
-function set_topic_address()
-{
-    [[ -n "$topic_address" || ( -n "$topic_host" && -n "$topic_port" ) ]] || die "topic '$topic': neither address nor host/port specified in files ${configs[@]}"
-    [[ -n "$topic_address" ]] || topic_address="tcp:$topic_host:$topic_port"
-}
-
 function cat_command()
 {
     local topic=$1
@@ -294,15 +321,6 @@ function cat_command()
     echo "$cmd"
 }
 
-function io_topics_log_run_forever()
-{
-    local is_shutdown=0
-    trap "local is_shutdown=1" HUP INT TERM
-    while (( ! is_shutdown )) ; do bash -c "$@"; sleep 0.1; done # quick and dirty
-}
-
-export -f io_topics_log_run_forever
-
 function log_command()
 {
     [[ -n "$options_log_dir" ]] || die "please specify --log-dir"
@@ -324,7 +342,7 @@ function log_command()
     local path
     [[ -z "$topic_path" ]] || path+="$topic_path/"
     path+="$options_log_dir/$topic"
-    [[ -z "$topic_restart" ]] || cmd="io_topics_log_run_forever \"$cmd\""
+    [[ -z "$topic_restart" ]] || cmd="io_topics_restart_topic \"$cmd\""
     (( "$options_dry_run" )) || mkdir -p $path || die "topic '$topic': failed to make directory $path"
     cmd="( cd $path && $cmd )"
     echo "bash -c $cmd"
@@ -365,18 +383,6 @@ function get_topics()
     verbose "topics: ${topics[@]}"
 }
 
-function set_topic_variables()
-{
-    local operation="$1"
-    local topic="$2"
-    eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
-    eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
-    topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )" # quick and dirty
-    if [[ -n "$topic_binary" ]]; then size_option="--size $( csv-size $topic_binary )"
-    elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
-    else unset size_option; fi
-}
-
 (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )) && usage
 operation=$1
 [[ $( type -t ${operation}_topic_fields ) == "function" ]] || die "expected operation, got '$operation'" # quick and dirty
@@ -391,7 +397,7 @@ if [[ $operation == "list" ]]; then for topic in ${topics[@]}; do echo $topic; d
 commands=()
 for topic in ${topics[@]}; do
     set_topic_variables "$operation" "$topic"
-    cmd="$( ${operation}_command $topic )" || die "topic $topic: making command failed"
+    cmd="$( ${operation}_command $topic )" || die "topic '$topic': making command failed"
     commands+=( "$cmd" )
 done
 say "will run 'comma_execute_and_wait --group' with commands:"

From 550c47a8f0ab03d988385d058378a2d14f0fa141 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 30 Dec 2020 19:09:56 +1100
Subject: [PATCH 0313/1056] io-publish: on-demand vs exited command handling
 implemented; io::publisher::disconnect_all() implemented

---
 io/applications/io-publish.cpp | 26 +++++++++++++++--------
 io/impl/publisher.cpp          | 39 +++++++++++++++++++++++++++-------
 io/impl/publisher.h            |  3 ++-
 io/publisher.cpp               |  2 ++
 io/publisher.h                 |  3 +++
 5 files changed, 55 insertions(+), 18 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index ab9ec23de..36b3c8a80 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -142,13 +142,13 @@ class publish
                , bool discard
                , bool flush
                , bool output_number_of_clients
-               , bool report_no_clients )
+               , bool update_no_clients )
             : discard_( discard )
             , flush_( flush )
             , buffer_( packet_size, '\0' )
             , packet_size_( packet_size )
             , output_number_of_clients_( output_number_of_clients )
-            , report_no_clients_( report_no_clients )
+            , update_no_clients_( update_no_clients )
             , got_first_client_ever_( false )
             , sizes_( endpoints.size(), 0 )
             , num_clients_( 0 )
@@ -185,6 +185,13 @@ class publish
             for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
         }
         
+        void disconnect_all()
+        {
+            transaction_t t( publishers_ );
+            for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
+            handle_sizes_( t ); // quick and dirty
+        }
+        
         bool read( std::istream& input )
         {
             if( is_binary_() )
@@ -199,10 +206,10 @@ class publish
                 if( !input.good() ) { return false; }
             }
             transaction_t t( publishers_ );
-            for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
+            for( auto& p: *t ) { if( p ) { p->write( &buffer_[0], buffer_.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
             return handle_sizes_( t );
         }
-
+        
         unsigned int num_clients() const { return num_clients_; }
 
     private:
@@ -210,7 +217,7 @@ class publish
         
         bool handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
         {
-            if( !output_number_of_clients_ && !report_no_clients_ ) { return true; }
+            if( !output_number_of_clients_ && !update_no_clients_ ) { return true; }
             unsigned int total = 0;
             bool changed = false;
             has_primary_clients_ = false;
@@ -231,7 +238,7 @@ class publish
                 for( unsigned int i = 0; i < sizes_.size(); ++i ) { std::cout << ',' << sizes_[i]; }
                 std::cout << std::endl;
             }
-            if( report_no_clients_ )
+            if( update_no_clients_ )
             {
                 if( total > 0 ) { got_first_client_ever_ = true; }
                 else if( got_first_client_ever_ ) { std::cerr << "io-publish: the last client exited" << std::endl; return false; }
@@ -252,7 +259,7 @@ class publish
             }
             while( !is_shutdown_ )
             {
-                select.wait( boost::posix_time::millisec( 100 ) ); // arbitrary timeout
+                select.wait( boost::posix_time::millisec( 100 ) ); // todo? make timeout configurable?
                 transaction_t t( publishers_ );
                 for( unsigned int i = 0; i < t->size(); ++i )
                 {
@@ -287,7 +294,7 @@ class publish
         std::string buffer_;
         unsigned int packet_size_;
         bool output_number_of_clients_;
-        bool report_no_clients_;
+        bool update_no_clients_;
         bool got_first_client_ever_;
         std::vector< unsigned int > sizes_;
         bool has_primary_clients_;
@@ -380,13 +387,14 @@ int main( int ac, char** av )
             if( ::pipe( fd ) == -1 ) { comma::last_error::to_exception( "couldn't open pipe" ); } // create a pipe to send the child stdout to the parent stdin
             while( !done && !is_shutdown )
             {
-                if( on_demand && p.num_clients() == 0 ) { ::sleep( 0.1 ); continue; }
+                if( on_demand && p.num_clients() == 0 ) { ::sleep( 0.1 ); continue; } // todo? make timeout configurable?
                 comma::verbose << "number of clients: " << p.num_clients() << std::endl;
                 command cmd( exec_command );
                 typedef boost::iostreams::file_descriptor_source fd_t;
                 boost::iostreams::stream< fd_t > is( fd_t( cmd.fd(), boost::iostreams::never_close_handle ) );
                 while( is.good() && !is_shutdown && p.read( is ) );
                 if( !on_demand ) { break; }
+                p.disconnect_all();
             }
         }
         //ProfilerStop(); }
diff --git a/io/impl/publisher.cpp b/io/impl/publisher.cpp
index 48bec03b6..f155e77b8 100644
--- a/io/impl/publisher.cpp
+++ b/io/impl/publisher.cpp
@@ -1,4 +1,31 @@
+// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author cedric wohlleber
 
@@ -24,13 +51,7 @@ namespace comma { namespace io { namespace impl {
 class file_acceptor : public acceptor
 {
     public:
-        file_acceptor( const std::string& name, io::mode::value mode )
-            : name_( name )
-            , mode_( mode )
-            , closed_( true )
-            , fd_( io::invalid_file_descriptor )
-        {
-        }
+        file_acceptor( const std::string& name, io::mode::value mode ): name_( name ), mode_( mode ), closed_( true ), fd_( io::invalid_file_descriptor ) {}
 
         ~file_acceptor()
         {
@@ -254,9 +275,11 @@ unsigned int publisher::write( const char* buf, std::size_t size, bool do_accept
 void publisher::close()
 {
     if( acceptor_ ) { acceptor_->close(); }
-    while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); }
+    disconnect_all();
 }
 
+void publisher::disconnect_all() { while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); } }
+
 unsigned int publisher::accept()
 {
     if( !acceptor_ ) { return 0; }
diff --git a/io/impl/publisher.h b/io/impl/publisher.h
index 0e0e37d81..4540ec79d 100644
--- a/io/impl/publisher.h
+++ b/io/impl/publisher.h
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
 #ifndef COMMA_IO_IMPL_PUBLISHER_H_
@@ -83,6 +82,8 @@ class publisher
         }
 
         void close();
+        
+        void disconnect_all();
 
         std::size_t size() const;
 
diff --git a/io/publisher.cpp b/io/publisher.cpp
index 486780099..2bf0d01bd 100644
--- a/io/publisher.cpp
+++ b/io/publisher.cpp
@@ -44,6 +44,8 @@ unsigned int publisher::accept() { return pimpl_->accept(); }
 
 void publisher::close() { pimpl_->close(); }
 
+void publisher::disconnect_all() { pimpl_->disconnect_all(); }
+
 std::size_t publisher::size() const { return pimpl_->size(); }
 
 file_descriptor publisher::acceptor_file_descriptor() const { return pimpl_->acceptor_ ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
diff --git a/io/publisher.h b/io/publisher.h
index a40c45aac..564011028 100644
--- a/io/publisher.h
+++ b/io/publisher.h
@@ -75,6 +75,9 @@ class publisher : public boost::noncopyable
 
         /// close
         void close();
+        
+        /// disconnect all existing clients
+        void disconnect_all();
 
         /// return current number of connected clients
         std::size_t size() const;

From b305e10f4286f2180c65d55e9a57afb2fbb929f0 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 30 Dec 2020 21:47:52 +1100
Subject: [PATCH 0314/1056] io-topics: publish: forming command (hopefully)
 fixed

---
 io/applications/io-topics | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index a067be2cf..e839bfe9d 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -293,13 +293,8 @@ function publish_command()
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $on_demand -- "
-    if [[ -z "$topic_input" ]]; then
-        cmd+="$topic_command"
-    else
-        #cmd+="bash -c '$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=1 --flush --verbose | $topic_command'" || die "topic '$topic': failed to configure input topic '$topic_input'" # todo! quick and dirty, expose connect parameters and flush (?) in config?
-        cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --connect-period=1 --connect-attempts=1 --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"
-        cmd="bash -c io_topics_restart_topic '$cmd'"
-    fi
+    if [[ -z "$topic_input" ]]; then cmd+="$topic_command"
+    else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"
     echo "$cmd"
 }

From 65f9933248fc85eb05f2f05c92ef8a645387323e Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 31 Dec 2020 10:39:37 +1100
Subject: [PATCH 0315/1056] io-topics: typo in help fixed

---
 io/applications/io-topics | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index e839bfe9d..cade6892e 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -196,7 +196,7 @@ eof
 function cat_topic_fields_help()
 {
     cat <<eof
-address; if present, passed verbatim to io-publish, in this case port attribute ignored
+address; if present, passed verbatim to io-cat, in this case port attribute ignored
 binary; if data is binary, the binary format of the data, overrides size
 command; command for the client to run
 connect_attempts; number of connect attemtps
@@ -231,7 +231,7 @@ eof
 function log_topic_fields_help()
 {
     cat <<eof
-address; if present, passed verbatim to io-publish, in this case port attribute ignored
+address; if present, passed verbatim to io-cat, in this case port attribute ignored
 binary; if data is binary, the binary format of the data, overrides size
 command; optional command for the logger to run instead of default logger
 connect_attempts; number of connect attemtps

From 96879c5c669bb6c716ad17d0faf0ca4c9f36cca9 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 31 Dec 2020 10:42:57 +1100
Subject: [PATCH 0316/1056] io-topics: typo in help fixed

---
 io/applications/io-topics | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index cade6892e..3c6a218d6 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -199,7 +199,7 @@ function cat_topic_fields_help()
 address; if present, passed verbatim to io-cat, in this case port attribute ignored
 binary; if data is binary, the binary format of the data, overrides size
 command; command for the client to run
-connect_attempts; number of connect attemtps
+connect_attempts; number of connect attempts
 connect_period; time in seconds between connect attempts
 flush; flush output on each record, default: buffer output
 host; tcp host for publishing, unless address field is present
@@ -234,7 +234,7 @@ function log_topic_fields_help()
 address; if present, passed verbatim to io-cat, in this case port attribute ignored
 binary; if data is binary, the binary format of the data, overrides size
 command; optional command for the logger to run instead of default logger
-connect_attempts; number of connect attemtps
+connect_attempts; number of connect attempts
 connect_period; time in seconds between connect attempts
 flush; flush output on each record, default: buffer output
 host; tcp host for publishing, unless address field is present

From 41c4ac507816cfa2637dd1332942fc90cfabd2b3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 11 Jan 2021 13:12:57 +1100
Subject: [PATCH 0317/1056] system/package/comma-package-docker-build: usage
 fixed when running with sudo

---
 system/package/Dockerfile                 | 3 ++-
 system/package/comma-package-docker-build | 2 ++
 system/package/readme                     | 4 +++-
 3 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/system/package/Dockerfile b/system/package/Dockerfile
index f9e25ee2c..8139bd50b 100644
--- a/system/package/Dockerfile
+++ b/system/package/Dockerfile
@@ -2,7 +2,8 @@ ARG version
 FROM ubuntu:${version}
 ENV DEBIAN_FRONTEND="noninteractive"
 RUN apt update \
-    && apt install software-properties-common --yes \
+    && apt install --yes apt-utils \
+    && apt install --yes software-properties-common \
     && apt install --yes ansible git build-essential cmake cmake-curses-gui python3-pip
 RUN apt install --yes python3-stdeb
 RUN apt install --yes python3-all
diff --git a/system/package/comma-package-docker-build b/system/package/comma-package-docker-build
index 8c9faa137..a9156fa43 100755
--- a/system/package/comma-package-docker-build
+++ b/system/package/comma-package-docker-build
@@ -3,4 +3,6 @@ version=$1
 comma_dir="$2"
 [[ -n "$version" ]] || { echo "usage: $0 <ubuntu version> [<comma dir>]; e.g. $0 20.04" >&2; exit 1; }
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
+[[ -n "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly" >&2; exit 1; }
+echo "docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f '$comma_dir/system/package/Dockerfile' ." >&2
 docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/Dockerfile" .
diff --git a/system/package/readme b/system/package/readme
index 316c27bb4..9c134db4d 100644
--- a/system/package/readme
+++ b/system/package/readme
@@ -1,4 +1,6 @@
-to build docker that has ansible, cmake, etc, run (you may need to run as sudo - am not sure why; try without sudo first):
+to build docker that has ansible, cmake, etc, run
+
+(you may need to run as sudo, unless you set up your docker running without sudo; see e.g: https://www.digitalocean.com/community/tutorials/how-to-install-and-use-docker-on-ubuntu-20-04)
 
 > ./comma-package-docker-build 18.04 # ubuntu 18.04
 > ./comma-package-docker-build 20.04 # ubuntu 20.04

From 772dde58a6fa5a6e04a2b4d59c5d5b2b72ac997c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 11 Jan 2021 13:41:36 +1100
Subject: [PATCH 0318/1056] system/package/comma-package-docker-*: made more
 verbose

---
 system/package/comma-package-docker-build | 3 ++-
 system/package/comma-package-docker-run   | 1 +
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/system/package/comma-package-docker-build b/system/package/comma-package-docker-build
index a9156fa43..124fa69f3 100755
--- a/system/package/comma-package-docker-build
+++ b/system/package/comma-package-docker-build
@@ -3,6 +3,7 @@ version=$1
 comma_dir="$2"
 [[ -n "$version" ]] || { echo "usage: $0 <ubuntu version> [<comma dir>]; e.g. $0 20.04" >&2; exit 1; }
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
-[[ -n "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly" >&2; exit 1; }
+[[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
+echo "$0: running:" >&2
 echo "docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f '$comma_dir/system/package/Dockerfile' ." >&2
 docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/Dockerfile" .
diff --git a/system/package/comma-package-docker-run b/system/package/comma-package-docker-run
index 5daab2c5a..bab3b8d23 100755
--- a/system/package/comma-package-docker-run
+++ b/system/package/comma-package-docker-run
@@ -7,6 +7,7 @@ comma_version_patch=$4
 comma_dir="$5"
 [[ -n "$comma_version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
+[[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
 
 docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \

From 226cf517d6ee67c2831f006a57cde7815a98300c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 11 Jan 2021 13:46:58 +1100
Subject: [PATCH 0319/1056] system/package: comma-package-docker-test: made
 more verbose; readme: minor typo fixed; todo commens added

---
 system/package/comma-package-docker-test | 2 ++
 system/package/comma-package-make        | 1 +
 system/package/readme                    | 2 +-
 3 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/system/package/comma-package-docker-test b/system/package/comma-package-docker-test
index 3c9eb490e..a2212949b 100755
--- a/system/package/comma-package-docker-test
+++ b/system/package/comma-package-docker-test
@@ -11,6 +11,8 @@ comma_dir="$4"
 [[ -s "$python_package" ]] || die "file not found or empty: '$python_package'"
 [[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
 package_dir=$( dirname "$( realpath "$package" )" )
+[[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
+# todo: optionally run full regression test
 
 docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 93f1efdc0..c62c3c40c 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -32,6 +32,7 @@ esac
     cd ~/src/comma/python
     echo "$0: setting up python in $( pwd )" >&2
     python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
+    # todo: optionally run full regression test
     echo "$0: done" >&2
 )
 cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
diff --git a/system/package/readme b/system/package/readme
index 9c134db4d..c9f525a06 100644
--- a/system/package/readme
+++ b/system/package/readme
@@ -17,5 +17,5 @@ debian package will be built in your current directory
 
 test that package is ok, e.g:
 
-> ./comma-package-docker-test 20.04 comma-1.0.0-Linux.deb python3-comma_1.0.0-1_all.deb
+> ./comma-package-docker-test 20.04 comma-1.2.3-Linux.deb python3-comma_1.2.3-1_all.deb
 

From bd7879363bdbcb9b8ffe248eb03d8c394387d703 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sun, 17 Jan 2021 12:19:22 +1100
Subject: [PATCH 0320/1056] csv-thin: simplify test of --deterministic flag

---
 csv/test/csv-thin/deterministic/expected | 10 +++++-----
 csv/test/csv-thin/deterministic/test     |  3 +--
 2 files changed, 6 insertions(+), 7 deletions(-)

diff --git a/csv/test/csv-thin/deterministic/expected b/csv/test/csv-thin/deterministic/expected
index fb91f8dbe..ae7ab26f6 100644
--- a/csv/test/csv-thin/deterministic/expected
+++ b/csv/test/csv-thin/deterministic/expected
@@ -1,5 +1,5 @@
-output[0]/n="3"
-output[1]/n="7"
-output[2]/n="11"
-output[3]/n="15"
-output[4]/n="19"
+output[0]/n="4"
+output[1]/n="8"
+output[2]/n="12"
+output[3]/n="16"
+output[4]/n="20"
diff --git a/csv/test/csv-thin/deterministic/test b/csv/test/csv-thin/deterministic/test
index 52bf9b4bc..bfe06923f 100755
--- a/csv/test/csv-thin/deterministic/test
+++ b/csv/test/csv-thin/deterministic/test
@@ -1,2 +1 @@
-csv-paste line-number | head -20 | csv-thin 0.25 --deterministic \
-    | name-value-from-csv --fields n --prefix output --line-number
+seq 20 | csv-thin 0.25 --deterministic | name-value-from-csv --fields n --prefix output --line-number

From 903e8e956e8f3ef795c49e7ec34b033cd12512cd Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sun, 17 Jan 2021 12:23:49 +1100
Subject: [PATCH 0321/1056] csv-thin: move --deterministic test to top-level

it's simple enough that it doesn't need it's own folder
---
 csv/test/csv-thin/deterministic/expected | 5 -----
 csv/test/csv-thin/deterministic/test     | 1 -
 csv/test/csv-thin/expected               | 2 ++
 csv/test/csv-thin/input                  | 1 +
 4 files changed, 3 insertions(+), 6 deletions(-)
 delete mode 100644 csv/test/csv-thin/deterministic/expected
 delete mode 100755 csv/test/csv-thin/deterministic/test

diff --git a/csv/test/csv-thin/deterministic/expected b/csv/test/csv-thin/deterministic/expected
deleted file mode 100644
index ae7ab26f6..000000000
--- a/csv/test/csv-thin/deterministic/expected
+++ /dev/null
@@ -1,5 +0,0 @@
-output[0]/n="4"
-output[1]/n="8"
-output[2]/n="12"
-output[3]/n="16"
-output[4]/n="20"
diff --git a/csv/test/csv-thin/deterministic/test b/csv/test/csv-thin/deterministic/test
deleted file mode 100755
index bfe06923f..000000000
--- a/csv/test/csv-thin/deterministic/test
+++ /dev/null
@@ -1 +0,0 @@
-seq 20 | csv-thin 0.25 --deterministic | name-value-from-csv --fields n --prefix output --line-number
diff --git a/csv/test/csv-thin/expected b/csv/test/csv-thin/expected
index 176eff035..01b70a6eb 100644
--- a/csv/test/csv-thin/expected
+++ b/csv/test/csv-thin/expected
@@ -1,3 +1,5 @@
+deterministic[0]/output="4,8,12,16,20,"
+deterministic[0]/status=0
 random/deterministic[0]/output="1,3,5,7,9,"
 random/deterministic[0]/status=0
 random/inverted[0]/output="1,2,3,4,5,6,7,8,9,10,"
diff --git a/csv/test/csv-thin/input b/csv/test/csv-thin/input
index b3d4aa61c..905183713 100644
--- a/csv/test/csv-thin/input
+++ b/csv/test/csv-thin/input
@@ -1,2 +1,3 @@
+deterministic[0]="seq 20 | csv-thin 0.25 --deterministic | tr '\\\n' ','"
 random/deterministic[0]="seq 10 | csv-thin 0.5 --invert --deterministic | tr '\\\n' ','"
 random/inverted[0]="( seq 10 | csv-thin 0.5; seq 10 | csv-thin 0.5 --invert ) | csv-sort --fields i | tr '\\\n' ','"

From 344a395f1b7b3f7a0cf0a9d79b6e9cae9c76240d Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sun, 17 Jan 2021 13:18:22 +1100
Subject: [PATCH 0322/1056] csv-thin: minor logic fix for --period option

if timestamp is equal to next_time we should output it
---
 csv/applications/csv-thin.cpp            | 2 +-
 csv/test/csv-thin/period/ascii/expected  | 4 ++--
 csv/test/csv-thin/period/binary/expected | 4 ++--
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index d9b892ca7..ed7f6e5c1 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -152,7 +152,7 @@ static bool keep() { return skip() == invert; }
 static bool skip_by_timestamp( boost::posix_time::ptime timestamp )
 {
     static boost::posix_time::ptime next_time = timestamp;
-    if( timestamp <= next_time ) { return true; }
+    if( timestamp < next_time ) { return true; }
     next_time += *period;
     return false;
 }
diff --git a/csv/test/csv-thin/period/ascii/expected b/csv/test/csv-thin/period/ascii/expected
index 768041874..b25ec4ecf 100644
--- a/csv/test/csv-thin/period/ascii/expected
+++ b/csv/test/csv-thin/period/ascii/expected
@@ -1,5 +1,5 @@
-output[0]/t="20180608T175915.180390703"
-output[0]/n="1"
+output[0]/t="20180608T175915.168851696"
+output[0]/n="0"
 output[1]/t="20180608T175915.271129830"
 output[1]/n="9"
 output[2]/t="20180608T175915.375231419"
diff --git a/csv/test/csv-thin/period/binary/expected b/csv/test/csv-thin/period/binary/expected
index 7f1c01d9b..27fa96e35 100644
--- a/csv/test/csv-thin/period/binary/expected
+++ b/csv/test/csv-thin/period/binary/expected
@@ -1,5 +1,5 @@
-output[0]/t="20180608T175915.180390"
-output[0]/n="1"
+output[0]/t="20180608T175915.168851"
+output[0]/n="0"
 output[1]/t="20180608T175915.271129"
 output[1]/n="9"
 output[2]/t="20180608T175915.375231"

From 234ceb98dfd687804dd24a08a28173d4159b9785 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sun, 17 Jan 2021 12:50:47 +1100
Subject: [PATCH 0323/1056] csv-thin: added tests for irregular input, with
 gaps and jumps

all tests pass with current application except jump-forward,
which currently fails
---
 .../period/irregular/baseline/expected        | 12 ++++
 .../csv-thin/period/irregular/baseline/input  | 60 +++++++++++++++++++
 .../period/irregular/gaps-01/expected         | 12 ++++
 .../csv-thin/period/irregular/gaps-01/input   | 47 +++++++++++++++
 .../period/irregular/gaps-02/expected         | 12 ++++
 .../csv-thin/period/irregular/gaps-02/input   | 48 +++++++++++++++
 .../period/irregular/jump-backward/expected   |  6 ++
 .../period/irregular/jump-backward/input      | 60 +++++++++++++++++++
 .../period/irregular/jump-forward/expected    | 12 ++++
 .../period/irregular/jump-forward/input       | 60 +++++++++++++++++++
 csv/test/csv-thin/period/irregular/test       |  1 +
 11 files changed, 330 insertions(+)
 create mode 100644 csv/test/csv-thin/period/irregular/baseline/expected
 create mode 100644 csv/test/csv-thin/period/irregular/baseline/input
 create mode 100644 csv/test/csv-thin/period/irregular/gaps-01/expected
 create mode 100644 csv/test/csv-thin/period/irregular/gaps-01/input
 create mode 100644 csv/test/csv-thin/period/irregular/gaps-02/expected
 create mode 100644 csv/test/csv-thin/period/irregular/gaps-02/input
 create mode 100644 csv/test/csv-thin/period/irregular/jump-backward/expected
 create mode 100644 csv/test/csv-thin/period/irregular/jump-backward/input
 create mode 100644 csv/test/csv-thin/period/irregular/jump-forward/expected
 create mode 100644 csv/test/csv-thin/period/irregular/jump-forward/input
 create mode 100755 csv/test/csv-thin/period/irregular/test

diff --git a/csv/test/csv-thin/period/irregular/baseline/expected b/csv/test/csv-thin/period/irregular/baseline/expected
new file mode 100644
index 000000000..ddd2da28f
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/baseline/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120002.0"
+output[2]/n="20"
+output[3]/t="20210117T120003.0"
+output[3]/n="30"
+output[4]/t="20210117T120004.0"
+output[4]/n="40"
+output[5]/t="20210117T120005.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/baseline/input b/csv/test/csv-thin/period/irregular/baseline/input
new file mode 100644
index 000000000..c1e23e235
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/baseline/input
@@ -0,0 +1,60 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.6,16
+20210117T120001.7,17
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T120002.0,20
+20210117T120002.1,21
+20210117T120002.2,22
+20210117T120002.3,23
+20210117T120002.4,24
+20210117T120002.5,25
+20210117T120002.6,26
+20210117T120002.7,27
+20210117T120002.8,28
+20210117T120002.9,29
+20210117T120003.0,30
+20210117T120003.1,31
+20210117T120003.2,32
+20210117T120003.3,33
+20210117T120003.4,34
+20210117T120003.5,35
+20210117T120003.6,36
+20210117T120003.7,37
+20210117T120003.8,38
+20210117T120003.9,39
+20210117T120004.0,40
+20210117T120004.1,41
+20210117T120004.2,42
+20210117T120004.3,43
+20210117T120004.4,44
+20210117T120004.5,45
+20210117T120004.6,46
+20210117T120004.7,47
+20210117T120004.8,48
+20210117T120004.9,49
+20210117T120005.0,50
+20210117T120005.1,51
+20210117T120005.2,52
+20210117T120005.3,53
+20210117T120005.4,54
+20210117T120005.5,55
+20210117T120005.6,56
+20210117T120005.7,57
+20210117T120005.8,58
+20210117T120005.9,59
diff --git a/csv/test/csv-thin/period/irregular/gaps-01/expected b/csv/test/csv-thin/period/irregular/gaps-01/expected
new file mode 100644
index 000000000..ddd2da28f
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-01/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120002.0"
+output[2]/n="20"
+output[3]/t="20210117T120003.0"
+output[3]/n="30"
+output[4]/t="20210117T120004.0"
+output[4]/n="40"
+output[5]/t="20210117T120005.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/gaps-01/input b/csv/test/csv-thin/period/irregular/gaps-01/input
new file mode 100644
index 000000000..28da4540f
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-01/input
@@ -0,0 +1,47 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.7,17
+20210117T120002.0,20
+20210117T120002.1,21
+20210117T120002.2,22
+20210117T120002.3,23
+20210117T120002.8,28
+20210117T120002.9,29
+20210117T120003.0,30
+20210117T120003.1,31
+20210117T120003.2,32
+20210117T120003.3,33
+20210117T120003.4,34
+20210117T120003.5,35
+20210117T120003.6,36
+20210117T120003.7,37
+20210117T120003.8,38
+20210117T120003.9,39
+20210117T120004.0,40
+20210117T120004.1,41
+20210117T120004.2,42
+20210117T120004.3,43
+20210117T120004.4,44
+20210117T120004.5,45
+20210117T120004.6,46
+20210117T120004.7,47
+20210117T120004.8,48
+20210117T120004.9,49
+20210117T120005.0,50
+20210117T120005.1,51
+20210117T120005.2,52
+20210117T120005.3,53
+20210117T120005.4,54
+20210117T120005.5,55
+20210117T120005.6,56
+20210117T120005.7,57
+20210117T120005.8,58
+20210117T120005.9,59
diff --git a/csv/test/csv-thin/period/irregular/gaps-02/expected b/csv/test/csv-thin/period/irregular/gaps-02/expected
new file mode 100644
index 000000000..1f56535f5
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-02/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.3"
+output[1]/n="13"
+output[2]/t="20210117T120002.0"
+output[2]/n="20"
+output[3]/t="20210117T120003.0"
+output[3]/n="30"
+output[4]/t="20210117T120004.4"
+output[4]/n="44"
+output[5]/t="20210117T120005.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/gaps-02/input b/csv/test/csv-thin/period/irregular/gaps-02/input
new file mode 100644
index 000000000..b390c96ad
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-02/input
@@ -0,0 +1,48 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T120002.0,20
+20210117T120002.1,21
+20210117T120002.2,22
+20210117T120002.3,23
+20210117T120002.4,24
+20210117T120002.5,25
+20210117T120002.6,26
+20210117T120002.7,27
+20210117T120002.8,28
+20210117T120002.9,29
+20210117T120003.0,30
+20210117T120003.1,31
+20210117T120003.2,32
+20210117T120003.3,33
+20210117T120003.4,34
+20210117T120003.5,35
+20210117T120003.6,36
+20210117T120003.7,37
+20210117T120003.8,38
+20210117T120004.4,44
+20210117T120004.5,45
+20210117T120004.6,46
+20210117T120004.7,47
+20210117T120004.8,48
+20210117T120004.9,49
+20210117T120005.0,50
+20210117T120005.1,51
+20210117T120005.2,52
+20210117T120005.3,53
+20210117T120005.4,54
+20210117T120005.5,55
+20210117T120005.6,56
+20210117T120005.7,57
+20210117T120005.8,58
+20210117T120005.9,59
diff --git a/csv/test/csv-thin/period/irregular/jump-backward/expected b/csv/test/csv-thin/period/irregular/jump-backward/expected
new file mode 100644
index 000000000..b5667b240
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-backward/expected
@@ -0,0 +1,6 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120002.0"
+output[2]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/jump-backward/input b/csv/test/csv-thin/period/irregular/jump-backward/input
new file mode 100644
index 000000000..e35a4988a
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-backward/input
@@ -0,0 +1,60 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.6,16
+20210117T120001.7,17
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T110059.0,20
+20210117T110059.1,21
+20210117T110059.2,22
+20210117T110059.3,23
+20210117T110059.4,24
+20210117T110059.5,25
+20210117T110059.6,26
+20210117T110059.7,27
+20210117T110059.8,28
+20210117T110059.9,29
+20210117T120000.0,30
+20210117T120000.1,31
+20210117T120000.2,32
+20210117T120000.3,33
+20210117T120000.4,34
+20210117T120000.5,35
+20210117T120000.6,36
+20210117T120000.7,37
+20210117T120000.8,38
+20210117T120000.9,39
+20210117T120001.0,40
+20210117T120001.1,41
+20210117T120001.2,42
+20210117T120001.3,43
+20210117T120001.4,44
+20210117T120001.5,45
+20210117T120001.6,46
+20210117T120001.7,47
+20210117T120001.8,48
+20210117T120001.9,49
+20210117T120002.0,50
+20210117T120002.1,51
+20210117T120002.2,52
+20210117T120002.3,53
+20210117T120002.4,54
+20210117T120002.5,55
+20210117T120002.6,56
+20210117T120002.7,57
+20210117T120002.8,58
+20210117T120002.9,59
diff --git a/csv/test/csv-thin/period/irregular/jump-forward/expected b/csv/test/csv-thin/period/irregular/jump-forward/expected
new file mode 100644
index 000000000..1e319278e
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-forward/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120102.0"
+output[2]/n="20"
+output[3]/t="20210117T120103.0"
+output[3]/n="30"
+output[4]/t="20210117T120104.0"
+output[4]/n="40"
+output[5]/t="20210117T120105.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/jump-forward/input b/csv/test/csv-thin/period/irregular/jump-forward/input
new file mode 100644
index 000000000..f98d8dc66
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-forward/input
@@ -0,0 +1,60 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.6,16
+20210117T120001.7,17
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T120102.0,20
+20210117T120102.1,21
+20210117T120102.2,22
+20210117T120102.3,23
+20210117T120102.4,24
+20210117T120102.5,25
+20210117T120102.6,26
+20210117T120102.7,27
+20210117T120102.8,28
+20210117T120102.9,29
+20210117T120103.0,30
+20210117T120103.1,31
+20210117T120103.2,32
+20210117T120103.3,33
+20210117T120103.4,34
+20210117T120103.5,35
+20210117T120103.6,36
+20210117T120103.7,37
+20210117T120103.8,38
+20210117T120103.9,39
+20210117T120104.0,40
+20210117T120104.1,41
+20210117T120104.2,42
+20210117T120104.3,43
+20210117T120104.4,44
+20210117T120104.5,45
+20210117T120104.6,46
+20210117T120104.7,47
+20210117T120104.8,48
+20210117T120104.9,49
+20210117T120105.0,50
+20210117T120105.1,51
+20210117T120105.2,52
+20210117T120105.3,53
+20210117T120105.4,54
+20210117T120105.5,55
+20210117T120105.6,56
+20210117T120105.7,57
+20210117T120105.8,58
+20210117T120105.9,59
diff --git a/csv/test/csv-thin/period/irregular/test b/csv/test/csv-thin/period/irregular/test
new file mode 100755
index 000000000..5e645c4bc
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/test
@@ -0,0 +1 @@
+csv-thin --period 1 --fields t | name-value-from-csv --fields t,n --prefix output --line-number

From 62f2adf5f6592c6606e00ad314006db456045d8f Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sun, 17 Jan 2021 13:00:42 +1100
Subject: [PATCH 0324/1056] csv-thin: added test for slow input (slower than
 --period)

---
 csv/test/csv-thin/period/slow/expected | 24 ++++++++++++++++++++++++
 csv/test/csv-thin/period/slow/input    | 12 ++++++++++++
 csv/test/csv-thin/period/slow/test     |  1 +
 3 files changed, 37 insertions(+)
 create mode 100644 csv/test/csv-thin/period/slow/expected
 create mode 100644 csv/test/csv-thin/period/slow/input
 create mode 100755 csv/test/csv-thin/period/slow/test

diff --git a/csv/test/csv-thin/period/slow/expected b/csv/test/csv-thin/period/slow/expected
new file mode 100644
index 000000000..a894b6eaa
--- /dev/null
+++ b/csv/test/csv-thin/period/slow/expected
@@ -0,0 +1,24 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120000.5"
+output[1]/n="5"
+output[2]/t="20210117T120001.0"
+output[2]/n="10"
+output[3]/t="20210117T120001.5"
+output[3]/n="15"
+output[4]/t="20210117T120002.0"
+output[4]/n="20"
+output[5]/t="20210117T120002.5"
+output[5]/n="25"
+output[6]/t="20210117T120003.0"
+output[6]/n="30"
+output[7]/t="20210117T120003.5"
+output[7]/n="35"
+output[8]/t="20210117T120004.0"
+output[8]/n="40"
+output[9]/t="20210117T120004.5"
+output[9]/n="45"
+output[10]/t="20210117T120005.0"
+output[10]/n="50"
+output[11]/t="20210117T120005.5"
+output[11]/n="55"
diff --git a/csv/test/csv-thin/period/slow/input b/csv/test/csv-thin/period/slow/input
new file mode 100644
index 000000000..041668da6
--- /dev/null
+++ b/csv/test/csv-thin/period/slow/input
@@ -0,0 +1,12 @@
+20210117T120000.0,0
+20210117T120000.5,5
+20210117T120001.0,10
+20210117T120001.5,15
+20210117T120002.0,20
+20210117T120002.5,25
+20210117T120003.0,30
+20210117T120003.5,35
+20210117T120004.0,40
+20210117T120004.5,45
+20210117T120005.0,50
+20210117T120005.5,55
diff --git a/csv/test/csv-thin/period/slow/test b/csv/test/csv-thin/period/slow/test
new file mode 100755
index 000000000..86cc14297
--- /dev/null
+++ b/csv/test/csv-thin/period/slow/test
@@ -0,0 +1 @@
+csv-thin --period 0.1 --fields t | name-value-from-csv --fields t,n --prefix output --line-number

From c90235696e920b85004fbd8ab39aaf6630999f3d Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sun, 17 Jan 2021 13:27:37 +1100
Subject: [PATCH 0325/1056] csv-thin: handle timestamp jumps in --period option

---
 csv/applications/csv-thin.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index ed7f6e5c1..9637d3d64 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -153,7 +153,7 @@ static bool skip_by_timestamp( boost::posix_time::ptime timestamp )
 {
     static boost::posix_time::ptime next_time = timestamp;
     if( timestamp < next_time ) { return true; }
-    next_time += *period;
+    while( next_time <= timestamp ) { next_time += *period; }
     return false;
 }
 

From 541f0ae54b6761b8f8d834edc0a64d05a2a4fc7c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 21 Jan 2021 15:17:25 +1100
Subject: [PATCH 0326/1056] cmake: minor refactoring

---
 CMakeLists.txt | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index d9cf51ead..a7eef706e 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -326,6 +326,8 @@ ADD_SUBDIRECTORY( python )
 set( CPACK_PACKAGE_NAME "comma" )
 set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "command line utilities to manipulate various structured and unstructured data from offline or realtime data" )
 set( CPACK_PACKAGE_VENDOR "orthographic" )
+set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma" )
+set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING" )
 set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
@@ -333,7 +335,6 @@ set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1)" )
-set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 
 # this code needs a brush-up
 # If the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
@@ -341,10 +342,10 @@ IF( BUILD_SHARED_LIBS )
     SET(CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig")
 ENDIF( BUILD_SHARED_LIBS )
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
-    SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy")
-    SET(CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
-    SET(CPACK_RPM_PRE_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-pre-install.sh" )
-    SET(CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" ) # Prevents /tmp from permission change when installing RPM package
+    SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy" )
+    SET( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
+    SET( CPACK_RPM_PRE_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-pre-install.sh" )
+    SET( CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" ) # Prevents /tmp from permission change when installing RPM package
 ELSE( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread socat psmisc recode")
 ENDIF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )

From b0e80f8359a6c595cedcbdad5fbdf6a322512ceb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 21 Jan 2021 15:17:39 +1100
Subject: [PATCH 0327/1056] csv-repeat: --pace: binary mode fixed

---
 csv/applications/csv-repeat.cpp | 38 ++++++++++++++++++++++++++++++---
 1 file changed, 35 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index a3efd08ca..f2456ff6d 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -155,6 +155,8 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
         bool ignore_eof = options.exists( "--ignore-eof,--ignoreeof,--yes" );
+        options.assert_mutually_exclusive( "--pace", "--ignore-eof,--ignoreeof,--yes" );
+        options.assert_mutually_exclusive( "--timestamped,pace" );
         if( ignore_eof && !options.exists( "--period" ) ) { std::cerr << "csv-repeat: got --ignore-oef, thus please specify --period" << std::endl; return 1; }
         comma::csv::options csv = comma::csv::options( options );
         boost::scoped_ptr< comma::csv::output_stream< output_t > > ostream;
@@ -271,6 +273,39 @@ int main( int ac, char** av )
             repeat( to );
             return 0;
         }
+        if( options.exists( "--pace" ) )
+        {
+            if( !period ) { std::cerr << "csv-repeat: for --pace, please specify --period" << std::endl; return 1; }
+            std::size_t record_size = csv.binary() ? csv.format().size() : 0;
+            if( record_size == 0 )
+            {
+                while( std::cin.good() && !std::cin.eof() )
+                {
+                    std::string line;
+                    std::getline( std::cin, line );
+                    if( line.empty() ) { break; }
+                    std::cout << line;
+                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), false ) ); }
+                    else { std::cout << std::endl; }
+                    boost::this_thread::sleep( *period );
+                }
+            }
+            else
+            {
+                std::vector< char > buf( record_size );
+                while( std::cin.good() && !std::cin.eof() ) // todo? quick and dirty; improve reading performance
+                {
+                    std::cin.read( &buf[0], record_size );
+                    if( std::cin.gcount() <= 0 ) { break; }
+                    if( std::cin.gcount() < int( record_size ) ) { std::cerr << "csv-repeat: expected " << record_size << " byte(s); got only: " << std::cin.gcount() << std::endl; return 1; }
+                    std::cout.write( &buf[0], record_size );
+                    std::cout.flush();
+                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), false ) ); }
+                    boost::this_thread::sleep( *period );
+                }
+            }
+            return 0;
+        }
         std::size_t record_size = csv.binary() ? csv.format().size() : 0;
         std::vector< char > buffer( csv.binary() ? ( 65536ul / record_size + 1 ) * record_size : 0 );
         char* buffer_begin = &buffer[0];
@@ -286,8 +321,6 @@ int main( int ac, char** av )
         std::string last_line;
         std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
         bool repeating = false;
-        bool pace = options.exists( "--pace" );
-        if( pace && !period ) { std::cerr << "csv-repeat: for --pace, please specify --period" << std::endl; return 1; }
         while( is->good() && !end_of_stream )
         {
             select.wait( repeating ? *period : timeout );
@@ -329,7 +362,6 @@ int main( int ac, char** av )
                     else { std::cout << std::endl; }
                 }
                 end_of_stream = repeating = false;
-                if( pace ) { boost::this_thread::sleep( *period ); } // todo: quick and dirty; fix it properly for --pace, to make sure sleep happens after each record only once
             }
             if( !is->good() || end_of_stream ) { break; }
             if( repeating )

From 88defa7c7041ae637020ae48af0a9f462664267a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 21 Jan 2021 15:19:04 +1100
Subject: [PATCH 0328/1056] csv-repeat: --pace: typo fixed: flush() called at
 the right place

---
 csv/applications/csv-repeat.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index f2456ff6d..910d112da 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -299,8 +299,8 @@ int main( int ac, char** av )
                     if( std::cin.gcount() <= 0 ) { break; }
                     if( std::cin.gcount() < int( record_size ) ) { std::cerr << "csv-repeat: expected " << record_size << " byte(s); got only: " << std::cin.gcount() << std::endl; return 1; }
                     std::cout.write( &buf[0], record_size );
-                    std::cout.flush();
                     if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), false ) ); }
+                    std::cout.flush();
                     boost::this_thread::sleep( *period );
                 }
             }

From 124643cdaaac1ea593e54e62dfaf1cd7d6697bb2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 29 Jan 2021 22:11:44 +1100
Subject: [PATCH 0329/1056] csv-eval: error message improved

---
 python/comma/csv/applications/csv_eval.py | 23 ++++++++++++++++++-----
 1 file changed, 18 insertions(+), 5 deletions(-)

diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 1d406afd9..0ca4f909e 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -475,6 +475,15 @@ def check_output_fields(fields, input_fields):
     invalid_output_fields = set(fields).intersection(input_fields)
     if invalid_output_fields: raise csv_eval_error( "output field(s) '{}' should not contain input fields '{}'".format(','.join(invalid_output_fields), ','.join(input_fields)) )
 
+def _numbered( s, line ):
+    t = s.split( '\n' )
+    return '\n'.join( [ '          {} {}\t{}'.format( '*' if i + 1 == line else ' ', i + 1, t[i] ) for i in range( len( t ) ) ] )
+
+def _code_error( what, c, e ):
+    t = e.__traceback__
+    while t is not None: line = t.tb_lineno; t = t.tb_next # todo: quick and dirty, is there a better way?
+    print( "csv-eval: {}: line {}: {}: {}\n{}".format( what, line, type( e ).__name__, str( e ), _numbered( c, line ) ), file = sys.stderr )
+
 def evaluate(stream):
     def disperse( var, fields, do_copy = False ):
         if do_copy: return '\n'.join( "{f} = copy( {v}['{f}'] )".format( v = var, f = f ) for f in fields )
@@ -519,8 +528,10 @@ def collect( var, fields ): return '\n'.join("{v}['{f}'] = {f}".format( v = var,
                 if stream.args.init_fields: init = stream.args.init_t(size)
                 if stream.args.update_fields: update = stream.update_t(size)
                 if stream.args.output_fields: output = stream.output_t(size)
-                exec( init_code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
-            exec( code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
+                try: exec( init_code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
+                except Exception as e: _code_error( "init expressions", init_code_string, e ); raise
+            try: exec( code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
+            except Exception as e: _code_error( "expressions", code_string, e ); raise
             if stream.args.update_fields: update_buffer(stream.input, update)
             if stream.args.output_fields: stream.output.write(output)
             else: stream.input.dump()
@@ -536,8 +547,9 @@ def select(stream):
     is_shutdown = comma.signal.is_shutdown()
     if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
     while not is_shutdown:
-        if input is not None: 
-            mask = eval(code, env, {f: input[f] for f in fields})
+        if input is not None:
+            try: mask = eval(code, env, {f: input[f] for f in fields})
+            except Exception as e: _code_error( "select expression", stream.args.select, e ); raise
             stream.input.dump(mask=mask)
         input = stream.input.read()
         if input is None: break
@@ -552,7 +564,8 @@ def exit_if(stream):
     if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
     while not is_shutdown:
         if input is not None:
-            mask = eval(code, env, {f: input[f] for f in fields})
+            try: mask = eval( code, env, { f: input[f] for f in fields } )
+            except Exception as e: _code_error( "exit-if expression", stream.args.select, e ); raise
             if mask:
                 if not stream.args.with_error: sys.exit()
                 name = os.path.basename(sys.argv[0])

From a4c234232c873f9c273619d7f98e07fd77318a6c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 30 Jan 2021 19:36:00 +1100
Subject: [PATCH 0330/1056] name-value-convert, name-value-get:
 --quote-numbers: added logic for json; basic regression test added

---
 .../applications/name-value-convert.cpp       | 57 +++++--------
 name_value/applications/name-value-get.cpp    | 68 ++++++----------
 name_value/impl/json_writer.h                 | 81 ++++++-------------
 name_value/test/name-value-convert/expected   |  4 +
 name_value/test/name-value-convert/input      |  4 +
 name_value/test/test                          |  6 ++
 6 files changed, 82 insertions(+), 138 deletions(-)
 create mode 100644 name_value/test/name-value-convert/expected
 create mode 100644 name_value/test/name-value-convert/input
 create mode 100755 name_value/test/test

diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index 1aab4213f..b228f76d8 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #include <iostream>
@@ -63,21 +62,24 @@ static void usage( bool verbose = false )
     std::cerr << "    xml: xml data" << std::endl;
     std::cerr << "    path-value: path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "name/path-value options:" << std::endl;
+    std::cerr << "name/path-value options" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal sign>: default '='" << std::endl;
     std::cerr << "    --delimiter,-d=<delimiter>: default ','" << std::endl;
     std::cerr << "    --no-brackets: show indices as path elements e.g. y/0/x/z/1=\"a\"" << std::endl;
-    std::cerr << "          by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "                   by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "path-value options:" << std::endl;
+    std::cerr << "path-value output options" << std::endl;
     std::cerr << "    --take-last: if paths are repeated, take last path=value" << std::endl;
     std::cerr << "    --verify-unique,--unique-input: ensure that all input paths are unique (takes precedence over --take-last)" << std::endl;
-    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
     std::cerr << std::endl;
     std::cerr <<      "warning: if paths are repeated, output value selected from these inputs in not deterministic" << std::endl;
     std::cerr << std::endl;
     std::cerr << "json options" << std::endl;
     std::cerr << "    --minify: if present, output minified json" << std::endl;
+    std::cerr << "    --quote-numbers,--quote: force quoting the numbers and booleans" << std::endl;
+    std::cerr << "                             unfortunately, historically path-value and xml quote numbers by default and json unquotes numbers by default" << std::endl;
+    std::cerr << "                             this default behaviour is left unchaged to keep backward compatibility" << std::endl;
     std::cerr << std::endl;
     std::cerr << "xml options" << std::endl;
     std::cerr << "    --indented: if present, output indented xml" << std::endl;
@@ -87,17 +89,16 @@ static void usage( bool verbose = false )
     std::cerr << "    --linewise,-l: if present, treat each input line as a record" << std::endl;
     std::cerr << "                   if absent, treat all of the input as one record" << std::endl;
     std::cerr << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 static comma::property_tree::xml_writer_settings_t xml_writer_settings;
-
 static char equal_sign;
 static char path_value_delimiter;
 static bool linewise;
 static bool minify_json;
 static bool unquote_numbers;
+static bool quote_numbers;
 typedef comma::property_tree::path_mode path_mode;
 static path_mode indices_mode = comma::property_tree::disabled;
 static bool use_index = true;
@@ -127,19 +128,13 @@ template <> struct traits< info >
 template <> struct traits< json >
 {
     static void input( std::istream& is, boost::property_tree::ptree& ptree ) { boost::property_tree::read_json( is, ptree ); }
-    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::name_value::impl::write_json( os, ptree, !minify_json ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::name_value::impl::write_json( os, ptree, !minify_json, !quote_numbers ); }
 };
 
 template <> struct traits< xml >
 {
-    static void input( std::istream& is, boost::property_tree::ptree& ptree ) 
-    { 
-        comma::property_tree::read_xml( is, ptree ); 
-    }
-    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode )
-    {
-        comma::property_tree::write_xml( os, ptree, xml_writer_settings);
-    }
+    static void input( std::istream& is, boost::property_tree::ptree& ptree ) { comma::property_tree::read_xml( is, ptree ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::property_tree::write_xml( os, ptree, xml_writer_settings ); }
 };
 
 template <> struct traits< path_value > // quick and dirty
@@ -171,7 +166,9 @@ int main( int ac, char** av )
         equal_sign = options.value( "--equal-sign,-e", '=' );
         linewise = options.exists( "--linewise,-l" );
         minify_json = options.exists( "--minify" );
+        options.assert_mutually_exclusive( "--unquote-numbers,--unquote", "--quote-numbers,--quote" );
         unquote_numbers = options.exists( "--unquote-numbers,--unquote" );
+        quote_numbers = options.exists( "--quote-numbers,--quote" ) && !unquote_numbers; // todo: quick and dirty, combine logic, it sucks now that there is different logic for json and everything else
         if ( options.exists( "--take-last" ) ) check_type = comma::property_tree::path_value::take_last;
         if ( options.exists( "--verify-unique,--unique-input" ) ) check_type = comma::property_tree::path_value::unique_input;
         xml_writer_settings.indent_count = options.value( "--indent", options.exists( "--indented" ) ? 4 : 0 );
@@ -240,26 +237,10 @@ int main( int ac, char** av )
         }
         return 0;
     }
-    catch( boost::property_tree::ptree_bad_data& ex )
-    {
-        std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_bad_path& ex )
-    {
-        std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_error& ex )
-    {
-        boost::regex e( "<unspecified file>" );
-        std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl;
-    }
-    catch( std::exception& ex )
-    {
-        std::cerr << "name-value-convert: " << ex.what() << std::endl;
-    }
-    catch( ... )
-    {
-        std::cerr << "name-value-convert: unknown exception" << std::endl;
-    }
+    catch( boost::property_tree::ptree_bad_data& ex ) { std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_bad_path& ex ) { std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_error& ex ) { boost::regex e( "<unspecified file>" ); std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "name-value-convert: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "name-value-convert: unknown exception" << std::endl; }
     return 1;
 }
diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index e4570b68f..060a1300a 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -71,18 +71,22 @@ static void usage( bool verbose = false )
     std::cerr << "    xml: xml data" << std::endl;
     std::cerr << "    path-value: path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "name/path-value options:" << std::endl;
+    std::cerr << "name/path-value options" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal sign>: default '='" << std::endl;
     std::cerr << "    --delimiter,-d=<delimiter>: default ','" << std::endl;
-    std::cerr << "    --output-path: if path-value, output path (for regex)" << std::endl;
+    std::cerr << "    --minify: if present, output minified json" << std::endl;
     std::cerr << "    --no-brackets: show indices as path elements e.g. y/0/x/z/1=\"a\"" << std::endl;
-    std::cerr << "          by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "                   by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "    --output-path: if path-value, output path (for regex)" << std::endl;
+    std::cerr << "    --quote-numbers,--quote: force quoting the numbers and booleans" << std::endl;
+    std::cerr << "                             unfortunately, historically path-value and xml quote numbers by default and json unquotes numbers by default" << std::endl;
+    std::cerr << "                             this default behaviour is left unchaged to keep backward compatibility" << std::endl;
+    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "path-value options:" << std::endl;
+    std::cerr << "path-value output options" << std::endl;
     std::cerr << "    --take-last: if paths are repeated, take last path=value" << std::endl;
     std::cerr << "    --verify-unique,--unique-input: ensure that all input paths are unique (takes precedence over --take-last)" << std::endl;
-    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
-    std::cerr << "warning: if paths are repeated, output value selected from these inputs in not deterministic" << std::endl;
+    std::cerr << "    warning: if paths are repeated, output value selected from these inputs in not deterministic" << std::endl;
     std::cerr << std::endl;
     std::cerr << "data flow options:" << std::endl;
     std::cerr << "    --linewise,-l: if present, treat each input line as a record" << std::endl;
@@ -95,9 +99,11 @@ static void usage( bool verbose = false )
 static char equal_sign;
 static char path_value_delimiter;
 static bool linewise;
+static bool minify;
 static bool option_regex;
 static bool output_path;
 static bool unquote_numbers;
+static bool quote_numbers;
 typedef comma::property_tree::path_mode path_mode;
 static path_mode indices_mode = comma::property_tree::disabled;
 static comma::property_tree::path_value::check_repeated_paths check_type( comma::property_tree::path_value::no_check );
@@ -126,7 +132,7 @@ template <> struct traits< info >
 template <> struct traits< json >
 {
     static void input( std::istream& is, boost::property_tree::ptree& ptree ) { boost::property_tree::read_json( is, ptree ); }
-    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const std::string& ) { comma::name_value::impl::write_json( os, ptree ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const std::string& ) { comma::name_value::impl::write_json( os, ptree, minify, !quote_numbers ); }
 };
 
 template <> struct traits< xml >
@@ -233,7 +239,7 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        path_strings = options.unnamed( "--linewise,-l,--output-path,--use-buffer,--regex", "--from,--to,--equal-sign,-e,--delimiter,-d" );
+        path_strings = options.unnamed( "--linewise,-l,--minify,--output-path,--use-buffer,--regex,--quote-numbers,--quote,--unquote-numbers,--unquote", "-.*" );
         if( path_strings.empty() ) { std::cerr << std::endl << "name-value-get: xpath missing" << std::endl; usage(); }
         path_regex.resize( path_strings.size() );
         paths.resize( path_strings.size() );
@@ -241,21 +247,17 @@ int main( int ac, char** av )
         option_regex = options.exists( "--regex" );
         for( std::size_t i = 0; i < path_strings.size(); ++i )
         {
-            if ( is_regex_(path_strings[i]) )
-            {
-                path_regex[i] = boost::regex( path_strings[i], boost::regex::extended );
-                has_regex = true;
-            }
-            else
-            { 
-                paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' ); 
-            }
+            if( is_regex_( path_strings[i] ) ) { path_regex[i] = boost::regex( path_strings[i], boost::regex::extended ); has_regex = true; }
+            else {  paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' ); }
         }
         boost::optional< std::string > from = options.optional< std::string >( "--from" );
         std::string to = options.value< std::string >( "--to", "path-value" );
         equal_sign = options.value( "--equal-sign,-e", '=' );
         linewise = options.exists( "--linewise,-l" );
+        minify = options.exists( "--minify" );
+        options.assert_mutually_exclusive( "--unquote-numbers,--unquote", "--quote-numbers,--quote" );
         unquote_numbers = options.exists( "--unquote-numbers,--unquote" );
+        quote_numbers = options.exists( "--quote-numbers,--quote" ) && !unquote_numbers; // todo: quick and dirty, combine logic, it sucks now that there is different logic for json and everything else
         if ( options.exists( "--take-last" ) ) check_type = comma::property_tree::path_value::take_last;
         if ( options.exists( "--verify-unique,--unique-input" ) ) check_type = comma::property_tree::path_value::unique_input;
         boost::optional< char > delimiter = options.optional< char >( "--delimiter,-d" );
@@ -308,7 +310,6 @@ int main( int ac, char** av )
                         case '"' : quoted = !quoted; break;
                         case '\n': if( !quoted ) { s[i] = ' '; } break;
                     }
-
                 }
                 std::cout << s << std::endl;
             }
@@ -319,29 +320,12 @@ int main( int ac, char** av )
             input( std::cin, ptree );
             if( has_regex ) { match_regex_( std::cout, ptree ); } else { match_( std::cout, ptree ); }
         }
+        return 0;
     }
-    catch( boost::property_tree::ptree_bad_data& ex )
-    {
-        std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_bad_path& ex )
-    {
-        std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_error& ex )
-    {
-        boost::regex e( "<unspecified file>" );
-        std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl;
-    }
-    catch( std::exception& ex )
-    {
-        std::cerr << std::endl << "name-value-get: " << ex.what() << std::endl << std::endl;
-        return 1;
-    }
-    catch( ... )
-    {
-        std::cerr << std::endl << "name-value-get: unknown exception" << std::endl << std::endl;
-        return 1;
-    }
-    return 0;
+    catch( boost::property_tree::ptree_bad_data& ex ) { std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_bad_path& ex ) { std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_error& ex ) { boost::regex e( "<unspecified file>" ); std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl; }
+    catch( std::exception& ex ) { std::cerr << std::endl << "name-value-get: " << ex.what() << std::endl << std::endl; }
+    catch( ... ) { std::cerr << std::endl << "name-value-get: unknown exception" << std::endl << std::endl; }
+    return 1;
 }
diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index d6d0833bf..238572a39 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -11,15 +11,17 @@
 #include <string>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/lexical_cast.hpp>
+#include <boost/regex.hpp>
 #include "../../base/exception.h"
 
 namespace comma { namespace name_value { namespace impl {
 
-template< typename C > void json_remove_quotes( std::basic_string< C >& json_text ) // assuming valid json
+template< typename C > inline void json_remove_quotes( std::basic_string< C >& json_text ) // assuming valid json
 {
     using string_type = std::basic_string< C >;
-    string_type const true_str( std::initializer_list< C >{ 't', 'r', 'u', 'e' } );
-    string_type const false_str( std::initializer_list< C >{ 'f', 'a', 'l', 's', 'e' } );
+    static string_type const true_str( std::initializer_list< C >{ 't', 'r', 'u', 'e' } );
+    static string_type const false_str( std::initializer_list< C >{ 'f', 'a', 'l', 's', 'e' } );
+    static boost::regex number_like_string( "^0[0-9][0-9]*$" );
     auto source = json_text.begin();
     auto target = json_text.cbegin();
     while( target != json_text.cend() )
@@ -40,8 +42,21 @@ template< typename C > void json_remove_quotes( std::basic_string< C >& json_tex
         if( ':' != *next_token )
         {
             auto const value = std::string( value_begin + 1, value_end );
-            if( true_str == value || false_str == value ) { quoted = false; }
-            else { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
+            if( true_str == value || false_str == value )
+            {
+                quoted = false;
+            }
+            else if( !boost::regex_match( value, number_like_string ) ) // to avoid unquoting strings like "01234"
+            {
+                try // todo? try to avoid lexical_cast+exception to improve performace?
+                {
+                    boost::lexical_cast< double >( value );
+                    quoted = false;
+                }
+                catch ( ... )
+                {
+                }
+            } 
         }
         if( !quoted ) { value_begin++; }
         while( value_begin != value_end ) { *source++ = *value_begin++; }
@@ -53,62 +68,12 @@ template< typename C > void json_remove_quotes( std::basic_string< C >& json_tex
     json_text.erase( source, json_text.cend() );
 }
 
-inline void remove_quotes( std::string& s )
-{
-    unsigned int size = 0;
-    char* end = &s[0] + s.length();
-    char* target = &s[0];
-    std::string value;
-    struct looking_for { enum what { first_quote, second_quote, escaped, colon }; };
-    looking_for::what state = looking_for::first_quote;
-    for( char* source = &s[0]; source != end; ++source )
-    {
-        switch( state )
-        {
-            case looking_for::first_quote:
-                if( *source == '"' ) { state = looking_for::second_quote; } else { *target++ = *source; ++size; }
-                break;
-            case looking_for::second_quote:
-                if( *source == '"' ) { state = looking_for::colon; }
-                else { value += *source; if( *source == '\\' ) { state = looking_for::escaped; } }
-                break;
-            case looking_for::escaped:
-                value += *source;
-                state = looking_for::second_quote;
-                break;
-            case looking_for::colon:
-            {
-                bool quoted = true;
-                bool skip = false;
-                switch( *source )
-                {
-                    case ' ': case '\t': case '\n': skip=true; break;
-                    case ':': break;
-                    default: try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} // hyper quick and dirty for now
-                }
-                if( skip ) { break; }
-                if( quoted ) { *target++ = '"'; ++size; }
-                ::memcpy( target, &value[0], value.size() );
-                target += value.size();
-                size += value.size();
-                if( quoted ) { *target++ = '"'; ++size; }
-                *target++ = *source;
-                ++size;
-                value.clear();
-                state = looking_for::first_quote;
-                break;
-            }
-        }
-    }
-    s.resize( size );
-}
-
-template<class Ptree> void write_json(std::basic_ostream< typename Ptree::key_type::value_type > &stream, const Ptree &ptree, bool const pretty = true )
+template< class PTree > void write_json( std::basic_ostream< typename PTree::key_type::value_type > &stream, const PTree &ptree, bool const pretty = true, bool unquote_numbers = true )
 {
-    std::basic_ostringstream< typename Ptree::key_type::value_type > string_stream;
+    std::basic_ostringstream< typename PTree::key_type::value_type > string_stream;
     boost::property_tree::write_json( string_stream, ptree, pretty );
     auto json_text = string_stream.str();
-    json_remove_quotes( json_text );
+    if( unquote_numbers ) { json_remove_quotes( json_text ); }
     stream << json_text << std::flush;
 }
  
diff --git a/name_value/test/name-value-convert/expected b/name_value/test/name-value-convert/expected
new file mode 100644
index 000000000..7718840e8
--- /dev/null
+++ b/name_value/test/name-value-convert/expected
@@ -0,0 +1,4 @@
+quoting[0]/output='{"a":"01"}'
+quoting[1]/output='{"a":"1"}'
+quoting[2]/output='a="1"'
+quoting[3]/output='a="1"'
diff --git a/name_value/test/name-value-convert/input b/name_value/test/name-value-convert/input
new file mode 100644
index 000000000..61fc46fad
--- /dev/null
+++ b/name_value/test/name-value-convert/input
@@ -0,0 +1,4 @@
+quoting[0]="echo a=01 | name-value-convert --to json --minify"
+quoting[1]="echo a=1 | name-value-convert --to json --quote-numbers --minify"
+quoting[2]="echo a=1 | name-value-convert --to json --minify | name-value-convert"
+quoting[3]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert"
diff --git a/name_value/test/test b/name_value/test/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/name_value/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From a192deafead4c4f8819cd4f5eb255a882fcc287c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 30 Jan 2021 19:50:30 +1100
Subject: [PATCH 0331/1056] name-value-convert, name-value-get: bug fixed; more
 tests added

---
 name_value/impl/json_writer.h               | 17 ++---------------
 name_value/ptree.cpp                        |  7 +++----
 name_value/test/name-value-convert/expected | 11 ++++++++---
 name_value/test/name-value-convert/input    | 11 ++++++++---
 4 files changed, 21 insertions(+), 25 deletions(-)

diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index 238572a39..7308cd8da 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -42,21 +42,8 @@ template< typename C > inline void json_remove_quotes( std::basic_string< C >& j
         if( ':' != *next_token )
         {
             auto const value = std::string( value_begin + 1, value_end );
-            if( true_str == value || false_str == value )
-            {
-                quoted = false;
-            }
-            else if( !boost::regex_match( value, number_like_string ) ) // to avoid unquoting strings like "01234"
-            {
-                try // todo? try to avoid lexical_cast+exception to improve performace?
-                {
-                    boost::lexical_cast< double >( value );
-                    quoted = false;
-                }
-                catch ( ... )
-                {
-                }
-            } 
+            if( true_str == value || false_str == value ) { quoted = false; }
+            else if( !boost::regex_match( value, number_like_string ) ) { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} } // todo? try to avoid lexical_cast+exception to improve performace?
         }
         if( !quoted ) { value_begin++; }
         while( value_begin != value_end ) { *source++ = *value_begin++; }
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index d7184952f..a42a6c985 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 /// @author vsevolod vlaskine
 
@@ -40,6 +39,7 @@
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
+#include <boost/regex.hpp>
 #include <boost/unordered_set.hpp>
 #include "../base/exception.h"
 #include "../base/types.h"
@@ -47,7 +47,6 @@
 #include "../xpath/xpath.h"
 #include "../visiting/visit.h"
 #include "../visiting/while.h"
-
 #include "ptree.h"
 
 namespace comma {
@@ -140,15 +139,15 @@ namespace comma { namespace impl {
 
 static void ptree_output_value_( std::ostream& os, const std::string& value, bool is_begin, const xpath& path, char equal_sign, char delimiter, const std::string& root, bool const unquote_numbers )
 {
+    static boost::regex number_like_string( "^0[0-9][0-9]*$" );
     if( !is_begin ) { os << delimiter; }
     if( root != "" ) { os << root << "/"; }
     os << path.to_string() << equal_sign;
-
     bool quoted = true;
     if( unquote_numbers )
     { 
         if( "true" == value || "false" == value ) { quoted = false; }
-        else { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
+        else if( !boost::regex_match( value, number_like_string ) ) { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
     }
     if( quoted ) { os << '"' << value << '"'; } else { os << value; }
 }
diff --git a/name_value/test/name-value-convert/expected b/name_value/test/name-value-convert/expected
index 7718840e8..d8170fca7 100644
--- a/name_value/test/name-value-convert/expected
+++ b/name_value/test/name-value-convert/expected
@@ -1,4 +1,9 @@
 quoting[0]/output='{"a":"01"}'
-quoting[1]/output='{"a":"1"}'
-quoting[2]/output='a="1"'
-quoting[3]/output='a="1"'
+quoting[1]/output='a="01"'
+quoting[2]/output='a="01"'
+quoting[3]/output='{"a":1}'
+quoting[5]/output='a="1"'
+quoting[6]/output='a=1'
+quoting[4]/output='{"a":"1"}'
+quoting[5]/output='a="1"'
+quoting[6]/output='a=1'
diff --git a/name_value/test/name-value-convert/input b/name_value/test/name-value-convert/input
index 61fc46fad..54cdf54fb 100644
--- a/name_value/test/name-value-convert/input
+++ b/name_value/test/name-value-convert/input
@@ -1,4 +1,9 @@
 quoting[0]="echo a=01 | name-value-convert --to json --minify"
-quoting[1]="echo a=1 | name-value-convert --to json --quote-numbers --minify"
-quoting[2]="echo a=1 | name-value-convert --to json --minify | name-value-convert"
-quoting[3]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert"
+quoting[1]="echo a=01 | name-value-convert --to json --minify | name-value-convert"
+quoting[2]="echo a=01 | name-value-convert --to json --minify | name-value-convert --unquote-numbers"
+quoting[3]="echo a=1 | name-value-convert --to json --minify"
+quoting[5]="echo a=1 | name-value-convert --to json --minify | name-value-convert"
+quoting[6]="echo a=1 | name-value-convert --to json --minify | name-value-convert --unquote-numbers"
+quoting[4]="echo a=1 | name-value-convert --to json --quote-numbers --minify"
+quoting[5]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert"
+quoting[6]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert --unquote-numbers"

From 4cedd5c7510f110ab139a6f639006d52a87c83b6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 16:17:31 +1100
Subject: [PATCH 0332/1056] system/packages: building with shared libraries
 turned on; readme updated

---
 system/package/comma-package-make | 1 +
 system/package/readme             | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index c62c3c40c..36c0a6258 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -23,6 +23,7 @@ esac
     cmake . -DCPACK_GENERATOR=DEB \
             -DBUILD_PYTHON_PACKAGES=ON \
             -DADD_PYTHON_PACKAGES_TO_RPM=ON \
+            -DBUILD_SHARED_LIBS=ON \
             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
diff --git a/system/package/readme b/system/package/readme
index c9f525a06..9fda7985a 100644
--- a/system/package/readme
+++ b/system/package/readme
@@ -9,7 +9,7 @@ to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
 
 > ./comma-package-docker-run 20.04 1 2 3
 
-if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run:
+if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run (you also need to specify comma directory if you run as sudo, since default location is ~):
 
 > ./comma-package-docker-run 20.04 1 2 3 ~/my/src/comma
 

From 05a41f1a25443dcd658124644c0ff43a069a87bc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 17:27:09 +1100
Subject: [PATCH 0333/1056] system/packages: more cmake flags explicitly
 defined

---
 system/package/comma-package-make | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 36c0a6258..94eeb2f43 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -24,6 +24,10 @@ esac
             -DBUILD_PYTHON_PACKAGES=ON \
             -DADD_PYTHON_PACKAGES_TO_RPM=ON \
             -DBUILD_SHARED_LIBS=ON \
+            -DBUILD_TESTS=OFF \
+            -DBUILD_TESTS=OFF \
+            -DCMAKE_INSTALL_PREFIX=/usr \
+            -DINSTALL_TESTS=OFF \
             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \

From 7880709edcb0d2979b0eb7b865ee521f66cb0195 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 20:33:19 +1100
Subject: [PATCH 0334/1056] system/package: cpack: building python packages
 switched off

---
 system/package/comma-package-make | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 94eeb2f43..0a952f0c4 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -22,7 +22,7 @@ esac
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
             -DBUILD_PYTHON_PACKAGES=ON \
-            -DADD_PYTHON_PACKAGES_TO_RPM=ON \
+            -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
             -DBUILD_SHARED_LIBS=ON \
             -DBUILD_TESTS=OFF \
             -DBUILD_TESTS=OFF \

From aba8fabbb3fb5cc0badab684380f15967291d432 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 20:41:02 +1100
Subject: [PATCH 0335/1056] cmake: minor change

---
 CMakeLists.txt                       | 12 +++++++-----
 etc/bash_completion.d/CMakeLists.txt |  1 -
 system/package/comma-package-make    |  1 +
 3 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index a7eef706e..8209ac955 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -287,9 +287,8 @@ INCLUDE( ${CMAKE_CURRENT_SOURCE_DIR}/CMakeFiles/generate_${PROJECT_NAME}_config.
 CONFIGURE_FILE( ${PROJECT_SOURCE_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake.in
                 ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake COPYONLY IMMEDIATE )
 
-SET( comma_PACKAGE_CMAKEFILES ${comma_PACKAGE_CMAKEFILES} ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake )
-INSTALL( FILES ${comma_PACKAGE_CMAKEFILES}
-         DESTINATION ${comma_INSTALL_PACKAGE_DIR} )
+set( comma_PACKAGE_CMAKEFILES ${comma_PACKAGE_CMAKEFILES} ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake )
+install( FILES ${comma_PACKAGE_CMAKEFILES} DESTINATION ${comma_INSTALL_PACKAGE_DIR} )
 
 #-----------------------------------------------------------------------------
 # add sources
@@ -315,9 +314,12 @@ if( comma_BUILD_XML )
 endif( comma_BUILD_XML )
 add_subdirectory( xpath )
 
-ADD_SUBDIRECTORY( etc/bash_completion.d )
+option( INSTALL_BASH_COMPLETION "install the BASH completion scripts" ON )
+if( INSTALL_BASH_COMPLETION )
+    add_subdirectory( etc/bash_completion.d )
+endif( INSTALL_BASH_COMPLETION )
 
-ADD_SUBDIRECTORY( python )
+add_subdirectory( python )
 
 #in future, may need to add third party dlls somehow, if they are linked as dlls. Not needed for statically linking to boost.
 #if we set them up to install to bin they might be packaged through, e.g. roughly (using GLOB):
diff --git a/etc/bash_completion.d/CMakeLists.txt b/etc/bash_completion.d/CMakeLists.txt
index 78be444a2..de41cd163 100644
--- a/etc/bash_completion.d/CMakeLists.txt
+++ b/etc/bash_completion.d/CMakeLists.txt
@@ -1,5 +1,4 @@
 IF (UNIX)
-    OPTION( INSTALL_BASH_COMPLETION "Install the BASH completion scripts." ON )
     SET( INSTALL_BASH_COMPLETION_DIR /etc/bash_completion.d
          CACHE PATH "Location in which to install the bash completion scripts.")
     IF( INSTALL_BASH_COMPLETION )
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 0a952f0c4..553925e3d 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -27,6 +27,7 @@ esac
             -DBUILD_TESTS=OFF \
             -DBUILD_TESTS=OFF \
             -DCMAKE_INSTALL_PREFIX=/usr \
+            -DINSTALL_BASH_COMPLETION=OFF \
             -DINSTALL_TESTS=OFF \
             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \

From d22bfe837ea6a6a36e9fc67628154355896d2524 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 20:51:10 +1100
Subject: [PATCH 0336/1056] cpack: adding debian definitions to make lintian
 happy

---
 CMakeLists.txt | 34 ++++++++++++++++++----------------
 1 file changed, 18 insertions(+), 16 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 8209ac955..c8416dd6a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -252,33 +252,33 @@ SET( comma_ALL_LIBRARIES
         debug comma_name_value-d
         optimized comma_name_value )
 
-IF(WIN32)
-    SET( comma_ALL_EXTERNAL_LIBRARIES Ws2_32.lib )
-ENDIF(WIN32)
+if(WIN32)
+    set( comma_ALL_EXTERNAL_LIBRARIES Ws2_32.lib )
+endif(WIN32)
 
-IF(UNIX AND NOT QNXNTO AND NOT APPLE)
-    SET( comma_ALL_EXTERNAL_LIBRARIES rt pthread )
-ENDIF(UNIX AND NOT QNXNTO AND NOT APPLE)
+if( UNIX AND NOT QNXNTO AND NOT APPLE )
+    set( comma_ALL_EXTERNAL_LIBRARIES rt pthread c )
+endif( UNIX AND NOT QNXNTO AND NOT APPLE )
 
-SET( comma_ALL_EXTERNAL_LIBRARIES ${Boost_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} )
+set( comma_ALL_EXTERNAL_LIBRARIES ${Boost_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} )
 
-IF( comma_BUILD_ZEROMQ )
-    SET( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${ZeroMQ_LIBRARY} )
-ENDIF( comma_BUILD_ZEROMQ )
+if( comma_BUILD_ZEROMQ )
+    set( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${ZeroMQ_LIBRARY} )
+endif( comma_BUILD_ZEROMQ )
 
-IF( BUILD_CPP_PYTHON_BINDINGS )
-    SET( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${PYTHON_LIBRARY} )
-ENDIF( BUILD_CPP_PYTHON_BINDINGS )
+if( BUILD_CPP_PYTHON_BINDINGS )
+    set( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${PYTHON_LIBRARY} )
+endif( BUILD_CPP_PYTHON_BINDINGS )
 
-SET( comma_ALL_LIBRARIES ${comma_ALL_LIBRARIES} ${comma_ALL_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} ) # as gcc parses library list only once
-SET( comma_EXTERNAL_INCLUDES ${Boost_INCLUDE_DIRS} )
+set( comma_ALL_LIBRARIES ${comma_ALL_LIBRARIES} ${comma_ALL_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} ) # as gcc parses library list only once
+set( comma_EXTERNAL_INCLUDES ${Boost_INCLUDE_DIRS} )
 
 CONFIGURE_FILE(
     "${CMAKE_CURRENT_SOURCE_DIR}/CMakeFiles/cmake_uninstall.cmake.in"
     "${CMAKE_CURRENT_BINARY_DIR}/cmake_uninstall.cmake"
     IMMEDIATE @ONLY)
 
-ADD_CUSTOM_TARGET(uninstall COMMAND ${CMAKE_COMMAND} -P ${CMAKE_CURRENT_BINARY_DIR}/cmake_uninstall.cmake)
+ADD_CUSTOM_TARGET( uninstall COMMAND ${CMAKE_COMMAND} -P ${CMAKE_CURRENT_BINARY_DIR}/cmake_uninstall.cmake )
 
 FILE( GLOB comma_PACKAGE_CMAKEFILES ${CMAKE_CURRENT_SOURCE_DIR}/CMakeFiles/*.cmake )
 
@@ -328,7 +328,9 @@ add_subdirectory( python )
 set( CPACK_PACKAGE_NAME "comma" )
 set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "command line utilities to manipulate various structured and unstructured data from offline or realtime data" )
 set( CPACK_PACKAGE_VENDOR "orthographic" )
+set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "command line utilities to manipulate various structured and unstructured data from offline or realtime data" ) # lintian gets upset
 set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma" )
+set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING" )
 set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )

From 47b059a2b058c8dfe4e5651e50294802695cf7be Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 21:03:59 +1100
Subject: [PATCH 0337/1056] fixing python packaging...

---
 python/setup.py                   | 18 ++++++++++++++++--
 system/package/comma-package-make |  6 +++---
 2 files changed, 19 insertions(+), 5 deletions(-)

diff --git a/python/setup.py b/python/setup.py
index 6d5c87393..a7df7db9c 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -6,12 +6,26 @@
 setup(
         name                = 'comma',
         version             = comma.version.__version__,
+        classifiers = [
+          'Development Status :: 4 - Beta',
+          'Environment :: Console',
+          'Intended Audience :: End Users/Desktop',
+          'Intended Audience :: Developers',
+          'License :: OSI Approved :: BSD 3-Clause',
+          'Operating System :: MacOS :: MacOS X',
+          'Operating System :: Microsoft :: Windows',
+          'Operating System :: POSIX',
+          'Programming Language :: Python',
+          'Topic :: Communications :: Email'
+        ],
         description         = 'comma python utilties',
         install_requires    = [ 'numpy' ],
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
-        scripts             = ["comma/csv/applications/csv-eval"],
+        maintainer          = 'vsevolod vlaskine',
+        maintainer_email    = 'vsevolod.vlaskine@gmail.com',
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma.cpp_bindings': 'comma/cpp_bindings' },
-        package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] }
+        package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
+        scripts             = [ "comma/csv/applications/csv-eval" ]
      )
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 553925e3d..8dd8043dd 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -18,6 +18,9 @@ case $ubuntu_version in
     *) libproc_version="libprocps8 (>= 1)" ;; # for now
 esac
 (
+    cd ~/src/comma/python
+    echo "$0: setting up python in $( pwd )" >&2
+    python3 setup.py --command-packages=stdeb.command --copyright-file=../COPYING bdist_deb || die "failed"
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
@@ -35,9 +38,6 @@ esac
             -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"
-    cd ~/src/comma/python
-    echo "$0: setting up python in $( pwd )" >&2
-    python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     # todo: optionally run full regression test
     echo "$0: done" >&2
 )

From b39c6f71006ee7a2cb02e3e5f482e47c06cf6b24 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 23:34:10 +1100
Subject: [PATCH 0338/1056] packaging csv-eval...

---
 python/setup.py                   | 4 ++--
 system/package/comma-package-make | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/python/setup.py b/python/setup.py
index a7df7db9c..8e69a4204 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -7,7 +7,6 @@
         name                = 'comma',
         version             = comma.version.__version__,
         classifiers = [
-          'Development Status :: 4 - Beta',
           'Environment :: Console',
           'Intended Audience :: End Users/Desktop',
           'Intended Audience :: Developers',
@@ -18,10 +17,11 @@
           'Programming Language :: Python',
           'Topic :: Communications :: Email'
         ],
-        description         = 'comma python utilties',
+        description         = 'comma python utilities',
         install_requires    = [ 'numpy' ],
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
+        long_description    = 'comma python utilities for offline and streamed csv and fixed width data',
         maintainer          = 'vsevolod vlaskine',
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
diff --git a/system/package/comma-package-make b/system/package/comma-package-make
index 8dd8043dd..dffe1da22 100755
--- a/system/package/comma-package-make
+++ b/system/package/comma-package-make
@@ -20,7 +20,7 @@ esac
 (
     cd ~/src/comma/python
     echo "$0: setting up python in $( pwd )" >&2
-    python3 setup.py --command-packages=stdeb.command --copyright-file=../COPYING bdist_deb || die "failed"
+    python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \

From a728e6392ff481dc41230989317fd4843206c45f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Feb 2021 23:46:25 +1100
Subject: [PATCH 0339/1056] fixing packaging...

---
 CMakeLists.txt       | 3 ++-
 COPYING => copyright | 0
 2 files changed, 2 insertions(+), 1 deletion(-)
 rename COPYING => copyright (100%)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c8416dd6a..e16be18fc 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -289,6 +289,7 @@ CONFIGURE_FILE( ${PROJECT_SOURCE_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake.in
 
 set( comma_PACKAGE_CMAKEFILES ${comma_PACKAGE_CMAKEFILES} ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake )
 install( FILES ${comma_PACKAGE_CMAKEFILES} DESTINATION ${comma_INSTALL_PACKAGE_DIR} )
+install( FILES ${PROJECT_SOURCE_DIR}/copyright DESTINATION share/doc/comma ) # quick and dirty
 
 #-----------------------------------------------------------------------------
 # add sources
@@ -332,7 +333,7 @@ set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "command line utilities to manipulate vari
 set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma" )
 set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
-set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING" )
+set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/copyright" )
 set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
diff --git a/COPYING b/copyright
similarity index 100%
rename from COPYING
rename to copyright

From 1bfaf9d33d261c26ea2a5fe3605806b7964f7cf5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 13:07:09 +1100
Subject: [PATCH 0340/1056] cpack: fixing lintian errors

---
 CMakeLists.txt                                  | 17 +++++++++--------
 system/package/{ => debian}/Dockerfile          |  0
 system/package/debian/changelog                 |  3 +++
 .../{ => debian}/comma-package-docker-build     |  0
 .../{ => debian}/comma-package-docker-run       |  0
 .../{ => debian}/comma-package-docker-test      |  0
 system/package/{ => debian}/comma-package-make  |  1 +
 system/package/{ => debian}/comma-package-test  |  0
 system/package/{ => debian}/readme              |  0
 9 files changed, 13 insertions(+), 8 deletions(-)
 rename system/package/{ => debian}/Dockerfile (100%)
 create mode 100644 system/package/debian/changelog
 rename system/package/{ => debian}/comma-package-docker-build (100%)
 rename system/package/{ => debian}/comma-package-docker-run (100%)
 rename system/package/{ => debian}/comma-package-docker-test (100%)
 rename system/package/{ => debian}/comma-package-make (97%)
 rename system/package/{ => debian}/comma-package-test (100%)
 rename system/package/{ => debian}/readme (100%)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e16be18fc..e3bb09396 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -327,11 +327,12 @@ add_subdirectory( python )
 #install(FILES "${Boost_LIBRARY_DIRS}/*.dll" DESTINATION bin )
 
 set( CPACK_PACKAGE_NAME "comma" )
-set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "command line utilities to manipulate various structured and unstructured data from offline or realtime data" )
+#set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "command line utilities to manipulate various structured and unstructured data from offline or realtime data" )
 set( CPACK_PACKAGE_VENDOR "orthographic" )
-set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "command line utilities to manipulate various structured and unstructured data from offline or realtime data" ) # lintian gets upset
+set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "command line utilities for structured or fixed-width offline or realtime data" ) # lintian gets upset
 set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma" )
-set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine" )
+set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine <vsevolod.vlaskine@gmail.com>" )
+set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/debian/changelog" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/copyright" )
 set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
@@ -341,11 +342,11 @@ set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1)" )
 
-# this code needs a brush-up
-# If the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
-IF( BUILD_SHARED_LIBS )
-    SET(CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig")
-ENDIF( BUILD_SHARED_LIBS )
+# if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
+if( BUILD_SHARED_LIBS )
+    set( CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig" )
+    set( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "/sbin/ldconfig" )
+endif( BUILD_SHARED_LIBS )
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy" )
     SET( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
diff --git a/system/package/Dockerfile b/system/package/debian/Dockerfile
similarity index 100%
rename from system/package/Dockerfile
rename to system/package/debian/Dockerfile
diff --git a/system/package/debian/changelog b/system/package/debian/changelog
new file mode 100644
index 000000000..5b745da7e
--- /dev/null
+++ b/system/package/debian/changelog
@@ -0,0 +1,3 @@
+comma (1.0.0); urgency=medium
+
+  * initial release
diff --git a/system/package/comma-package-docker-build b/system/package/debian/comma-package-docker-build
similarity index 100%
rename from system/package/comma-package-docker-build
rename to system/package/debian/comma-package-docker-build
diff --git a/system/package/comma-package-docker-run b/system/package/debian/comma-package-docker-run
similarity index 100%
rename from system/package/comma-package-docker-run
rename to system/package/debian/comma-package-docker-run
diff --git a/system/package/comma-package-docker-test b/system/package/debian/comma-package-docker-test
similarity index 100%
rename from system/package/comma-package-docker-test
rename to system/package/debian/comma-package-docker-test
diff --git a/system/package/comma-package-make b/system/package/debian/comma-package-make
similarity index 97%
rename from system/package/comma-package-make
rename to system/package/debian/comma-package-make
index dffe1da22..8f7a69761 100755
--- a/system/package/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -29,6 +29,7 @@ esac
             -DBUILD_SHARED_LIBS=ON \
             -DBUILD_TESTS=OFF \
             -DBUILD_TESTS=OFF \
+            -DCMAKE_BUILD_TYPE=Release \
             -DCMAKE_INSTALL_PREFIX=/usr \
             -DINSTALL_BASH_COMPLETION=OFF \
             -DINSTALL_TESTS=OFF \
diff --git a/system/package/comma-package-test b/system/package/debian/comma-package-test
similarity index 100%
rename from system/package/comma-package-test
rename to system/package/debian/comma-package-test
diff --git a/system/package/readme b/system/package/debian/readme
similarity index 100%
rename from system/package/readme
rename to system/package/debian/readme

From 4d6ba8cb6b852bbbdecfca7c770798cbcc36370c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 13:45:50 +1100
Subject: [PATCH 0341/1056] packaging: fixing lintian errors...

---
 CMakeLists.txt                           |  19 +++++++++++++------
 io/applications/CMakeLists.txt           |   5 ++++-
 system/package/debian/changelog          |   3 ---
 system/package/debian/changelog.gz       | Bin 0 -> 81 bytes
 system/package/debian/comma-package-make |   3 ++-
 5 files changed, 19 insertions(+), 11 deletions(-)
 delete mode 100644 system/package/debian/changelog
 create mode 100644 system/package/debian/changelog.gz

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e3bb09396..1f6555359 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -106,8 +106,8 @@ IF(CMAKE_BUILD_TOOL MATCHES "make")
 ENDIF(CMAKE_BUILD_TOOL MATCHES "make")
 
 if( UNIX )
-INCLUDE( CMakeFiles/check.c++.standard.cmake REQUIRED )
-endif()
+    include( CMakeFiles/check.c++.standard.cmake REQUIRED )
+endif( UNIX )
 
 SET( SOURCE_CODE_BASE_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 SET( LIBRARY_OUTPUT_PATH ${CMAKE_BINARY_DIR}/lib )
@@ -326,16 +326,23 @@ add_subdirectory( python )
 #if we set them up to install to bin they might be packaged through, e.g. roughly (using GLOB):
 #install(FILES "${Boost_LIBRARY_DIRS}/*.dll" DESTINATION bin )
 
+if( CMAKE_COMPILER_IS_GNUCXX )
+    if( CMAKE_BUILD_TYPE STREQUAL "Release" )
+        set( CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -s" )
+    endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
+endif( CMAKE_COMPILER_IS_GNUCXX )
+install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma )
+
 set( CPACK_PACKAGE_NAME "comma" )
 #set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "command line utilities to manipulate various structured and unstructured data from offline or realtime data" )
 set( CPACK_PACKAGE_VENDOR "orthographic" )
-set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "command line utilities for structured or fixed-width offline or realtime data" ) # lintian gets upset
-set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma" )
+set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
+set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma/-/wikis/home" )
 set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine <vsevolod.vlaskine@gmail.com>" )
 set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/debian/changelog" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/copyright" )
-set( CPACK_GENERATOR "PRM" CACHE STRING "cpack generator: PRM or DEB" )
+set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
@@ -345,7 +352,7 @@ set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS
 # if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
 if( BUILD_SHARED_LIBS )
     set( CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig" )
-    set( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "/sbin/ldconfig" )
+    set( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "%posttrans -p /sbin/ldconfig" )
 endif( BUILD_SHARED_LIBS )
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy" )
diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index da59b5f07..955307c8e 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -50,6 +50,9 @@ if( NOT WIN32 )
 endif( NOT WIN32 )
 
 install( PROGRAMS io-topics DESTINATION ${comma_INSTALL_BIN_DIR})
-install( PROGRAMS rabbit-cat DESTINATION ${comma_INSTALL_BIN_DIR})
+option( comma_build_io_rabbit_cat "build rabbit-cat" ON )
+if( comma_build_io_rabbit_cat )
+    install( PROGRAMS rabbit-cat DESTINATION ${comma_INSTALL_BIN_DIR})
+endif( comma_build_io_rabbit_cat )
 install( PROGRAMS zero-publish DESTINATION ${comma_INSTALL_BIN_DIR})
 
diff --git a/system/package/debian/changelog b/system/package/debian/changelog
deleted file mode 100644
index 5b745da7e..000000000
--- a/system/package/debian/changelog
+++ /dev/null
@@ -1,3 +0,0 @@
-comma (1.0.0); urgency=medium
-
-  * initial release
diff --git a/system/package/debian/changelog.gz b/system/package/debian/changelog.gz
new file mode 100644
index 0000000000000000000000000000000000000000..82cf0602f4746ae8aae6e4450818fd5553f043a7
GIT binary patch
literal 81
zcmV-X0IvTZiwFovd?a8317m1mZf9j|Z)X5Y&d<$FRM0TgGte{8v{ooBN>9y8uC&cf
nP01|H<>FFM&{D|E%Ph%E%uy&x%}GrxPUQjsa6$pAGXMYpS>7Rv

literal 0
HcmV?d00001

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 8f7a69761..11f0e8519 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -36,7 +36,8 @@ esac
             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
-            -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  || die "failed"
+            -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  \
+            -Dcomma_build_io_rabbit_cat=OFF || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"
     # todo: optionally run full regression test

From c604d3bca9d30bf65b7fc0599eb195043b3c6fab Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 15:43:09 +1100
Subject: [PATCH 0342/1056] packaging: fixing lintian errors...

---
 CMakeLists.txt                          |  1 +
 application/CMakeLists.txt              | 11 ++++---
 application/applications/CMakeLists.txt |  2 ++
 base/CMakeLists.txt                     |  3 +-
 csv/CMakeLists.txt                      |  1 +
 csv/applications/CMakeLists.txt         | 40 ++++++++++++++++++++++++-
 io/CMakeLists.txt                       |  1 +
 io/applications/CMakeLists.txt          | 10 +++++++
 name_value/CMakeLists.txt               |  1 +
 name_value/applications/CMakeLists.txt  |  7 +++++
 string/CMakeLists.txt                   |  1 +
 util/applications/CMakeLists.txt        | 21 +++++++------
 xpath/CMakeLists.txt                    |  1 +
 13 files changed, 83 insertions(+), 17 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 1f6555359..39bfd3c42 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -329,6 +329,7 @@ add_subdirectory( python )
 if( CMAKE_COMPILER_IS_GNUCXX )
     if( CMAKE_BUILD_TYPE STREQUAL "Release" )
         set( CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -s" )
+        set( CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -s" )
     endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
 endif( CMAKE_COMPILER_IS_GNUCXX )
 install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma )
diff --git a/application/CMakeLists.txt b/application/CMakeLists.txt
index 9fddc5e03..a2fd116cb 100644
--- a/application/CMakeLists.txt
+++ b/application/CMakeLists.txt
@@ -8,15 +8,14 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
-INSTALL(
-    TARGETS ${TARGET_NAME}
-    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
-    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
-    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
-)
+INSTALL( TARGETS ${TARGET_NAME}
+         RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime       # .exe, .dll
+         LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime       # .so, mod.dll
+         ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development ) # .a, .lib
 
 if( comma_BUILD_APPLICATIONS )
     add_subdirectory( applications )
diff --git a/application/applications/CMakeLists.txt b/application/applications/CMakeLists.txt
index 2bf923a04..b5d69d45e 100644
--- a/application/applications/CMakeLists.txt
+++ b/application/applications/CMakeLists.txt
@@ -4,8 +4,10 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 
 ADD_EXECUTABLE( comma-options-to-name-value comma-options-to-name-value.cpp )
 TARGET_LINK_LIBRARIES ( comma-options-to-name-value comma_application comma_string ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( comma-options-to-name-value PROPERTIES LINK_FLAGS_RELEASE -s )
 INSTALL( TARGETS comma-options-to-name-value RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 ADD_EXECUTABLE( comma-options-validate comma-options-validate.cpp )
 TARGET_LINK_LIBRARIES ( comma-options-validate comma_application comma_string ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( comma-options-validate PROPERTIES LINK_FLAGS_RELEASE -s )
 INSTALL( TARGETS comma-options-validate RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/base/CMakeLists.txt b/base/CMakeLists.txt
index edc0331da..104ee42b9 100644
--- a/base/CMakeLists.txt
+++ b/base/CMakeLists.txt
@@ -6,6 +6,7 @@ FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
 SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL(
@@ -14,4 +15,4 @@ INSTALL(
     LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
     ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
 )
-     
\ No newline at end of file
+     
diff --git a/csv/CMakeLists.txt b/csv/CMakeLists.txt
index 3de46ff97..55d6561c0 100644
--- a/csv/CMakeLists.txt
+++ b/csv/CMakeLists.txt
@@ -12,6 +12,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index f615f4c5c..a7073d5e1 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -7,9 +7,14 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${play_source} ${play_includes} ${source} ${i
 
 add_executable( csv-quote csv-quote.cpp )
 target_link_libraries( csv-quote ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
+set_target_properties( csv-quote PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-quote RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-fields ${dir}/csv-fields.cpp )
+target_link_libraries ( csv-fields ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
+set_target_properties( csv-fields PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS csv-fields RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
 add_executable( csv-format ${dir}/csv-format.cpp )
 add_executable( csv-size ${dir}/csv-size.cpp )
 add_executable( csv-select ${dir}/csv-select.cpp )
@@ -35,7 +40,6 @@ add_executable( csv-thin ${dir}/csv-thin.cpp )
 add_executable( csv-analyse ${dir}/csv-analyse.cpp )
 add_executable( csv-to-sql ${dir}/csv-to-sql.cpp )
 
-target_link_libraries ( csv-fields ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-format ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-size ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-bin-cut ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_xpath )
@@ -61,6 +65,30 @@ target_link_libraries ( csv-thin ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma
 target_link_libraries ( csv-analyse ${comma_ALL_EXTERNAL_LIBRARIES} comma_application )
 target_link_libraries ( csv-to-sql ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 
+set_target_properties( csv-bin-cut PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-format PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-join PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-sort PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-from-columns PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-paste PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-split PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time-delay PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time-join PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time-stamp PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-to-bin PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-from-bin PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-size PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-calc PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-play PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-shape PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-shuffle PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-crc PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-select PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-thin PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-analyse PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-to-sql PROPERTIES LINK_FLAGS_RELEASE -s )
+
 install( TARGETS csv-bin-cut
                  csv-fields
                  csv-format
@@ -92,42 +120,52 @@ install ( PROGRAMS csv-gate DESTINATION ${comma_INSTALL_BIN_DIR} )
 
 add_executable( csv-blocks ${dir}/csv-blocks.cpp )
 target_link_libraries ( csv-blocks ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-blocks PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-blocks RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-cast ${dir}/csv-cast.cpp )
 target_link_libraries ( csv-cast ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv )
+set_target_properties( csv-cast PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-cast RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-enumerate ${dir}/csv-enumerate.cpp )
 target_link_libraries ( csv-enumerate ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-enumerate PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-enumerate RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-intervals ${dir}/csv-intervals.cpp )
 target_link_libraries ( csv-intervals ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath )
+set_target_properties( csv-intervals PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-intervals RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
          
 add_executable( csv-units ${dir}/csv-units.cpp )
 target_link_libraries ( csv-units ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
+set_target_properties( csv-units PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-units RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-random ${dir}/csv-random.cpp )
 target_link_libraries ( csv-random ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-random PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-random RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-strings ${dir}/csv-strings.cpp )
 target_link_libraries ( csv-strings ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-strings PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-strings RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-update ${dir}/csv-update.cpp )
 target_link_libraries ( csv-update ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-update PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-update RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 if( NOT WIN32 )
     add_executable( csv-repeat ${dir}/csv-repeat.cpp )
     target_link_libraries ( csv-repeat comma_application comma_csv comma_io )
+    set_target_properties( csv-repeat PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS csv-repeat RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 endif()
 
 add_executable( csv-bin-reverse ${dir}/csv-bin-reverse.cpp )
 target_link_libraries ( csv-bin-reverse ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_xpath comma_csv )
+set_target_properties( csv-bin-reverse PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-bin-reverse RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index 26997da0b..b0f0acb86 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -17,6 +17,7 @@ ELSE( comma_BUILD_ZEROMQ )
 ENDIF( comma_BUILD_ZEROMQ )
 
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index 955307c8e..98f71f174 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -6,6 +6,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 IF( comma_BUILD_ZEROMQ )
 ADD_EXECUTABLE( zero-cat ${dir}/zero-cat.cpp )
 TARGET_LINK_LIBRARIES ( zero-cat ${ZeroMQ_LIBRARY} comma_io comma_application ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( zero-cat PROPERTIES LINK_FLAGS_RELEASE -s )
 INSTALL( TARGETS zero-cat
          RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR}
          COMPONENT Runtime )
@@ -13,39 +14,48 @@ ENDIF( comma_BUILD_ZEROMQ )
 
 add_executable( io-buffer ${dir}/io-buffer.cpp )
 target_link_libraries( io-buffer comma_application comma_io comma_csv comma_base ) # profiler )
+set_target_properties( io-buffer PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS io-buffer RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 if( NOT WIN32 )
     add_executable( io-bandwidth ${dir}/io-bandwidth.cpp )
     target_link_libraries( io-bandwidth comma_application comma_io )
+    set_target_properties( io-bandwidth PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-bandwidth RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-cat ${dir}/io-cat.cpp )
     target_link_libraries( io-cat comma_application comma_io comma_csv comma_base ) # profiler )
+    set_target_properties( io-cat PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-cat RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-line io-line.cpp )
     target_link_libraries ( io-line comma_application )
+    set_target_properties( io-line PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-line RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-ls ${dir}/io-ls.cpp )
     target_link_libraries( io-ls comma_application comma_csv comma_xpath )
+    set_target_properties( io-ls PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-ls RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( io-publish ${dir}/io-publish.cpp )
     target_link_libraries( io-publish comma_base comma_io comma_application ) # profiler )
+    set_target_properties( io-publish PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-publish RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-tee ${dir}/io-tee.cpp )
     target_link_libraries( io-tee comma_application comma_io comma_csv comma_base ) # profiler )
+    set_target_properties( io-tee PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-tee RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( udp-client ${dir}/udp-client.cpp )
     target_link_libraries( udp-client comma_application comma_io comma_csv comma_base ) # profiler )
+    set_target_properties( udp-client PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS udp-client RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( io-console ${dir}/io-console.cpp )
     target_link_libraries( io-console comma_base comma_io comma_application ) # profiler )
+    set_target_properties( io-console PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-console RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 endif( NOT WIN32 )
 
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index b1b30b945..741e2301a 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -13,6 +13,7 @@ INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJE
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/name_value/applications/CMakeLists.txt b/name_value/applications/CMakeLists.txt
index 48ec29ad5..c1b94c309 100644
--- a/name_value/applications/CMakeLists.txt
+++ b/name_value/applications/CMakeLists.txt
@@ -12,6 +12,11 @@ TARGET_LINK_LIBRARIES( name-value-get comma_application comma_string comma_xpath
 TARGET_LINK_LIBRARIES( name-value-eval-preparse comma_application comma_name_value )
 TARGET_LINK_LIBRARIES( name-value-permute comma_application comma_string comma_xpath comma_name_value )
 
+set_target_properties( name-value-convert PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( name-value-get PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( name-value-eval-preparse PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( name-value-permute PROPERTIES LINK_FLAGS_RELEASE -s )
+
 INSTALL( TARGETS name-value-convert name-value-get name-value-eval-preparse name-value-permute
          RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR}
          COMPONENT Runtime )
@@ -20,8 +25,10 @@ install( PROGRAMS name-value-eval name-value-calc name-value-apply DESTINATION $
          
 add_executable( name-value-from-csv ${dir}/name-value-from-csv.cpp )
 target_link_libraries( name-value-from-csv comma_application comma_string )
+set_target_properties( name-value-from-csv PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS name-value-from-csv RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( name-value-to-csv ${dir}/name-value-to-csv.cpp )
 target_link_libraries( name-value-to-csv comma_application comma_string )
+set_target_properties( name-value-to-csv PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS name-value-to-csv RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/string/CMakeLists.txt b/string/CMakeLists.txt
index 57b62efda..3c7c5cb79 100644
--- a/string/CMakeLists.txt
+++ b/string/CMakeLists.txt
@@ -6,6 +6,7 @@ FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
 SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL(
diff --git a/util/applications/CMakeLists.txt b/util/applications/CMakeLists.txt
index 3b5519214..263cb70f9 100644
--- a/util/applications/CMakeLists.txt
+++ b/util/applications/CMakeLists.txt
@@ -1,6 +1,7 @@
 add_executable( comma-progress comma-progress.cpp )
 target_link_libraries(comma-progress ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_name_value )
-INSTALL( TARGETS comma-progress RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+set_target_properties( comma-progress PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS comma-progress RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 if( NOT WIN32 )
     # It is too troublesome to cross compile PROCPS
@@ -21,18 +22,20 @@ if( NOT WIN32 )
             # unset the cached result, so that we check again next time, in case the library is installed
             unset( HAVE_PROCPS_DEV CACHE )
         endif( HAVE_PROCPS_DEV )
-        target_link_libraries(comma-timeout-group ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_name_value ${LIBPROCPS} )
-        INSTALL( TARGETS comma-timeout-group RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+        target_link_libraries( comma-timeout-group ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_name_value ${LIBPROCPS} )
+        set_target_properties( comma-timeout-group PROPERTIES LINK_FLAGS_RELEASE -s )
+        install( TARGETS comma-timeout-group RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     endif( NOT NO_PROCPS )
 endif( NOT WIN32 )
 
-add_executable(comma-nap comma-nap.cpp )
-target_link_libraries(comma-nap ${comma_ALL_EXTERNAL_LIBRARIES} )
-INSTALL( TARGETS comma-nap RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+add_executable( comma-nap comma-nap.cpp )
+target_link_libraries( comma-nap ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( comma-nap PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS comma-nap RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
-INSTALL( PROGRAMS comma-build DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-profile-graph DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-repeat DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-build DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-profile-graph DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-repeat DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-enforce DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-match DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-run DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/xpath/CMakeLists.txt b/xpath/CMakeLists.txt
index 1886d4819..75f11d119 100644
--- a/xpath/CMakeLists.txt
+++ b/xpath/CMakeLists.txt
@@ -8,6 +8,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )

From 9eed280cfb25878ef17129698a205c1ed31e1466 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 16:08:57 +1100
Subject: [PATCH 0343/1056] packaging: fixing lintian errors...

---
 CMakeLists.txt | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 39bfd3c42..991e81e51 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -335,9 +335,10 @@ endif( CMAKE_COMPILER_IS_GNUCXX )
 install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma )
 
 set( CPACK_PACKAGE_NAME "comma" )
-#set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "command line utilities to manipulate various structured and unstructured data from offline or realtime data" )
+#set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
+set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "cli utilities for structured or fixed-width offline or realtime data" )
 set( CPACK_PACKAGE_VENDOR "orthographic" )
-set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
+set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "command line utilities for processing structured or fixed-width data offline or in realtime" )
 set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma/-/wikis/home" )
 set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine <vsevolod.vlaskine@gmail.com>" )
 set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/debian/changelog" )
@@ -348,7 +349,7 @@ set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1)" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 
 # if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
 if( BUILD_SHARED_LIBS )

From c37aaaa9fb36682babacd1208648dad49d239b70 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 16:25:49 +1100
Subject: [PATCH 0344/1056] packaging: fixing lintian errors...

---
 CMakeLists.txt | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 991e81e51..8f6ebca0f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -126,9 +126,7 @@ IF( NOT comma_INSTALL_INCLUDE_DIR )
     SET( comma_INSTALL_INCLUDE_DIR include/${PROJECT_NAME} )
 ENDIF( NOT comma_INSTALL_INCLUDE_DIR )
 
-IF( NOT comma_INSTALL_LIB_DIR)
-  SET( comma_INSTALL_LIB_DIR lib )
-ENDIF( NOT comma_INSTALL_LIB_DIR )
+set( comma_INSTALL_LIB_DIR lib CACHE PATH "library install directory" )
 
 IF( NOT comma_INSTALL_PACKAGE_DIR )
   SET( comma_INSTALL_PACKAGE_DIR CMakeFiles )
@@ -143,7 +141,7 @@ ENDIF( APPLE )
 OPTION( BUILD_TESTS "build unit tests" OFF )
 SET( comma_BUILD_TESTS ${BUILD_TESTS} )
 
-OPTION( BUILD_PYTHON_PACKAGES "install comma python packages" ON )
+option( BUILD_PYTHON_PACKAGES "install comma python packages" ON )
 
 INCLUDE( CMakeDependentOption )
 CMAKE_DEPENDENT_OPTION( ADD_PYTHON_PACKAGES_TO_RPM "add comma python packages to rpm" OFF "BUILD_PYTHON_PACKAGES" ON )
@@ -350,6 +348,7 @@ set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
 
 # if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
 if( BUILD_SHARED_LIBS )

From 8a446cf6e91da64184cc0dd3170128a42e13d315 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 16:58:56 +1100
Subject: [PATCH 0345/1056] packaging: fixing lintian errors...

---
 CMakeLists.txt                           | 1 +
 system/package/debian/comma-package-make | 3 +++
 2 files changed, 4 insertions(+)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 8f6ebca0f..6a535cbbc 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -348,6 +348,7 @@ set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor
 set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
+set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
 #set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
 
 # if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 11f0e8519..a2aa477fc 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -23,6 +23,9 @@ esac
     python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
+    
+    # todo? -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu
+    
     cmake . -DCPACK_GENERATOR=DEB \
             -DBUILD_PYTHON_PACKAGES=ON \
             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \

From 9a25cbe039b85c80cc38cfe1541dc75eff9a3553 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 22:45:53 +1100
Subject: [PATCH 0346/1056] packaging: c++ package: lintian errors fixed

---
 CMakeLists.txt             | 30 ++++++++++++++++++++++++++----
 application/CMakeLists.txt |  1 +
 base/CMakeLists.txt        | 14 ++++++--------
 csv/CMakeLists.txt         |  1 +
 io/CMakeLists.txt          |  1 +
 name_value/CMakeLists.txt  |  1 +
 string/CMakeLists.txt      |  1 +
 xpath/CMakeLists.txt       |  1 +
 8 files changed, 38 insertions(+), 12 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6a535cbbc..fd2c15a53 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -344,17 +344,39 @@ set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/copyright" )
 set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
-set( CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE} CACHE STRING "cpack version minor" )
-set( CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH} CACHE STRING "cpack version patch" )
+set( CPACK_PACKAGE_VERSION_MINOR "0" CACHE STRING "cpack version minor" )
+set( CPACK_PACKAGE_VERSION_PATCH "0" CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
-#set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
+set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
+set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )
 
 # if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
 if( BUILD_SHARED_LIBS )
-    set( CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig" )
+    #set( CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig" )
     set( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "%posttrans -p /sbin/ldconfig" )
+    #set( SHLIBS_FILE "${CMAKE_CURRENT_BINARY_DIR}/shlibs" )
+    # witchcraft from here: https://github.com/roboception/rcdiscover/blob/master/cmake/package_debian.cmake
+    set( TRIGGERS_FILE "${CMAKE_CURRENT_BINARY_DIR}/triggers" )
+    file( WRITE "${TRIGGERS_FILE}" "activate-noawait ldconfig\n" )
+    #file( WRITE "${SHLIBS_FILE}" "" )
+    #foreach ( libname ${sharedlibs} )
+    #    get_target_property( so_abiversion ${libname} SOVERSION )
+    #    if(NOT ${so_abiversion})
+    #      set(so_abiversion ${abiversion})
+    #      message(STATUS "SOVERSION of shared lib \"${libname}\" not set explicitly. Using <Major.Minor> of latest tag: ${so_abiversion}")
+    #      set_target_properties(${libname} PROPERTIES SOVERSION ${so_abiversion})
+    #    endif()
+    #    file(APPEND "${SHLIBS_FILE}" "lib${libname} ${so_abiversion} ${CPACK_PACKAGE_NAME}\n")
+    #endforeach (libname)
+    #execute_process( COMMAND chmod 644 "${SHLIBS_FILE}" "${TRIGGERS_FILE}" )
+    execute_process( COMMAND chmod 644 "${TRIGGERS_FILE}" )
+    if( CPACK_DEB_COMPONENT_INSTALL )
+        set( CPACK_DEBIAN_BIN_PACKAGE_CONTROL_EXTRA "${CPACK_DEBIAN_BIN_PACKAGE_CONTROL_EXTRA};${SHLIBS_FILE};${TRIGGERS_FILE}" )
+    else ( CPACK_DEB_COMPONENT_INSTALL )
+        set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA};${SHLIBS_FILE};${TRIGGERS_FILE}" )
+    endif ( CPACK_DEB_COMPONENT_INSTALL )
 endif( BUILD_SHARED_LIBS )
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy" )
diff --git a/application/CMakeLists.txt b/application/CMakeLists.txt
index a2fd116cb..34dc6450c 100644
--- a/application/CMakeLists.txt
+++ b/application/CMakeLists.txt
@@ -9,6 +9,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/base/CMakeLists.txt b/base/CMakeLists.txt
index 104ee42b9..24a821c9c 100644
--- a/base/CMakeLists.txt
+++ b/base/CMakeLists.txt
@@ -7,12 +7,10 @@ SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
 
-INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
-INSTALL(
-    TARGETS ${TARGET_NAME}
-    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
-    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
-    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
-)
-     
+install( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+install( TARGETS ${TARGET_NAME}
+         RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime       # .exe, .dll
+         LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime       # .so, mod.dll
+         ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development ) # .a, .lib
diff --git a/csv/CMakeLists.txt b/csv/CMakeLists.txt
index 55d6561c0..e7224c25e 100644
--- a/csv/CMakeLists.txt
+++ b/csv/CMakeLists.txt
@@ -13,6 +13,7 @@ ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index b0f0acb86..45bf14547 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -18,6 +18,7 @@ ENDIF( comma_BUILD_ZEROMQ )
 
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index 741e2301a..2818652e1 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -14,6 +14,7 @@ ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/string/CMakeLists.txt b/string/CMakeLists.txt
index 3c7c5cb79..471778c05 100644
--- a/string/CMakeLists.txt
+++ b/string/CMakeLists.txt
@@ -7,6 +7,7 @@ SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL(
diff --git a/xpath/CMakeLists.txt b/xpath/CMakeLists.txt
index 75f11d119..c2ee2f62f 100644
--- a/xpath/CMakeLists.txt
+++ b/xpath/CMakeLists.txt
@@ -9,6 +9,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )

From 51673cff9e3c3f7c0e7247d3e6b68a681677478f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 22:46:29 +1100
Subject: [PATCH 0347/1056] packaging: c++ package: csv-eval dependency removed

---
 CMakeLists.txt | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index fd2c15a53..80ee85ab4 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -347,7 +347,8 @@ set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR "0" CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH "0" CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )

From cc1d1cf7ffd86e77f9ba88154b6f2fc3ba27909e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Feb 2021 23:26:47 +1100
Subject: [PATCH 0348/1056] packaging: python: fixing lintian errors: README
 added

---
 python/README | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)
 create mode 100644 python/README

diff --git a/python/README b/python/README
new file mode 100644
index 000000000..5dbc6e10a
--- /dev/null
+++ b/python/README
@@ -0,0 +1,24 @@
+comma, generic python components and command-line
+utilities for quick and efficient data manipulation, especially streams
+of CSV and binary data, protocol packets, structured data (e.g. JSON), etc
+
+# installation from source
+
+Quickest way (works on Ubuntu 18.04 or higher with ansible playbook version 2.5 or higher):
+
+> mkdir src
+> cd src
+> git clone <repo>
+> ansible-playbook comma/system/ansible/install.yml --ask-become-pass
+
+Manual way:
+
+> mkdir -p src build/comma
+> cd src
+> git clone https://gitlab.com/orthographic/comma
+> cd ../build/comma
+> cmake ../../src/comma
+> make
+> sudo make install
+
+Read install.yml, if interested in tweaking build configuration.

From 0d62de1b2d835526e562409e710bbb5b3d3d40d2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Feb 2021 12:28:28 +1100
Subject: [PATCH 0349/1056] packaging... maddening...

---
 CMakeLists.txt                           |  1 +
 system/package/debian/Dockerfile         |  2 +-
 system/package/debian/comma-package-make | 13 ++++++++++---
 3 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 80ee85ab4..6d7e6303c 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -331,6 +331,7 @@ if( CMAKE_COMPILER_IS_GNUCXX )
     endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
 endif( CMAKE_COMPILER_IS_GNUCXX )
 install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma )
+install( FILES "${PROJECT_SOURCE_DIR}/copyright" DESTINATION share/doc/comma )
 
 set( CPACK_PACKAGE_NAME "comma" )
 #set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
diff --git a/system/package/debian/Dockerfile b/system/package/debian/Dockerfile
index 8139bd50b..a3290cdc4 100644
--- a/system/package/debian/Dockerfile
+++ b/system/package/debian/Dockerfile
@@ -4,7 +4,7 @@ ENV DEBIAN_FRONTEND="noninteractive"
 RUN apt update \
     && apt install --yes apt-utils \
     && apt install --yes software-properties-common \
-    && apt install --yes ansible git build-essential cmake cmake-curses-gui python3-pip
+    && apt install --yes ansible git build-essential cmake cmake-curses-gui python3-pip devscripts
 RUN apt install --yes python3-stdeb
 RUN apt install --yes python3-all
 RUN apt install --yes dh-python
diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index a2aa477fc..3d6f55e1b 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -21,11 +21,17 @@ esac
     cd ~/src/comma/python
     echo "$0: setting up python in $( pwd )" >&2
     python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
-    cd ~/build/comma
-    echo "$0: running cmake in $( pwd )" >&2
     
-    # todo? -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu
     
+    #https://shallowsky.com/blog/programming/packaging-launchpad-ppas.html
+    # todo: python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright
+    # todo: optionally gpg key
+    # todo? add lintian check?
+    # todo? or do all above outside of this script?
+    
+    
+    cd ~/build/comma
+    echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
             -DBUILD_PYTHON_PACKAGES=ON \
             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
@@ -40,6 +46,7 @@ esac
             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
             -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  \
+            -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
             -Dcomma_build_io_rabbit_cat=OFF || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"

From b04c766136a012975339ef95b33cee45edb31e31 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Feb 2021 13:24:21 +1100
Subject: [PATCH 0350/1056] packaging: fixed lintian errors, todo: new error to
 fix after gpg-signing the package: misplaced-extra-member-in-deb

---
 system/package/debian/comma-package-make | 17 +++++++++--------
 system/package/debian/readme             |  6 ++++++
 2 files changed, 15 insertions(+), 8 deletions(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 3d6f55e1b..ffad1b966 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -20,16 +20,17 @@ esac
 (
     cd ~/src/comma/python
     echo "$0: setting up python in $( pwd )" >&2
-    python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
-    
-    
+    #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
+    echo "$0: running python3 setup.py ..." >&2
+    python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright || die "failed"
+    echo "$0: building package..." >&2
+    cd deb_dist/comma-$version_major.$version_minor.$version_patch || die "failed"
+    dpkg-buildpackage -rfakeroot -uc -us || die "failed"
     #https://shallowsky.com/blog/programming/packaging-launchpad-ppas.html
-    # todo: python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright
-    # todo: optionally gpg key
+    # todo? optionally gpg key
     # todo? add lintian check?
-    # todo? or do all above outside of this script?
-    
-    
+    # todo? or do all above outside of this script using:
+    #       debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
diff --git a/system/package/debian/readme b/system/package/debian/readme
index 9fda7985a..aa4ebd980 100644
--- a/system/package/debian/readme
+++ b/system/package/debian/readme
@@ -19,3 +19,9 @@ test that package is ok, e.g:
 
 > ./comma-package-docker-test 20.04 comma-1.2.3-Linux.deb python3-comma_1.2.3-1_all.deb
 
+sign packages, e.g:
+
+> debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
+> debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 python3-comma_1.0.0-1_all.deb
+
+todo: fix lintian misplaced-extra-member-in-deb, which happens after gpg-signing

From 29e16933ea9a5c15fadac533544b79673c2dc075 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Feb 2021 18:31:58 +1100
Subject: [PATCH 0351/1056] system/package/debian/examples/package-python
 added; it still does not quite work

---
 python/requirements.txt                       |  1 +
 python/setup.py                               |  7 ++++---
 system/package/debian/comma-package-make      | 17 +++++++++++++----
 system/package/debian/examples/package-python | 11 +++++++++++
 4 files changed, 29 insertions(+), 7 deletions(-)
 create mode 100644 python/requirements.txt
 create mode 100755 system/package/debian/examples/package-python

diff --git a/python/requirements.txt b/python/requirements.txt
new file mode 100644
index 000000000..24ce15ab7
--- /dev/null
+++ b/python/requirements.txt
@@ -0,0 +1 @@
+numpy
diff --git a/python/setup.py b/python/setup.py
index 8e69a4204..08cddec68 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,10 +1,11 @@
 #!/usr/bin/env python
 
-from distutils.core import setup # from setuptools import setup
+from distutils.core import setup
+#from setuptools import setup
 import comma.version
 
 setup(
-        name                = 'comma',
+        name                = 'python3-comma', # quick and dirty to make python packaging work
         version             = comma.version.__version__,
         classifiers = [
           'Environment :: Console',
@@ -18,7 +19,7 @@
           'Topic :: Communications :: Email'
         ],
         description         = 'comma python utilities',
-        install_requires    = [ 'numpy' ],
+        #install_requires    = [ 'numpy' ],
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
         long_description    = 'comma python utilities for offline and streamed csv and fixed width data',
diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index ffad1b966..fc4df215c 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -22,14 +22,23 @@ esac
     echo "$0: setting up python in $( pwd )" >&2
     #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     echo "$0: running python3 setup.py ..." >&2
-    python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright || die "failed"
+    python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal  || die "failed"
+    # todo: mount gpg key
+    # debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
+    # mkdir tmp
+    # cd tmp
+    # dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
+    # cd python3-comma-1.0.0
+    # debuild -S -sa
+    # dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
+    # ? debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 ../../deb_dist/python3-comma_1.0.0-1_source.changes
+    # 
+    # ...
     echo "$0: building package..." >&2
     cd deb_dist/comma-$version_major.$version_minor.$version_patch || die "failed"
     dpkg-buildpackage -rfakeroot -uc -us || die "failed"
     #https://shallowsky.com/blog/programming/packaging-launchpad-ppas.html
-    # todo? optionally gpg key
-    # todo? add lintian check?
-    # todo? or do all above outside of this script using:
+    # todo? or do all above outside of this script using something like (but also see above):
     #       debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
diff --git a/system/package/debian/examples/package-python b/system/package/debian/examples/package-python
new file mode 100755
index 000000000..7f27ffb45
--- /dev/null
+++ b/system/package/debian/examples/package-python
@@ -0,0 +1,11 @@
+#!/bin/bash
+
+cd ~/src/comma/python
+rm -rf deb_disc tmp
+python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal --package python3-comma
+debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
+mkdir tmp
+dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
+cd python3-comma-1.0.0
+debuild -S -sa
+dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes

From 3a92da3a900fad46c4b50145b54a6d2dc6505770 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Feb 2021 18:37:12 +1100
Subject: [PATCH 0352/1056] system/package/debian/examples/package-python: typo
 fixed

---
 system/package/debian/examples/package-python | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/system/package/debian/examples/package-python b/system/package/debian/examples/package-python
index 7f27ffb45..f9fbc84d4 100755
--- a/system/package/debian/examples/package-python
+++ b/system/package/debian/examples/package-python
@@ -1,10 +1,11 @@
 #!/bin/bash
 
 cd ~/src/comma/python
-rm -rf deb_disc tmp
+rm -rf deb_dist dist tmp
 python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal --package python3-comma
 debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
 mkdir tmp
+cd tmp
 dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
 cd python3-comma-1.0.0
 debuild -S -sa

From 6a64ac5219e047f71880e68d63876156ce83814a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Feb 2021 18:59:33 +1100
Subject: [PATCH 0353/1056] system/package/debian/examples/package-python:
 testing...

---
 system/package/debian/examples/package-python | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/system/package/debian/examples/package-python b/system/package/debian/examples/package-python
index f9fbc84d4..27b569d14 100755
--- a/system/package/debian/examples/package-python
+++ b/system/package/debian/examples/package-python
@@ -2,11 +2,11 @@
 
 cd ~/src/comma/python
 rm -rf deb_dist dist tmp
-python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal --package python3-comma
+python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal --package python3-comma --build-depends python3-numpy
 debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
 mkdir tmp
 cd tmp
 dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
 cd python3-comma-1.0.0
 debuild -S -sa
-dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
+dput ppa:orthographic/test-ppa ../python3-comma_1.0.0-1_source.changes #dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes

From 1d66175b23dde9c6101c6561dfb20d5c5cf11f1b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 13 Feb 2021 11:17:23 +1100
Subject: [PATCH 0354/1056] cmake: improving for building with shared
 libraries...

---
 CMakeLists.txt             | 18 ++++++++++++------
 application/CMakeLists.txt |  2 +-
 base/CMakeLists.txt        |  2 +-
 csv/CMakeLists.txt         |  2 +-
 io/CMakeLists.txt          |  2 +-
 name_value/CMakeLists.txt  |  2 +-
 string/CMakeLists.txt      |  2 +-
 xpath/CMakeLists.txt       |  2 +-
 8 files changed, 19 insertions(+), 13 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6d7e6303c..cf2f199e2 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -116,6 +116,10 @@ SET( EXECUTABLE_OUTPUT_PATH
      ${PROJECT_BINARY_DIR}/bin CACHE PATH
      "Single output directory for building all executables." )
 
+set( comma_version_major "1" ) # quick and dirty
+set( comma_version_minor "0" ) # quick and dirty
+set( comma_version_patch "0" ) # quick and dirty
+     
 SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" )
 
 IF( NOT comma_INSTALL_BIN_DIR )
@@ -126,7 +130,9 @@ IF( NOT comma_INSTALL_INCLUDE_DIR )
     SET( comma_INSTALL_INCLUDE_DIR include/${PROJECT_NAME} )
 ENDIF( NOT comma_INSTALL_INCLUDE_DIR )
 
-set( comma_INSTALL_LIB_DIR lib CACHE PATH "library install directory" )
+if( NOT comma_INSTALL_LIB_DIR ) # voodoo
+  set( comma_INSTALL_LIB_DIR lib )
+endif( NOT comma_INSTALL_LIB_DIR )
 
 IF( NOT comma_INSTALL_PACKAGE_DIR )
   SET( comma_INSTALL_PACKAGE_DIR CMakeFiles )
@@ -330,8 +336,8 @@ if( CMAKE_COMPILER_IS_GNUCXX )
         set( CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -s" )
     endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
 endif( CMAKE_COMPILER_IS_GNUCXX )
-install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma )
-install( FILES "${PROJECT_SOURCE_DIR}/copyright" DESTINATION share/doc/comma )
+install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
+install( FILES "${PROJECT_SOURCE_DIR}/copyright" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
 
 set( CPACK_PACKAGE_NAME "comma" )
 #set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
@@ -344,9 +350,9 @@ set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/de
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/copyright" )
 set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
-set( CPACK_PACKAGE_VERSION_MAJOR "1" CACHE STRING "cpack version major" )
-set( CPACK_PACKAGE_VERSION_MINOR "0" CACHE STRING "cpack version minor" )
-set( CPACK_PACKAGE_VERSION_PATCH "0" CACHE STRING "cpack version patch" )
+set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} CACHE STRING "cpack version major" )
+set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} CACHE STRING "cpack version minor" )
+set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
diff --git a/application/CMakeLists.txt b/application/CMakeLists.txt
index 34dc6450c..fe718a5d2 100644
--- a/application/CMakeLists.txt
+++ b/application/CMakeLists.txt
@@ -9,7 +9,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/base/CMakeLists.txt b/base/CMakeLists.txt
index 24a821c9c..4c4d6dc08 100644
--- a/base/CMakeLists.txt
+++ b/base/CMakeLists.txt
@@ -7,7 +7,7 @@ SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 
 install( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 install( TARGETS ${TARGET_NAME}
diff --git a/csv/CMakeLists.txt b/csv/CMakeLists.txt
index e7224c25e..a607236b7 100644
--- a/csv/CMakeLists.txt
+++ b/csv/CMakeLists.txt
@@ -13,7 +13,7 @@ ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index 45bf14547..e4d3a4fdf 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -18,7 +18,7 @@ ENDIF( comma_BUILD_ZEROMQ )
 
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index 2818652e1..9c2a3048e 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -14,7 +14,7 @@ ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/string/CMakeLists.txt b/string/CMakeLists.txt
index 471778c05..8b24fab83 100644
--- a/string/CMakeLists.txt
+++ b/string/CMakeLists.txt
@@ -7,7 +7,7 @@ SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL(
diff --git a/xpath/CMakeLists.txt b/xpath/CMakeLists.txt
index c2ee2f62f..2053921d4 100644
--- a/xpath/CMakeLists.txt
+++ b/xpath/CMakeLists.txt
@@ -9,7 +9,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${CPACK_PACKAGE_VERSION_MAJOR} ${CPACK_PACKAGE_VERSION_MINOR} ${CPACK_PACKAGE_VERSION_PATCH} )
+set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )

From 4054b96b1fe00700417587a93aa75347398f2c20 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 13 Feb 2021 11:30:18 +1100
Subject: [PATCH 0355/1056] copyright renamed back to copying

---
 CMakeLists.txt       | 21 ++++++++-------------
 copyright => COPYING |  0
 2 files changed, 8 insertions(+), 13 deletions(-)
 rename copyright => COPYING (100%)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index cf2f199e2..fdacfb36c 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -54,14 +54,9 @@ ELSE() # Probably windows; gets hardcoded patch version
 	SET ( COMMITHASH "abc" )
 ENDIF()
 
-# ---------------------------------------------------------------------------
-# set compiler and linker flags and variables
-
-IF(NOT CMAKE_BUILD_TYPE)
-  SET(CMAKE_BUILD_TYPE RelWithDebInfo CACHE STRING
-      "Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel."
-      FORCE)
-ENDIF(NOT CMAKE_BUILD_TYPE)
+if( NOT CMAKE_BUILD_TYPE )
+  set( CMAKE_BUILD_TYPE Release CACHE STRING "Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel." FORCE )
+endif( NOT CMAKE_BUILD_TYPE )
 
 IF(WIN32)
   SET(CMAKE_CXX_WARNING_LEVEL 4)
@@ -158,7 +153,7 @@ SET( comma_BUILD_APPLICATIONS ${BUILD_APPLICATIONS} )
 
 OPTION( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
 
-OPTION(BUILD_SHARED_LIBS "build with shared libraries" OFF)
+option( BUILD_SHARED_LIBS "build with shared libraries" ON ) # option( BUILD_SHARED_LIBS "build with shared libraries" OFF )
 
 OPTION( comma_BUILD_XML "build xml" OFF )
 
@@ -293,7 +288,7 @@ CONFIGURE_FILE( ${PROJECT_SOURCE_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake.in
 
 set( comma_PACKAGE_CMAKEFILES ${comma_PACKAGE_CMAKEFILES} ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake )
 install( FILES ${comma_PACKAGE_CMAKEFILES} DESTINATION ${comma_INSTALL_PACKAGE_DIR} )
-install( FILES ${PROJECT_SOURCE_DIR}/copyright DESTINATION share/doc/comma ) # quick and dirty
+#install( FILES ${PROJECT_SOURCE_DIR}/copyright DESTINATION share/doc/comma ) # quick and dirty
 
 #-----------------------------------------------------------------------------
 # add sources
@@ -336,8 +331,8 @@ if( CMAKE_COMPILER_IS_GNUCXX )
         set( CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -s" )
     endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
 endif( CMAKE_COMPILER_IS_GNUCXX )
-install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
-install( FILES "${PROJECT_SOURCE_DIR}/copyright" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
+#install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
+#install( FILES "${PROJECT_SOURCE_DIR}/copyright" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
 
 set( CPACK_PACKAGE_NAME "comma" )
 #set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
@@ -348,7 +343,7 @@ set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma/-/wiki
 set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine <vsevolod.vlaskine@gmail.com>" )
 set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/debian/changelog" )
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
-set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/copyright" )
+set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING" )
 set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} CACHE STRING "cpack version minor" )
diff --git a/copyright b/COPYING
similarity index 100%
rename from copyright
rename to COPYING

From 4daa6167d6355a7325d9fa4aebb020d173d5a77a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 14 Feb 2021 11:51:26 +1100
Subject: [PATCH 0356/1056] cmake: made ldconfig running on installing shared
 libs

---
 CMakeLists.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index fdacfb36c..cf0fe8b66 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -331,6 +331,9 @@ if( CMAKE_COMPILER_IS_GNUCXX )
         set( CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -s" )
     endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
 endif( CMAKE_COMPILER_IS_GNUCXX )
+if( BUILD_SHARED_LIBS )
+    install( CODE "execute_process( COMMAND \"/sbin/ldconfig\" )" ) # is it the right way? does it run at the right time?
+endif( BUILD_SHARED_LIBS )
 #install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
 #install( FILES "${PROJECT_SOURCE_DIR}/copyright" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
 

From 138c5b5bbfd4befe320c42a89f3b70ddabdccac5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 14 Feb 2021 12:25:14 +1100
Subject: [PATCH 0357/1056] cmake: made ldconfig running on installing shared
 libs: (hopefully) made sure it runs last

---
 CMakeFiles/post_install/CMakeLists.txt | 4 ++++
 CMakeLists.txt                         | 9 ++-------
 2 files changed, 6 insertions(+), 7 deletions(-)
 create mode 100644 CMakeFiles/post_install/CMakeLists.txt

diff --git a/CMakeFiles/post_install/CMakeLists.txt b/CMakeFiles/post_install/CMakeLists.txt
new file mode 100644
index 000000000..65acf3bd4
--- /dev/null
+++ b/CMakeFiles/post_install/CMakeLists.txt
@@ -0,0 +1,4 @@
+if( BUILD_SHARED_LIBS )
+    install( CODE "execute_process( COMMAND /sbin/ldconfig )" )
+endif( BUILD_SHARED_LIBS )
+
diff --git a/CMakeLists.txt b/CMakeLists.txt
index cf0fe8b66..fe09015fd 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -331,11 +331,8 @@ if( CMAKE_COMPILER_IS_GNUCXX )
         set( CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -s" )
     endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
 endif( CMAKE_COMPILER_IS_GNUCXX )
-if( BUILD_SHARED_LIBS )
-    install( CODE "execute_process( COMMAND \"/sbin/ldconfig\" )" ) # is it the right way? does it run at the right time?
-endif( BUILD_SHARED_LIBS )
-#install( FILES "${PROJECT_SOURCE_DIR}/system/package/debian/changelog.gz" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
-#install( FILES "${PROJECT_SOURCE_DIR}/copyright" DESTINATION share/doc/comma ) # todo: remove - cannot use cpack for ubuntu ppa anyway
+
+add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
 
 set( CPACK_PACKAGE_NAME "comma" )
 #set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
@@ -398,5 +395,3 @@ INCLUDE( InstallRequiredSystemLibraries )
 
 #this line does all the work. Actually, even if this is the only line, you get all but the dlls...
 INCLUDE( CPack )
-
-

From abb5a0e11291aa6facc2893b3acbeec2c67df152 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 14 Feb 2021 12:30:40 +1100
Subject: [PATCH 0358/1056] cmake: made ldconfig running on installing shared
 libs: made more verbose

---
 CMakeFiles/post_install/CMakeLists.txt | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/CMakeFiles/post_install/CMakeLists.txt b/CMakeFiles/post_install/CMakeLists.txt
index 65acf3bd4..cf00749b3 100644
--- a/CMakeFiles/post_install/CMakeLists.txt
+++ b/CMakeFiles/post_install/CMakeLists.txt
@@ -1,4 +1,6 @@
 if( BUILD_SHARED_LIBS )
+    install( CODE "message( \"ldconfig: running...\" )" )
     install( CODE "execute_process( COMMAND /sbin/ldconfig )" )
+    install( CODE "message( \"ldconfig: done\" )" )
 endif( BUILD_SHARED_LIBS )
 

From 369d443c28c8c545f55d2f6a94fb76b42b858a67 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 24 Feb 2021 15:28:47 +1100
Subject: [PATCH 0359/1056] io-cat,io-publish: demote a couple of messages to
 verbose only

---
 io/applications/io-cat.cpp     | 2 +-
 io/applications/io-publish.cpp | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index ad2e13d68..03a6a6dd4 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -336,7 +336,7 @@ int main( int argc, char** argv )
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;
         for( bool done = false; !done; )
         {
-            if( is_shutdown ) { std::cerr << "io-cat: received signal" << std::endl; break; }
+            if( is_shutdown ) { if( verbose ) { std::cerr << "io-cat: received signal" << std::endl; }; break; }
             bool connected_all_we_could = try_connect( streams, select );
             if( !ready( streams, select, connected_all_we_could ) ) { continue; }
             done = true;
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 36b3c8a80..703fa2320 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -241,7 +241,7 @@ class publish
             if( update_no_clients_ )
             {
                 if( total > 0 ) { got_first_client_ever_ = true; }
-                else if( got_first_client_ever_ ) { std::cerr << "io-publish: the last client exited" << std::endl; return false; }
+                else if( got_first_client_ever_ ) { comma::verbose << "the last client exited" << std::endl; return false; }
             }
             return true;
         }

From 49e77aaaf037d8da489fc9e6d4985e0d62f1017f Mon Sep 17 00:00:00 2001
From: Navid P <navidp@acfr.usyd.edu.au>
Date: Fri, 22 Mar 2019 12:37:51 +1100
Subject: [PATCH 0360/1056] csv-repeat added append field repeat_count

---
 csv/applications/csv-repeat.cpp | 23 +++++++++++++++++------
 1 file changed, 17 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index 910d112da..08e61ed79 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -86,6 +86,7 @@ void usage( bool verbose = false )
     std::cerr << "    --append fields are appended to output; supported fields are:" << std::endl;
     std::cerr << "        time: append timestamp" << std::endl;
     std::cerr << "        repeating: 1 if currently repeating" << std::endl;
+    std::cerr << "        repeat_count: 0 if not repeated, otherwise counts up for consecutive repeating records" << std::endl;
     std::cerr << std::endl;
     if( verbose )
     {
@@ -120,8 +121,9 @@ struct output_t
 {
     boost::posix_time::ptime time;
     bool repeating;
-    output_t() : repeating( false ) {}
-    output_t( const boost::posix_time::ptime& time, bool repeating ) : time( time ), repeating( repeating ) {}
+    unsigned repeat_count;
+    output_t() : repeating( false ), repeat_count(0) {}
+    output_t( const boost::posix_time::ptime& time, bool repeating, unsigned repeat_count=0 ) : time( time ), repeating( repeating ), repeat_count(repeat_count) {}
 };
 
 namespace comma { namespace visiting {
@@ -138,11 +140,13 @@ template <> struct traits< output_t >
     {
         v.apply( "time", p.time );
         v.apply( "repeating", p.repeating );
+        v.apply( "repeat_count", p.repeat_count );
     }
     template < typename K, typename V > static void visit( const K&, output_t& p, V& v )
     {
         v.apply( "time", p.time );
         v.apply( "repeating", p.repeating );
+        v.apply( "repeat_count", p.repeat_count );
     }
 };
     
@@ -321,6 +325,9 @@ int main( int ac, char** av )
         std::string last_line;
         std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
         bool repeating = false;
+        unsigned int repeat_count = 0;
+        bool pace = options.exists( "--pace" );
+        if( pace && !period ) { std::cerr << "csv-repeat: for --pace, please specify --period" << std::endl; return 1; }
         while( is->good() && !end_of_stream )
         {
             select.wait( repeating ? *period : timeout );
@@ -362,11 +369,14 @@ int main( int ac, char** av )
                     else { std::cout << std::endl; }
                 }
                 end_of_stream = repeating = false;
+                repeat_count = 0;
+                if( pace ) { boost::this_thread::sleep( *period ); } // todo: quick and dirty; fix it properly for --pace, to make sure sleep happens after each record only once
             }
             if( !is->good() || end_of_stream ) { break; }
             if( repeating )
             {
                 if( !period ) { std::cerr << "csv-repeat: input data timed out" << std::endl; return 1; }
+                repeat_count++;
                 if( csv.binary() )
                 {
                     if( last_record )
@@ -374,7 +384,7 @@ int main( int ac, char** av )
                         std::cout.write( last_record, record_size );
                         /// do not do it! see the note inside csv::stream.h, search for passed<> class template
                         /// ::write( 1, last_record, record_size );
-                        if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) ); }
+                        if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) ); }
                     }
                 }
                 else
@@ -385,7 +395,7 @@ int main( int ac, char** av )
                         if( ostream )
                         {
                             std::cout << csv.delimiter;
-                            ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) );
+                            ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) );
                         }
                         else { std::cout << std::endl; }
                     }
@@ -400,19 +410,20 @@ int main( int ac, char** av )
             {
                 boost::this_thread::sleep( *period ); // quick and dirty
                 if( is_shutdown ) { break; }
+                repeat_count++;
                 if( csv.binary() )
                 {
                     if( !last_record ) { break; }
                     std::cout.write( last_record, record_size );
                     /// do not do it! see the note inside csv::stream.h, search for passed<> class template
                     /// ::write( 1, last_record, record_size );
-                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) ); }
+                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) ); }
                 }
                 else
                 {
                     if( last_line.empty() ) { break; }
                     std::cout << last_line;
-                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) ); }
+                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) ); }
                     else { std::cout << std::endl; }
                 }
                 std::cout.flush();

From 62d941559cd5be7e590b0822aa4b09c5bd59370d Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Fri, 3 May 2019 12:45:10 +1000
Subject: [PATCH 0361/1056] csv-calc: added example to help

---
 csv/applications/csv-calc.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 630e6fc10..82f7979fc 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -142,6 +142,7 @@ static void usage( bool verbose )
     }
     std::cerr << "examples" << std::endl;
     std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.9" << std::endl;
+    std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.1,percentile=0.9" << std::endl;
     std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.9:interpolate --verbose" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | " << comma::verbose.app_name() << " --fields=a,block percentile=0.9" << std::endl;

From 058ed9725796eaea8d2e1d22ed1eb7ba14f28fa6 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 28 Mar 2019 14:43:44 +1100
Subject: [PATCH 0362/1056] name-value-to-csv: fix application name in help
 examples

---
 name_value/applications/name-value-to-csv.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index cadd823e4..104f08f1f 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -32,7 +32,7 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    indexed data" << std::endl;
-    std::cerr << "        cat <<EOF | $scriptname --fields=name,value,status --prefix=my/test" << std::endl;
+    std::cerr << "        cat <<EOF | name-value-to-csv --fields=name,value,status --prefix=my/test" << std::endl;
     std::cerr << "        my/test[0]/name=a" << std::endl;
     std::cerr << "        my/test[0]/value=10" << std::endl;
     std::cerr << "        my/test[0]/status=0" << std::endl;

From 89a1bb48d87fb612547d30f30a5451c80c92ce10 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Wed, 15 May 2019 11:53:14 +1000
Subject: [PATCH 0363/1056] bash_completion.d/comma: fixed copyright year

---
 etc/bash_completion.d/comma | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/etc/bash_completion.d/comma b/etc/bash_completion.d/comma
index 0911896ae..332b588da 100644
--- a/etc/bash_completion.d/comma
+++ b/etc/bash_completion.d/comma
@@ -1,5 +1,5 @@
 # This file is part of comma, a generic and flexible library
-# Copyright (c) 2011 The University of Sydney
+# Copyright (c) 2015 The University of Sydney
 # All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without

From a198971c02b1835b9159ba5f701707263eb71ace Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Fri, 24 May 2019 16:26:38 +1000
Subject: [PATCH 0364/1056] csv-thin: fixed app name in error message

---
 csv/applications/csv-thin.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index 9637d3d64..e9ce3d778 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -251,7 +251,7 @@ int main( int ac, char** av )
         }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-size: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-size: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-thin: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-thin: unknown exception" << std::endl; }
     return 1;
 }

From e2cc85f1838e7d6b534a260ab40ae492e6dccc41 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Wed, 17 Jul 2019 09:45:37 +1000
Subject: [PATCH 0365/1056] CMakeLists.txt: changed hint line so it will fit in
 80 columns

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index fe09015fd..eec526472 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -55,7 +55,7 @@ ELSE() # Probably windows; gets hardcoded patch version
 ENDIF()
 
 if( NOT CMAKE_BUILD_TYPE )
-  set( CMAKE_BUILD_TYPE Release CACHE STRING "Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel." FORCE )
+  set( CMAKE_BUILD_TYPE Release CACHE STRING "options are: None Debug Release RelWithDebInfo MinSizeRel." FORCE )
 endif( NOT CMAKE_BUILD_TYPE )
 
 IF(WIN32)

From 5fdaaa28b56490bd233231547f8c8321bec72b69 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 11 Mar 2021 11:16:56 +1100
Subject: [PATCH 0366/1056] csv-repeat: rename append field from repeat_count
 to count

---
 csv/applications/csv-repeat.cpp | 29 +++++++++++++++--------------
 1 file changed, 15 insertions(+), 14 deletions(-)

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index 08e61ed79..6cef51af5 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -86,7 +86,7 @@ void usage( bool verbose = false )
     std::cerr << "    --append fields are appended to output; supported fields are:" << std::endl;
     std::cerr << "        time: append timestamp" << std::endl;
     std::cerr << "        repeating: 1 if currently repeating" << std::endl;
-    std::cerr << "        repeat_count: 0 if not repeated, otherwise counts up for consecutive repeating records" << std::endl;
+    std::cerr << "        count: counts up from zero for consecutive repeating records" << std::endl;
     std::cerr << std::endl;
     if( verbose )
     {
@@ -121,9 +121,9 @@ struct output_t
 {
     boost::posix_time::ptime time;
     bool repeating;
-    unsigned repeat_count;
-    output_t() : repeating( false ), repeat_count(0) {}
-    output_t( const boost::posix_time::ptime& time, bool repeating, unsigned repeat_count=0 ) : time( time ), repeating( repeating ), repeat_count(repeat_count) {}
+    unsigned count;
+    output_t() : repeating( false ), count( 0 ) {}
+    output_t( const boost::posix_time::ptime& time, bool repeating, unsigned count=0 ) : time( time ), repeating( repeating ), count( count ) {}
 };
 
 namespace comma { namespace visiting {
@@ -140,13 +140,13 @@ template <> struct traits< output_t >
     {
         v.apply( "time", p.time );
         v.apply( "repeating", p.repeating );
-        v.apply( "repeat_count", p.repeat_count );
+        v.apply( "count", p.count );
     }
     template < typename K, typename V > static void visit( const K&, output_t& p, V& v )
     {
         v.apply( "time", p.time );
         v.apply( "repeating", p.repeating );
-        v.apply( "repeat_count", p.repeat_count );
+        v.apply( "count", p.count );
     }
 };
     
@@ -184,6 +184,7 @@ int main( int ac, char** av )
                     {
                         if( v[i] == "repeating" ) { format += comma + 'b'; }
                         else if( v[i] == "time" ) { format += comma + 't'; }
+                        else if( v[i] == "count" ) { format += comma + "ui"; }
                         else { std::cerr << "csv-repeat: expected one of: " << comma::join( comma::csv::names< output_t >( false ), ',' ) << "; got: \"" << v[i] << "\"" << std::endl; return 1; }
                         comma = ",";
                     }
@@ -325,7 +326,7 @@ int main( int ac, char** av )
         std::string last_line;
         std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
         bool repeating = false;
-        unsigned int repeat_count = 0;
+        unsigned int count = 0;
         bool pace = options.exists( "--pace" );
         if( pace && !period ) { std::cerr << "csv-repeat: for --pace, please specify --period" << std::endl; return 1; }
         while( is->good() && !end_of_stream )
@@ -369,14 +370,14 @@ int main( int ac, char** av )
                     else { std::cout << std::endl; }
                 }
                 end_of_stream = repeating = false;
-                repeat_count = 0;
+                count = 0;
                 if( pace ) { boost::this_thread::sleep( *period ); } // todo: quick and dirty; fix it properly for --pace, to make sure sleep happens after each record only once
             }
             if( !is->good() || end_of_stream ) { break; }
             if( repeating )
             {
                 if( !period ) { std::cerr << "csv-repeat: input data timed out" << std::endl; return 1; }
-                repeat_count++;
+                count++;
                 if( csv.binary() )
                 {
                     if( last_record )
@@ -384,7 +385,7 @@ int main( int ac, char** av )
                         std::cout.write( last_record, record_size );
                         /// do not do it! see the note inside csv::stream.h, search for passed<> class template
                         /// ::write( 1, last_record, record_size );
-                        if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) ); }
+                        if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) ); }
                     }
                 }
                 else
@@ -395,7 +396,7 @@ int main( int ac, char** av )
                         if( ostream )
                         {
                             std::cout << csv.delimiter;
-                            ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) );
+                            ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) );
                         }
                         else { std::cout << std::endl; }
                     }
@@ -410,20 +411,20 @@ int main( int ac, char** av )
             {
                 boost::this_thread::sleep( *period ); // quick and dirty
                 if( is_shutdown ) { break; }
-                repeat_count++;
+                count++;
                 if( csv.binary() )
                 {
                     if( !last_record ) { break; }
                     std::cout.write( last_record, record_size );
                     /// do not do it! see the note inside csv::stream.h, search for passed<> class template
                     /// ::write( 1, last_record, record_size );
-                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) ); }
+                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) ); }
                 }
                 else
                 {
                     if( last_line.empty() ) { break; }
                     std::cout << last_line;
-                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, repeat_count ) ); }
+                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) ); }
                     else { std::cout << std::endl; }
                 }
                 std::cout.flush();

From d5974a6de898c92936bdab637014a7df37bda491 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 11 Mar 2021 11:17:48 +1100
Subject: [PATCH 0367/1056] csv-repeat: added tests for --append=count

---
 csv/test/csv-repeat/append/all/expected   | 22 +++++++++++
 csv/test/csv-repeat/append/all/input      |  2 +-
 csv/test/csv-repeat/append/count/expected | 45 +++++++++++++++++++++++
 csv/test/csv-repeat/append/count/input    | 12 ++++++
 4 files changed, 80 insertions(+), 1 deletion(-)
 create mode 100644 csv/test/csv-repeat/append/count/expected
 create mode 100644 csv/test/csv-repeat/append/count/input

diff --git a/csv/test/csv-repeat/append/all/expected b/csv/test/csv-repeat/append/all/expected
index 1f5958aeb..607742fc2 100644
--- a/csv/test/csv-repeat/append/all/expected
+++ b/csv/test/csv-repeat/append/all/expected
@@ -1,67 +1,89 @@
 ascii[0]/data=123
 ascii[0]/repeating=0
 ascii[0]/time=ascii[0]/timestamp +/- 0.01
+ascii[0]/count=0
 ascii[1]/data=456
 ascii[1]/repeating=0
 ascii[1]/time=ascii[1]/timestamp +/- 0.01
+ascii[1]/count=0
 ascii[2]/data=789
 ascii[2]/repeating=0
 ascii[2]/time=ascii[2]/timestamp +/- 0.01
+ascii[2]/count=0
 ascii[3]/data=789
 ascii[3]/repeating=1
 ascii[3]/time=ascii[3]/timestamp +/- 0.01
+ascii[3]/count=1
 ascii[4]/data=789
 ascii[4]/repeating=1
 ascii[4]/time=ascii[4]/timestamp +/- 0.01
+ascii[4]/count=2
 ascii[5]/data=789
 ascii[5]/repeating=1
 ascii[5]/time=ascii[5]/timestamp +/- 0.01
+ascii[5]/count=3
 ascii[6]/data=123
 ascii[6]/repeating=0
 ascii[6]/time=ascii[6]/timestamp +/- 0.01
+ascii[6]/count=0
 ascii[7]/data=456
 ascii[7]/repeating=0
 ascii[7]/time=ascii[7]/timestamp +/- 0.01
+ascii[7]/count=0
 ascii[8]/data=456
 ascii[8]/repeating=1
 ascii[8]/time=ascii[8]/timestamp +/- 0.01
+ascii[8]/count=1
 ascii[9]/data=456
 ascii[9]/repeating=1
 ascii[9]/time=ascii[9]/timestamp +/- 0.01
+ascii[9]/count=2
 ascii[10]/data=456
 ascii[10]/repeating=1
 ascii[10]/time=ascii[10]/timestamp +/- 0.01
+ascii[10]/count=3
 
 binary[0]/data=123
 binary[0]/repeating=0
 binary[0]/time=binary[0]/timestamp +/- 0.01
+binary[0]/count=0
 binary[1]/data=456
 binary[1]/repeating=0
 binary[1]/time=binary[1]/timestamp +/- 0.01
+binary[1]/count=0
 binary[2]/data=789
 binary[2]/repeating=0
 binary[2]/time=binary[2]/timestamp +/- 0.01
+binary[2]/count=0
 binary[3]/data=789
 binary[3]/repeating=1
 binary[3]/time=binary[3]/timestamp +/- 0.01
+binary[3]/count=1
 binary[4]/data=789
 binary[4]/repeating=1
 binary[4]/time=binary[4]/timestamp +/- 0.01
+binary[4]/count=2
 binary[5]/data=789
 binary[5]/repeating=1
 binary[5]/time=binary[5]/timestamp +/- 0.01
+binary[5]/count=3
 binary[6]/data=123
 binary[6]/repeating=0
 binary[6]/time=binary[6]/timestamp +/- 0.01
+binary[6]/count=0
 binary[7]/data=456
 binary[7]/repeating=0
 binary[7]/time=binary[7]/timestamp +/- 0.01
+binary[7]/count=0
 binary[8]/data=456
 binary[8]/repeating=1
 binary[8]/time=binary[8]/timestamp +/- 0.01
+binary[8]/count=1
 binary[9]/data=456
 binary[9]/repeating=1
 binary[9]/time=binary[9]/timestamp +/- 0.01
+binary[9]/count=2
 binary[10]/data=456
 binary[10]/repeating=1
 binary[10]/time=binary[10]/timestamp +/- 0.01
+binary[10]/count=3
diff --git a/csv/test/csv-repeat/append/all/input b/csv/test/csv-repeat/append/all/input
index 04a7f90fe..68fb9eadb 100644
--- a/csv/test/csv-repeat/append/all/input
+++ b/csv/test/csv-repeat/append/all/input
@@ -1,6 +1,6 @@
 timeout=0.3
 period=0.1
-append="repeating,time"
+append="repeating,time,count"
 format=ui
 data="
 0.20,123
diff --git a/csv/test/csv-repeat/append/count/expected b/csv/test/csv-repeat/append/count/expected
new file mode 100644
index 000000000..35c6c3704
--- /dev/null
+++ b/csv/test/csv-repeat/append/count/expected
@@ -0,0 +1,45 @@
+ascii[0]/data=123
+ascii[0]/count=0
+ascii[1]/data=456
+ascii[1]/count=0
+ascii[2]/data=789
+ascii[2]/count=0
+ascii[3]/data=789
+ascii[3]/count=1
+ascii[4]/data=789
+ascii[4]/count=2
+ascii[5]/data=789
+ascii[5]/count=3
+ascii[6]/data=123
+ascii[6]/count=0
+ascii[7]/data=456
+ascii[7]/count=0
+ascii[8]/data=456
+ascii[8]/count=1
+ascii[9]/data=456
+ascii[9]/count=2
+ascii[10]/data=456
+ascii[10]/count=3
+
+binary[0]/data=123
+binary[0]/count=0
+binary[1]/data=456
+binary[1]/count=0
+binary[2]/data=789
+binary[2]/count=0
+binary[3]/data=789
+binary[3]/count=1
+binary[4]/data=789
+binary[4]/count=2
+binary[5]/data=789
+binary[5]/count=3
+binary[6]/data=123
+binary[6]/count=0
+binary[7]/data=456
+binary[7]/count=0
+binary[8]/data=456
+binary[8]/count=1
+binary[9]/data=456
+binary[9]/count=2
+binary[10]/data=456
+binary[10]/count=3
diff --git a/csv/test/csv-repeat/append/count/input b/csv/test/csv-repeat/append/count/input
new file mode 100644
index 000000000..35be3cee9
--- /dev/null
+++ b/csv/test/csv-repeat/append/count/input
@@ -0,0 +1,12 @@
+timeout=0.3
+period=0.1
+append="count"
+format=ui
+data="
+0.20,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999
+"

From 381a20e61cd0ac6f7e6adb29a53e503972fcf5b3 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 12:05:19 +1000
Subject: [PATCH 0368/1056] csv-play.cpp: minor re-layout for clarity

---
 csv/applications/csv-play.cpp | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index ebaa2d151..58a6cab84 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -130,7 +130,13 @@ class key_press_handler_t
 public:
     enum states { running, paused, read_once, read_block };
     
-    key_press_handler_t( bool interactive, bool paused_at_start ): key_press_( interactive ), paused_( paused_at_start ), state_( paused_ ? paused : running ) { if( paused_at_start ) { std::cerr << "csv-play: paused at start" << std::endl; } }
+    key_press_handler_t( bool interactive, bool paused_at_start )
+        : key_press_( interactive )
+        , paused_( paused_at_start )
+        , state_( paused_ ? paused : running )
+    {
+        if( paused_at_start ) { std::cerr << "csv-play: paused at start" << std::endl; }
+    }
     
     void update( boost::posix_time::ptime t )
     {

From c8b721a009f45d5e3c5d725188387e20c1cb7139 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 12:12:01 +1000
Subject: [PATCH 0369/1056] csv-play: just have spacebar for pause/resume

---
 csv/applications/csv-play.cpp | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 58a6cab84..c4b7c9a1d 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -79,7 +79,7 @@ static void usage( bool )
     std::cerr << "               can be specified individually for each client, e.g." << std::endl;
     std::cerr << "               csv-play file1;pipe;clients=1 file2;tcp:1234;clients=3" << std::endl;
     std::cerr << "    --interactive,-i: react to key presses:" << std::endl;
-    std::cerr << "                      <whitespace>: pause, resume" << std::endl;
+    std::cerr << "                      <space>: pause, resume" << std::endl;
     std::cerr << "                      left or down arrow key: output one record at a time" << std::endl;
     std::cerr << "                      shift left or down arrow key: TODO: output one block at a time" << std::endl;
     std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
@@ -144,7 +144,6 @@ class key_press_handler_t
         if( !c ) { return; }
         switch( *c )
         {
-            case 10:
             case ' ':
                 switch( state_ )
                 {
@@ -215,7 +214,7 @@ class key_press_handler_t
             new_termios.c_iflag &= ~( BRKINT | ICRNL | INPCK | ISTRIP | IXON );
             if( ::tcsetattr( fd_, TCSANOW, &new_termios ) < 0 ) { COMMA_THROW( comma::exception, "failed to set '" << tty << "'" ); }
             std::cerr << "csv-play: running in interactive mode" << std::endl;
-            std::cerr << "          press <whitespace> to pause or resume" << std::endl;
+            std::cerr << "          press <space> to pause or resume" << std::endl;
             std::cerr << "          press left or down arrow key: output one record at a time" << std::endl;
         }
         

From c7d68d312aaea53280d57439959f41fd8f00f849 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 12:23:05 +1000
Subject: [PATCH 0370/1056] csv-play: fixed help to correctly describe keys in
 interactive mode

---
 csv/applications/csv-play.cpp | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index c4b7c9a1d..7134dc40c 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -80,8 +80,8 @@ static void usage( bool )
     std::cerr << "               csv-play file1;pipe;clients=1 file2;tcp:1234;clients=3" << std::endl;
     std::cerr << "    --interactive,-i: react to key presses:" << std::endl;
     std::cerr << "                      <space>: pause, resume" << std::endl;
-    std::cerr << "                      left or down arrow key: output one record at a time" << std::endl;
-    std::cerr << "                      shift left or down arrow key: TODO: output one block at a time" << std::endl;
+    std::cerr << "                      right or down arrow key: output one record at a time" << std::endl;
+    std::cerr << "                      shift right or down arrow key: TODO: output one block at a time" << std::endl;
     std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
     std::cerr << "    --paused-at-start,--paused; if --interactive, then start playback as paused" << std::endl;
     std::cerr << "    --resolution=<second>: timestamp resolution; timestamps closer than this value will be" << std::endl;
@@ -163,15 +163,15 @@ class key_press_handler_t
                         break;
                 };
                 break;
-            case 27:
+            case 27:                    // escape sequence for arrows: ESC-[
                 c = key_press_.read();
                 if( !c || *c != 91 ) { return; }
                 c = key_press_.read();
                 if( !c ) { return; }
                 switch( *c )
                 {
-                    case 66:
-                    case 67:
+                    case 66:            // down
+                    case 67:            // right
                         state_ = read_once;
                         break;  
                     default:
@@ -215,7 +215,7 @@ class key_press_handler_t
             if( ::tcsetattr( fd_, TCSANOW, &new_termios ) < 0 ) { COMMA_THROW( comma::exception, "failed to set '" << tty << "'" ); }
             std::cerr << "csv-play: running in interactive mode" << std::endl;
             std::cerr << "          press <space> to pause or resume" << std::endl;
-            std::cerr << "          press left or down arrow key: output one record at a time" << std::endl;
+            std::cerr << "          press right or down arrow key: output one record at a time" << std::endl;
         }
         
         ~key_press_t_()

From d75e234f2205dc5b0ef6d687f1198f8d37b08e0e Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 12:28:00 +1000
Subject: [PATCH 0371/1056] csv-play: added example for --interactive to help

---
 csv/applications/csv-play.cpp | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 7134dc40c..6b14f6c9f 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -122,6 +122,10 @@ static void usage( bool )
     std::cerr << "        > #in another shell, run" << std::endl;
     std::cerr << "        > socat tcp:localhost:8888 - | csv-from-bin t,2ui" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "    pause and step through output:" << std::endl;
+    std::cerr << "        echo 0 | csv-repeat --period 0.1 --yes | csv-paste - line-number \\" << std::endl;
+    std::cerr << "            | csv-time-stamp | csv-play --interactive" << std::endl;
+    std::cerr << std::endl;
     exit( 0 );
 }
 

From cdc8ba570b78e315e02e88e495a2695bafbc45a0 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 12:35:51 +1000
Subject: [PATCH 0372/1056] csv-play: added <t> key to interactive to output
 current timestamp

---
 csv/applications/csv-play.cpp | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 6b14f6c9f..587ad7b36 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -82,6 +82,7 @@ static void usage( bool )
     std::cerr << "                      <space>: pause, resume" << std::endl;
     std::cerr << "                      right or down arrow key: output one record at a time" << std::endl;
     std::cerr << "                      shift right or down arrow key: TODO: output one block at a time" << std::endl;
+    std::cerr << "                      <t>: output current timestamp to stderr" << std::endl;
     std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
     std::cerr << "    --paused-at-start,--paused; if --interactive, then start playback as paused" << std::endl;
     std::cerr << "    --resolution=<second>: timestamp resolution; timestamps closer than this value will be" << std::endl;
@@ -181,6 +182,10 @@ class key_press_handler_t
                     default:
                         return;
                 }
+                break;
+            case 't':
+                std::cerr << boost::posix_time::to_iso_string( t ) << std::endl;
+                break;
             default:
                 break;
         }
@@ -219,7 +224,8 @@ class key_press_handler_t
             if( ::tcsetattr( fd_, TCSANOW, &new_termios ) < 0 ) { COMMA_THROW( comma::exception, "failed to set '" << tty << "'" ); }
             std::cerr << "csv-play: running in interactive mode" << std::endl;
             std::cerr << "          press <space> to pause or resume" << std::endl;
-            std::cerr << "          press right or down arrow key: output one record at a time" << std::endl;
+            std::cerr << "          press right or down arrow key to output one record at a time" << std::endl;
+            std::cerr << "          press <t> to output current timestamp to stderr" << std::endl;
         }
         
         ~key_press_t_()

From 0deb6d5b104aef618f123d007dd4df038682e000 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 15:42:30 +1000
Subject: [PATCH 0373/1056] csv-play: --paused implies --interactive

---
 csv/applications/csv-play.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 587ad7b36..24efdcd7d 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -84,7 +84,7 @@ static void usage( bool )
     std::cerr << "                      shift right or down arrow key: TODO: output one block at a time" << std::endl;
     std::cerr << "                      <t>: output current timestamp to stderr" << std::endl;
     std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
-    std::cerr << "    --paused-at-start,--paused; if --interactive, then start playback as paused" << std::endl;
+    std::cerr << "    --paused-at-start,--paused: start playback as paused, implies --interactive" << std::endl;
     std::cerr << "    --resolution=<second>: timestamp resolution; timestamps closer than this value will be" << std::endl;
     std::cerr << "                           played without delay; the rationale is that microsleep used in csv-play" << std::endl;
     std::cerr << "                           (boost::this_thread::sleep()) is essentially imprecise and may create" << std::endl;
@@ -136,7 +136,7 @@ class key_press_handler_t
     enum states { running, paused, read_once, read_block };
     
     key_press_handler_t( bool interactive, bool paused_at_start )
-        : key_press_( interactive )
+        : key_press_( interactive || paused_at_start )
         , paused_( paused_at_start )
         , state_( paused_ ? paused : running )
     {

From 23ab7924e1bcf2594418a53d07e171ee34b913fe Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 15:46:55 +1000
Subject: [PATCH 0374/1056] etc/bash_completion.d/comma: updated TODO

---
 etc/bash_completion.d/comma | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/etc/bash_completion.d/comma b/etc/bash_completion.d/comma
index 332b588da..fde7d559b 100644
--- a/etc/bash_completion.d/comma
+++ b/etc/bash_completion.d/comma
@@ -113,7 +113,7 @@ complete -F _csv_time csv-time
 complete -F _csv_update csv-update
 
 # todo
-#     - add --bash-completion to csv-units, csv-update, comma-test-_comma_test_run
+#     - add --bash-completion to csv-update
 #     - install in the installation directory, if possible (if not, /etc is OK)
 
 _comma_bash_completion()

From 1cfd47bcaf2d7cf6035a756825a2371ffec7c12b Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 16:37:25 +1000
Subject: [PATCH 0375/1056] csv-play: added bash completion

---
 csv/applications/csv-play.cpp | 19 +++++++++++++++++++
 etc/bash_completion.d/comma   |  1 +
 2 files changed, 20 insertions(+)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 24efdcd7d..50864f951 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -58,6 +58,24 @@
 #include "../../csv/applications/play/play.h"
 #include "../../csv/applications/play/multiplay.h"
 
+static void bash_completion( unsigned const ac, char const* const* av )
+{
+    static const char* completion_options =
+        " --help -h"
+        " --speed --slowdown --slow"
+        " --quiet"
+        " --fields --binary"
+        " --clients"
+        " --interactive -i"
+        " --no-flush "
+        " --paused-at-start --paused"
+        " --resolution"
+        " --from --to"
+        ;
+    std::cout << completion_options << std::endl;
+    exit( 0 );
+}
+
 static void usage( bool )
 {
     std::cerr << std::endl;
@@ -262,6 +280,7 @@ int main( int argc, char** argv )
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
         comma::signal_flag shutdown_flag( signals );
         comma::command_line_options options( argc, argv, usage );
+        if( options.exists( "--bash-completion" ) ) bash_completion( argc, argv );
         options.assert_mutually_exclusive( "--speed,--slow,--slowdown" );
         double speed = options.value( "--speed", 1.0 / options.value< double >( "--slow,--slowdown", 1.0 ) );
         double resolution = options.value< double >( "--resolution", 0.01 );
diff --git a/etc/bash_completion.d/comma b/etc/bash_completion.d/comma
index fde7d559b..55fdd5d91 100644
--- a/etc/bash_completion.d/comma
+++ b/etc/bash_completion.d/comma
@@ -136,6 +136,7 @@ _comma_bash_completion()
 complete -F _comma_bash_completion comma-test-enforce
 complete -F _comma_bash_completion comma-test-run
 complete -F _comma_bash_completion csv-calc
+complete -F _comma_bash_completion csv-play
 complete -F _comma_bash_completion csv-repeat
 complete -F _comma_bash_completion csv-time-join
 complete -F _comma_bash_completion csv-units

From dd3582cbfc6d4e1257f90f7290a9d3a40a6b92cb Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 16:44:20 +1000
Subject: [PATCH 0376/1056] csv-play.cpp: move playback state to a separate
 class

---
 csv/applications/csv-play.cpp | 105 +++++++++++++++++-----------------
 1 file changed, 51 insertions(+), 54 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 50864f951..e2b5dca96 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -148,18 +148,53 @@ static void usage( bool )
     exit( 0 );
 }
 
-class key_press_handler_t
+class playback_state_t
 {
 public:
-    enum states { running, paused, read_once, read_block };
-    
-    key_press_handler_t( bool interactive, bool paused_at_start )
-        : key_press_( interactive || paused_at_start )
-        , paused_( paused_at_start )
-        , state_( paused_ ? paused : running )
+    playback_state_t() : state_( state::running ) {}
+
+    bool is_running() const { return state_ == state::running; }
+    bool is_paused() const { return state_ == state::paused; }
+
+    void pause( const boost::posix_time::ptime& t = boost::posix_time::not_a_date_time )
+    {
+        if( state_ != state::paused )
+        {
+            state_ = state::paused;
+            std::cerr << "csv-play: paused";
+            if( ! t.is_not_a_date_time() ) { std::cerr << " at " << boost::posix_time::to_iso_string( t ); }
+            std::cerr << std::endl;
+        }
+    }
+
+    void run()
+    {
+        if( state_ != state::running )
+        {
+            state_ = state::running;
+            std::cerr << "csv-play: resumed" << std::endl;
+        }
+    }
+
+    void read_once() { state_ = state::read_once; }
+
+    void has_read_once()
     {
-        if( paused_at_start ) { std::cerr << "csv-play: paused at start" << std::endl; }
+        if( state_ == state::read_once ) { state_ = state::paused; }
     }
+
+private:
+    enum class state { running, paused, read_once, read_block };
+
+    state state_;
+};
+
+static playback_state_t playback;
+
+class key_press_handler_t
+{
+public:
+    key_press_handler_t( bool interactive ) : key_press_( interactive ) {}
     
     void update( boost::posix_time::ptime t )
     {
@@ -168,38 +203,15 @@ class key_press_handler_t
         switch( *c )
         {
             case ' ':
-                switch( state_ )
-                {
-                    case running:
-                        std::cerr << "csv-play: paused at " << boost::posix_time::to_iso_string( t ) << std::endl;
-                        state_ = paused;
-                        break;
-                    case paused:
-                        std::cerr << "csv-play: resumed" << std::endl;
-                        state_ = running;
-                        break;
-                    case read_block:
-                        return; // never here, todo
-                    case read_once:
-                        std::cerr << "csv-play: resumed" << std::endl;
-                        state_ = running;
-                        break;
-                };
+                if( playback.is_running() ) { playback.pause( t ); }
+                else { playback.run(); }
                 break;
             case 27:                    // escape sequence for arrows: ESC-[
                 c = key_press_.read();
                 if( !c || *c != 91 ) { return; }
                 c = key_press_.read();
                 if( !c ) { return; }
-                switch( *c )
-                {
-                    case 66:            // down
-                    case 67:            // right
-                        state_ = read_once;
-                        break;  
-                    default:
-                        return;
-                }
+                if( *c == 66 || *c == 67 ) { playback.read_once(); } // down or right arrow
                 break;
             case 't':
                 std::cerr << boost::posix_time::to_iso_string( t ) << std::endl;
@@ -209,21 +221,6 @@ class key_press_handler_t
         }
     }
     
-    states state() const { return state_; }
-    
-    void has_read_once() 
-    {
-        switch( state_ )
-        {
-            case running:
-            case paused:
-            case read_block:
-                return;
-            case read_once:
-                state_ = paused;
-        };
-    }
-    
 private:
     class key_press_t_
     {
@@ -267,9 +264,8 @@ class key_press_handler_t
         int fd_;
         struct termios old_termios_;
     };
+
     key_press_t_ key_press_;
-    bool paused_;
-    states state_;
 };
 
 int main( int argc, char** argv )
@@ -301,13 +297,14 @@ int main( int argc, char** argv )
         boost::posix_time::ptime totime;
         if( !to.empty() ) { totime = boost::posix_time::from_iso_string( to ); }
         multiplay.reset( new comma::Multiplay( sourceConfigs, 1.0 / speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int> (resolution * 1000000) ), fromtime, totime, flush ) );
-        key_press_handler_t key_press_handler( options.exists( "--interactive,-i" ), options.exists( "--paused,--paused-at-start" ) );
+        if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
+        key_press_handler_t key_press_handler( options.exists( "--interactive,-i" ) || options.exists( "--paused,--paused-at-start" ));
         while( !shutdown_flag && std::cout.good() && !std::cout.bad() && !std::cout.eof() )
         {
             key_press_handler.update( multiplay->now() );
-            if( key_press_handler.state() == key_press_handler_t::paused ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }
+            if( playback.is_paused() ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }
             if( !multiplay->read() ) { break; }
-            key_press_handler.has_read_once();
+            playback.has_read_once();
         }
         multiplay->close();
         multiplay.reset();

From 5f113a62f7942837895e73fd363e9ff5c53668c7 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 17:27:48 +1000
Subject: [PATCH 0377/1056] play.h,play.cpp: removed unused constructor

---
 csv/applications/play/play.cpp | 20 +-------------------
 csv/applications/play/play.h   |  1 -
 2 files changed, 1 insertion(+), 20 deletions(-)

diff --git a/csv/applications/play/play.cpp b/csv/applications/play/play.cpp
index 69566cd90..3e71fcde9 100644
--- a/csv/applications/play/play.cpp
+++ b/csv/applications/play/play.cpp
@@ -37,36 +37,18 @@
 namespace comma { namespace csv { namespace impl {
     
 /// constructor    
-play::play( double speed, bool quiet, const boost::posix_time::time_duration& resolution ):
-    m_speed( speed ),
-    m_resolution( resolution ),
-    m_lag( false ),
-    m_lagCounter( 0U ),
-    m_quiet( quiet )
-{
-}
-
-/// constructor
-/// @param first first timestamp
 /// @param speed slow-down factor: 1.0 = real time, 2.0 = twice as slow etc...
 /// @param quiet if true, do not output warnings if we can not keep up with the desired playback speed
 /// @param resolution expected resolution from the sleep function
-play::play( const boost::posix_time::ptime& first, double speed, bool quiet, const boost::posix_time::time_duration& resolution ):
-
-    m_systemFirst( boost::get_system_time() ),
-    m_offset( m_systemFirst - first ),
-    m_first( first ),
-    m_last( first ),
+play::play( double speed, bool quiet, const boost::posix_time::time_duration& resolution ):
     m_speed( speed ),
     m_resolution( resolution ),
     m_lag( false ),
     m_lagCounter( 0U ),
     m_quiet( quiet )
 {
-    
 }
 
-
 /// wait until a timestamp
 /// @param time timestamp as ptime
 void play::wait( const boost::posix_time::ptime& time )
diff --git a/csv/applications/play/play.h b/csv/applications/play/play.h
index 9ae95c6eb..4fda2fc06 100644
--- a/csv/applications/play/play.h
+++ b/csv/applications/play/play.h
@@ -43,7 +43,6 @@ class play
 {
 public:
     play( double speed = 1.0, bool quiet = false, const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds(1) );
-    play( const boost::posix_time::ptime& first, double speed = 1.0, bool quiet = false, const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds(1) );
 
     void wait( const boost::posix_time::ptime& time );
 

From b2e4c4fc1d27e1a7f53358acca952968f9025b6a Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 17:32:56 +1000
Subject: [PATCH 0378/1056] play.h,play.cpp: replaced m_offset with a boolean

it was only being used in that fashion
---
 csv/applications/play/play.cpp | 17 +++++++++--------
 csv/applications/play/play.h   |  2 +-
 2 files changed, 10 insertions(+), 9 deletions(-)

diff --git a/csv/applications/play/play.cpp b/csv/applications/play/play.cpp
index 3e71fcde9..8065a6e9e 100644
--- a/csv/applications/play/play.cpp
+++ b/csv/applications/play/play.cpp
@@ -40,12 +40,13 @@ namespace comma { namespace csv { namespace impl {
 /// @param speed slow-down factor: 1.0 = real time, 2.0 = twice as slow etc...
 /// @param quiet if true, do not output warnings if we can not keep up with the desired playback speed
 /// @param resolution expected resolution from the sleep function
-play::play( double speed, bool quiet, const boost::posix_time::time_duration& resolution ):
-    m_speed( speed ),
-    m_resolution( resolution ),
-    m_lag( false ),
-    m_lagCounter( 0U ),
-    m_quiet( quiet )
+play::play( double speed, bool quiet, const boost::posix_time::time_duration& resolution )
+    : m_times_initialized( false )
+    , m_speed( speed )
+    , m_resolution( resolution )
+    , m_lag( false )
+    , m_lagCounter( 0U )
+    , m_quiet( quiet )
 {
 }
 
@@ -54,13 +55,13 @@ play::play( double speed, bool quiet, const boost::posix_time::time_duration& re
 void play::wait( const boost::posix_time::ptime& time )
 {
 
-    if ( !m_offset )
+    if ( !m_times_initialized )
     {
         boost::posix_time::ptime systemTime = boost::get_system_time();
-        m_offset = systemTime - time;
         m_systemFirst = systemTime;
         m_first = time;
         m_last = time;
+        m_times_initialized = true;
     }
     else
     {        
diff --git a/csv/applications/play/play.h b/csv/applications/play/play.h
index 4fda2fc06..bcc820cd9 100644
--- a/csv/applications/play/play.h
+++ b/csv/applications/play/play.h
@@ -49,8 +49,8 @@ class play
     void wait( const std::string& isoTime );
 
 private:
+    bool m_times_initialized;
     boost::posix_time::ptime m_systemFirst; /// system time at first timestamp
-    boost::optional< boost::posix_time::time_duration > m_offset; /// offset between timestamps and system time
     boost::posix_time::ptime m_first; /// first timestamp
     boost::posix_time::ptime m_last; /// last timestamp received
     const double m_speed;

From 7b017a3adcc61f47e9ba29bb70074863aaaca88a Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Thu, 11 Jul 2019 19:02:08 +1000
Subject: [PATCH 0379/1056] csv-play: correctly handle pausing in interactive
 mode

---
 csv/applications/csv-play.cpp     | 23 +++++++++++++++++------
 csv/applications/play/multiplay.h |  2 ++
 csv/applications/play/play.cpp    |  9 ++++++++-
 csv/applications/play/play.h      |  2 ++
 4 files changed, 29 insertions(+), 7 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index e2b5dca96..c45d84168 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -148,6 +148,8 @@ static void usage( bool )
     exit( 0 );
 }
 
+static boost::scoped_ptr< comma::Multiplay > multiplay;
+
 class playback_state_t
 {
 public:
@@ -161,32 +163,42 @@ class playback_state_t
         if( state_ != state::paused )
         {
             state_ = state::paused;
-            std::cerr << "csv-play: paused";
-            if( ! t.is_not_a_date_time() ) { std::cerr << " at " << boost::posix_time::to_iso_string( t ); }
-            std::cerr << std::endl;
+            paused_time_ = boost::posix_time::microsec_clock::universal_time();
+            if( ! t.is_not_a_date_time() ) { std::cerr << "csv-play: paused at " << boost::posix_time::to_iso_string( t ) << std::endl; }
         }
     }
 
+    void unpause()
+    {
+        multiplay->paused_for( boost::posix_time::microsec_clock::universal_time() - paused_time_ );
+    }
+
     void run()
     {
         if( state_ != state::running )
         {
+            if( state_ == state::paused ) { unpause(); }
             state_ = state::running;
             std::cerr << "csv-play: resumed" << std::endl;
         }
     }
 
-    void read_once() { state_ = state::read_once; }
+    void read_once()
+    {
+        if( state_ == state::paused ) { unpause(); }
+        state_ = state::read_once;
+    }
 
     void has_read_once()
     {
-        if( state_ == state::read_once ) { state_ = state::paused; }
+        if( state_ == state::read_once ) { pause(); }
     }
 
 private:
     enum class state { running, paused, read_once, read_block };
 
     state state_;
+    boost::posix_time::ptime paused_time_;
 };
 
 static playback_state_t playback;
@@ -270,7 +282,6 @@ class key_press_handler_t
 
 int main( int argc, char** argv )
 {
-    boost::scoped_ptr< comma::Multiplay > multiplay;
     try
     {
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
diff --git a/csv/applications/play/multiplay.h b/csv/applications/play/multiplay.h
index c10c35d0f..040db7bcd 100644
--- a/csv/applications/play/multiplay.h
+++ b/csv/applications/play/multiplay.h
@@ -81,6 +81,8 @@ class Multiplay
         
         boost::posix_time::ptime now() const { return now_; }
 
+        void paused_for( const boost::posix_time::time_duration& pause_duration ) { m_play.paused_for( pause_duration ); }
+
     private:
         std::vector<SourceConfig> m_configs;
         std::vector< boost::shared_ptr< comma::io::istream > > istreams_;
diff --git a/csv/applications/play/play.cpp b/csv/applications/play/play.cpp
index 8065a6e9e..071693f13 100644
--- a/csv/applications/play/play.cpp
+++ b/csv/applications/play/play.cpp
@@ -108,5 +108,12 @@ void play::wait( const std::string& isoTime )
     wait( boost::posix_time::from_iso_string( isoTime ) );
 }
 
+/// allow for a pause in playback
+/// @param pause_duration duration of pause
+void play::paused_for( const boost::posix_time::time_duration& pause_duration )
+{
+    if( m_times_initialized ) { m_systemFirst += pause_duration; }
+}
+
+
 } } } // namespace comma { namespace csv { namespace impl {
-    
\ No newline at end of file
diff --git a/csv/applications/play/play.h b/csv/applications/play/play.h
index bcc820cd9..fa9acccbf 100644
--- a/csv/applications/play/play.h
+++ b/csv/applications/play/play.h
@@ -48,6 +48,8 @@ class play
 
     void wait( const std::string& isoTime );
 
+    void paused_for( const boost::posix_time::time_duration& pause_duration );
+
 private:
     bool m_times_initialized;
     boost::posix_time::ptime m_systemFirst; /// system time at first timestamp

From 95c28977dfa727121f62c6bf81eb8104534ee349 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Fri, 12 Jul 2019 10:41:07 +1000
Subject: [PATCH 0380/1056] csv-play.cpp: removed unrequired includes (and
 added one)

---
 csv/applications/csv-play.cpp | 7 +------
 1 file changed, 1 insertion(+), 6 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index c45d84168..7c73eebd8 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -32,30 +32,25 @@
 #include <fcntl.h>
 #include <stdio.h>
 #ifdef WIN32
-#include <stdio.h>
 #include <io.h>
 #else
 #include <errno.h>
 #include <sys/ioctl.h>
 #include <sys/types.h>
-#include <termios.h>
 #include <unistd.h>
-#include <sys/types.h>
 #include <sys/stat.h>
 #endif
 #include <termios.h>
 
 #include <iostream>
-#include <fstream>
+#include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../csv/options.h"
-#include "../../csv/stream.h"
 #include "../../csv/traits.h"
 #include "../../name_value/parser.h"
-#include "../../csv/applications/play/play.h"
 #include "../../csv/applications/play/multiplay.h"
 
 static void bash_completion( unsigned const ac, char const* const* av )

From b9277644c85c865f3026d781012ce0b4eeadebd5 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Fri, 12 Jul 2019 11:47:54 +1000
Subject: [PATCH 0381/1056] play/play.cpp: refactor m_speed to mean speed-up
 factor, rather than slowdown

that matches the meaning given by csv-play
---
 csv/applications/csv-play.cpp  | 2 +-
 csv/applications/play/play.cpp | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 7c73eebd8..3b9319845 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -302,7 +302,7 @@ int main( int argc, char** argv )
         if( !from.empty() ) { fromtime = boost::posix_time::from_iso_string( from ); }
         boost::posix_time::ptime totime;
         if( !to.empty() ) { totime = boost::posix_time::from_iso_string( to ); }
-        multiplay.reset( new comma::Multiplay( sourceConfigs, 1.0 / speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int> (resolution * 1000000) ), fromtime, totime, flush ) );
+        multiplay.reset( new comma::Multiplay( sourceConfigs, speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int>( resolution * 1000000 )), fromtime, totime, flush ));
         if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
         key_press_handler_t key_press_handler( options.exists( "--interactive,-i" ) || options.exists( "--paused,--paused-at-start" ));
         while( !shutdown_flag && std::cout.good() && !std::cout.bad() && !std::cout.eof() )
diff --git a/csv/applications/play/play.cpp b/csv/applications/play/play.cpp
index 071693f13..3d794e4b6 100644
--- a/csv/applications/play/play.cpp
+++ b/csv/applications/play/play.cpp
@@ -37,7 +37,7 @@
 namespace comma { namespace csv { namespace impl {
     
 /// constructor    
-/// @param speed slow-down factor: 1.0 = real time, 2.0 = twice as slow etc...
+/// @param speed speed-up factor: 1.0 = real time, 0.5 = half speed etc
 /// @param quiet if true, do not output warnings if we can not keep up with the desired playback speed
 /// @param resolution expected resolution from the sleep function
 play::play( double speed, bool quiet, const boost::posix_time::time_duration& resolution )
@@ -68,7 +68,7 @@ void play::wait( const boost::posix_time::ptime& time )
         if ( time > m_last )
         {
             boost::posix_time::ptime systemTime = boost::get_system_time();
-            const boost::posix_time::ptime target = m_systemFirst + boost::posix_time::milliseconds( static_cast<long>(( time - m_first ).total_milliseconds() * m_speed ) );
+            const boost::posix_time::ptime target = m_systemFirst + boost::posix_time::milliseconds( static_cast<long>(( time - m_first ).total_milliseconds() / m_speed ) );
             const boost::posix_time::time_duration lag = systemTime - target;
             if ( !m_quiet && ( lag > m_resolution ) ) // no need to be alarmed for a lag less than the expected accuracy
             {

From 9226fd913cc6e8f45fe20462694fe578b8f56be8 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Tue, 16 Jul 2019 18:49:53 +1000
Subject: [PATCH 0382/1056] csv-play: added <q> (quit) in interactive mode

---
 csv/applications/csv-play.cpp | 24 ++++++++++++++++--------
 1 file changed, 16 insertions(+), 8 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 3b9319845..6534110be 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -71,6 +71,15 @@ static void bash_completion( unsigned const ac, char const* const* av )
     exit( 0 );
 }
 
+static void interactive_help( std::string prefix )
+{
+    prefix.assign( prefix.size(), ' ' );
+    std::cerr << prefix << "<space>: pause or resume" << std::endl;
+    std::cerr << prefix << "right or down arrow key: output one record at a time" << std::endl;
+    std::cerr << prefix << "<t>: output current timestamp to stderr" << std::endl;
+    std::cerr << prefix << "<q>: quit" << std::endl;
+}
+
 static void usage( bool )
 {
     std::cerr << std::endl;
@@ -92,10 +101,7 @@ static void usage( bool )
     std::cerr << "               can be specified individually for each client, e.g." << std::endl;
     std::cerr << "               csv-play file1;pipe;clients=1 file2;tcp:1234;clients=3" << std::endl;
     std::cerr << "    --interactive,-i: react to key presses:" << std::endl;
-    std::cerr << "                      <space>: pause, resume" << std::endl;
-    std::cerr << "                      right or down arrow key: output one record at a time" << std::endl;
-    std::cerr << "                      shift right or down arrow key: TODO: output one block at a time" << std::endl;
-    std::cerr << "                      <t>: output current timestamp to stderr" << std::endl;
+    interactive_help( "    --interactive,-i: " );
     std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
     std::cerr << "    --paused-at-start,--paused: start playback as paused, implies --interactive" << std::endl;
     std::cerr << "    --resolution=<second>: timestamp resolution; timestamps closer than this value will be" << std::endl;
@@ -144,6 +150,7 @@ static void usage( bool )
 }
 
 static boost::scoped_ptr< comma::Multiplay > multiplay;
+static bool quit = false;
 
 class playback_state_t
 {
@@ -220,6 +227,9 @@ class key_press_handler_t
                 if( !c ) { return; }
                 if( *c == 66 || *c == 67 ) { playback.read_once(); } // down or right arrow
                 break;
+            case 'q':
+                quit = true;
+                break;
             case 't':
                 std::cerr << boost::posix_time::to_iso_string( t ) << std::endl;
                 break;
@@ -245,9 +255,7 @@ class key_press_handler_t
             new_termios.c_iflag &= ~( BRKINT | ICRNL | INPCK | ISTRIP | IXON );
             if( ::tcsetattr( fd_, TCSANOW, &new_termios ) < 0 ) { COMMA_THROW( comma::exception, "failed to set '" << tty << "'" ); }
             std::cerr << "csv-play: running in interactive mode" << std::endl;
-            std::cerr << "          press <space> to pause or resume" << std::endl;
-            std::cerr << "          press right or down arrow key to output one record at a time" << std::endl;
-            std::cerr << "          press <t> to output current timestamp to stderr" << std::endl;
+            interactive_help( "csv-play: " );
         }
         
         ~key_press_t_()
@@ -305,7 +313,7 @@ int main( int argc, char** argv )
         multiplay.reset( new comma::Multiplay( sourceConfigs, speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int>( resolution * 1000000 )), fromtime, totime, flush ));
         if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
         key_press_handler_t key_press_handler( options.exists( "--interactive,-i" ) || options.exists( "--paused,--paused-at-start" ));
-        while( !shutdown_flag && std::cout.good() && !std::cout.bad() && !std::cout.eof() )
+        while( !shutdown_flag && !quit && std::cout.good() && !std::cout.bad() && !std::cout.eof() )
         {
             key_press_handler.update( multiplay->now() );
             if( playback.is_paused() ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }

From 8cc920692107f3b0a106e82e4a039ea264d9bfc6 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Tue, 16 Jul 2019 18:50:56 +1000
Subject: [PATCH 0383/1056] csv-play.cpp: removed test for cout.bad and eof;
 good() is sufficient

---
 csv/applications/csv-play.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 6534110be..9574b278d 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -313,7 +313,7 @@ int main( int argc, char** argv )
         multiplay.reset( new comma::Multiplay( sourceConfigs, speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int>( resolution * 1000000 )), fromtime, totime, flush ));
         if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
         key_press_handler_t key_press_handler( options.exists( "--interactive,-i" ) || options.exists( "--paused,--paused-at-start" ));
-        while( !shutdown_flag && !quit && std::cout.good() && !std::cout.bad() && !std::cout.eof() )
+        while( !shutdown_flag && !quit && std::cout.good() )
         {
             key_press_handler.update( multiplay->now() );
             if( playback.is_paused() ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }

From 9672db31e7519441d27b24f0a79dceaceab330dd Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Wed, 24 Jul 2019 14:53:47 +1000
Subject: [PATCH 0384/1056] csv-play: allow --verbose,-v flags

even though we don't use them, we allow them to be placed on the command-line
without changing behaviour
---
 csv/applications/csv-play.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 9574b278d..702dde790 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -298,7 +298,7 @@ int main( int argc, char** argv )
         std::string to = options.value< std::string>( "--to", "" );
         bool quiet =  options.exists( "--quiet" );
         bool flush =  !options.exists( "--no-flush" );
-        std::vector< std::string > configstrings = options.unnamed("--interactive,-i,--paused,--paused-at-start,--quiet,--flush,--no-flush","--slow,--slowdown,--speed,--resolution,--binary,--fields,--clients,--from,--to");
+        std::vector< std::string > configstrings = options.unnamed( "--verbose,-v,--interactive,-i,--paused,--paused-at-start,--quiet,--flush,--no-flush","--slow,--slowdown,--speed,--resolution,--binary,--fields,--clients,--from,--to" );
         if( configstrings.empty() ) { configstrings.push_back( "-;-" ); }
         comma::csv::options csv( argc, argv );
         csv.full_xpath = false;

From f9a0ef6f968177d19c62b90927bfba9ebe690ba6 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Wed, 24 Jul 2019 15:16:38 +1000
Subject: [PATCH 0385/1056] csv-play.cpp: split key sequence reading from
 action

---
 csv/applications/csv-play.cpp | 48 +++++++++++++++++++++++++----------
 1 file changed, 34 insertions(+), 14 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 702dde790..f0fc8ac74 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -209,36 +209,56 @@ class key_press_handler_t
 {
 public:
     key_press_handler_t( bool interactive ) : key_press_( interactive ) {}
-    
+
     void update( boost::posix_time::ptime t )
     {
-        boost::optional< char > c = key_press_.read();
-        if( !c ) { return; }
-        switch( *c )
+        key k = get_key();
+        switch( k )
         {
-            case ' ':
+            case key::space:
                 if( playback.is_running() ) { playback.pause( t ); }
                 else { playback.run(); }
                 break;
-            case 27:                    // escape sequence for arrows: ESC-[
-                c = key_press_.read();
-                if( !c || *c != 91 ) { return; }
-                c = key_press_.read();
-                if( !c ) { return; }
-                if( *c == 66 || *c == 67 ) { playback.read_once(); } // down or right arrow
+            case key::down_arrow:
+            case key::right_arrow:
+                playback.read_once();
                 break;
-            case 'q':
+            case key::q:
                 quit = true;
                 break;
-            case 't':
+            case key::t:
                 std::cerr << boost::posix_time::to_iso_string( t ) << std::endl;
                 break;
-            default:
+            case key::none:
+            case key::other:
                 break;
         }
     }
     
 private:
+    enum class key { none, space, right_arrow, down_arrow, q, t, other };
+
+    key get_key()
+    {
+        boost::optional< char > c = key_press_.read();
+        if( !c ) { return key::none; }
+        switch( *c )
+        {
+            case ' ': return key::space;
+            case 'q': return key::q;
+            case 't': return key::t;
+            case 27:                    // escape sequence for arrows: ESC-[
+                c = key_press_.read();
+                if( !c || *c != 91 ) { break; }
+                c = key_press_.read();
+                if( !c ) { break; }
+                if( *c == 66 ) { return key::down_arrow; }
+                if( *c == 67 ) { return key::right_arrow; }
+                break;
+        }
+        return key::other;
+    }
+
     class key_press_t_
     {
     public:

From 14964cd95386e011b019f5bf282d323f650f29c0 Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Mon, 12 Aug 2019 17:13:24 +1000
Subject: [PATCH 0386/1056] csv-play: added --pause-at option

---
 csv/applications/csv-play.cpp | 22 ++++++++++++++++++----
 1 file changed, 18 insertions(+), 4 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index f0fc8ac74..9fce41843 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -104,6 +104,7 @@ static void usage( bool )
     interactive_help( "    --interactive,-i: " );
     std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
     std::cerr << "    --paused-at-start,--paused: start playback as paused, implies --interactive" << std::endl;
+    std::cerr << "    --pause-at=[<timestamp>]; pause when timestamp reached, implies --interactive" << std::endl;
     std::cerr << "    --resolution=<second>: timestamp resolution; timestamps closer than this value will be" << std::endl;
     std::cerr << "                           played without delay; the rationale is that microsleep used in csv-play" << std::endl;
     std::cerr << "                           (boost::this_thread::sleep()) is essentially imprecise and may create" << std::endl;
@@ -318,7 +319,7 @@ int main( int argc, char** argv )
         std::string to = options.value< std::string>( "--to", "" );
         bool quiet =  options.exists( "--quiet" );
         bool flush =  !options.exists( "--no-flush" );
-        std::vector< std::string > configstrings = options.unnamed( "--verbose,-v,--interactive,-i,--paused,--paused-at-start,--quiet,--flush,--no-flush","--slow,--slowdown,--speed,--resolution,--binary,--fields,--clients,--from,--to" );
+        std::vector< std::string > configstrings = options.unnamed( "--verbose,-v,--interactive,-i,--paused,--paused-at-start,--quiet,--flush,--no-flush","--pause-at,--slow,--slowdown,--speed,--resolution,--binary,--fields,--clients,--from,--to" );
         if( configstrings.empty() ) { configstrings.push_back( "-;-" ); }
         comma::csv::options csv( argc, argv );
         csv.full_xpath = false;
@@ -332,11 +333,24 @@ int main( int argc, char** argv )
         if( !to.empty() ) { totime = boost::posix_time::from_iso_string( to ); }
         multiplay.reset( new comma::Multiplay( sourceConfigs, speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int>( resolution * 1000000 )), fromtime, totime, flush ));
         if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
-        key_press_handler_t key_press_handler( options.exists( "--interactive,-i" ) || options.exists( "--paused,--paused-at-start" ));
+        boost::optional< boost::posix_time::ptime > pause_at_timestamp = boost::make_optional( options.exists( "--pause-at" ), boost::posix_time::from_iso_string( options.value< std::string >( "--pause-at" )));
+        key_press_handler_t key_press_handler(  options.exists( "--interactive,-i" )
+                                             || options.exists( "--paused,--paused-at-start" )
+                                             || options.exists( "--pause-at" ));
         while( !shutdown_flag && !quit && std::cout.good() )
         {
-            key_press_handler.update( multiplay->now() );
-            if( playback.is_paused() ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }
+            boost::posix_time::ptime now = multiplay->now();
+            key_press_handler.update( now );
+            if( pause_at_timestamp && !now.is_not_a_date_time() && *pause_at_timestamp < now )
+            {
+                playback.pause( now );
+                pause_at_timestamp = boost::none;
+            }
+            if( playback.is_paused() )
+            {
+                boost::this_thread::sleep( boost::posix_time::millisec( 200 ) );
+                continue;
+            }
             if( !multiplay->read() ) { break; }
             playback.has_read_once();
         }

From 4b190170d5e1edcbb4a8ee35f6cf6979f621569d Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Tue, 13 Aug 2019 16:57:17 +1000
Subject: [PATCH 0387/1056] csv-play: fixed bug with --pause-at option

---
 csv/applications/csv-play.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 9fce41843..8e9a6542a 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -333,7 +333,9 @@ int main( int argc, char** argv )
         if( !to.empty() ) { totime = boost::posix_time::from_iso_string( to ); }
         multiplay.reset( new comma::Multiplay( sourceConfigs, speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int>( resolution * 1000000 )), fromtime, totime, flush ));
         if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
-        boost::optional< boost::posix_time::ptime > pause_at_timestamp = boost::make_optional( options.exists( "--pause-at" ), boost::posix_time::from_iso_string( options.value< std::string >( "--pause-at" )));
+        boost::optional< std::string > pause_at_option = options.optional< std::string >( "--pause-at" );
+        boost::optional< boost::posix_time::ptime > pause_at_timestamp;
+        if( pause_at_option ) { pause_at_timestamp = boost::posix_time::from_iso_string( *pause_at_option ); }
         key_press_handler_t key_press_handler(  options.exists( "--interactive,-i" )
                                              || options.exists( "--paused,--paused-at-start" )
                                              || options.exists( "--pause-at" ));

From b27b1b790f2f407f340598f041eddfec3e8e43dd Mon Sep 17 00:00:00 2001
From: dave <dave@acfr.usyd.edu.au>
Date: Tue, 13 Aug 2019 18:04:14 +1000
Subject: [PATCH 0388/1056] csv-play: remove compilation warning

---
 csv/applications/csv-play.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 8e9a6542a..8e618a287 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -334,7 +334,7 @@ int main( int argc, char** argv )
         multiplay.reset( new comma::Multiplay( sourceConfigs, speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int>( resolution * 1000000 )), fromtime, totime, flush ));
         if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
         boost::optional< std::string > pause_at_option = options.optional< std::string >( "--pause-at" );
-        boost::optional< boost::posix_time::ptime > pause_at_timestamp;
+        boost::optional< boost::posix_time::ptime > pause_at_timestamp = boost::make_optional< boost::posix_time::ptime >( false, boost::posix_time::not_a_date_time );
         if( pause_at_option ) { pause_at_timestamp = boost::posix_time::from_iso_string( *pause_at_option ); }
         key_press_handler_t key_press_handler(  options.exists( "--interactive,-i" )
                                              || options.exists( "--paused,--paused-at-start" )

From 590250aedf3acb09155859f22b60149ce6c5e56b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 16 Mar 2021 16:53:33 +1100
Subject: [PATCH 0389/1056] application::command_line_options::assert_exists()
 implemented

---
 application/command_line_options.cpp | 2 ++
 application/command_line_options.h   | 3 +++
 2 files changed, 5 insertions(+)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 42a406177..31872993a 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -177,6 +177,8 @@ void command_line_options::assert_mutually_exclusive( const std::string& names )
     }
 }
 
+void command_line_options::assert_exists( const std::string& names ) const { if( !exists( names ) ) { COMMA_THROW( comma::exception, "please specify one of the following: " << names  ); } }
+
 void command_line_options::assert_mutually_exclusive( const std::string& first, const std::string& second ) const
 {
     const std::vector< std::string >& v = comma::split( first, ',' );
diff --git a/application/command_line_options.h b/application/command_line_options.h
index 8fbdf1dff..10fff8d41 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -124,6 +124,9 @@ class command_line_options
         
         /// throw, if at least one option from each set is present
         void assert_mutually_exclusive( const std::string& first, const std::string& second ) const;
+        
+        /// throw, if not at least one of options in the list exists, trivial convenience method
+        void assert_exists( const std::string& comma_separated_names ) const;
 
         /// description
         struct description

From d4228b49805e4f8e3451fda970d1031e67a4a995 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 20 May 2021 10:57:02 +1000
Subject: [PATCH 0390/1056] io-topics: replaced deprecated csv-size with
 "csv-format size"

---
 io/applications/io-topics | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 3c6a218d6..1229e76f5 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -279,7 +279,7 @@ function set_topic_variables()
     eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
     eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
     topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )" # quick and dirty
-    if [[ -n "$topic_binary" ]]; then size_option="--size $( csv-size $topic_binary )"
+    if [[ -n "$topic_binary" ]]; then size_option="--size $( echo $topic_binary | csv-format size )"
     elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
     else unset size_option; fi
 }

From 5e8235e9594bd503fc193fa65f98584717b8b35c Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 24 May 2021 10:13:33 +1000
Subject: [PATCH 0391/1056] csv-thin: minor whitespace cleanup in help

---
 csv/applications/csv-thin.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index e9ce3d778..f65ae9848 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -75,14 +75,12 @@ static void usage( bool verbose = false )
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
-    std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    output 70% of data:          cat full.csv | csv-thin 0.7" << std::endl;
     std::cerr << "    output once every 2 seconds: cat full.csv | csv-thin --period 2" << std::endl;
     std::cerr << "    using timestamp from input:  cat full.csv | csv-thin --period 2 --fields t" << std::endl;
     std::cerr << "    binary data:                 cat full.bin | csv-thin 0.1 --binary 3d" << std::endl;
     std::cerr << std::endl;
-    std::cerr << std::endl;
     exit( 1 );
 }
 

From c0eb01c3b592289c2441fc8c257e84b4612c84f9 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 24 May 2021 10:14:14 +1000
Subject: [PATCH 0392/1056] csv-thin: honour --flush option when --fields
 option is used

---
 csv/applications/csv-thin.cpp | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index f65ae9848..a71e24183 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -161,6 +161,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         bool binary = options.exists( "--size,-s,--binary,-b" );
+        bool flush = options.exists( "--flush" );
         deterministic = options.exists( "--deterministic,-d" );
         invert = options.exists( "--invert,-i" );
         seed = options.optional< comma::uint32 >( "--seed" );
@@ -178,8 +179,12 @@ int main( int ac, char** av )
                 const timestamped* p = istream.read();
                 if( !p ) { break; }
                 if( skip_by_timestamp( p->timestamp ) != invert ) { continue; }
-                if( istream.is_binary()) { std::cout.write( istream.binary().last(), istream.binary().size() ); }
-                else { std::cout << comma::join( istream.ascii().last(), istream.ascii().ascii().delimiter() )<< std::endl; }
+                if( istream.is_binary())
+                {
+                    std::cout.write( istream.binary().last(), istream.binary().size() );
+                    if( flush ) { std::cout.flush(); }
+                }
+                else { std::cout << comma::join( istream.ascii().last(), istream.ascii().ascii().delimiter() ) << std::endl; }
             }
             return 0;
         }

From b5fa70a69dbf0a8b5a45d8edcf3f882c8012d425 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 28 May 2021 13:36:27 +1000
Subject: [PATCH 0393/1056] csv-random --seed made unsigned int

---
 csv/applications/csv-random.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 8e7789ee3..f295f55c7 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -20,7 +20,7 @@ static void usage( bool verbose )
     std::cerr << "random operations on input stream" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
-    std::cerr << "    --seed=[<int>]; random seed" << std::endl;
+    std::cerr << "    --seed=[<unsigned int>]; random seed" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
     std::cerr << "    make: output pseudo-random numbers" << std::endl;
@@ -443,7 +443,7 @@ int main( int ac, char** av )
         if( unnamed.empty() ) { std::cerr << "csv-random: please specify operation" << std::endl; return 1; }
         ::csv = comma::csv::options( options );
         std::cout.precision( ::csv.precision );
-        ::seed = options.optional< int >( "--seed" );
+        ::seed = options.optional< comma::uint32 >( "--seed" );
         ::verbose = options.exists( "--verbose,-v" );
         std::string operation = unnamed[0];
         if( operation == "make" ) { return comma::applications::random::make::run( options ); }

From c11c71b9acbd467e85c397e425293ee1f661b352 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 1 Jun 2021 20:34:27 +1000
Subject: [PATCH 0394/1056] io-topics: only show examples with --help --verbose

they're a bit overwhelming for a first look at the application
---
 io/applications/io-topics | 15 +++++++++++++--
 1 file changed, 13 insertions(+), 2 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 1229e76f5..f46cb6aa1 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -52,6 +52,7 @@ EOF
 
 function usage()
 {
+    local verbose=$1
     cat >&2 <<eof
     
 a simple topic publisher supporting tcp, local sockets, and zero-mq (i.e. whatever io-publish supports)
@@ -76,6 +77,9 @@ $( log_options | sed 's/^/            /g' )
 common options
 $( common_options | sed 's/^/    /g' )
 
+eof
+    if (( verbose )); then
+        cat >&2 <<eof
 examples
     publish
         run publisher with topics a and b, with b on demand
@@ -136,8 +140,11 @@ examples
             > io-topics log --dir my-log --config <( echo "a/address=tcp:localhost:12345"; echo 'b/command=socat tcp:localhost:12346 - > log.csv' )
             > ls -al my-log/a
             > head my-log/b/log.csv
-
 eof
+    else
+        echo "use \"$scriptname --help --verbose\" for examples"
+    fi
+    echo
     exit 0
 }
 
@@ -378,7 +385,11 @@ function get_topics()
     verbose "topics: ${topics[@]}"
 }
 
-(( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )) && usage
+if (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )); then
+    (( $( comma_options_has --verbose "$@" ) || $( comma_options_has -v "$@" ) )) && verbose=1 || verbose=0
+    usage $verbose
+fi
+
 operation=$1
 [[ $( type -t ${operation}_topic_fields ) == "function" ]] || die "expected operation, got '$operation'" # quick and dirty
 (( $( comma_options_has --topic-fields "$@" ) )) && { ${operation}_topic_fields; exit 0; }

From 9a685b4e1e503655274d8484ab94c74075c84b8a Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 1 Jun 2021 22:13:46 +1000
Subject: [PATCH 0395/1056] io-topics: reflowed help to fit cleanly on 80
 character terminal

---
 io/applications/io-topics | 147 ++++++++++++++++++++++++--------------
 1 file changed, 94 insertions(+), 53 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index f46cb6aa1..121c2d6c3 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -40,13 +40,19 @@ source $( type -p comma-process-util ) || { echo "io-topics: could not source 'c
 function common_options()
 {
     cat <<EOF
---help,-h; display help and exit
---config=[<config>]; <config>: <dir>[:<path>], where <dir> is path to a json or path-value file specifying topic attributes, <path>: path inside config, multiple --config options allowed, configs will be applied in the reverse order of --config options on command line (see examples)
---dry-run,--dry; print final command and exit
---topics-from-all-configs,--all; take topics from all configs and topic command values, default: take topics and topic command values only from the first config ("master config")
---topic-fields; output topic config fields and exit
+--help,-h;           display help and exit
+--config=[<config>]; <config>: <dir>[:<path>], where <dir> is path to a
+                     json or path-value file specifying topic attributes,
+                     <path>: path inside config, multiple --config options
+                     allowed, configs will be applied in the reverse order
+                     of --config options on command line (see examples)
+--dry-run,--dry;     print final command and exit
+--topics-from-all-configs,--all; take topics from all configs and topic
+                     command values, default: take topics and topic command
+                     values only from the first config ("master config")
+--topic-fields;      output topic config fields and exit
 --topic-fields-help; output topic config fields help and exit
---verbose,-v; print verbose information
+--verbose,-v;        print verbose information
 EOF
 }
 
@@ -55,91 +61,122 @@ function usage()
     local verbose=$1
     cat >&2 <<eof
     
-a simple topic publisher supporting tcp, local sockets, and zero-mq (i.e. whatever io-publish supports)
+a simple topic publisher supporting tcp, local sockets, and zero-mq
+(i.e. whatever io-publish supports)
 
 usage: io-topics <operation> [<topics>] <options>
 
 todo: debug zero-mq support
 
 operations
-    cat: receive and handle data on given topics
-    
-    list: list topics
-    
-    log: log topics (todo)
-        options
-$( log_options | sed 's/^/            /g' )
-
-    play: play back logs, counterpart to log operation (todo)
-    
-    publish: start all the publishers listed on command line or in the config file (todo)
+    cat:     receive and handle data on given topics
+    list:    list topics
+    log:     log topics (todo)
+    play:    play back logs, counterpart to log operation (todo)
+    publish: start all the publishers listed on command line or config file (todo)
 
 common options
 $( common_options | sed 's/^/    /g' )
 
+log operation options
+$( log_options | sed 's/^/    /g' )
+
 eof
     if (( verbose )); then
         cat >&2 <<eof
 examples
-    publish
-        run publisher with topics a and b, with b on demand
-            > io-topics publish --config <( echo "a/command=csv-paste line-number"; echo "a/port=8888"; echo "b/command=csv-paste line-number"; echo "b/port=9999"; echo "b/on_demand=1" )
+    --- publish ---
+        run publisher with topics a and b, with b on demand:
+            $ io-topics publish --config <( sed 's/^ *//' <<EOF
+                  a/command=csv-paste line-number
+                  a/port=8888
+                  b/command=csv-paste line-number
+                  b/port=9999
+                  b/on_demand=1
+EOF
+)
             io-topics: will run 'comma_execute_and_wait --group' with commands:
-            io-topics:     io-publish tcp:8888   -- csv-paste line-number
-            io-topics:     io-publish tcp:9999  --on-demand -- csv-paste line-number
+            io-topics: io-publish tcp:8888   -- csv-paste line-number
+            io-topics: io-publish tcp:9999  --on-demand -- csv-paste line-number
         
-        in a different shell, observe that topic a keeps running even if no-one is listening, whereas topic b runs only if at least one client is connected:
-            > socat tcp:localhost:8888 | head -n5 # will output something like:
+        in a different shell, observe that topic a keeps running even if no-one
+        is listening, whereas topic b runs only if at least one client is
+        connected:
+            $ socat tcp:localhost:8888 - | head -n5    # outputs something like:
             16648534
             16648535
             16648536
             16648537
             16648538
-            
-            > socat tcp:localhost:9999 - | head -n5
+            $ socat tcp:localhost:9999 - | head -n5
             0
             1
             2
             3
             4
             
-        secondary address or port with --dry-run (try it without dry run)
-            > io-topics publish --config <( echo "a/command=csv-paste line-number"; echo "a/port=12345"; echo "b/command=csv-paste line-number"; echo "b/port=12346"; echo "b/secondary/port=8888"; echo "b/on_demand=1" ) --dry-run
-            io-topics: publish: will run 'comma_execute_and_wait --group' with commands:
-            io-topics: publish:     io-publish tcp:12345    -- csv-paste line-number
-            io-topics: publish:     io-publish tcp:12346 tcp:8888;secondary  --on-demand -- csv-paste line-number
-            
-    cat
-        run publisher
-            > io-topics publish --config <( echo "a/command=csv-paste line-number"; echo "a/port=12345"; echo "b/command=csv-paste line-number"; echo "b/port=12346"; echo "b/on_demand=1" )
-        
-        in a different shell, run clients
-            > io-topics cat --config <( echo "a/command=head -n5 | tee a.csv"; echo "a/address=tcp:localhost:12345"; echo "b/command=head -n5 | tee b.csv"; echo "b/address=tcp:localhost:12346" )
+        secondary address or port with --dry-run (try it without dry run):
+            $ io-topics publish --config <( sed 's/^ *//' <<EOF
+                  a/command=csv-paste line-number
+                  a/port=12345
+                  b/command=csv-paste line-number
+                  b/port=12346
+                  b/secondary/port=8888
+                  b/on_demand=1
+EOF
+) --dry-run
+            io-topics: publish: will run 'comma_execute_and_wait --group'
+                                with commands:
+            io-topics: publish: io-publish tcp:12345 -- csv-paste line-number
+            io-topics: publish: io-publish tcp:12346 tcp:8888;secondary
+                                           --on-demand -- csv-paste line-number
             
-        check output
-            > cat a.csv 
+    --- cat ---
+        run publisher:
+            $ io-topics publish --config <( sed 's/^ *//' <<EOF
+                  a/command=csv-paste line-number
+                  a/port=12345
+                  b/command=csv-paste line-number
+                  b/port=12346
+                  b/on_demand=1
+EOF
+)
+        in a different shell, run clients:
+            $ io-topics cat --config <( sed 's/^ *//' <<EOF
+                  a/command=head -n5 | tee a.csv
+                  a/address=tcp:localhost:12345
+                  b/command=head -n5 | tee b.csv
+                  b/address=tcp:localhost:12346
+EOF
+)
+        check output:
+            $ cat a.csv 
             203740462
             203740463
             203740464
             203740465
             203740466
-            > cat b.csv 
+            $ cat b.csv 
             0
             1
             2
             3
             4
             
-    log
-        run publisher as in previous examples and then run logging
-            > io-topics log --dir my-log --config <( echo "a/address=tcp:localhost:8888"; echo "b/address=tcp:localhost:9999" )
-            > ls -al my-log/a
-            > ls -al my-log/b
+    --- log ---
+        run publisher as in first example and then run logging:
+            $ io-topics log --dir my-log --config <(
+                  echo "a/address=tcp:localhost:8888"
+                  echo "b/address=tcp:localhost:9999" )
+            $ ls -al my-log/a
+            $ ls -al my-log/b
             
-        run publisher as in previous examples and then run logging with a custom command
-            > io-topics log --dir my-log --config <( echo "a/address=tcp:localhost:12345"; echo 'b/command=socat tcp:localhost:12346 - > log.csv' )
-            > ls -al my-log/a
-            > head my-log/b/log.csv
+        run publisher as in second example and then log with a custom command:
+            $ io-topics log --dir my-log --config <(
+                  echo "a/address=tcp:localhost:12345"
+                  echo 'b/command=socat tcp:localhost:12346 - > log.csv' )
+            $ ls -al my-log/a
+            $ head my-log/b/log.csv
 eof
     else
         echo "use \"$scriptname --help --verbose\" for examples"
@@ -258,8 +295,12 @@ eof
 function log_options()
 {
     cat <<eof
---log-dir,--dir=[<path>]; log directory, for each topic, actual log directory will be [<path>/]<dir>/<topic>, see io-topics log --topic-fields-help
---period=<seconds>; default=60; the log files will be split based on a given time period, settings for specific topic override this option
+--log-dir,--dir=[<path>]; log directory, for each topic, actual log
+                          directory will be [<path>/]<dir>/<topic>,
+                          see io-topics log --topic-fields-help
+--period=<seconds>;       default=60; the log files will be split based
+                          on a given time period, settings for specific
+                          topic override this option
 eof
 }
 

From 8f499049a19715da9f0c97be83b6ab99b861e15a Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 1 Jun 2021 22:17:38 +1000
Subject: [PATCH 0396/1056] io-topics: remove "todo" note from log and publish
 operations

---
 io/applications/io-topics | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 121c2d6c3..8e595601d 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -71,9 +71,9 @@ todo: debug zero-mq support
 operations
     cat:     receive and handle data on given topics
     list:    list topics
-    log:     log topics (todo)
+    log:     log topics
     play:    play back logs, counterpart to log operation (todo)
-    publish: start all the publishers listed on command line or config file (todo)
+    publish: start all the publishers listed on command line or config file
 
 common options
 $( common_options | sed 's/^/    /g' )

From fbbdc183086ea89bcebd15a7d6734dac20ced332 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 1 Jun 2021 22:26:26 +1000
Subject: [PATCH 0397/1056] io-topics: added bash completion

---
 etc/bash_completion.d/comma |  1 +
 io/applications/io-topics   | 11 +++++++++++
 2 files changed, 12 insertions(+)

diff --git a/etc/bash_completion.d/comma b/etc/bash_completion.d/comma
index 55fdd5d91..349dd15cf 100644
--- a/etc/bash_completion.d/comma
+++ b/etc/bash_completion.d/comma
@@ -141,3 +141,4 @@ complete -F _comma_bash_completion csv-repeat
 complete -F _comma_bash_completion csv-time-join
 complete -F _comma_bash_completion csv-units
 complete -F _comma_bash_completion io-bandwidth
+complete -F _comma_bash_completion io-topics
diff --git a/io/applications/io-topics b/io/applications/io-topics
index 8e595601d..458f60572 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -37,6 +37,15 @@ source $( type -p comma-process-util ) || { echo "io-topics: could not source 'c
 
 # todo: --master-config: default behaviour: first config; --guess-by command: all configs
 
+function bash_completion()
+{
+    echo "cat list log publish"
+    {
+        common_options
+        log_options
+    } | comma_options_to_bash_completion
+}
+
 function common_options()
 {
     cat <<EOF
@@ -426,6 +435,8 @@ function get_topics()
     verbose "topics: ${topics[@]}"
 }
 
+(( $( comma_options_has "--bash-completion" $@ ) )) && { bash_completion; exit 0; }
+
 if (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )); then
     (( $( comma_options_has --verbose "$@" ) || $( comma_options_has -v "$@" ) )) && verbose=1 || verbose=0
     usage $verbose

From fae7eb56d75bd14729e9165cb34ad0df7d338f15 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 1 Jun 2021 22:38:47 +1000
Subject: [PATCH 0398/1056] io-topics: derive topic_fields from
 topic_fields_help

---
 io/applications/io-topics | 45 ++++++---------------------------------
 1 file changed, 6 insertions(+), 39 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 458f60572..7fcaf644a 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -201,19 +201,11 @@ function die() { say "$@"; exit 1; }
 
 function list_topic_fields() { :; }
 
-function publish_topic_fields() # todo: flush field? flush is default behaviour in io-publish, which is inconsistent with log and cat operations and thus introducing flush in publish might be confusing
+# todo: flush field? flush is default behaviour in io-publish, which is inconsistent with
+# log and cat operations and thus introducing flush in publish might be confusing
+function publish_topic_fields()
 {
-    cat <<eof
-address
-binary
-command
-input
-on_demand
-port
-secondary/address
-secondary/port
-size
-eof
+    publish_topic_fields_help | cut -f1 -d';'
 }
 
 function publish_topic_fields_help()
@@ -233,17 +225,7 @@ eof
 
 function cat_topic_fields()
 {
-    cat <<eof
-address
-binary
-command
-connect_attempts
-connect_period
-flush
-host
-port
-size
-eof
+    cat_topic_fields_help | cut -f1 -d';'
 }
 
 function cat_topic_fields_help()
@@ -263,22 +245,7 @@ eof
 
 function log_topic_fields()
 {
-    cat <<eof
-address
-binary
-command
-connect_attempts
-connect_period
-flush
-host
-index
-path
-period
-port
-restart
-size
-suffix
-eof
+    log_topic_fields_help | cut -f1 -d';'
 }
 
 function log_topic_fields_help()

From f9306412e70b4256e1c04e1ae58f60d51a16cc14 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 1 Jun 2021 22:49:22 +1000
Subject: [PATCH 0399/1056] io-topics: laid out field descriptions in clearer
 way

---
 io/applications/io-topics | 69 ++++++++++++++++++++-------------------
 1 file changed, 36 insertions(+), 33 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 7fcaf644a..6991bc5c8 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -205,66 +205,69 @@ function list_topic_fields() { :; }
 # log and cat operations and thus introducing flush in publish might be confusing
 function publish_topic_fields()
 {
-    publish_topic_fields_help | cut -f1 -d';'
+    publish_topic_fields_help | grep -v '^ ' | cut -f1 -d';'
 }
 
 function publish_topic_fields_help()
 {
     cat <<eof
-address; if present, passed verbatim to io-publish, in this case port attribute ignored
-binary; if publisher publishes binary data, the binary format of the data, overrides size
-command; command for the publisher to run
-input; input topic for publish command to read on stdin
-on_demand; if present, same meaning as io-publish --on-demand
-port; tcp port for publishing, unless address field is present
-secondary/address; if present, passed verbatim to io-publish as '<address>;secondary', in this case port attribute ignored
-secondary/port; if present, secondary tcp port for publishing, unless address field is present, io-publish as 'tcp:<port>;secondary'
-size; if publisher publishes binary data, size of the binary record, if no binary attribute given
+address;           passed verbatim to io-publish, port attribute will be ignored
+binary;            for binary data, binary format of data, overrides size
+command;           command for the publisher to run
+input;             input topic for publish command to read on stdin
+on_demand;         same meaning as io-publish --on-demand
+port;              tcp port for publishing, unless address field is present
+secondary/address; passed verbatim to io-publish as '<address>;secondary',
+                   in this case port attribute ignored
+secondary/port;    secondary tcp port for publishing, unless address field is
+                   present, io-publish as 'tcp:<port>;secondary'
+size;              for binary data, size of the binary record
 eof
 }
 
 function cat_topic_fields()
 {
-    cat_topic_fields_help | cut -f1 -d';'
+    cat_topic_fields_help | grep -v '^ ' | cut -f1 -d';'
 }
 
 function cat_topic_fields_help()
 {
     cat <<eof
-address; if present, passed verbatim to io-cat, in this case port attribute ignored
-binary; if data is binary, the binary format of the data, overrides size
-command; command for the client to run
+address;          passed verbatim to io-cat, port attribute will be ignored
+binary;           if data is binary, binary format of data, overrides size
+command;          command for the client to run
 connect_attempts; number of connect attempts
-connect_period; time in seconds between connect attempts
-flush; flush output on each record, default: buffer output
-host; tcp host for publishing, unless address field is present
-port; tcp port for publishing, unless address field is present
-size; if if data is binary, size of the binary record, if no binary attribute given
+connect_period;   time in seconds between connect attempts
+flush;            flush output on each record, default: buffer output
+host;             tcp host for publishing, unless address field is present
+port;             tcp port for publishing, unless address field is present
+size;             if data is binary, size of the binary record
 eof
 }
 
 function log_topic_fields()
 {
-    log_topic_fields_help | cut -f1 -d';'
+    log_topic_fields_help | grep -v '^ ' | cut -f1 -d';'
 }
 
 function log_topic_fields_help()
 {
     cat <<eof
-address; if present, passed verbatim to io-cat, in this case port attribute ignored
-binary; if data is binary, the binary format of the data, overrides size
-command; optional command for the logger to run instead of default logger
+address;          passed verbatim to io-cat, in this case port attribute ignored
+binary;           if data is binary, binary format of data, overrides size
+command;          optional command for logger to run instead of default logger
 connect_attempts; number of connect attempts
-connect_period; time in seconds between connect attempts
-flush; flush output on each record, default: buffer output
-host; tcp host for publishing, unless address field is present
-index; optional command to generate index file, default: fixed-width binary index for each binary record, ascii: no index file
-path; prefix path for log directory (e.g. if logs need to be split across multiple drives)
-period; split log files on a given number of seconds, overrides --period
-port; tcp port for publishing, unless address field is present
-restart; if data stream disconnects keep trying to reconnect
-size; if if data is binary, size of the binary record, if no binary attribute given
-suffix; optional log file suffix, default: bin for binary, csv for ascii
+connect_period;   time in seconds between connect attempts
+flush;            flush output on each record, default: buffer output
+host;             tcp host for publishing, unless address field is present
+index;            optional command to generate index file, default: fixed-width
+                  binary index for each binary record, ascii: no index file
+path;             prefix path for log directory (to split logs across drives)
+period;           split log files at given number of seconds, overrides --period
+port;             tcp port for publishing, unless address field is present
+restart;          if data stream disconnects keep trying to reconnect
+size;             if data is binary, size of the binary record
+suffix;           optional log suffix, default: bin for binary, csv for ascii
 eof
 }
 

From 3d21b3d192a10a208a283a5eb3f69a7712c20e3e Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 1 Jun 2021 23:00:13 +1000
Subject: [PATCH 0400/1056] io-topics: added multipler field option for publish
 operation

---
 io/applications/io-topics | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 6991bc5c8..b68b86e83 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -215,6 +215,7 @@ address;           passed verbatim to io-publish, port attribute will be ignored
 binary;            for binary data, binary format of data, overrides size
 command;           command for the publisher to run
 input;             input topic for publish command to read on stdin
+multiplier;        passed to io-publish
 on_demand;         same meaning as io-publish --on-demand
 port;              tcp port for publishing, unless address field is present
 secondary/address; passed verbatim to io-publish as '<address>;secondary',
@@ -318,8 +319,9 @@ function publish_command()
     [[ -n "$topic_address" ]] || topic_address="tcp:$topic_port"
     [[ -n "$topic_secondary_address" ]] || { [[ -z "$topic_secondary_port" ]] || topic_secondary_address="tcp:$topic_secondary_port"; }
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
+    if [[ -n "$topic_multiplier" ]]; then multiplier="--multiplier $topic_multiplier"; else unset multiplier; fi
     if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
-    local cmd="io-publish $topic_address $topic_secondary_address $size_option $on_demand -- "
+    local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand -- "
     if [[ -z "$topic_input" ]]; then cmd+="$topic_command"
     else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"

From 75f15f14ddbe42e7b8ff72d247a5ebc7cbcde7e0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Jul 2021 12:48:16 +1000
Subject: [PATCH 0401/1056] bash/test/examples added

---
 bash/test/examples/expected | 4 ++++
 bash/test/examples/input    | 2 ++
 bash/test/examples/my-util  | 3 +++
 bash/test/examples/test     | 4 ++++
 bash/test/test              | 4 ++--
 5 files changed, 15 insertions(+), 2 deletions(-)
 create mode 100644 bash/test/examples/expected
 create mode 100644 bash/test/examples/input
 create mode 100644 bash/test/examples/my-util
 create mode 100755 bash/test/examples/test

diff --git a/bash/test/examples/expected b/bash/test/examples/expected
new file mode 100644
index 000000000..2027deaff
--- /dev/null
+++ b/bash/test/examples/expected
@@ -0,0 +1,4 @@
+hello/world/output="hello world"
+hello/world/status=0
+hello/jimmy/output="hello jimmy"
+hello/jimmy/status=0
\ No newline at end of file
diff --git a/bash/test/examples/input b/bash/test/examples/input
new file mode 100644
index 000000000..e58f29871
--- /dev/null
+++ b/bash/test/examples/input
@@ -0,0 +1,2 @@
+hello/world="some-function world"
+hello/jimmy="some-function jimmy"
\ No newline at end of file
diff --git a/bash/test/examples/my-util b/bash/test/examples/my-util
new file mode 100644
index 000000000..b27a99881
--- /dev/null
+++ b/bash/test/examples/my-util
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+function some-function() { echo "hello $1"; }
\ No newline at end of file
diff --git a/bash/test/examples/test b/bash/test/examples/test
new file mode 100755
index 000000000..d692563aa
--- /dev/null
+++ b/bash/test/examples/test
@@ -0,0 +1,4 @@
+#!/bin/bash
+source $( type -p comma-test-util ) # test framework stuff
+source my-util # bash utils under test
+comma_test_commands # execute tests defined in file called 'input' and match output agains values in file called 'expected'
diff --git a/bash/test/test b/bash/test/test
index 639918470..bff14d7ad 100755
--- a/bash/test/test
+++ b/bash/test/test
@@ -1,3 +1,3 @@
 #!/bin/bash
-source $( type -p comma-test-util )
-comma_test_commands
+source $( type -p comma-test-util ) # test framework stuff
+comma_test_commands # execute tests defined in file called 'input' and match output agains values in file called 'expected'

From f2346f3ac4dd9d358f38e509f716f6688cb2e1fc Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 8 Jul 2021 13:02:47 +1000
Subject: [PATCH 0402/1056] io-publish: minor tweak to verbose message

---
 io/applications/io-publish.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 703fa2320..33f014d2d 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -334,7 +334,7 @@ class command
 
         ~command()
         {
-            comma::verbose << "killing child pid " << child_pid_ << " for " << command_ << "..." << std::endl;
+            comma::verbose << "sending SIGTERM to " << comma::split( command_ )[0] << " (pid " << child_pid_ << ")..." << std::endl;
             ::kill( -child_pid_, SIGTERM );
             comma::verbose << "waiting for pid " << child_pid_ << "..." << std::endl;
             if( ::waitpid( -child_pid_, NULL, 0 ) < 0 ) { comma::verbose << "warning: waiting for pid " << child_pid_ << " failed" << std::endl; }

From 19fcd0eb9b8b13c93859111c94db51454a682423 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 8 Jul 2021 13:03:18 +1000
Subject: [PATCH 0403/1056] io-publish: explicitly close file descriptor before
 killing child

When the child is a ROS application outputting a high bandwidth stream an
issue occurs where the application hangs in the write() command and doesn't
respond to signals. Explicitly closing the file descriptor before killing the
child seems to fix this condition. ROS signal handling is a little weird.
---
 io/applications/io-publish.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 33f014d2d..1ad5e92c1 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -334,6 +334,8 @@ class command
 
         ~command()
         {
+            comma::verbose << "closing file descriptor " << fd_ << " for " << comma::split( command_ )[0] << "..." << std::endl;
+            ::close( fd_ );
             comma::verbose << "sending SIGTERM to " << comma::split( command_ )[0] << " (pid " << child_pid_ << ")..." << std::endl;
             ::kill( -child_pid_, SIGTERM );
             comma::verbose << "waiting for pid " << child_pid_ << "..." << std::endl;

From 7f77451c0490ec0f10fbd39a460c6d37ba07fae2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 4 Aug 2021 15:59:59 +1000
Subject: [PATCH 0404/1056] csv-eval: installed as entry point (might have
 broken packaging; check later...); pip used for python installation

---
 python/CMakeLists.txt                     | 10 ++++--
 python/comma/csv/applications/__init__.py |  2 ++
 python/comma/csv/applications/csv-eval    | 38 -----------------------
 python/comma/csv/applications/csv_eval.py | 13 +++-----
 python/setup.py                           | 15 +++++----
 5 files changed, 22 insertions(+), 56 deletions(-)
 delete mode 100644 python/comma/csv/applications/csv-eval

diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index 2777db060..d1422ee65 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -79,11 +79,15 @@ set_python_build_lib_directory()
 ADD_SUBDIRECTORY( comma )
 
 ADD_CUSTOM_TARGET( python_build ALL
-                ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE}
-                WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )
+                   ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE}
+                   WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )
+
+#INSTALL( CODE "EXECUTE_PROCESS(
+#                    COMMAND ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE} install ${INSTALL_PREFIX_OPTION} --force
+#                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
 
 INSTALL( CODE "EXECUTE_PROCESS(
-                    COMMAND ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE} install ${INSTALL_PREFIX_OPTION} --force
+                    COMMAND ${PYTHON} -m pip install ${CMAKE_CURRENT_SOURCE_DIR} --ignore-installed
                     WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
 
 SET_DIRECTORY_PROPERTIES( PROPERTIES ADDITIONAL_MAKE_CLEAN_FILES build )
diff --git a/python/comma/csv/applications/__init__.py b/python/comma/csv/applications/__init__.py
index 0cff88821..6cf509948 100644
--- a/python/comma/csv/applications/__init__.py
+++ b/python/comma/csv/applications/__init__.py
@@ -26,3 +26,5 @@
 # WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+from . import csv_eval
\ No newline at end of file
diff --git a/python/comma/csv/applications/csv-eval b/python/comma/csv/applications/csv-eval
deleted file mode 100644
index 340655a02..000000000
--- a/python/comma/csv/applications/csv-eval
+++ /dev/null
@@ -1,38 +0,0 @@
-#!/usr/bin/python
-# todo: once fully ported to python3: !/usr/bin/env python
-
-# This file is part of comma, a generic and flexible library
-# Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-from comma.csv.applications import csv_eval
-import sys, signal
-try:
-    csv_eval.main()
-except KeyboardInterrupt:
-    sys.exit( 128 + signal.SIGINT )
diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index 0ca4f909e..06f8f7d6d 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -1,17 +1,10 @@
 # Copyright (c) 2011 The University of Sydney
 
 from __future__ import print_function
-import argparse
-import ast
-import itertools
-import numpy as np
-import os
-import re
-import signal
-import sys
+import argparse, ast, itertools, numpy as np, os, re, signal, sys
 if sys.version_info.major < 3: from itertools import izip
 else: izip = zip # todo! watch performance! it's reported python3 zip is some 30% slower than izip
-import comma
+import comma # should not it be a relative path?
 
 description = """
 evaluate numerical expressions and append computed values to csv stream
@@ -588,6 +581,8 @@ def main():
         name = os.path.basename(sys.argv[0])
         print( "{} error: {}".format(name, e), file = sys.stderr )
         sys.exit(1)
+    except KeyboardInterrupt:
+        sys.exit(128 + signal.SIGINT)
     except Exception as e: #except StandardError as e:
         import traceback
         traceback.print_exc(file=sys.stderr)
diff --git a/python/setup.py b/python/setup.py
index 08cddec68..df6606515 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,10 +1,9 @@
 #!/usr/bin/env python
 
-from distutils.core import setup
-#from setuptools import setup
+import setuptools #from distutils.core import setup
 import comma.version
 
-setup(
+setuptools.setup(
         name                = 'python3-comma', # quick and dirty to make python packaging work
         version             = comma.version.__version__,
         classifiers = [
@@ -19,14 +18,18 @@
           'Topic :: Communications :: Email'
         ],
         description         = 'comma python utilities',
-        #install_requires    = [ 'numpy' ],
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
         long_description    = 'comma python utilities for offline and streamed csv and fixed width data',
         maintainer          = 'vsevolod vlaskine',
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
+        python_requires     = '>=3.6',
+        install_requires    = ['numpy'], # todo?
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
-        package_dir         = { 'comma.cpp_bindings': 'comma/cpp_bindings' },
+        package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
-        scripts             = [ "comma/csv/applications/csv-eval" ]
+        entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] },
+        #scripts             = [ "comma/csv/applications/csv-eval" ]
      )
+
+# "console_scripts": [ 'sxm-detect=jfab.stm.imaging.scripts.sxm_detect:main'

From 89f2b9aca1267b844dd2a15a18e912881b4e83a6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 9 Sep 2021 19:00:10 +1000
Subject: [PATCH 0405/1056] csv-sort: --help: --last marked as todo

---
 csv/applications/csv-sort.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index d896aedc3..2072328f8 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -68,7 +68,7 @@ static void usage( bool more )
     std::cerr << "           fields" << std::endl;
     std::cerr << "               id: if present, multiple id fields accepted; output first record for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
     std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
-    std::cerr << "    --last: last line matching given keys; last line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
+    std::cerr << "    --last: to be implemented: last line matching given keys; last line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
     std::cerr << "    --min: output only record(s) with minimum value for a given field" << std::endl;
     std::cerr << "           fields" << std::endl;
     std::cerr << "               id: if present, multiple id fields accepted; output minimum for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;

From 2675e810c36e3a8e9d0a5157dcc9594feebc7d12 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 9 Sep 2021 19:16:34 +1000
Subject: [PATCH 0406/1056] csv-sort: --last: now exits with todo message

---
 csv/applications/csv-sort.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index 2072328f8..b6a3a8d73 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -759,6 +759,7 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--min,--sliding-window,--window,--unique,--random" );
         options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--max,--sliding-window,--window,--unique,--random" );
+        if( options.exists( "--last" ) ) { std::cerr << "csv-sort: --last: not implemented; todo" << std::endl; return 1; }
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
         return   options.exists( "--first,--min,--max" )

From 3712698e694460da85a0d2f24b68dc88f8b649f9 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 30 Sep 2021 21:40:23 +1000
Subject: [PATCH 0407/1056] csv-bits: to-csv: implemented; debugging...

---
 csv/applications/csv-bits.cpp | 168 ++++++++++++++++++++++++++++++++++
 1 file changed, 168 insertions(+)
 create mode 100644 csv/applications/csv-bits.cpp

diff --git a/csv/applications/csv-bits.cpp b/csv/applications/csv-bits.cpp
new file mode 100644
index 000000000..4095a58e2
--- /dev/null
+++ b/csv/applications/csv-bits.cpp
@@ -0,0 +1,168 @@
+#include <array>
+#include <memory>
+#include <numeric>
+#include <vector>
+#include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../base/types.h"
+#include "../../string/string.h"
+#include "../stream.h"
+#include "../traits.h"
+
+void usage( bool )
+{
+    std::cerr << "converting between bits and csv and other bit operations" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat input.bin | csv-bits <operation> <options> > output.bin" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations: from-csv (unpack), to-csv (pack)" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    from-csv (pack): todo; convert csv to packed bits" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --endian=<which>; default=big; endianness of input: big or little" << std::endl;
+    std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    to-csv (unpack): todo; convert packed bits to csv" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --endian=<which>; default=big; endianness of output: big or little" << std::endl;
+    std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+// todo
+//   - document on gitlab
+//   - to-csv
+//     - unit test
+//     - support uint64
+//   - from-csv
+//   - use constexpr
+
+namespace comma { namespace csv_bits {
+
+struct unpacked
+{
+    std::vector< comma::uint32 > values;
+    unpacked( unsigned int size = 0 ): values( size, 0 ) {}
+};
+
+struct field
+{
+    unsigned int begin;
+    unsigned int begin_byte;
+    char begin_mask;
+    unsigned int size;
+    unsigned int bytes;
+    unsigned int shift;
+    bool little_endian;
+
+    static std::array< comma::uint32, 32 > begin_masks;
+
+    field() = default;
+    field( unsigned int begin, unsigned int size, bool little_endian )
+        : begin( begin )
+        , begin_byte( begin / 8 )
+        , begin_mask( begin_masks[ begin % 8 ] )
+        , size( size )
+        , bytes( size % 8 + int( size % 8 > 0 ) )
+        , shift( 64 - begin % 8 - size )
+        , little_endian( little_endian )
+    {
+        if( size > sizeof( comma::uint32 ) * 8 ) { COMMA_THROW( comma::exception, "expected size up to " << ( sizeof( comma::uint32 ) * 8 ) << " bits; got: " << size ); }
+    }
+
+    comma::uint32 get( const std::vector< char >& buf ) const // todo: quick and dirty, watch performance
+    {
+        comma::uint64 r = 0;
+        char* p = reinterpret_cast< char* >( &r );
+        std::memcpy( p, &buf[ begin_byte ], bytes );
+        p[0] &= begin_mask;
+        r >>= shift;
+        if( !little_endian )
+        {
+            // todo
+        }
+        return r;
+    }
+};
+
+std::array< comma::uint32, 32 > field::begin_masks = { 255, 127, 63, 31, 15, 7, 3, 1 }; // todo: use constexpr
+
+} } // namespace comma { namespace csv_bits {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv_bits::unpacked >
+{
+    template < typename K, typename V > static void visit( const K&, const comma::csv_bits::unpacked& p, V& v ) { v.apply( "values", p.values ); }
+    template < typename K, typename V > static void visit( const K&, comma::csv_bits::unpacked& p, V& v ) { v.apply( "values", p.values ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace csv_bits { namespace from_csv {
+
+int run( const comma::command_line_options& options )
+{
+    #ifdef WIN32
+        _setmode( _fileno( stdout ), _O_BINARY );
+    #endif
+    comma::csv::options csv( options );
+    std::cerr << "csv-bits: from-csv: todo" << std::endl;
+    return 1;
+}
+
+} } } // namespace comma { namespace csv_bits { namespace from_csv {
+
+namespace comma { namespace csv_bits { namespace to_csv {
+
+int run( const comma::command_line_options& options )
+{
+    #ifdef WIN32
+        _setmode( _fileno( stdin ), _O_BINARY );
+    #endif
+    comma::csv::options csv( options );
+    if( !csv.flush ) { std::cin.tie( NULL ); }
+    const auto& sizes = comma::split_as< unsigned int >( options.value< std::string >( "--sizes" ), ',' );
+    unsigned int size = std::accumulate( sizes.begin(), sizes.end(), 0 );
+    if( size % 8 > 0 ) { std::cerr << "csv-bits: to-csv: expected input record size in bits divisible by 8; got: " << size << " (oddly-sized record support: todo)" << std::endl; return 1; }
+    size /= 8;
+    bool little_endian = options.value< std::string >( "--endian", "big" ) == "little";
+    std::vector< std::pair< unsigned int, unsigned int > > indices;
+    std::vector< comma::csv_bits::field > fields;
+    unsigned int begin = 0;
+    for( auto s: sizes ) { fields.push_back( comma::csv_bits::field( begin, s, little_endian ) ); begin += s; }
+    std::vector< char > buf( size );
+    comma::csv_bits::unpacked output( sizes.size() );
+    comma::csv::output_stream< comma::csv_bits::unpacked > os( std::cout, csv, output );
+    while( std::cin.good() )
+    {
+        std::cin.read( &buf[0], size );
+        if( std::cin.gcount() <= 0 ) { break; }
+        if( std::cin.gcount() < size ) { std::cerr << "csv-bits: to-csv: expected " << size << " byte(s); got: " << std::cin.gcount() << std::endl; return 1; }
+        for( unsigned int i = 0; i < sizes.size(); ++i ) { output.values[i] = fields[i].get( buf ); }
+        os.write( output );
+    }
+    return 0;
+}
+
+} } } // namespace comma { namespace csv_bits { namespace to_csv {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        const auto& unnamed = options.unnamed( "--flush, --verbose, -v", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-bits: please specify operation" << std::endl; return 1; }
+        if( unnamed.size() > 1 ) { std::cerr << "csv-bits: expected operation; got: " << comma::join( unnamed, ',' ) << std::endl; return 1; }
+        const std::string& operation = unnamed[0];
+        if( operation == "to-csv" || operation == "unpack" ) { return comma::csv_bits::to_csv::run( options ); }
+        if( operation == "from-csv" || operation == "pack" ) { return comma::csv_bits::from_csv::run( options ); }
+        std::cerr << "csv-bits: expected operation; got: \"" << operation << "\"" << std::endl;
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-bits: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-bits: unknown exception" << std::endl; }
+    return 1;
+}

From 4abb34f5944cc29b99a23d1e82199d4970c9714a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 30 Sep 2021 21:56:37 +1000
Subject: [PATCH 0408/1056] csv-bits: to-csv: implemented; debugging...

---
 csv/applications/CMakeLists.txt |  5 +++++
 csv/applications/csv-bits.cpp   | 12 ++++++++----
 csv/applications/csv-cast.cpp   |  6 +++---
 3 files changed, 16 insertions(+), 7 deletions(-)

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index a7073d5e1..fd2077b72 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -169,3 +169,8 @@ add_executable( csv-bin-reverse ${dir}/csv-bin-reverse.cpp )
 target_link_libraries ( csv-bin-reverse ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_xpath comma_csv )
 set_target_properties( csv-bin-reverse PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-bin-reverse RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
+add_executable( csv-bits ${dir}/csv-bits.cpp )
+target_link_libraries ( csv-bits ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string )
+set_target_properties( csv-bits PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS csv-bits RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/csv/applications/csv-bits.cpp b/csv/applications/csv-bits.cpp
index 4095a58e2..2d467faa7 100644
--- a/csv/applications/csv-bits.cpp
+++ b/csv/applications/csv-bits.cpp
@@ -51,13 +51,13 @@ struct field
 {
     unsigned int begin;
     unsigned int begin_byte;
-    char begin_mask;
+    unsigned char begin_mask;
     unsigned int size;
     unsigned int bytes;
     unsigned int shift;
     bool little_endian;
 
-    static std::array< comma::uint32, 32 > begin_masks;
+    static std::array< unsigned char, 8 > begin_masks;
 
     field() = default;
     field( unsigned int begin, unsigned int size, bool little_endian )
@@ -65,11 +65,12 @@ struct field
         , begin_byte( begin / 8 )
         , begin_mask( begin_masks[ begin % 8 ] )
         , size( size )
-        , bytes( size % 8 + int( size % 8 > 0 ) )
+        , bytes( size / 8 + int( size % 8 > 0 ) )
         , shift( 64 - begin % 8 - size )
         , little_endian( little_endian )
     {
         if( size > sizeof( comma::uint32 ) * 8 ) { COMMA_THROW( comma::exception, "expected size up to " << ( sizeof( comma::uint32 ) * 8 ) << " bits; got: " << size ); }
+        //std::cerr << "--> a: begin: " << begin << " begin byte: " << begin_byte << " bytes: " << bytes << " size: " << size << " begin mask: " << ( unsigned int )begin_mask << " shift: " << shift << std::endl;
     }
 
     comma::uint32 get( const std::vector< char >& buf ) const // todo: quick and dirty, watch performance
@@ -77,8 +78,11 @@ struct field
         comma::uint64 r = 0;
         char* p = reinterpret_cast< char* >( &r );
         std::memcpy( p, &buf[ begin_byte ], bytes );
+        //std::cerr << "--> b: p[0]: " << int( p[0] ) << " r: " << r << std::endl;
         p[0] &= begin_mask;
+        //std::cerr << "--> c: p[0]: " << int( p[0] ) << " r: " << r << std::endl;
         r >>= shift;
+        //std::cerr << "--> d: r: " << r << std::endl;
         if( !little_endian )
         {
             // todo
@@ -87,7 +91,7 @@ struct field
     }
 };
 
-std::array< comma::uint32, 32 > field::begin_masks = { 255, 127, 63, 31, 15, 7, 3, 1 }; // todo: use constexpr
+std::array< unsigned char, 8 > field::begin_masks = { 255, 127, 63, 31, 15, 7, 3, 1 }; // todo: use constexpr
 
 } } // namespace comma { namespace csv_bits {
 
diff --git a/csv/applications/csv-cast.cpp b/csv/applications/csv-cast.cpp
index fcf3e1b3d..bec891db7 100644
--- a/csv/applications/csv-cast.cpp
+++ b/csv/applications/csv-cast.cpp
@@ -44,7 +44,7 @@
 
 static const std::string app_name = "csv-cast";
 
-static void usage()
+static void usage( bool verbose = false )
 {
     std::cerr << "reads binary in the given input format and writes binary in the given output format" << std::endl;
     std::cerr << std::endl;
@@ -76,6 +76,7 @@ static void usage()
     std::cerr << "        echo {0..9}.2345789,3.1415 | fmt -1 | csv-time-stamp | csv-to-bin s[22],s[10],s[6] | csv-cast s[22],s[10],s[6] t,2d | csv-from-bin t,2d" << std::endl;
     std::cerr << std::endl;
     std::cerr << std::endl;
+    exit(0);
 }
 
 static void check_conversions( const comma::csv::format& iformat, const comma::csv::format& oformat, const bool force )
@@ -255,8 +256,7 @@ int main( int ac, char** av )
 #endif
     try
     {
-        comma::command_line_options options( ac, av );
-        if( options.exists( "--help,-h" ) ) { usage(); return 0; }
+        comma::command_line_options options( ac, av, usage );
         if( ac < 3 ) { usage(); return 1; }
         comma::csv::format iformat( options.value< std::string >( "--binary,-b,--from", av[1] ) );
         comma::csv::format oformat( options.value< std::string >( "--output-binary,--output,-o,--to", av[2] ) );

From d8afdd3781b92dd45e617ec08077359aa157a386 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 30 Sep 2021 22:13:50 +1000
Subject: [PATCH 0409/1056] csv-bits: first cut kind of works; todo: test
 thoroughly...

---
 csv/applications/csv-bits.cpp | 21 ++++++++++-----------
 1 file changed, 10 insertions(+), 11 deletions(-)

diff --git a/csv/applications/csv-bits.cpp b/csv/applications/csv-bits.cpp
index 2d467faa7..009b3e2ac 100644
--- a/csv/applications/csv-bits.cpp
+++ b/csv/applications/csv-bits.cpp
@@ -1,3 +1,4 @@
+#include <endian.h>
 #include <array>
 #include <memory>
 #include <numeric>
@@ -18,14 +19,14 @@ void usage( bool )
     std::cerr << "operations: from-csv (unpack), to-csv (pack)" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
-    std::cerr << "    from-csv (pack): todo; convert csv to packed bits" << std::endl;
+    std::cerr << "    from-csv (pack): todo; convert csv to packed bits in big endian order" << std::endl;
     std::cerr << "        options" << std::endl;
-    std::cerr << "            --endian=<which>; default=big; endianness of input: big or little" << std::endl;
+    std::cerr << "            --endian=<which>; default=big; todo: endianness of input: big or little" << std::endl;
     std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    to-csv (unpack): todo; convert packed bits to csv" << std::endl;
+    std::cerr << "    to-csv (unpack): convert packed bits to csv; input bits are expected in big endian order" << std::endl;
     std::cerr << "        options" << std::endl;
-    std::cerr << "            --endian=<which>; default=big; endianness of output: big or little" << std::endl;
+    //std::cerr << "            --endian=<which>; default=big; todo: endianness of output: big or little" << std::endl;
     std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
     std::cerr << std::endl;
     exit( 0 );
@@ -34,6 +35,7 @@ void usage( bool )
 // todo
 //   - document on gitlab
 //   - to-csv
+//     - sort out endianness: big endian vs transparent semantic use in the mainstream use case
 //     - unit test
 //     - support uint64
 //   - from-csv
@@ -81,13 +83,10 @@ struct field
         //std::cerr << "--> b: p[0]: " << int( p[0] ) << " r: " << r << std::endl;
         p[0] &= begin_mask;
         //std::cerr << "--> c: p[0]: " << int( p[0] ) << " r: " << r << std::endl;
-        r >>= shift;
-        //std::cerr << "--> d: r: " << r << std::endl;
-        if( !little_endian )
-        {
-            // todo
-        }
-        return r;
+        // todo: something like: r = little_endian ? le64toh( r ) : be64toh( r );
+        comma::uint64 s = htobe64( r ) >> shift;
+        //std::cerr << "--> d: s: " << s << std::endl;
+        return s;
     }
 };
 

From 3ccec0b206fb15a8c048358a7fc01be61a7e4f1e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 2 Oct 2021 00:56:28 +1000
Subject: [PATCH 0410/1056] csv-bits: --help --verbose added

---
 csv/applications/csv-bits.cpp | 20 +++++++++++---------
 1 file changed, 11 insertions(+), 9 deletions(-)

diff --git a/csv/applications/csv-bits.cpp b/csv/applications/csv-bits.cpp
index 009b3e2ac..b4c7edebc 100644
--- a/csv/applications/csv-bits.cpp
+++ b/csv/applications/csv-bits.cpp
@@ -10,7 +10,7 @@
 #include "../stream.h"
 #include "../traits.h"
 
-void usage( bool )
+void usage( bool verbose )
 {
     std::cerr << "converting between bits and csv and other bit operations" << std::endl;
     std::cerr << std::endl;
@@ -19,21 +19,27 @@ void usage( bool )
     std::cerr << "operations: from-csv (unpack), to-csv (pack)" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
-    std::cerr << "    from-csv (pack): todo; convert csv to packed bits in big endian order" << std::endl;
+    std::cerr << "    from-csv (pack): todo; convert input csv as to packed bits in big endian order" << std::endl;
     std::cerr << "        options" << std::endl;
-    std::cerr << "            --endian=<which>; default=big; todo: endianness of input: big or little" << std::endl;
+    //std::cerr << "            --endian=<which>; default=big; todo: endianness of input: big or little" << std::endl;
+    std::cerr << "            --binary,-b=[<format>]; input is binary; see details below" << std::endl;
+    std::cerr << "            --flush; see below" << std::endl;
     std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    to-csv (unpack): convert packed bits to csv; input bits are expected in big endian order" << std::endl;
+    std::cerr << "    to-csv (unpack): convert packed bits to integers as csv; input bits are expected in big endian order" << std::endl;
     std::cerr << "        options" << std::endl;
     //std::cerr << "            --endian=<which>; default=big; todo: endianness of output: big or little" << std::endl;
+    std::cerr << "            --binary,-b=[<format>]; output is binary; see details below" << std::endl;
+    std::cerr << "            --flush; see below" << std::endl;
     std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
     exit( 0 );
 }
 
 // todo
-//   - document on gitlab
 //   - to-csv
 //     - sort out endianness: big endian vs transparent semantic use in the mainstream use case
 //     - unit test
@@ -72,7 +78,6 @@ struct field
         , little_endian( little_endian )
     {
         if( size > sizeof( comma::uint32 ) * 8 ) { COMMA_THROW( comma::exception, "expected size up to " << ( sizeof( comma::uint32 ) * 8 ) << " bits; got: " << size ); }
-        //std::cerr << "--> a: begin: " << begin << " begin byte: " << begin_byte << " bytes: " << bytes << " size: " << size << " begin mask: " << ( unsigned int )begin_mask << " shift: " << shift << std::endl;
     }
 
     comma::uint32 get( const std::vector< char >& buf ) const // todo: quick and dirty, watch performance
@@ -80,12 +85,9 @@ struct field
         comma::uint64 r = 0;
         char* p = reinterpret_cast< char* >( &r );
         std::memcpy( p, &buf[ begin_byte ], bytes );
-        //std::cerr << "--> b: p[0]: " << int( p[0] ) << " r: " << r << std::endl;
         p[0] &= begin_mask;
-        //std::cerr << "--> c: p[0]: " << int( p[0] ) << " r: " << r << std::endl;
         // todo: something like: r = little_endian ? le64toh( r ) : be64toh( r );
         comma::uint64 s = htobe64( r ) >> shift;
-        //std::cerr << "--> d: s: " << s << std::endl;
         return s;
     }
 };

From 0fe5c3a5042b4c182ab1cb1646f07647ca7367ff Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 9 Feb 2022 22:06:32 +1100
Subject: [PATCH 0411/1056] io/applications/CMakeLists.txt: add xpath to
 io-publish libraries

fixes debug build failure introduced in commit 708e5688
---
 io/applications/CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index 98f71f174..152b00f28 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -39,7 +39,7 @@ if( NOT WIN32 )
     install( TARGETS io-ls RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( io-publish ${dir}/io-publish.cpp )
-    target_link_libraries( io-publish comma_base comma_io comma_application ) # profiler )
+    target_link_libraries( io-publish comma_base comma_io comma_application comma_xpath ) # profiler )
     set_target_properties( io-publish PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-publish RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 

From 89d4c780f424ee2a3029a0b43e5559a5e3ebba76 Mon Sep 17 00:00:00 2001
From: vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 3 Mar 2022 16:04:08 +1100
Subject: [PATCH 0412/1056] system/ansible: python-pip added

---
 system/ansible/install.python3.yml | 1 +
 system/ansible/install.yml         | 1 +
 2 files changed, 2 insertions(+)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index fcbe2c851..0076254e9 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -26,6 +26,7 @@
       - libgtest-dev
       - python3-dev
       - python3-numpy
+      - python3-pip
       - libprocps-dev
       - recode
       
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index eed77cf05..517351dd2 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -26,6 +26,7 @@
       - libgtest-dev
       - python-dev
       - python-numpy
+      - python-pip
       - libprocps-dev
       - recode
 

From 4c1756eb9723b57f9255e758938e8e8756ab3ba1 Mon Sep 17 00:00:00 2001
From: vlaskine <vlaskine@yahoo.com>
Date: Mon, 14 Mar 2022 16:19:56 +1100
Subject: [PATCH 0413/1056] syste/package/debian: typo fixed

---
 system/package/debian/comma-package-docker-build | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/system/package/debian/comma-package-docker-build b/system/package/debian/comma-package-docker-build
index 124fa69f3..424175d25 100755
--- a/system/package/debian/comma-package-docker-build
+++ b/system/package/debian/comma-package-docker-build
@@ -5,5 +5,5 @@ comma_dir="$2"
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
 [[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
 echo "$0: running:" >&2
-echo "docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f '$comma_dir/system/package/Dockerfile' ." >&2
-docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/Dockerfile" .
+echo "docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f '$comma_dir/system/package/debian/Dockerfile' ." >&2
+docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/debian/Dockerfile" .

From ec49ae0c46e89155fbe65ec983e5ca7c00f4ba39 Mon Sep 17 00:00:00 2001
From: vlaskine <vlaskine@yahoo.com>
Date: Mon, 14 Mar 2022 16:37:52 +1100
Subject: [PATCH 0414/1056] syste/package/debian: typo fixed

---
 system/package/debian/comma-package-docker-run | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/debian/comma-package-docker-run b/system/package/debian/comma-package-docker-run
index bab3b8d23..2f78a4953 100755
--- a/system/package/debian/comma-package-docker-run
+++ b/system/package/debian/comma-package-docker-run
@@ -13,4 +13,4 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$( pwd ),target=/root/output" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/package/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/debian/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }

From 171d999abfe4a75de81cce36d35c06b28b2113fc Mon Sep 17 00:00:00 2001
From: vlaskine <vlaskine@yahoo.com>
Date: Mon, 14 Mar 2022 16:57:38 +1100
Subject: [PATCH 0415/1056] syste/package/debian: typo fixed

---
 system/package/debian/comma-package-make | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index fc4df215c..0fc522b06 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -22,7 +22,7 @@ esac
     echo "$0: setting up python in $( pwd )" >&2
     #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
     echo "$0: running python3 setup.py ..." >&2
-    python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal  || die "failed"
+    python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../COPYING --suite focal  || die "failed"
     # todo: mount gpg key
     # debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
     # mkdir tmp
@@ -32,7 +32,7 @@ esac
     # debuild -S -sa
     # dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
     # ? debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 ../../deb_dist/python3-comma_1.0.0-1_source.changes
-    # 
+    #
     # ...
     echo "$0: building package..." >&2
     cd deb_dist/comma-$version_major.$version_minor.$version_patch || die "failed"

From 7e735ceaf5e35d5e5badd9754b42814fb8debe4b Mon Sep 17 00:00:00 2001
From: vlaskine <vlaskine@yahoo.com>
Date: Thu, 17 Mar 2022 16:40:07 +1100
Subject: [PATCH 0416/1056] csv-split --timestamps implemented

---
 csv/applications/csv-split.cpp   | 13 +++---
 csv/applications/split/split.cpp | 76 ++++++++++++++++++++++----------
 csv/applications/split/split.h   | 15 ++++++-
 3 files changed, 73 insertions(+), 31 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index 0372668ff..ca1dada76 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -49,10 +49,11 @@ static unsigned int size = 0;
 static bool passthrough;
 static std::string files;
 static std::string default_filename;
+static std::string timestamps;
 
 template < typename T > static void run()
 {
-    comma::csv::applications::split< T > split( duration, suffix, csv, streams, passthrough, files );
+    comma::csv::applications::split< T > split( duration, suffix, csv, streams, passthrough, files, default_filename, timestamps );
     if( size == 0 )
     {
         std::string line;
@@ -93,7 +94,8 @@ int main( int argc, char** argv )
             ( "size,c", boost::program_options::value< unsigned int >( &size ), "packet size, only full packets will be written" )
             ( "string", "id is string; default: 32-bit integer" )
             ( "suffix,s", boost::program_options::value< std::string >( &extension ), "filename extension; default will be csv or bin, depending whether it is ascii or binary" )
-            ( "time", "id is time; default: 32-bit integer" );
+            ( "time", "id is time; default: 32-bit integer" )
+            ( "timestamps", boost::program_options::value< std::string >( &timestamps ), "<filename>[;<csv options>]: split by timestamps (assuming both input and timestamps are in ascending order)" );
         description.add( comma::csv::program_options::description() );
         boost::program_options::variables_map vm;
         boost::program_options::store( boost::program_options::parse_command_line( argc, argv, description), vm );
@@ -162,17 +164,19 @@ int main( int argc, char** argv )
             return 0;
         }
         csv = comma::csv::program_options::get( vm );
+        if( vm.count( "period" ) && vm.count( "timestamps" ) ) { std::cerr << "csv-split: --period and --timestamps are mutually exclusive (todo? combine them? just ask)" << std::endl; return 1; }
         if( !default_filename.empty() ) { std::cerr << "csv-split: --default-filename: todo, just ask" << std::endl; }
         if( csv.binary() ) { size = csv.format().size(); }
         bool id_is_string = vm.count( "string" );
         bool id_is_time = vm.count( "time" );
-        passthrough = vm.count("passthrough");        
-        if( id_is_string && id_is_time ) { std::cerr << "csv-split: either --string or --time" << std::endl; }
+        passthrough = vm.count("passthrough");
+        if( id_is_string && id_is_time ) { std::cerr << "csv-split: --string and --time are mutually exclusive" << std::endl; return 1; }
         if( period > 0 ) { duration = boost::posix_time::microseconds( static_cast< unsigned int >( period * 1e6 )); }
         if( extension.empty() ) { suffix = csv.binary() || size > 0 ? ".bin" : ".csv"; }
         else { suffix += "."; suffix += extension; }
         streams = boost::program_options::collect_unrecognized( parsed.options, boost::program_options::include_positional );
         if( !streams.empty() && ( csv.has_field( "block" ) || id_is_time ) ) { std::cerr << "publisher streams are not compatible with splitting by block or timestamp." << std::endl; return 1; }
+        if( ( csv.has_field( "t" ) || csv.fields.empty() ) && !period && timestamps.empty() ) { COMMA_THROW( comma::exception, "got fields '" << csv.fields << "' meaning split by time; thus please specify either --period or --timestamps" ); }
         if( id_is_string ) { run< std::string >(); }
         else if( id_is_time ) { run< boost::posix_time::ptime >(); }
         else { run< comma::uint32 >(); }
@@ -182,4 +186,3 @@ int main( int argc, char** argv )
     catch( ... ) { std::cerr << argv[0] << ": unknown exception" << std::endl; }
     return 1;
 }
-
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 056c82b0c..206e8248c 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -77,6 +77,12 @@ template < typename T > struct traits< comma::csv::applications::filename_record
     }
 };
 
+template <> struct traits< comma::csv::applications::timestamp >
+{
+    template< typename K, typename V > static void visit( const K&, comma::csv::applications::timestamp& t, V& v ) { v.apply( "t", t.t ); }
+    template< typename K, typename V > static void visit( const K&, const comma::csv::applications::timestamp& t, V& v ) { v.apply( "t", t.t ); }
+};
+
 } } // namespace comma { namespace visiting {
 
 namespace comma { namespace csv { namespace applications {
@@ -102,25 +108,53 @@ std::pair< std::unordered_map< comma::uint32, std::string >, bool > static filen
     if( r.first.empty() ) { COMMA_THROW( comma::exception, "got no filenames from '" << csv.filename << "'" ); }
     return r;
 }
-    
+
+template < typename T >
+void split< T >::timestamps_stream_make_( const std::string& timestamps )
+{
+    if( timestamps.empty() ) { return; }
+    auto csv = comma::name_value::parser( "filename", ';', '=', false ).get< comma::csv::options >( timestamps );
+    timestamps_ifstream_.reset( new std::ifstream( csv.filename ) );
+    if( !timestamps_ifstream_->is_open() ) { COMMA_THROW( comma::exception, "could not open --timestamps='" << csv.filename << "'" ); }
+    timestamps_.reset( new comma::csv::input_stream< csv::applications::timestamp >( *timestamps_ifstream_, csv ) );
+    auto p = timestamps_->read();
+    if( !p ) { COMMA_THROW( comma::exception, "could not read from --timestamps='" << csv.filename << "'" ); } // quick and dirty
+    timestamps_last_.second = p->t;
+    //std::cerr << "--> a: interval: " << boost::posix_time::to_iso_string( timestamps_last_.first ) << " - " << boost::posix_time::to_iso_string( timestamps_last_.second ) << std::endl;
+}
+
+template < typename T >
+bool split< T >::timestamps_stream_seek_( boost::posix_time::ptime t )
+{
+    bool changed = false;
+    while( t >= timestamps_last_.second && !timestamps_last_.second.is_pos_infinity() )
+    {
+        auto p = timestamps_->read();
+        timestamps_last_.first = timestamps_last_.second;
+        timestamps_last_.second = p ? p->t : boost::posix_time::pos_infin;
+        changed = true;
+    }
+    return changed;
+}
+
 template < typename T >
 split< T >::split( const boost::optional< boost::posix_time::time_duration >& period
                  , const std::string& suffix
                  , const comma::csv::options& csv
                  , bool pass
                  , const std::string& filenames
-                 , const std::string& default_filename )
+                 , const std::string& default_filename
+                 , const std::string& timestamps )
     : ofstream_( std::bind( &split< T >::ofstream_by_time_, this ) )
     , period_( period )
     , suffix_( suffix )
+    , timestamps_last_( boost::posix_time::neg_infin, boost::posix_time::not_a_date_time )
     , pass_ ( pass )
     , flush_( csv.flush )
     , is_shutdown_( false )
 {
-    if( ( csv.has_field( "t" ) || csv.fields.empty() ) && !period ) { COMMA_THROW( comma::exception, "please specify --period" ); }
     if( csv.fields.empty() ) { return; }
-    if( csv.binary() ) { binary_.reset( new comma::csv::binary< input >( csv ) ); }
-    else { ascii_.reset( new comma::csv::ascii< input >( csv ) ); }
+    if( csv.binary() ) { binary_.reset( new comma::csv::binary< input >( csv ) ); } else { ascii_.reset( new comma::csv::ascii< input >( csv ) ); }
     boost::tie( filenames_, filenames_have_id_ ) = applications::filenames( filenames );
     if( csv.has_field( "block" ) )
     {
@@ -128,15 +162,10 @@ split< T >::split( const boost::optional< boost::posix_time::time_duration >& pe
     }
     else
     {
-        if( csv.has_field( "id" ) )
-        { 
-            ofstream_ = std::bind( &split< T >::ofstream_by_id_, this );
-        }
-        else
-        {    
-            if( !filenames_.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); }
-        }
+        if( csv.has_field( "id" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_id_, this ); }
+        else { if( !filenames_.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); } }
     }
+    timestamps_stream_make_( timestamps );
 }
 
 template < typename T >
@@ -146,8 +175,9 @@ split< T >::split( const boost::optional< boost::posix_time::time_duration >& pe
                  , const std::vector< std::string >& streams //to-do
                  , bool pass
                  , const std::string& filenames
-                 , const std::string& default_filename )
-    : split( period, suffix, csv, pass, filenames, default_filename )
+                 , const std::string& default_filename
+                 , const std::string& timestamps )
+    : split( period, suffix, csv, pass, filenames, default_filename, timestamps )
 {
     if( streams.empty() ) { return; }
     auto const io_mode = csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii;
@@ -186,7 +216,7 @@ split< T >::~split()
     {
         acceptor_thread_.join();
         transaction t( publishers_ );
-        for( auto& ii : *t ) { ii->close(); } 
+        for( auto& ii : *t ) { ii->close(); }
     }
 }
 
@@ -196,7 +226,7 @@ void split< T >::accept_()
     comma::io::select select;
     {
         transaction t( publishers_ );
-        for( auto& ii : *t ) { if( ii->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ii->acceptor_file_descriptor() ); } } 
+        for( auto& ii : *t ) { if( ii->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ii->acceptor_file_descriptor() ); } }
         if( default_publisher_ ) { if( default_publisher_->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( default_publisher_->acceptor_file_descriptor() ); } }
     }
     while( !is_shutdown_ )
@@ -240,7 +270,7 @@ void split< T >::write( const char* data, unsigned int size )
 }
 
 template < typename T >
-void split< T >::write ( std::string line )
+void split< T >::write( std::string line )
 {
     mode_ = std::ofstream::out; // quick and dirty
     if( ascii_ ) { ascii_->get( current_, line ); }
@@ -262,10 +292,11 @@ void split< T >::write ( std::string line )
 template < typename T >
 std::ofstream* split< T >::ofstream_by_time_()
 {
-    if( !last_ || current_.timestamp > ( last_->timestamp + *period_ ) )
+    bool changed = period_ ? !last_ || current_.timestamp > last_->timestamp + *period_ : timestamps_stream_seek_( current_.timestamp );
+    if( !last_ || changed )
     {
         file_.close();
-        std::string time = boost::posix_time::to_iso_string( current_.timestamp );
+        std::string time = boost::posix_time::to_iso_string( period_ || timestamps_last_.first.is_neg_infinity() ? current_.timestamp : timestamps_last_.first );
         if( time.find_first_of( '.' ) == std::string::npos ) { time += ".000000"; }
         file_.open( ( time + suffix_ ).c_str(), mode_ );
         last_ = current_;
@@ -287,10 +318,7 @@ std::ofstream* split< T >::ofstream_by_block_()
             if( it == filenames_.end() ) { return nullptr; }
             filename = it->second;
             const auto& dirname = boost::filesystem::path( filename ).parent_path();
-            if( !( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) )
-            {
-                COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << filename << "'" );
-            }
+            if( !( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) ) { COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << filename << "'" ); }
         }
         if( filename.empty() ) { filename = boost::lexical_cast< std::string >( current_.block ) + suffix_; }
         file_.open( &filename[0], mode_ );
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 50b0e5c99..5705b04e0 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2022 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -45,6 +46,7 @@
 #include "../../../base/types.h"
 #include "../../../csv/ascii.h"
 #include "../../../csv/binary.h"
+#include "../../../csv/stream.h"
 #include "../../../visiting/traits.h"
 #include "../../../io/publisher.h"
 #include "../../../sync/synchronized.h"
@@ -58,6 +60,8 @@ template < typename T > struct input // quick and dirty
     T id;
 };
 
+struct timestamp { boost::posix_time::ptime t; };
+
 } } } // namespace comma { namespace csv { namespace applications {
 
 namespace comma { namespace visiting {
@@ -123,14 +127,16 @@ class split
              , const comma::csv::options& csv
              , bool passthrough
              , const std::string& filenames
-             , const std::string& default_filename = "" );
+             , const std::string& default_filename = ""
+             , const std::string& timestamps = "" );
         split( const boost::optional< boost::posix_time::time_duration >& period
              , const std::string& suffix
              , const comma::csv::options& csv
              , const std::vector< std::string >& streams
              , bool passthrough
              , const std::string& filenames
-             , const std::string& default_filename = "" );
+             , const std::string& default_filename = ""
+             , const std::string& timestamps = "" );
         ~split();
         void write( const char* data, unsigned int size );
         void write( std::string line );
@@ -142,6 +148,8 @@ class split
         void update_( const char* data, unsigned int size );
         void update_( const std::string& line );
         void accept_();
+        void timestamps_stream_make_( const std::string& timestamps );
+        bool timestamps_stream_seek_( boost::posix_time::ptime t );
 
         std::function< std::ofstream*() > ofstream_;
         std::unique_ptr< comma::csv::ascii< input > > ascii_;
@@ -152,6 +160,9 @@ class split
         boost::optional< input > last_;
         std::ios_base::openmode mode_;
         std::ofstream file_;
+        std::unique_ptr< std::ifstream > timestamps_ifstream_;
+        std::unique_ptr< comma::csv::input_stream< applications::timestamp > > timestamps_;
+        std::pair< boost::posix_time::ptime, boost::posix_time::ptime > timestamps_last_;
 
         using Files = typename traits< T >::map;
         using ids_type_ = typename traits< T >::set;

From 06b168061fa6247ae4dbeb1e3e61db972d4bc4bf Mon Sep 17 00:00:00 2001
From: vlaskine <vlaskine@yahoo.com>
Date: Thu, 24 Mar 2022 13:18:55 +1100
Subject: [PATCH 0417/1056] cmake: gtest (deprecated) replaced with googletest

---
 CMakeLists.txt | 20 ++++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index eec526472..e3ff2ca15 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -16,7 +16,7 @@ cmake_minimum_required( VERSION 3.1 )
 # if( USE_ARM_TOOLCHAIN )
 #     set(CMAKE_TOOLCHAIN_FILE ${SOURCE_CODE_BASE_DIR}/CMakeFiles/arm.toolchain.cmake)
 # endif( USE_ARM_TOOLCHAIN )
-# 
+#
 # option(my_test_option "whatever" OFF)
 # if(my_test_option)
 #     set(my_other_option "is set")
@@ -50,7 +50,7 @@ IF (UNIX AND NOT APPLE)
 		SET ( COMMITHASH "abc" )
 	ENDIF()
 ELSE() # Probably windows; gets hardcoded patch version
-	SET ( COMMITDATE 1 ) 
+	SET ( COMMITDATE 1 )
 	SET ( COMMITHASH "abc" )
 ENDIF()
 
@@ -114,7 +114,7 @@ SET( EXECUTABLE_OUTPUT_PATH
 set( comma_version_major "1" ) # quick and dirty
 set( comma_version_minor "0" ) # quick and dirty
 set( comma_version_patch "0" ) # quick and dirty
-     
+
 SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" )
 
 IF( NOT comma_INSTALL_BIN_DIR )
@@ -181,7 +181,7 @@ IF( comma_BUILD_TESTS )
 
     # todo: maybe else clause is actually the right way to do things
     IF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
-        FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/gtest DOC "source code of gtest" )
+        FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/googletest/googletest DOC "source code of gtest" ) # FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/gtest DOC "source code of gtest" )
         ADD_SUBDIRECTORY( ${GTest_SOURCE_DIR} gtest )
         INCLUDE_DIRECTORIES( src ${GTest_SOURCE_DIR}/include ${GTest_SOURCE_DIR} )
         SET( GTEST_BOTH_LIBRARIES gtest gtest_main )
@@ -189,7 +189,7 @@ IF( comma_BUILD_TESTS )
         FIND_PACKAGE( GTest )
         INCLUDE_DIRECTORIES( ${GTEST_INCLUDE_DIRS} )
     ENDIF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
-	
+
 #TT: Install tests to dir. This allows them to be packed by CPack.
 #Note: if your source tree is dirty (eg you've already run tests there and have output/ directories)
 #those will also be installed too.
@@ -198,13 +198,13 @@ OPTION( INSTALL_TESTS "Install the tests into the nominated directory" OFF )
 IF( INSTALL_TESTS )
     SET ( comma_CPP_TESTS_INSTALL_DIR bin CACHE PATH "Install directory for cpp unit tests" )
     SET ( comma_INSTALL_COMMA_TESTS_DIR share/test )
-	
+
 # Get the list of test directories (using glob).
-FILE ( GLOB_RECURSE all_files 
+FILE ( GLOB_RECURSE all_files
 		# RELATIVE is tricky. When you use it, you need to specify the path you expect the output to be RELATIVE to. (Yes, that path could be considerably non-relative to the file that is found.)
-		RELATIVE ${CMAKE_SOURCE_DIR} 
+		RELATIVE ${CMAKE_SOURCE_DIR}
 		* )
-		
+
 SET ( test_dirs )
 FOREACH ( i ${all_files} )
 	if ( ${i} MATCHES "[\\/]test[\\/]" )
@@ -220,7 +220,7 @@ ENDFOREACH (i)
                         IF( NOT skip )
 			# See that slash there? 		 vvv It's really important.
 			INSTALL ( 	DIRECTORY ${dest_dir}/
-						DESTINATION ${comma_INSTALL_COMMA_TESTS_DIR}/${CMAKE_PROJECT_NAME}/unit/${dest_dir} 
+						DESTINATION ${comma_INSTALL_COMMA_TESTS_DIR}/${CMAKE_PROJECT_NAME}/unit/${dest_dir}
 						USE_SOURCE_PERMISSIONS
                             PATTERN "output" EXCLUDE )
                         ENDIF( NOT skip )

From 8071d8ab57f40e916bbb0148f8d287d3306ce87e Mon Sep 17 00:00:00 2001
From: vlaskine <vlaskine@yahoo.com>
Date: Thu, 24 Mar 2022 14:00:38 +1100
Subject: [PATCH 0418/1056] csv-shuffle: --drop-empty implemented and tested

---
 csv/applications/csv-shuffle.cpp | 42 +++++++++-----------------------
 csv/test/csv-shuffle/expected    |  8 ++++++
 csv/test/csv-shuffle/input       |  4 +++
 3 files changed, 24 insertions(+), 30 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 9df07b8ef..aaf9d0d77 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -1,33 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // Copyright (c) 2020 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-// Copyright (c) 2011 The University of Sydney
 
 /// @author vsevolod vlaskine
 
@@ -51,9 +23,12 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
+    std::cerr << "    --drop-empty,-e; e.g. csv-shuffle --fields a,b,,,c --drop-empty is equivalent to" << std::endl;
+    std::cerr << "                          csv-shuffle --fields a,b,,,c --output-fields a,b,c" << std::endl;
     std::cerr << "    --fields,-f,--input-fields=<fields>; input fields" << std::endl;
     std::cerr << "    --output-fields,--output,-o=<fields>; output fields, if not specified, will be set" << std::endl;
-    std::cerr << "                                          to --input-fields, which would chops off trailing input fields" << std::endl;
+    std::cerr << "                                          to --input-fields, which would chop off trailing input fields" << std::endl;
+    std::cerr << "                                          see also --drop-empty" << std::endl;
     std::cerr << "    --verbose,-v: more output" << std::endl;
     if( verbose ) { std::cerr << std::endl << comma::csv::options::usage() << std::endl; }
     std::cerr << std::endl;
@@ -80,10 +55,17 @@ int main( int ac, char** av )
         comma::csv::options csv( options, options.value< std::string >( "--fields,-f,--input-fields" ) );
         std::vector< std::string > input_fields = comma::split( csv.fields, ',', true );
         std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o", csv.fields ), ',', true );
+        if( options.exists( "--drop-empty,-e" ) )
+        {
+            std::vector< std::string > v;
+            for( auto s: output_fields ) { if( !s.empty() ) { v.push_back( s ); } }
+            output_fields = v;
+        }
+        if( output_fields.empty() ) { std::cerr << "csv-shuffle: please specify --output-fields or --drop-empty" << std::endl; return 1; }
         if( output_fields.back() == "..." ) { std::cerr << "csv-shuffle: support for trailing fields has been removed for now; please specify input/output fields explicitly" << std::endl; return 1; }
         auto find_ = [&]( const std::string& n )->unsigned int
         {
-            if( n.empty() ) { COMMA_THROW( comma::exception, "got empty fields in output fields '" << comma::join( output_fields, ',' ) << "'" ); }
+            if( n.empty() ) { COMMA_THROW( comma::exception, "got empty fields in output fields '" << comma::join( output_fields, ',' ) << "'; you may need to use --drop-empty" ); }
             unsigned int j = 0;
             for( ; j < input_fields.size(); ++j ) { if( input_fields[j] == n ) { return j; } }
             COMMA_THROW( comma::exception, "output field '" << n << "' not found in input fields '" << csv.fields << "'" );
diff --git a/csv/test/csv-shuffle/expected b/csv/test/csv-shuffle/expected
index ac8eaab3b..baf7b61ad 100644
--- a/csv/test/csv-shuffle/expected
+++ b/csv/test/csv-shuffle/expected
@@ -10,6 +10,12 @@ ascii[4]/output="1,3,1,3"
 ascii[4]/status=0
 ascii[5]/output="0,1,2"
 ascii[5]/status=0
+ascii[6]/output=""
+ascii[6]/status=1
+ascii[7]/output="0,1,2,5"
+ascii[7]/status=0
+ascii[8]/output="0,1,2,5"
+ascii[8]/status=0
 
 binary[0]/output="0"
 binary[0]/status=0
@@ -21,3 +27,5 @@ binary[3]/output="1,2,1,2,1,2"
 binary[3]/status=0
 binary[4]/output="0,1,2"
 binary[4]/status=0
+binary[5]/output="0,1,2,5"
+binary[5]/status=0
diff --git a/csv/test/csv-shuffle/input b/csv/test/csv-shuffle/input
index 444bc6b59..c27c04380 100644
--- a/csv/test/csv-shuffle/input
+++ b/csv/test/csv-shuffle/input
@@ -4,9 +4,13 @@ ascii[2]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5"
 ascii[3]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5,4"
 ascii[4]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 1,3,1,3"
 ascii[5]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2"
+ascii[6]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,,,5"
+ascii[7]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,,,5 --drop-empty"
+ascii[8]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,,,5 --output-fields 0,1,2,,,5 --drop-empty"
 
 binary[0]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 0 | csv-from-bin ui"
 binary[1]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 3,4,5,0,1,2 | csv-from-bin 3uw,3ui"
 binary[2]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 4,5,2,3,0,1 | csv-from-bin 2uw,ui,uw,2ui"
 binary[3]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 1,2,1,2,1,2 | csv-from-bin 6ui"
 binary[4]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2 | csv-from-bin 3ui"
+binary[5]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,,,5 --drop-empty | csv-from-bin 3ui,uw"

From 06824637b571dea2b453b8be5a8d3d047e70d2d2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 6 Apr 2022 11:57:59 +1000
Subject: [PATCH 0419/1056] comma-application-util: swiss util: application
 name made global to fix application name in the stderr messages

---
 bash/comma-application-util | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 76db1f92f..998444614 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -44,7 +44,7 @@
 [[ -n "$comma_application_util_include_guard_" ]] && return 0
 readonly comma_application_util_include_guard_=1
 
-source $( type -p comma-name-value-util ) || { echo "$name: cannot source 'comma-name-value-util' from '$BASH_SOURCE'" >&2; exit 1; }
+source $( type -p comma-name-value-util ) || { echo "$comma_application_name: cannot source 'comma-name-value-util' from '$BASH_SOURCE'" >&2; exit 1; }
 
 ## @page comma_options_from_name_value comma_options_from_name_value
 # @section comma_options_from_name_value
@@ -120,7 +120,7 @@ export -f comma_pretty_description
 
 ## @page comma_options_names comma_options_names
 # @description converts a standard comma description to a list of names
-# 
+#
 # example
 #   description | comma_options_names
 function comma_options_names()
@@ -132,7 +132,7 @@ export -f comma_options_names
 ## @page comma_options_to_bash_completion comma_options_to_bash_completion
 # @description converts a standard comma description to input
 # for the comma bash completion function
-# 
+#
 # example
 #   description | comma_options_to_bash_completion
 function comma_options_to_bash_completion()
@@ -144,7 +144,7 @@ export -f comma_options_to_bash_completion
 ## @page comma_options_select comma_options_select
 # @description after a set of options have been retrieved as paths convert to
 # options format for a child script
-# 
+#
 # example
 #   comma-test-run $( comma-test-run --description | comma-options-to-name-value $@ | comma_name_value_to_options )
 function comma_name_value_to_options()
@@ -272,9 +272,9 @@ export -f comma-application-init
 
 function comma-application-swiss-init()
 {
-    local name=$( basename "$0" )
+    comma_application_name=$( basename "$0" )
     local common_options=$( cat )
-    [[ -n "$1" ]] || { echo "$name: please specify operation" >&2; exit 1; }
+    [[ -n "$1" ]] || { echo "$comma_application_name: please specify operation" >&2; exit 1; }
     comma_application_swiss_operation="$1" # todo? quick and dirty, allow --help anywhere on the command line?
     if comma_options_help $@; then
         if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
@@ -287,9 +287,9 @@ function comma-application-swiss-init()
         fi >&2
         exit 0
     fi
-    function say() { echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
-    function saymore() { (( ! options_verbose )) || echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
-    function verbose() { (( ! options_verbose )) || echo "$name: ${comma_application_swiss_operation}: $@" >&2; }
+    function say() { echo "$comma_application_name: ${comma_application_swiss_operation}: $@" >&2; }
+    function saymore() { (( ! options_verbose )) || echo "$comma_application_name: ${comma_application_swiss_operation}: $@" >&2; }
+    function verbose() { (( ! options_verbose )) || echo "$comma_application_name: ${comma_application_swiss_operation}: $@" >&2; }
     function die() { say "$@"; exit 1; }
     [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
     local options; options=$( ( echo "$common_options"; comma-application-common-options ) | comma-options-to-name-value "$@" ) || die "invalid options"

From 04d7ae53a764c3ae09989f16124adb0ce3a26554 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 12 Apr 2022 18:18:50 +1000
Subject: [PATCH 0420/1056] added tests for csv-crc

---
 csv/test/csv-crc/check/ascii-bad/expected     |  2 ++
 csv/test/csv-crc/check/ascii-bad/input        |  4 +++
 csv/test/csv-crc/check/ascii-good/expected    |  4 +++
 csv/test/csv-crc/check/ascii-good/input       |  4 +++
 csv/test/csv-crc/check/binary-bad/expected    |  2 ++
 csv/test/csv-crc/check/binary-bad/input       |  5 ++++
 csv/test/csv-crc/check/binary-good/expected   |  4 +++
 csv/test/csv-crc/check/binary-good/input      |  5 ++++
 csv/test/csv-crc/recover/binary-bad/expected  |  3 +++
 csv/test/csv-crc/recover/binary-bad/input     |  5 ++++
 csv/test/csv-crc/recover/binary-good/expected |  4 +++
 csv/test/csv-crc/recover/binary-good/input    |  5 ++++
 .../csv-crc/recover/give-up-after-21/expected |  3 +++
 .../csv-crc/recover/give-up-after-21/input    |  6 +++++
 .../csv-crc/recover/give-up-after-7/expected  |  2 ++
 .../csv-crc/recover/give-up-after-7/input     |  6 +++++
 csv/test/csv-crc/test                         | 25 +++++++++++++++++++
 csv/test/csv-crc/wrap/ascii/expected          |  3 +++
 csv/test/csv-crc/wrap/ascii/input             |  3 +++
 csv/test/csv-crc/wrap/binary/expected         |  3 +++
 csv/test/csv-crc/wrap/binary/input            |  4 +++
 21 files changed, 102 insertions(+)
 create mode 100644 csv/test/csv-crc/check/ascii-bad/expected
 create mode 100644 csv/test/csv-crc/check/ascii-bad/input
 create mode 100644 csv/test/csv-crc/check/ascii-good/expected
 create mode 100644 csv/test/csv-crc/check/ascii-good/input
 create mode 100644 csv/test/csv-crc/check/binary-bad/expected
 create mode 100644 csv/test/csv-crc/check/binary-bad/input
 create mode 100644 csv/test/csv-crc/check/binary-good/expected
 create mode 100644 csv/test/csv-crc/check/binary-good/input
 create mode 100644 csv/test/csv-crc/recover/binary-bad/expected
 create mode 100644 csv/test/csv-crc/recover/binary-bad/input
 create mode 100644 csv/test/csv-crc/recover/binary-good/expected
 create mode 100644 csv/test/csv-crc/recover/binary-good/input
 create mode 100644 csv/test/csv-crc/recover/give-up-after-21/expected
 create mode 100644 csv/test/csv-crc/recover/give-up-after-21/input
 create mode 100644 csv/test/csv-crc/recover/give-up-after-7/expected
 create mode 100644 csv/test/csv-crc/recover/give-up-after-7/input
 create mode 100755 csv/test/csv-crc/test
 create mode 100644 csv/test/csv-crc/wrap/ascii/expected
 create mode 100644 csv/test/csv-crc/wrap/ascii/input
 create mode 100644 csv/test/csv-crc/wrap/binary/expected
 create mode 100644 csv/test/csv-crc/wrap/binary/input

diff --git a/csv/test/csv-crc/check/ascii-bad/expected b/csv/test/csv-crc/check/ascii-bad/expected
new file mode 100644
index 000000000..2889b5d60
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-bad/expected
@@ -0,0 +1,2 @@
+output[0]/line="1,2,3,8625"
+count=1
diff --git a/csv/test/csv-crc/check/ascii-bad/input b/csv/test/csv-crc/check/ascii-bad/input
new file mode 100644
index 000000000..e96e98c53
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-bad/input
@@ -0,0 +1,4 @@
+operation=check
+1,2,3,8625
+1,2,3,8600
+1,2,3,8625
diff --git a/csv/test/csv-crc/check/ascii-good/expected b/csv/test/csv-crc/check/ascii-good/expected
new file mode 100644
index 000000000..1e78e14ac
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-good/expected
@@ -0,0 +1,4 @@
+output[0]/line="1,2,3,8625"
+output[1]/line="1,2,3,8625"
+output[2]/line="1,2,3,8625"
+count=3
diff --git a/csv/test/csv-crc/check/ascii-good/input b/csv/test/csv-crc/check/ascii-good/input
new file mode 100644
index 000000000..97b8789ac
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-good/input
@@ -0,0 +1,4 @@
+operation=check
+1,2,3,8625
+1,2,3,8625
+1,2,3,8625
diff --git a/csv/test/csv-crc/check/binary-bad/expected b/csv/test/csv-crc/check/binary-bad/expected
new file mode 100644
index 000000000..cfe99d992
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-bad/expected
@@ -0,0 +1,2 @@
+output[0]/line="1,2,3,37878"
+count=1
diff --git a/csv/test/csv-crc/check/binary-bad/input b/csv/test/csv-crc/check/binary-bad/input
new file mode 100644
index 000000000..ae724b9bc
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-bad/input
@@ -0,0 +1,5 @@
+operation=check
+binary=3ui,uw
+1,2,3,37878
+1,2,3,37777
+1,2,3,37878
diff --git a/csv/test/csv-crc/check/binary-good/expected b/csv/test/csv-crc/check/binary-good/expected
new file mode 100644
index 000000000..6f587e39e
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-good/expected
@@ -0,0 +1,4 @@
+output[0]/line="1,2,3,37878"
+output[1]/line="1,2,3,37878"
+output[2]/line="1,2,3,37878"
+count=3
diff --git a/csv/test/csv-crc/check/binary-good/input b/csv/test/csv-crc/check/binary-good/input
new file mode 100644
index 000000000..74f8fe349
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-good/input
@@ -0,0 +1,5 @@
+operation=check
+binary=3ui,uw
+1,2,3,37878
+1,2,3,37878
+1,2,3,37878
diff --git a/csv/test/csv-crc/recover/binary-bad/expected b/csv/test/csv-crc/recover/binary-bad/expected
new file mode 100644
index 000000000..38d716d3f
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad/expected
@@ -0,0 +1,3 @@
+output[0]/line="1,2,3,37878"
+output[0]/line="1,2,3,37878"
+count=2
diff --git a/csv/test/csv-crc/recover/binary-bad/input b/csv/test/csv-crc/recover/binary-bad/input
new file mode 100644
index 000000000..70c6d00e6
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad/input
@@ -0,0 +1,5 @@
+operation=recover
+binary=3ui,uw
+1,2,3,37878
+1,2,3,37777
+1,2,3,37878
diff --git a/csv/test/csv-crc/recover/binary-good/expected b/csv/test/csv-crc/recover/binary-good/expected
new file mode 100644
index 000000000..6f587e39e
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-good/expected
@@ -0,0 +1,4 @@
+output[0]/line="1,2,3,37878"
+output[1]/line="1,2,3,37878"
+output[2]/line="1,2,3,37878"
+count=3
diff --git a/csv/test/csv-crc/recover/binary-good/input b/csv/test/csv-crc/recover/binary-good/input
new file mode 100644
index 000000000..ecb843c63
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-good/input
@@ -0,0 +1,5 @@
+operation=recover
+binary=3ui,uw
+1,2,3,37878
+1,2,3,37878
+1,2,3,37878
diff --git a/csv/test/csv-crc/recover/give-up-after-21/expected b/csv/test/csv-crc/recover/give-up-after-21/expected
new file mode 100644
index 000000000..95a1d7a99
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-21/expected
@@ -0,0 +1,3 @@
+output[0]/line="1,2,3,37878"
+output[1]/line="1,2,3,37878"
+count=2
diff --git a/csv/test/csv-crc/recover/give-up-after-21/input b/csv/test/csv-crc/recover/give-up-after-21/input
new file mode 100644
index 000000000..8177a2b2f
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-21/input
@@ -0,0 +1,6 @@
+operation=recover
+binary=3ui,uw
+args="--give-up-after 21"
+1,2,3,37878
+1,2,3,37777
+1,2,3,37878
diff --git a/csv/test/csv-crc/recover/give-up-after-7/expected b/csv/test/csv-crc/recover/give-up-after-7/expected
new file mode 100644
index 000000000..cfe99d992
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-7/expected
@@ -0,0 +1,2 @@
+output[0]/line="1,2,3,37878"
+count=1
diff --git a/csv/test/csv-crc/recover/give-up-after-7/input b/csv/test/csv-crc/recover/give-up-after-7/input
new file mode 100644
index 000000000..b5400771b
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-7/input
@@ -0,0 +1,6 @@
+operation=recover
+binary=3ui,uw
+args="--give-up-after 7"
+1,2,3,37878
+1,2,3,37777
+1,2,3,37878
diff --git a/csv/test/csv-crc/test b/csv/test/csv-crc/test
new file mode 100755
index 000000000..0f991b0d5
--- /dev/null
+++ b/csv/test/csv-crc/test
@@ -0,0 +1,25 @@
+#!/bin/bash
+
+# read individual test parameters and data
+input=$( cat )
+eval "$( grep = <<< $input )"
+data=$( grep -v = <<< $input )
+
+[[ $operation ]] || exit 1
+[[ $data ]] || exit 1
+
+function run_test()
+{
+    if [[ $binary ]]; then
+        size=$( echo $binary | csv-format size )
+        output_format=$binary
+        [[ $operation == wrap ]] && output_format=$output_format,uw
+        echo "$data" | csv-to-bin $binary | csv-crc $operation --size $size $args | csv-from-bin $output_format
+    else
+        echo "$data" | csv-crc $operation $args
+    fi
+}
+
+output=$( run_test )
+echo "$output" | name-value-from-csv -f line -d : --line-number -p output
+echo count=$( wc -l <<< $output )
diff --git a/csv/test/csv-crc/wrap/ascii/expected b/csv/test/csv-crc/wrap/ascii/expected
new file mode 100644
index 000000000..dc20e8c6c
--- /dev/null
+++ b/csv/test/csv-crc/wrap/ascii/expected
@@ -0,0 +1,3 @@
+output[0]/line="1,2,3,8625"
+output[1]/line="4,5,6,55251"
+count=2
diff --git a/csv/test/csv-crc/wrap/ascii/input b/csv/test/csv-crc/wrap/ascii/input
new file mode 100644
index 000000000..a6e12e74f
--- /dev/null
+++ b/csv/test/csv-crc/wrap/ascii/input
@@ -0,0 +1,3 @@
+operation=wrap
+1,2,3
+4,5,6
diff --git a/csv/test/csv-crc/wrap/binary/expected b/csv/test/csv-crc/wrap/binary/expected
new file mode 100644
index 000000000..90ff5b1aa
--- /dev/null
+++ b/csv/test/csv-crc/wrap/binary/expected
@@ -0,0 +1,3 @@
+output[0]/line="1,2,3,37878"
+output[1]/line="4,5,6,58890"
+count=2
diff --git a/csv/test/csv-crc/wrap/binary/input b/csv/test/csv-crc/wrap/binary/input
new file mode 100644
index 000000000..d920d3b71
--- /dev/null
+++ b/csv/test/csv-crc/wrap/binary/input
@@ -0,0 +1,4 @@
+operation=wrap
+binary=3ui
+1,2,3
+4,5,6

From 886359a691ef68e929af4cbf7bab0d1dcaeb9476 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 12 Apr 2022 18:32:41 +1000
Subject: [PATCH 0421/1056] csv-crc.cpp: fix check mode to exit on failure with
 binary input

---
 csv/applications/csv-crc.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/csv/applications/csv-crc.cpp b/csv/applications/csv-crc.cpp
index 637bd4775..2c08b8c25 100644
--- a/csv/applications/csv-crc.cpp
+++ b/csv/applications/csv-crc.cpp
@@ -185,6 +185,7 @@ static bool run_()
                     {
                         if( recovered ) { std::cerr << "csv-crc: crc check failed" << ( !give_up_after || *give_up_after > 0 ? "; recovering..." : "" ) << std::endl; }
                         recovered = false;
+                        if( give_up_after && recovered_byte_count >= *give_up_after ) { break; }
                         ++recovered_byte_count;
                     }
                 }

From 39841cc10637e81d0c5e642fc536854f9be59d34 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 14 Apr 2022 10:09:04 +1000
Subject: [PATCH 0422/1056] csv-crc: modify test input values to more clearly
 see behaviour

---
 csv/test/csv-crc/check/ascii-bad/expected          |  2 +-
 csv/test/csv-crc/check/ascii-bad/input             |  7 ++++---
 csv/test/csv-crc/check/ascii-good/expected         |  9 +++++----
 csv/test/csv-crc/check/ascii-good/input            |  7 ++++---
 csv/test/csv-crc/check/binary-bad/expected         |  2 +-
 csv/test/csv-crc/check/binary-bad/input            |  7 ++++---
 csv/test/csv-crc/check/binary-good/expected        |  9 +++++----
 csv/test/csv-crc/check/binary-good/input           |  7 ++++---
 csv/test/csv-crc/recover/binary-bad/expected       |  7 ++++---
 csv/test/csv-crc/recover/binary-bad/input          |  7 ++++---
 csv/test/csv-crc/recover/binary-good/expected      |  9 +++++----
 csv/test/csv-crc/recover/binary-good/input         |  7 ++++---
 csv/test/csv-crc/recover/give-up-after-21/expected |  7 ++++---
 csv/test/csv-crc/recover/give-up-after-21/input    |  7 ++++---
 csv/test/csv-crc/recover/give-up-after-7/expected  |  2 +-
 csv/test/csv-crc/recover/give-up-after-7/input     |  7 ++++---
 csv/test/csv-crc/wrap/ascii/expected               | 14 +++++++++++---
 csv/test/csv-crc/wrap/ascii/input                  | 12 ++++++++++--
 csv/test/csv-crc/wrap/binary/expected              | 14 +++++++++++---
 csv/test/csv-crc/wrap/binary/input                 | 12 ++++++++++--
 20 files changed, 100 insertions(+), 55 deletions(-)

diff --git a/csv/test/csv-crc/check/ascii-bad/expected b/csv/test/csv-crc/check/ascii-bad/expected
index 2889b5d60..efcad8ed9 100644
--- a/csv/test/csv-crc/check/ascii-bad/expected
+++ b/csv/test/csv-crc/check/ascii-bad/expected
@@ -1,2 +1,2 @@
-output[0]/line="1,2,3,8625"
+output[0]/line="0,0,0,54755"
 count=1
diff --git a/csv/test/csv-crc/check/ascii-bad/input b/csv/test/csv-crc/check/ascii-bad/input
index e96e98c53..272285034 100644
--- a/csv/test/csv-crc/check/ascii-bad/input
+++ b/csv/test/csv-crc/check/ascii-bad/input
@@ -1,4 +1,5 @@
 operation=check
-1,2,3,8625
-1,2,3,8600
-1,2,3,8625
+0,0,0,54755
+1,1,1,0
+2,2,2,57154
+3,3,3,20994
diff --git a/csv/test/csv-crc/check/ascii-good/expected b/csv/test/csv-crc/check/ascii-good/expected
index 1e78e14ac..36a88a0d7 100644
--- a/csv/test/csv-crc/check/ascii-good/expected
+++ b/csv/test/csv-crc/check/ascii-good/expected
@@ -1,4 +1,5 @@
-output[0]/line="1,2,3,8625"
-output[1]/line="1,2,3,8625"
-output[2]/line="1,2,3,8625"
-count=3
+output[0]/line="0,0,0,54755"
+output[1]/line="1,1,1,22691"
+output[2]/line="2,2,2,57154"
+output[3]/line="3,3,3,20994"
+count=4
diff --git a/csv/test/csv-crc/check/ascii-good/input b/csv/test/csv-crc/check/ascii-good/input
index 97b8789ac..f64d1713f 100644
--- a/csv/test/csv-crc/check/ascii-good/input
+++ b/csv/test/csv-crc/check/ascii-good/input
@@ -1,4 +1,5 @@
 operation=check
-1,2,3,8625
-1,2,3,8625
-1,2,3,8625
+0,0,0,54755
+1,1,1,22691
+2,2,2,57154
+3,3,3,20994
diff --git a/csv/test/csv-crc/check/binary-bad/expected b/csv/test/csv-crc/check/binary-bad/expected
index cfe99d992..98ac01605 100644
--- a/csv/test/csv-crc/check/binary-bad/expected
+++ b/csv/test/csv-crc/check/binary-bad/expected
@@ -1,2 +1,2 @@
-output[0]/line="1,2,3,37878"
+output[0]/line="0,0,0,34041"
 count=1
diff --git a/csv/test/csv-crc/check/binary-bad/input b/csv/test/csv-crc/check/binary-bad/input
index ae724b9bc..0873c8bc1 100644
--- a/csv/test/csv-crc/check/binary-bad/input
+++ b/csv/test/csv-crc/check/binary-bad/input
@@ -1,5 +1,6 @@
 operation=check
 binary=3ui,uw
-1,2,3,37878
-1,2,3,37777
-1,2,3,37878
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/check/binary-good/expected b/csv/test/csv-crc/check/binary-good/expected
index 6f587e39e..d5a50a50a 100644
--- a/csv/test/csv-crc/check/binary-good/expected
+++ b/csv/test/csv-crc/check/binary-good/expected
@@ -1,4 +1,5 @@
-output[0]/line="1,2,3,37878"
-output[1]/line="1,2,3,37878"
-output[2]/line="1,2,3,37878"
-count=3
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+count=4
diff --git a/csv/test/csv-crc/check/binary-good/input b/csv/test/csv-crc/check/binary-good/input
index 74f8fe349..362856496 100644
--- a/csv/test/csv-crc/check/binary-good/input
+++ b/csv/test/csv-crc/check/binary-good/input
@@ -1,5 +1,6 @@
 operation=check
 binary=3ui,uw
-1,2,3,37878
-1,2,3,37878
-1,2,3,37878
+0,0,0,34041
+1,1,1,46827
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/binary-bad/expected b/csv/test/csv-crc/recover/binary-bad/expected
index 38d716d3f..3b497e5a4 100644
--- a/csv/test/csv-crc/recover/binary-bad/expected
+++ b/csv/test/csv-crc/recover/binary-bad/expected
@@ -1,3 +1,4 @@
-output[0]/line="1,2,3,37878"
-output[0]/line="1,2,3,37878"
-count=2
+output[0]/line="0,0,0,34041"
+output[1]/line="2,2,2,57565"
+output[2]/line="3,3,3,53967"
+count=3
diff --git a/csv/test/csv-crc/recover/binary-bad/input b/csv/test/csv-crc/recover/binary-bad/input
index 70c6d00e6..04ed0a7f8 100644
--- a/csv/test/csv-crc/recover/binary-bad/input
+++ b/csv/test/csv-crc/recover/binary-bad/input
@@ -1,5 +1,6 @@
 operation=recover
 binary=3ui,uw
-1,2,3,37878
-1,2,3,37777
-1,2,3,37878
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/binary-good/expected b/csv/test/csv-crc/recover/binary-good/expected
index 6f587e39e..d5a50a50a 100644
--- a/csv/test/csv-crc/recover/binary-good/expected
+++ b/csv/test/csv-crc/recover/binary-good/expected
@@ -1,4 +1,5 @@
-output[0]/line="1,2,3,37878"
-output[1]/line="1,2,3,37878"
-output[2]/line="1,2,3,37878"
-count=3
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+count=4
diff --git a/csv/test/csv-crc/recover/binary-good/input b/csv/test/csv-crc/recover/binary-good/input
index ecb843c63..28a29aa1e 100644
--- a/csv/test/csv-crc/recover/binary-good/input
+++ b/csv/test/csv-crc/recover/binary-good/input
@@ -1,5 +1,6 @@
 operation=recover
 binary=3ui,uw
-1,2,3,37878
-1,2,3,37878
-1,2,3,37878
+0,0,0,34041
+1,1,1,46827
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/give-up-after-21/expected b/csv/test/csv-crc/recover/give-up-after-21/expected
index 95a1d7a99..3b497e5a4 100644
--- a/csv/test/csv-crc/recover/give-up-after-21/expected
+++ b/csv/test/csv-crc/recover/give-up-after-21/expected
@@ -1,3 +1,4 @@
-output[0]/line="1,2,3,37878"
-output[1]/line="1,2,3,37878"
-count=2
+output[0]/line="0,0,0,34041"
+output[1]/line="2,2,2,57565"
+output[2]/line="3,3,3,53967"
+count=3
diff --git a/csv/test/csv-crc/recover/give-up-after-21/input b/csv/test/csv-crc/recover/give-up-after-21/input
index 8177a2b2f..0d8b71097 100644
--- a/csv/test/csv-crc/recover/give-up-after-21/input
+++ b/csv/test/csv-crc/recover/give-up-after-21/input
@@ -1,6 +1,7 @@
 operation=recover
 binary=3ui,uw
 args="--give-up-after 21"
-1,2,3,37878
-1,2,3,37777
-1,2,3,37878
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/give-up-after-7/expected b/csv/test/csv-crc/recover/give-up-after-7/expected
index cfe99d992..98ac01605 100644
--- a/csv/test/csv-crc/recover/give-up-after-7/expected
+++ b/csv/test/csv-crc/recover/give-up-after-7/expected
@@ -1,2 +1,2 @@
-output[0]/line="1,2,3,37878"
+output[0]/line="0,0,0,34041"
 count=1
diff --git a/csv/test/csv-crc/recover/give-up-after-7/input b/csv/test/csv-crc/recover/give-up-after-7/input
index b5400771b..798df435b 100644
--- a/csv/test/csv-crc/recover/give-up-after-7/input
+++ b/csv/test/csv-crc/recover/give-up-after-7/input
@@ -1,6 +1,7 @@
 operation=recover
 binary=3ui,uw
 args="--give-up-after 7"
-1,2,3,37878
-1,2,3,37777
-1,2,3,37878
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/wrap/ascii/expected b/csv/test/csv-crc/wrap/ascii/expected
index dc20e8c6c..320309a98 100644
--- a/csv/test/csv-crc/wrap/ascii/expected
+++ b/csv/test/csv-crc/wrap/ascii/expected
@@ -1,3 +1,11 @@
-output[0]/line="1,2,3,8625"
-output[1]/line="4,5,6,55251"
-count=2
+output[0]/line="0,0,0,54755"
+output[1]/line="1,1,1,22691"
+output[2]/line="2,2,2,57154"
+output[3]/line="3,3,3,20994"
+output[4]/line="4,4,4,49313"
+output[5]/line="5,5,5,19937"
+output[6]/line="6,6,6,51712"
+output[7]/line="7,7,7,18240"
+output[8]/line="8,8,8,65383"
+output[9]/line="9,9,9,29223"
+count=10
diff --git a/csv/test/csv-crc/wrap/ascii/input b/csv/test/csv-crc/wrap/ascii/input
index a6e12e74f..82e0e414b 100644
--- a/csv/test/csv-crc/wrap/ascii/input
+++ b/csv/test/csv-crc/wrap/ascii/input
@@ -1,3 +1,11 @@
 operation=wrap
-1,2,3
-4,5,6
+0,0,0
+1,1,1
+2,2,2
+3,3,3
+4,4,4
+5,5,5
+6,6,6
+7,7,7
+8,8,8
+9,9,9
diff --git a/csv/test/csv-crc/wrap/binary/expected b/csv/test/csv-crc/wrap/binary/expected
index 90ff5b1aa..a21ec8d4f 100644
--- a/csv/test/csv-crc/wrap/binary/expected
+++ b/csv/test/csv-crc/wrap/binary/expected
@@ -1,3 +1,11 @@
-output[0]/line="1,2,3,37878"
-output[1]/line="4,5,6,58890"
-count=2
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+output[4]/line="4,4,4,19633"
+output[5]/line="5,5,5,32419"
+output[6]/line="6,6,6,10389"
+output[7]/line="7,7,7,6791"
+output[8]/line="8,8,8,1096"
+output[9]/line="9,9,9,13914"
+count=10
diff --git a/csv/test/csv-crc/wrap/binary/input b/csv/test/csv-crc/wrap/binary/input
index d920d3b71..00e305daa 100644
--- a/csv/test/csv-crc/wrap/binary/input
+++ b/csv/test/csv-crc/wrap/binary/input
@@ -1,4 +1,12 @@
 operation=wrap
 binary=3ui
-1,2,3
-4,5,6
+0,0,0
+1,1,1
+2,2,2
+3,3,3
+4,4,4
+5,5,5
+6,6,6
+7,7,7
+8,8,8
+9,9,9

From a499e9fc885defb9e1733e2e975dfa6315d1ce5c Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 14 Apr 2022 16:24:54 +1000
Subject: [PATCH 0423/1056] csv-crc: clarified behaviour in help and added more
 tests

The tests match the behaviour described by help.
Currently some of these tests will fail as the application behaviour does not
match the help in all cases.
---
 csv/applications/csv-crc.cpp                  | 87 ++++++++++---------
 csv/test/csv-crc/check/big-endian/expected    |  5 ++
 csv/test/csv-crc/check/big-endian/input       |  7 ++
 .../csv-crc/recover/binary-bad-1/expected     | 10 +++
 csv/test/csv-crc/recover/binary-bad-1/input   | 12 +++
 .../csv-crc/recover/binary-bad-2/expected     |  9 ++
 csv/test/csv-crc/recover/binary-bad-2/input   | 12 +++
 .../csv-crc/recover/binary-bad-3/expected     |  8 ++
 csv/test/csv-crc/recover/binary-bad-3/input   | 12 +++
 csv/test/csv-crc/recover/binary-bad/expected  |  4 -
 .../csv-crc/recover/discard-after-1/expected  |  9 ++
 .../csv-crc/recover/discard-after-1/input     | 13 +++
 .../csv-crc/recover/discard-after-2/expected  |  6 ++
 .../csv-crc/recover/discard-after-2/input     | 13 +++
 .../csv-crc/recover/give-up-after-0/expected  |  2 +
 .../{binary-bad => give-up-after-0}/input     |  1 +
 .../csv-crc/recover/recover-after-1/expected  | 10 +++
 .../csv-crc/recover/recover-after-1/input     | 13 +++
 .../csv-crc/recover/recover-after-10/expected |  5 ++
 .../csv-crc/recover/recover-after-10/input    | 13 +++
 .../csv-crc/recover/recover-after-2/expected  |  8 ++
 .../csv-crc/recover/recover-after-2/input     | 13 +++
 csv/test/csv-crc/wrap/big-endian/expected     | 11 +++
 csv/test/csv-crc/wrap/big-endian/input        | 13 +++
 24 files changed, 251 insertions(+), 45 deletions(-)
 create mode 100644 csv/test/csv-crc/check/big-endian/expected
 create mode 100644 csv/test/csv-crc/check/big-endian/input
 create mode 100644 csv/test/csv-crc/recover/binary-bad-1/expected
 create mode 100644 csv/test/csv-crc/recover/binary-bad-1/input
 create mode 100644 csv/test/csv-crc/recover/binary-bad-2/expected
 create mode 100644 csv/test/csv-crc/recover/binary-bad-2/input
 create mode 100644 csv/test/csv-crc/recover/binary-bad-3/expected
 create mode 100644 csv/test/csv-crc/recover/binary-bad-3/input
 delete mode 100644 csv/test/csv-crc/recover/binary-bad/expected
 create mode 100644 csv/test/csv-crc/recover/discard-after-1/expected
 create mode 100644 csv/test/csv-crc/recover/discard-after-1/input
 create mode 100644 csv/test/csv-crc/recover/discard-after-2/expected
 create mode 100644 csv/test/csv-crc/recover/discard-after-2/input
 create mode 100644 csv/test/csv-crc/recover/give-up-after-0/expected
 rename csv/test/csv-crc/recover/{binary-bad => give-up-after-0}/input (75%)
 create mode 100644 csv/test/csv-crc/recover/recover-after-1/expected
 create mode 100644 csv/test/csv-crc/recover/recover-after-1/input
 create mode 100644 csv/test/csv-crc/recover/recover-after-10/expected
 create mode 100644 csv/test/csv-crc/recover/recover-after-10/input
 create mode 100644 csv/test/csv-crc/recover/recover-after-2/expected
 create mode 100644 csv/test/csv-crc/recover/recover-after-2/input
 create mode 100644 csv/test/csv-crc/wrap/big-endian/expected
 create mode 100644 csv/test/csv-crc/wrap/big-endian/input

diff --git a/csv/applications/csv-crc.cpp b/csv/applications/csv-crc.cpp
index 2c08b8c25..b998eee7e 100644
--- a/csv/applications/csv-crc.cpp
+++ b/csv/applications/csv-crc.cpp
@@ -45,47 +45,52 @@
 
 static void usage( bool )
 {
-    std::cerr << std::endl;
-    std::cerr << "wrap/check crc on fixed-width input (ascii or binary)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: csv-crc <commands> [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<command>" << std::endl;
-    std::cerr << "    wrap: add crc" << std::endl;
-    std::cerr << "    check: check crc; exit, if check fails" << std::endl;
-    std::cerr << "    recover: recover with given parameters (see below)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "data options" << std::endl;
-    std::cerr << "    --crc-size; output given crc size to stdout and exit" << std::endl;
-    std::cerr << "    --delimiter,-d=<delimiter>: ascii csv delimiter" << std::endl;
-    std::cerr << "    --size=<size>: binary data size; if absent, expect ascii csv" << std::endl;
-    std::cerr << "                   for wrap: payload size" << std::endl;
-    std::cerr << "                   for check/recover size including crc" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "crc options" << std::endl;
-    std::cerr << "    --crc=<which>:" << std::endl;
-    std::cerr << "        16: 16-bit, generator 0x8805" << std::endl;
-    std::cerr << "        ccitt: 16-bit, generator 0x1021" << std::endl;
-    std::cerr << "        xmodem: 16-bit, generator 0x1021" << std::endl;
-    std::cerr << "        32: 32-bit, generator 0x04C11DB7" << std::endl;
-    //std::cerr << "        checksum16: simple 16-bit checksum (todo)" << std::endl;
-    //std::cerr << "        checksum32: simple 32-bit checksum (todo)" << std::endl;
-    std::cerr << "        default: ccitt" << std::endl;
-    std::cerr << "    --big-endian,--net-byte-order: if binary, crc is big endian" << std::endl;
-    std::cerr << "    --verbose,-v: more output" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    For a definitive list of 16 bits CRC algorithms see:" << std::endl;
-    std::cerr << "    http://reveng.sourceforge.net/crc-catalogue/16.htm" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "recovery options" << std::endl;
-    std::cerr << "    --give-up-after=<n>: if check fails, give up after <n> bytes" << std::endl;
-    std::cerr << "                         if absent and no --recover-after: default 0" << std::endl;
-    std::cerr << "                         if absent and --recover-after: default infinity (don't give up)" << std::endl;
-    std::cerr << "    --recover-after=<n>: if check fails and then new valid crc found" << std::endl;
-    std::cerr << "                         make sure that at least <n> subsequent lines (ascii) or" << std::endl;
-    std::cerr << "                         packets (binary) are valid, before output; default 0, i.e. recover on the next valid" << std::endl;
-    std::cerr << "    --discard-on-recovery,--discard: discard those <n> packets accumulated during the recovery check" << std::endl;
-    std::cerr << std::endl;
+    std::cerr << "\n";
+    std::cerr << "wrap/check crc on fixed-width input (ascii or binary)\n";
+    std::cerr << "\n";
+    std::cerr << "usage: csv-crc <command> [<options>]\n";
+    std::cerr << "\n";
+    std::cerr << "<command>\n";
+    std::cerr << "    wrap:    add crc\n";
+    std::cerr << "    check:   check crc; exit if check fails\n";
+    std::cerr << "    recover: recover with given parameters (see below)\n";
+    std::cerr << "\n";
+    std::cerr << "general options\n";
+    std::cerr << "    --help,-h;    this help\n";
+    std::cerr << "    --verbose,-v: more output\n";
+    std::cerr << "\n";
+    std::cerr << "data options\n";
+    std::cerr << "    --crc-size;      output given crc size to stdout and exit\n";
+    std::cerr << "    --delimiter,-d=[<char>]: ascii csv delimiter\n";
+    std::cerr << "    --size=[<size>]: binary data size; if absent, expect ascii csv\n";
+    std::cerr << "                     for wrap: payload size\n";
+    std::cerr << "                     for check/recover: size including crc\n";
+    std::cerr << "\n";
+    std::cerr << "crc options\n";
+    std::cerr << "    --crc=<which>:\n";
+    std::cerr << "        16:     16-bit, generator 0x8805\n";
+    std::cerr << "        ccitt:  16-bit, generator 0x1021\n";
+    std::cerr << "        xmodem: 16-bit, generator 0x1021\n";
+    std::cerr << "        32:     32-bit, generator 0x04C11DB7\n";
+    //std::cerr << "        checksum16: simple 16-bit checksum (todo)\n";
+    //std::cerr << "        checksum32: simple 32-bit checksum (todo)\n";
+    std::cerr << "        default: ccitt\n";
+    std::cerr << "    --big-endian,--net-byte-order: if binary, crc is big endian\n";
+    std::cerr << "\n";
+    std::cerr << "recover options\n";
+    std::cerr << "    --give-up-after=<n>: if check fails, give up after <n> bytes\n";
+    std::cerr << "                         default: infinity; don't give up\n";
+    std::cerr << "    --recover-after=<n>: if check fails and then new valid crc found\n";
+    std::cerr << "                         make sure that at least <n> subsequent lines (ascii)\n";
+    std::cerr << "                         or packets (binary) are valid, before output;\n";
+    std::cerr << "                         default: 0; recover on the next valid packet\n";
+    std::cerr << "    --discard-on-recovery,--discard: discard packets accumulated when recovering\n";
+    std::cerr << "\n";
+    std::cerr << "    Note that the check command is equivalent to\n";
+    std::cerr << "    csv-crc recover --give-up-after 0\n";
+    std::cerr << "\n";
+    std::cerr << "For a definitive list of 16 bit CRC algorithms see:\n";
+    std::cerr << "http://reveng.sourceforge.net/crc-catalogue/16.htm\n";
     std::cerr << std::endl;
     exit( 1 );
 }
diff --git a/csv/test/csv-crc/check/big-endian/expected b/csv/test/csv-crc/check/big-endian/expected
new file mode 100644
index 000000000..016496f83
--- /dev/null
+++ b/csv/test/csv-crc/check/big-endian/expected
@@ -0,0 +1,5 @@
+output[0]/line="0,0,0,63876"
+output[1]/line="1,1,1,60342"
+output[2]/line="2,2,2,56800"
+output[3]/line="3,3,3,53202"
+count=4
diff --git a/csv/test/csv-crc/check/big-endian/input b/csv/test/csv-crc/check/big-endian/input
new file mode 100644
index 000000000..e9f01c460
--- /dev/null
+++ b/csv/test/csv-crc/check/big-endian/input
@@ -0,0 +1,7 @@
+operation=check
+binary=3ui,uw
+args="--big-endian"
+0,0,0,63876
+1,1,1,60342
+2,2,2,56800
+3,3,3,53202
diff --git a/csv/test/csv-crc/recover/binary-bad-1/expected b/csv/test/csv-crc/recover/binary-bad-1/expected
new file mode 100644
index 000000000..87d9b518d
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-1/expected
@@ -0,0 +1,10 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="2,2,2,57565"
+output[2]/line="3,3,3,53967"
+output[3]/line="4,4,4,19633"
+output[4]/line="5,5,5,32419"
+output[5]/line="6,6,6,10389"
+output[6]/line="7,7,7,6791"
+output[7]/line="8,8,8,1096"
+output[8]/line="9,9,9,13914"
+count=9
diff --git a/csv/test/csv-crc/recover/binary-bad-1/input b/csv/test/csv-crc/recover/binary-bad-1/input
new file mode 100644
index 000000000..e07603006
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-1/input
@@ -0,0 +1,12 @@
+operation=recover
+binary=3ui,uw
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/binary-bad-2/expected b/csv/test/csv-crc/recover/binary-bad-2/expected
new file mode 100644
index 000000000..da2800f25
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-2/expected
@@ -0,0 +1,9 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="3,3,3,53967"
+output[2]/line="4,4,4,19633"
+output[3]/line="5,5,5,32419"
+output[4]/line="6,6,6,10389"
+output[5]/line="7,7,7,6791"
+output[6]/line="8,8,8,1096"
+output[7]/line="9,9,9,13914"
+count=8
diff --git a/csv/test/csv-crc/recover/binary-bad-2/input b/csv/test/csv-crc/recover/binary-bad-2/input
new file mode 100644
index 000000000..98a092270
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-2/input
@@ -0,0 +1,12 @@
+operation=recover
+binary=3ui,uw
+0,0,0,34041
+1,1,1,0
+2,2,2,0
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/binary-bad-3/expected b/csv/test/csv-crc/recover/binary-bad-3/expected
new file mode 100644
index 000000000..f03fe1cbc
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-3/expected
@@ -0,0 +1,8 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="4,4,4,19633"
+output[2]/line="5,5,5,32419"
+output[3]/line="6,6,6,10389"
+output[4]/line="7,7,7,6791"
+output[5]/line="8,8,8,1096"
+output[6]/line="9,9,9,13914"
+count=7
diff --git a/csv/test/csv-crc/recover/binary-bad-3/input b/csv/test/csv-crc/recover/binary-bad-3/input
new file mode 100644
index 000000000..ed36c0e4a
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-3/input
@@ -0,0 +1,12 @@
+operation=recover
+binary=3ui,uw
+0,0,0,34041
+1,1,1,0
+2,2,2,0
+3,3,3,0
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/binary-bad/expected b/csv/test/csv-crc/recover/binary-bad/expected
deleted file mode 100644
index 3b497e5a4..000000000
--- a/csv/test/csv-crc/recover/binary-bad/expected
+++ /dev/null
@@ -1,4 +0,0 @@
-output[0]/line="0,0,0,34041"
-output[1]/line="2,2,2,57565"
-output[2]/line="3,3,3,53967"
-count=3
diff --git a/csv/test/csv-crc/recover/discard-after-1/expected b/csv/test/csv-crc/recover/discard-after-1/expected
new file mode 100644
index 000000000..da2800f25
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-1/expected
@@ -0,0 +1,9 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="3,3,3,53967"
+output[2]/line="4,4,4,19633"
+output[3]/line="5,5,5,32419"
+output[4]/line="6,6,6,10389"
+output[5]/line="7,7,7,6791"
+output[6]/line="8,8,8,1096"
+output[7]/line="9,9,9,13914"
+count=8
diff --git a/csv/test/csv-crc/recover/discard-after-1/input b/csv/test/csv-crc/recover/discard-after-1/input
new file mode 100644
index 000000000..05462938c
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-1/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 1 --discard"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/discard-after-2/expected b/csv/test/csv-crc/recover/discard-after-2/expected
new file mode 100644
index 000000000..d89a4f109
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-2/expected
@@ -0,0 +1,6 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="6,6,6,10389"
+output[2]/line="7,7,7,6791"
+output[3]/line="8,8,8,1096"
+output[4]/line="9,9,9,13914"
+count=5
diff --git a/csv/test/csv-crc/recover/discard-after-2/input b/csv/test/csv-crc/recover/discard-after-2/input
new file mode 100644
index 000000000..3e55f6cc8
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-2/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 2 --discard"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,0
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/give-up-after-0/expected b/csv/test/csv-crc/recover/give-up-after-0/expected
new file mode 100644
index 000000000..98ac01605
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-0/expected
@@ -0,0 +1,2 @@
+output[0]/line="0,0,0,34041"
+count=1
diff --git a/csv/test/csv-crc/recover/binary-bad/input b/csv/test/csv-crc/recover/give-up-after-0/input
similarity index 75%
rename from csv/test/csv-crc/recover/binary-bad/input
rename to csv/test/csv-crc/recover/give-up-after-0/input
index 04ed0a7f8..981369062 100644
--- a/csv/test/csv-crc/recover/binary-bad/input
+++ b/csv/test/csv-crc/recover/give-up-after-0/input
@@ -1,5 +1,6 @@
 operation=recover
 binary=3ui,uw
+args="--give-up-after 0"
 0,0,0,34041
 1,1,1,0
 2,2,2,57565
diff --git a/csv/test/csv-crc/recover/recover-after-1/expected b/csv/test/csv-crc/recover/recover-after-1/expected
new file mode 100644
index 000000000..87d9b518d
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-1/expected
@@ -0,0 +1,10 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="2,2,2,57565"
+output[2]/line="3,3,3,53967"
+output[3]/line="4,4,4,19633"
+output[4]/line="5,5,5,32419"
+output[5]/line="6,6,6,10389"
+output[6]/line="7,7,7,6791"
+output[7]/line="8,8,8,1096"
+output[8]/line="9,9,9,13914"
+count=9
diff --git a/csv/test/csv-crc/recover/recover-after-1/input b/csv/test/csv-crc/recover/recover-after-1/input
new file mode 100644
index 000000000..988d63176
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-1/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 1"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/recover-after-10/expected b/csv/test/csv-crc/recover/recover-after-10/expected
new file mode 100644
index 000000000..d5a50a50a
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-10/expected
@@ -0,0 +1,5 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+count=4
diff --git a/csv/test/csv-crc/recover/recover-after-10/input b/csv/test/csv-crc/recover/recover-after-10/input
new file mode 100644
index 000000000..9cd49614b
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-10/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 10"
+0,0,0,34041
+1,1,1,46827
+2,2,2,57565
+3,3,3,53967
+4,4,4,0
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/recover-after-2/expected b/csv/test/csv-crc/recover/recover-after-2/expected
new file mode 100644
index 000000000..f03fe1cbc
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-2/expected
@@ -0,0 +1,8 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="4,4,4,19633"
+output[2]/line="5,5,5,32419"
+output[3]/line="6,6,6,10389"
+output[4]/line="7,7,7,6791"
+output[5]/line="8,8,8,1096"
+output[6]/line="9,9,9,13914"
+count=7
diff --git a/csv/test/csv-crc/recover/recover-after-2/input b/csv/test/csv-crc/recover/recover-after-2/input
new file mode 100644
index 000000000..687ae2121
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-2/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 2"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,0
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/wrap/big-endian/expected b/csv/test/csv-crc/wrap/big-endian/expected
new file mode 100644
index 000000000..e0e2c23f7
--- /dev/null
+++ b/csv/test/csv-crc/wrap/big-endian/expected
@@ -0,0 +1,11 @@
+output[0]/line="0,0,0,63876"
+output[1]/line="1,1,1,60342"
+output[2]/line="2,2,2,56800"
+output[3]/line="3,3,3,53202"
+output[4]/line="4,4,4,45388"
+output[5]/line="5,5,5,41854"
+output[6]/line="6,6,6,38184"
+output[7]/line="7,7,7,34586"
+output[8]/line="8,8,8,18436"
+output[9]/line="9,9,9,23094"
+count=10
diff --git a/csv/test/csv-crc/wrap/big-endian/input b/csv/test/csv-crc/wrap/big-endian/input
new file mode 100644
index 000000000..3d773dbe0
--- /dev/null
+++ b/csv/test/csv-crc/wrap/big-endian/input
@@ -0,0 +1,13 @@
+operation=wrap
+binary=3ui
+args="--big-endian"
+0,0,0
+1,1,1
+2,2,2
+3,3,3
+4,4,4
+5,5,5
+6,6,6
+7,7,7
+8,8,8
+9,9,9

From 524c5c1b52519260f05ed6adc26a50fc18feaaea Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 14 Apr 2022 16:29:47 +1000
Subject: [PATCH 0424/1056] csv-crc: fix behaviour for --recover-after option

previously it would output duplicate records and records that didn't meet the
--recover-after threshold
---
 csv/applications/csv-crc.cpp | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-crc.cpp b/csv/applications/csv-crc.cpp
index b998eee7e..735ab5cee 100644
--- a/csv/applications/csv-crc.cpp
+++ b/csv/applications/csv-crc.cpp
@@ -146,6 +146,7 @@ static bool run_()
         bool recovered = true;
         std::size_t recovered_count = 0;
         std::size_t recovered_byte_count = 0;
+        std::size_t current_recovered_byte_count = 0;
         std::vector< char > recovery_buffer( recover_after * size );
         while( std::cin.good() && !std::cin.eof() )
         {
@@ -167,6 +168,7 @@ static bool run_()
                     if( big_endian ) { expected = traits< typename Crc::value_type >::hton( expected ); }
                     if( crc == expected )
                     {
+                        bool output_input_buffer = true;
                         if( !recovered )
                         {
                             if( recovered_count == recover_after )
@@ -176,27 +178,34 @@ static bool run_()
                                 recovered = true;
                                 recovered_count = 0;
                                 recovered_byte_count = 0;
+                                current_recovered_byte_count = 0;
                             }
                             else
                             {
                                 ::memcpy( &recovery_buffer[ recovered_count * size ], p, size );
                                 ++recovered_count;
+                                output_input_buffer = false;        // we're just stashing them until we check
                             }
                         }
-                        std::cout.write( p, size );
+                        if( output_input_buffer ) { std::cout.write( p, size ); }
                         std::cout.flush();
                     }
                     else // quick and dirty: lots of code duplication, but just to make it working
                     {
+                        if( current_recovered_byte_count / size > recovered_count )
+                        {
+                            recovered_count = 0;
+                            current_recovered_byte_count = 0;
+                        }
                         if( recovered ) { std::cerr << "csv-crc: crc check failed" << ( !give_up_after || *give_up_after > 0 ? "; recovering..." : "" ) << std::endl; }
                         recovered = false;
                         if( give_up_after && recovered_byte_count >= *give_up_after ) { break; }
-                        ++recovered_byte_count;
                     }
                 }
                 unsigned int step = recovered ? size : 1;
                 p += step;
                 offset -= step;
+                if( !recovered ) { recovered_byte_count += step; current_recovered_byte_count += step; }
                 if( end - p < int( size ) )
                 {
                     ::memcpy( begin, p, offset ); // todo: quick and dirty, check if works in case of overlapping

From 26e1c830e2a78c1f32734dcbffadca1d208a758c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 22 Apr 2022 12:34:28 +1000
Subject: [PATCH 0425/1056] ansible: python changed to python3

---
 system/ansible/install.python3.yml | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
index 0076254e9..c476c0e42 100644
--- a/system/ansible/install.python3.yml
+++ b/system/ansible/install.python3.yml
@@ -13,13 +13,13 @@
     become: true
     apt: pkg={{ item }} state=present update_cache=yes
     with_items:
-      - build-essential 
+      - build-essential
       - git
       - cmake-curses-gui
       - cmake
       - gawk
       - perl
-      - python
+      - python3
       - libboost-all-dev
       - socat
       - libzmq3-dev
@@ -29,7 +29,7 @@
       - python3-pip
       - libprocps-dev
       - recode
-      
+
   - name: "install comma regressions test dependencies"
     become: true
     apt: pkg={{ item }} state=present update_cache=yes
@@ -37,20 +37,20 @@
       - moreutils
       - net-tools
       - pv
-      
+
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
     with_items:
         - src
         - build
-    
+
   - name: "comma: clone"
     git:
         repo: "https://gitlab.com/orthographic/comma.git"
         dest: "{{ base }}/src/comma"
         clone: yes
         update: yes
-        
+
   - name: "comma: make build directory at {{ base }}"
     file: dest="{{ base }}/build/comma" state=directory
 

From 99dda7e5042c1944564275104858fa69af92e353 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 22 Apr 2022 12:44:50 +1000
Subject: [PATCH 0426/1056] minor compilation fix

---
 application/test/application_test.cpp |  6 +++---
 csv/applications/csv-units.cpp        | 27 ++++++++++++++-------------
 2 files changed, 17 insertions(+), 16 deletions(-)

diff --git a/application/test/application_test.cpp b/application/test/application_test.cpp
index f3cfd2481..d4ebe5a0c 100644
--- a/application/test/application_test.cpp
+++ b/application/test/application_test.cpp
@@ -63,8 +63,8 @@ TEST( application, command_line_options )
     EXPECT_TRUE( !options.exists( "--d" ) );
     EXPECT_TRUE( options.values< int >( "-x" ).empty() );
     EXPECT_TRUE( options.values< int >( "-x,-y,-z" ).empty() );
-    EXPECT_EQ( options.optional< int >( "-x" ), boost::optional< int >() );
-    EXPECT_EQ( options.optional< int >( "-x,-y,-z" ), boost::optional< int >() );
+    EXPECT_FALSE( bool( options.optional< int >( "-x" ) ) );
+    EXPECT_FALSE( bool( options.optional< int >( "-x,-y,-z" ) ) );
     EXPECT_EQ( options.value< std::string >( "-a" ), "b" );
     EXPECT_EQ( options.value< bool >( "--a" ), true );
     EXPECT_EQ( options.value< int >( "--b" ), 15 );
@@ -290,7 +290,7 @@ TEST( application, command_line_options_description_default_values_double_quotes
     check_default_value( "--filename,-f=[<filename>]; default=\"blah=\\\"$var\\\"\" ; some filename", "blah=\"$var\"" );
     check_default_value( "--filename,-f=[<filename>]; default=\"blah with space \"; some filename", "blah with space " );
 }
-    
+
 int main( int argc, char* argv[] )
 {
     ::testing::InitGoogleTest( &argc, argv );
diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index 18f3eb8a4..c46bfd541 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -33,6 +33,7 @@
 #include <iostream>
 #include <boost/array.hpp>
 #include <boost/bind.hpp>
+#include <boost/optional.hpp>
 #include <boost/unordered/unordered_map.hpp>
 
 #include <boost/units/systems/si.hpp>
@@ -130,7 +131,7 @@ typedef boost::units::absolute< boost::units::si::temperature > kelvin_t;
 typedef boost::units::absolute< boost::units::celsius::temperature > celsius_t;
 typedef boost::units::absolute< boost::units::fahrenheit::temperature > fahrenheit_t;
 
-/// Converts the given value between the two template measurement units 
+/// Converts the given value between the two template measurement units
 template < typename From, typename To >
 double cast( double input )
 {
@@ -198,7 +199,7 @@ namespace units {
               count,
               invalid
     };
-    
+
     static boost::array< et, count > metric = {{ kelvin
                                                , radians
                                                , kelvin
@@ -251,7 +252,7 @@ namespace units {
     /// returns a name even if the value is invalid
     std::string debug_name( const et val ) { return val < 0 || val > invalid ? "ERROR:" + boost::lexical_cast<std::string>(val) : name( val ); }
 
-    /// Given a canonical name or an alias of a measurement unit 
+    /// Given a canonical name or an alias of a measurement unit
     /// retrieve the canonical enumeration.
     et value( std::string const & str )
     {
@@ -295,18 +296,18 @@ namespace units {
         if( map.cend() != citr ) { return citr->second; }
         COMMA_THROW( comma::exception, "expected unit name, got \"" << str << "\"" );
     }
-    
+
     /// A type to allow a lookup table for converting units
     //typedef double (* cast_function)( double );
     typedef boost::function< double( double ) > cast_function;
-    
+
     /// Retrieve a function that will convert between the two given
     /// measurement units.
     /// @returns NULL if the conversion is not supported.
     cast_function cast_lookup( const et from, const et to ) // quick and dirty
     {
         if ( from < 0 || from >= count ) { COMMA_THROW( comma::exception, "can not cast lookup for invalid unit (from) " << from ); }
-        if ( to < 0 || to >= count ) { COMMA_THROW( comma::exception, "can not cast lookup for invalid unit (to) " << to ); }        
+        if ( to < 0 || to >= count ) { COMMA_THROW( comma::exception, "can not cast lookup for invalid unit (to) " << to ); }
         static cast_function map[count][count] = { { NULL, }, };
         static bool initialised = false;
         if (! initialised )
@@ -348,7 +349,7 @@ namespace units {
         }
         return map[from][to];
     }
-    
+
     /// Test if the conversion between two measurement units is supported.
     bool can_convert( const et from, const et to ) { return NULL != cast_lookup(from, to); }
 }
@@ -376,7 +377,7 @@ struct item_t
 
 struct input_t
 {
-    std::vector< item_t > values;    
+    std::vector< item_t > values;
 };
 
 namespace comma { namespace visiting {
@@ -420,7 +421,7 @@ static std::string init_input_field( const std::string& v )
 {
     const std::string stripped( comma::strip( v, ' ' ) );
     if( stripped.empty() ) { return std::string(); }
-    
+
     const size_t pos = stripped.rfind( '/' );
     std::string head, tail;
     if ( std::string::npos == pos ) // just a
@@ -438,11 +439,11 @@ static std::string init_input_field( const std::string& v )
             tail = "value";
         }
     }
-    
+
     unsigned idx = input_fields.size();
     if ( input_fields.cend() == input_fields.find( head ) ) { input_fields[head] = idx; }
     else { idx = input_fields.at( head ); }
-    
+
     return "values[" + boost::lexical_cast< std::string >( idx ) + "]/" + tail;
 }
 
@@ -483,7 +484,7 @@ static int run( const units::et from, const units::et to )
 
     units::cast_function const default_cast_function = units::cast_lookup( from, to );
     if (NULL == default_cast_function) { COMMA_THROW( comma::exception, "unsupported default conversion from " << debug_name(from) << " to " << debug_name(to) ); }
-    
+
     unsigned line = 0;
     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
     {
@@ -514,7 +515,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
-        
+
         if( options.exists( "--help,-h" ) ) usage();
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );

From 688726f27c59bdf697bae0523a3b4ba6a6ecda46 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 22 Apr 2022 12:49:41 +1000
Subject: [PATCH 0427/1056] minor compilation fix

---
 csv/test/ascii_test.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/csv/test/ascii_test.cpp b/csv/test/ascii_test.cpp
index a6f61643c..cc87283b2 100644
--- a/csv/test/ascii_test.cpp
+++ b/csv/test/ascii_test.cpp
@@ -30,6 +30,9 @@
 
 #include <gtest/gtest.h>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#if ( BOOST_VERSION >= 107400 ) // quick and dirty; fixing trivial compilation error
+#include <boost/optional/optional_io.hpp>
+#endif
 #include "../../csv/ascii.h"
 #include "../../string/string.h"
 

From 2ff5c7cf30a406abc7edfa2dd004045ba28c7149 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 5 May 2022 18:41:41 +1000
Subject: [PATCH 0428/1056] csv-random: trivial refactoring

---
 csv/applications/csv-random.cpp | 61 ++++++++++-----------------------
 1 file changed, 18 insertions(+), 43 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index f295f55c7..ccb339eec 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -111,6 +111,7 @@ struct type_traits< unsigned char >
 };
 
 namespace make {
+
 template < typename T, template < typename > class Distribution, typename Engine >
 static int run_impl( Distribution< T >& distribution, bool append, bool binary, std::size_t count )
 {
@@ -125,11 +126,7 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
             {
                 std::cin.read( &buf[0], buf.size() );
                 if( std::cin.gcount() == 0 ) { break; }
-                if( std::cin.gcount() != static_cast< int >( buf.size() ) )
-                {
-                    std::cerr << "csv-random make: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl;
-                    return 1;
-                }
+                if( std::cin.gcount() != static_cast< int >( buf.size() ) ) { std::cerr << "csv-random make: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
                 std::cout.write( &buf[0], buf.size() );
                 for( std::size_t i = 0; i < count; ++i )
                 {
@@ -213,45 +210,23 @@ static int run( const comma::command_line_options& options ) // quick and dirty
 {
     const auto& distribution = options.value< std::string >( "--distribution", "uniform" );
     const auto& format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
-    if ( format.collapsed_string().find( ',' ) != std::string::npos )
+    if ( format.collapsed_string().find( ',' ) != std::string::npos ) { std::cerr << "csv-random make: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl; return 1; }
+    if( distribution == "uniform" )
     {
-        std::cerr << "csv-random make: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl;
-        return 1;
-    }
-    switch ( format.offset( 0 ).type ) {
-        case csv::format::int8:
-            if( distribution == "uniform" ) { return run_impl< char, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::uint8:
-            if( distribution == "uniform" ) { return run_impl< unsigned char, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::int16:
-            if( distribution == "uniform" ) { return run_impl< comma::int16, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::uint16:
-            if( distribution == "uniform" ) { return run_impl< comma::uint16, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::int32:
-            if( distribution == "uniform" ) { return run_impl< comma::int32, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::uint32:
-            if( distribution == "uniform" ) { return run_impl< comma::uint32, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::int64:
-            if( distribution == "uniform" ) { return run_impl< comma::int64, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::uint64:
-            if( distribution == "uniform" ) { return run_impl< comma::uint64, std::uniform_int_distribution >( options ); }
-            break;
-        case csv::format::float_t:
-            if( distribution == "uniform" ) { return run_impl< float, std::uniform_real_distribution >( options ); }
-            break;
-        case csv::format::double_t:
-            if( distribution == "uniform" ) { return run_impl< double, std::uniform_real_distribution >( options ); }
-            break;
-        default:
-            std::cerr << "csv-random make: expected type; got: '" << format.string() << "'" << std::endl;
-            return 1;
+        switch ( format.offset( 0 ).type )
+        {
+            case csv::format::int8: return run_impl< char, std::uniform_int_distribution >( options );
+            case csv::format::uint8: return run_impl< unsigned char, std::uniform_int_distribution >( options );
+            case csv::format::int16: return run_impl< comma::int16, std::uniform_int_distribution >( options );
+            case csv::format::uint16: return run_impl< comma::uint16, std::uniform_int_distribution >( options );
+            case csv::format::int32: return run_impl< comma::int32, std::uniform_int_distribution >( options );
+            case csv::format::uint32: return run_impl< comma::uint32, std::uniform_int_distribution >( options );
+            case csv::format::int64: return run_impl< comma::int64, std::uniform_int_distribution >( options );
+            case csv::format::uint64: return run_impl< comma::uint64, std::uniform_int_distribution >( options );
+            case csv::format::float_t: return run_impl< float, std::uniform_real_distribution >( options );
+            case csv::format::double_t: return run_impl< double, std::uniform_real_distribution >( options );
+            default: std::cerr << "csv-random make: expected type; got: '" << format.string() << "'" << std::endl; return 1;
+        }
     }
     std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
     return 1;

From 749a7025120aacbbb5e0f2090fc5f837354e548c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 6 May 2022 12:44:45 +1000
Subject: [PATCH 0429/1056] csv-random: sample operation implemented

---
 csv/applications/csv-random.cpp | 203 ++++++++++++++------------------
 1 file changed, 90 insertions(+), 113 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index ccb339eec..658cbc507 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -51,13 +51,28 @@ static void usage( bool verbose )
     std::cerr << "        example" << std::endl;
     std::cerr << "            > csv-random make --seed=$( csv-random true-random --once )" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "    sample: output a uniformly distributed sample of input records of a given size; record order preserved" << std::endl;
+    std::cerr << "            limitation: current implementation accumulates input records before outputting" << std::endl;
+    std::cerr << "                        if records are large, it may be memory-inefficient; can be improved, just ask" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        usage: cat records.csv | csv-random sample [<options>] > sample.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
+    std::cerr << "            --fields=[<fields>]; if 'block' field present sample each block, otherwise read whole input and then sample" << std::endl;
+    std::cerr << "            --ratio=[<ratio>]; portion of each block to output, if block is too small, nothing will be output for it" << std::endl;
+    std::cerr << "            --size=<n>; default=1; number of records to output in each block, if smaller than block size, output the whole block" << std::endl;
+    std::cerr << "            --sliding-window,--window=[<size>]; todo: sample on sliding window of <size> records" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "    shuffle: output input records in pseudo-random order" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
-    std::cerr << "            --fields=[<fields>]; if 'block' field present shuffle each block, otherwise read whole input and then shuffle" << std::endl;
+    std::cerr << "            --fields=[<fields>]; if 'block' field present, shuffle each block, otherwise read whole input and then shuffle" << std::endl;
+    std::cerr << "            --ratio=[<ratio>]; portion of each block to output, same as for \"sample\" operation, but shuffled" << std::endl;
+    std::cerr << "            --size=<n>; default=1; number of records to output in each block, same as for \"sample\" operation, but shuffled" << std::endl;
     std::cerr << "            --sliding-window,--window=[<size>]; todo: shuffle on sliding window of <size> records" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options:" << std::endl;
@@ -92,23 +107,9 @@ template <> struct traits< comma::applications::random::shuffle::input >
 
 namespace comma { namespace applications { namespace random {
 
-template < typename T >
-struct type_traits
-{
-    static T cast( const T t ) { return t; }
-};
-
-template <>
-struct type_traits< char >
-{
-    static int cast( const char t ) { return static_cast< int >( t ); }
-};
-
-template <>
-struct type_traits< unsigned char >
-{
-    static unsigned int cast( const unsigned char t ) { return static_cast< int >( t ); }
-};
+template < typename T > struct type_traits { static T cast( const T t ) { return t; } };
+template <> struct type_traits< char > { static int cast( const char t ) { return static_cast< int >( t ); } };
+template <> struct type_traits< unsigned char > { static unsigned int cast( const unsigned char t ) { return static_cast< int >( t ); } };
 
 namespace make {
 
@@ -135,45 +136,43 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
                 }
                 if( ::csv.flush ) { std::cout.flush(); }
             }
+            return 0;
         }
-        else
+        while( std::cin.good() )
         {
-            while( std::cin.good() )
-            {
-                std::string s;
-                std::getline( std::cin, s );
-                if( s.empty() ) { continue; }
-                std::cout << s;
-                for( std::size_t i = 0; i < count; ++i ) { std::cout << ::csv.delimiter << type_traits< T >::cast( distribution( engine ) ); }
-                std::cout << std::endl;
-                if( ::csv.flush ) { std::cout.flush(); }
-            }
+            std::string s;
+            std::getline( std::cin, s );
+            if( s.empty() ) { continue; }
+            std::cout << s;
+            for( std::size_t i = 0; i < count; ++i ) { std::cout << ::csv.delimiter << type_traits< T >::cast( distribution( engine ) ); }
+            std::cout << std::endl;
+            if( ::csv.flush ) { std::cout.flush(); }
         }
+        return 0;
     }
-    else
+    if( binary )
     {
         while( std::cout.good() )
         {
-            if( binary )
+            for( std::size_t i = 0; i < count; ++i )
             {
-                for( std::size_t i = 0; i < count; ++i )
-                {
-                    T r = distribution( engine );
-                    std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
-                }
-            }
-            else
-            {
-                std::string comma;
-                for( std::size_t i = 0; i < count; ++i )
-                {
-                    std::cout << comma << type_traits< T >::cast( distribution( engine ) );
-                    comma = ::csv.delimiter;
-                }
-                std::cout << std::endl;
+                T r = distribution( engine );
+                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
             }
             if( ::csv.flush ) { std::cout.flush(); }
         }
+        return 0;
+    }
+    while( std::cout.good() )
+    {
+        std::string comma;
+        for( std::size_t i = 0; i < count; ++i )
+        {
+            std::cout << comma << type_traits< T >::cast( distribution( engine ) );
+            comma = ::csv.delimiter;
+        }
+        std::cout << std::endl;
+        if( ::csv.flush ) { std::cout.flush(); } // todo? remove? std::endl flushes anyway?
     }
     return 0;
 }
@@ -236,97 +235,74 @@ static int run( const comma::command_line_options& options ) // quick and dirty
 
 namespace shuffle {
 
-template < typename Engine >
-static int run_impl( const comma::command_line_options& options )
+template < typename Engine > static int run_impl( const comma::command_line_options& options, bool sample = false )
 {
     auto engine = ::seed ? Engine( *::seed ) : Engine();
     std::deque< std::string > records;
-    auto output = []( std::deque< std::string >& records )
-    {
-        for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
-        records.clear();
-        if( ::csv.flush ) { std::cout.flush(); }
-    };
+    std::vector< unsigned int > indices; // quick and dirty
+    unsigned int size = options.value( "--size", 1 ); // quick and dirty
+    auto ratio = options.optional< float >( "--ratio" ); // quick and dirty
     auto sliding_window = options.optional< unsigned int >( "--sliding-window,--window" );
-    if( ::csv.has_field( "block" ) )
+    if( sliding_window ) { std::cerr << "csv-random shuffle: --sliding-window: todo" << std::endl; return 1; }
+    if( sliding_window ) { std::cerr << "csv-random shuffle: expected either block field or --sliding-window; got both" << std::endl; return 1; }
+    comma::csv::input_stream< input > is( std::cin, ::csv );
+    comma::uint32 block = 0;
+    while( is.ready() || std::cin.good() )
     {
-        if( sliding_window ) { std::cerr << "csv-random shuffle: expected either block field or --sliding-window; got both" << std::endl; return 1; }
-        comma::csv::input_stream< input > is( std::cin, ::csv );
-        comma::uint32 block = 0;
-        while( is.ready() || std::cin.good() )
+        const input* p = is.read();
+        if( !p || p->block != block )
         {
-            const input* p = is.read();
-            if( !p || p->block != block )
-            {
-                std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
-                std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
-                output( records );
-                if( p ) { block = p->block; }
-            }
-            if( !p ) { break; }
-            if( ::csv.binary() )
-            {
-                records.emplace_back();
-                records.back().resize( ::csv.format().size() );
-                std::memcpy( &records.back()[0], is.binary().last(), ::csv.format().size() );
-            }
-            else
-            {
-                records.push_back( comma::join( is.ascii().last(), ::csv.delimiter ) + "\n" );
-            }
+            std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+            indices.resize( records.size() ); // quick and dirty
+            for( unsigned int i = 0; i < indices.size(); ++i ) { indices[i] = i; }
+            std::random_shuffle( indices.begin(), indices.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
+            unsigned int s = sample ? ( ratio ? int( records.size() * *ratio ) : size ) : records.size();
+            if( sample ) { std::sort( indices.begin(), indices.begin() + s ); } // quick and dirty
+            for( unsigned int i = 0; i < s; ++i ) { std::cout.write( &records[indices[i]][0], records[indices[i]].size() ); }
+            records.clear();
+            if( ::csv.flush ) { std::cout.flush(); }
+            if( p ) { block = p->block; }
         }
-    }
-    else // quick and dirty
-    {
-        if( sliding_window ) { std::cerr << "csv-random shuffle: --sliding-window: todo" << std::endl; return 1; }
+        if( !p ) { break; }
         if( ::csv.binary() )
         {
-            std::string s( ::csv.format().size(), 0 );
-            while( std::cin.good() )
-            {
-                std::cin.read( &s[0], s.size() );
-                if( std::cin.gcount() == 0 ) { break; }
-                if( std::cin.gcount() != int( s.size() ) ) { std::cerr << "csv-random shuffle: expected " << s.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
-                records.emplace_back();
-                records.back().resize( ::csv.format().size() );
-                std::memcpy( &records.back()[0], &s[0], ::csv.format().size() );
-            }
+            records.emplace_back();
+            records.back().resize( ::csv.format().size() );
+            std::memcpy( &records.back()[0], is.binary().last(), ::csv.format().size() );
         }
         else
         {
-            while( std::cin.good() )
-            {
-                std::string s;
-                std::getline( std::cin, s );
-                if( !s.empty() ) { records.push_back( s + "\n" ); }
-            }
+            records.push_back( comma::join( is.ascii().last(), ::csv.delimiter ) + "\n" );
         }
-        std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
-        std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
-        output( records );
     }
     return 0;
 }
 
-static int run( const comma::command_line_options& options )
+static int run( const comma::command_line_options& options, bool sample = false )
 {
     const auto& engine = options.value< std::string >( "--engine", "mt19937_64" );
-    if( engine == "minstd_rand0" ) { return run_impl< std::minstd_rand0 >( options ); }
-    if( engine == "minstd_rand" ) { return run_impl< std::minstd_rand >( options ); }
-    if( engine == "mt19937" ) { return run_impl< std::mt19937>( options ); }
-    if( engine == "mt19937_64" ) { return run_impl< std::mt19937_64 >( options ); }
-    if( engine == "ranlux24_base" ) { return run_impl< std::ranlux24_base >( options ); }
-    if( engine == "ranlux48_base" ) { return run_impl< std::ranlux48_base >( options ); }
-    if( engine == "ranlux24" ) { return run_impl< std::ranlux24 >( options ); }
-    if( engine == "ranlux48" ) { return run_impl< std::ranlux48 >( options ); }
-    if( engine == "knuth_b" ) { return run_impl< std::knuth_b >( options ); }
-    if( engine == "default_random_engine" ) { return run_impl< std::default_random_engine >( options ); }
-    std::cerr << "csv-random shuffle: expected engine; got: '" << engine << "'" << std::endl;
+    if( engine == "minstd_rand0" ) { return run_impl< std::minstd_rand0 >( options, sample ); }
+    if( engine == "minstd_rand" ) { return run_impl< std::minstd_rand >( options, sample ); }
+    if( engine == "mt19937" ) { return run_impl< std::mt19937>( options, sample ); }
+    if( engine == "mt19937_64" ) { return run_impl< std::mt19937_64 >( options, sample ); }
+    if( engine == "ranlux24_base" ) { return run_impl< std::ranlux24_base >( options, sample ); }
+    if( engine == "ranlux48_base" ) { return run_impl< std::ranlux48_base >( options, sample ); }
+    if( engine == "ranlux24" ) { return run_impl< std::ranlux24 >( options, sample ); }
+    if( engine == "ranlux48" ) { return run_impl< std::ranlux48 >( options, sample ); }
+    if( engine == "knuth_b" ) { return run_impl< std::knuth_b >( options, sample ); }
+    if( engine == "default_random_engine" ) { return run_impl< std::default_random_engine >( options, sample ); }
+    std::cerr << "csv-random " << ( sample ? "sample" : "shuffle" ) << ": expected engine; got: '" << engine << "'" << std::endl;
     return 1;
 }
 
 } // namespace shuffle {
 
+namespace sample {
+
+static int run( const comma::command_line_options& options ) { return shuffle::run( options, true ); } // quick and relatively dirty for now
+
+} // namespace sample {
+
 namespace true_random {
 
 template < typename T >
@@ -422,6 +398,7 @@ int main( int ac, char** av )
         ::verbose = options.exists( "--verbose,-v" );
         std::string operation = unnamed[0];
         if( operation == "make" ) { return comma::applications::random::make::run( options ); }
+        if( operation == "sample" ) { return comma::applications::random::sample::run( options ); }
         if( operation == "shuffle" ) { return comma::applications::random::shuffle::run( options ); }
         if( operation == "true-random" ) { return comma::applications::random::true_random::run( options ); }
         std::cerr << "csv-random: expected operation; got: '" << operation << "'" << std::endl;

From ecfd716ba3d04513d319741f2b26b41ac3fefb2d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 8 May 2022 15:48:03 +1000
Subject: [PATCH 0430/1056] system/ansible: install.python3.yml renamed to
 install.yml

---
 system/ansible/install.python3.yml | 72 ------------------------------
 system/ansible/install.yml         | 20 ++++-----
 2 files changed, 10 insertions(+), 82 deletions(-)
 delete mode 100644 system/ansible/install.python3.yml

diff --git a/system/ansible/install.python3.yml b/system/ansible/install.python3.yml
deleted file mode 100644
index c476c0e42..000000000
--- a/system/ansible/install.python3.yml
+++ /dev/null
@@ -1,72 +0,0 @@
----
-# sample ansible-playbook script to install comma dependencies and build comma from source; include it as it is or copy to your playbook
-
-- hosts: localhost
-  connection: local
-  vars:
-    - base: "{{ ansible_env.HOME }}"
-    - make_j: 6
-    - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
-
-  tasks:
-  - name: "install comma dependencies"
-    become: true
-    apt: pkg={{ item }} state=present update_cache=yes
-    with_items:
-      - build-essential
-      - git
-      - cmake-curses-gui
-      - cmake
-      - gawk
-      - perl
-      - python3
-      - libboost-all-dev
-      - socat
-      - libzmq3-dev
-      - libgtest-dev
-      - python3-dev
-      - python3-numpy
-      - python3-pip
-      - libprocps-dev
-      - recode
-
-  - name: "install comma regressions test dependencies"
-    become: true
-    apt: pkg={{ item }} state=present update_cache=yes
-    with_items:
-      - moreutils
-      - net-tools
-      - pv
-
-  - name: "comma: make source directory at {{ base }}"
-    file: path={{ base }}/{{ item }} state=directory
-    with_items:
-        - src
-        - build
-
-  - name: "comma: clone"
-    git:
-        repo: "https://gitlab.com/orthographic/comma.git"
-        dest: "{{ base }}/src/comma"
-        clone: yes
-        update: yes
-
-  - name: "comma: make build directory at {{ base }}"
-    file: dest="{{ base }}/build/comma" state=directory
-
-  - name: "comma: cmake"
-    vars:
-        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -DBUILD_PYTHON_PACKAGES=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
-    shell: "/usr/bin/cmake {{ comma_cmake_options }} {{ base }}/src/comma chdir={{ base }}/build/comma"
-
-  - name: "comma: make"
-    make:
-        chdir: "{{ base }}/build/comma"
-        params:
-            MAKEFLAGS: "-j {{ make_j }}"
-
-  - name: "comma: install"
-    become: true
-    make:
-        chdir: "{{ base }}/build/comma"
-        target: "install"
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 517351dd2..c476c0e42 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -6,27 +6,27 @@
   vars:
     - base: "{{ ansible_env.HOME }}"
     - make_j: 6
-    - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF"
+    - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
 
   tasks:
   - name: "install comma dependencies"
     become: true
     apt: pkg={{ item }} state=present update_cache=yes
     with_items:
-      - build-essential 
+      - build-essential
       - git
       - cmake-curses-gui
       - cmake
       - gawk
       - perl
-      - python
+      - python3
       - libboost-all-dev
       - socat
       - libzmq3-dev
       - libgtest-dev
-      - python-dev
-      - python-numpy
-      - python-pip
+      - python3-dev
+      - python3-numpy
+      - python3-pip
       - libprocps-dev
       - recode
 
@@ -37,26 +37,26 @@
       - moreutils
       - net-tools
       - pv
-      
+
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
     with_items:
         - src
         - build
-    
+
   - name: "comma: clone"
     git:
         repo: "https://gitlab.com/orthographic/comma.git"
         dest: "{{ base }}/src/comma"
         clone: yes
         update: yes
-        
+
   - name: "comma: make build directory at {{ base }}"
     file: dest="{{ base }}/build/comma" state=directory
 
   - name: "comma: cmake"
     vars:
-        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF"
+        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -DBUILD_PYTHON_PACKAGES=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
     shell: "/usr/bin/cmake {{ comma_cmake_options }} {{ base }}/src/comma chdir={{ base }}/build/comma"
 
   - name: "comma: make"

From a88e6d82304f07bfe838fd4af74ed117fb23e5f8 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 12:14:32 +1000
Subject: [PATCH 0431/1056] cmake: made building python conditional

---
 CMakeLists.txt | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e3ff2ca15..59e446a58 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -155,6 +155,8 @@ OPTION( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
 
 option( BUILD_SHARED_LIBS "build with shared libraries" ON ) # option( BUILD_SHARED_LIBS "build with shared libraries" OFF )
 
+OPTION( comma_BUILD_PYTHON "build python" ON )
+
 OPTION( comma_BUILD_XML "build xml" OFF )
 
 SET(comma_BUILD_SHARED_LIBS ${BUILD_SHARED_LIBS})
@@ -319,7 +321,9 @@ if( INSTALL_BASH_COMPLETION )
     add_subdirectory( etc/bash_completion.d )
 endif( INSTALL_BASH_COMPLETION )
 
-add_subdirectory( python )
+if( comma_BUILD_PYTHON )
+  add_subdirectory( python )
+endif( comma_BUILD_PYTHON )
 
 #in future, may need to add third party dlls somehow, if they are linked as dlls. Not needed for statically linking to boost.
 #if we set them up to install to bin they might be packaged through, e.g. roughly (using GLOB):
@@ -348,7 +352,7 @@ set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} CACHE STRING "cpack version major" )
 set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} CACHE STRING "cpack version minor" )
 set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} CACHE STRING "cpack version patch" )
-set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps6 (>= 2:3.3.0)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
+set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )

From b6e2526971be7b83a8964edf7f4eda408fc90a47 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 12:49:33 +1000
Subject: [PATCH 0432/1056] rabbit-cat: python replaced with env python

---
 io/applications/rabbit-cat | 41 +++++++-------------------------------
 1 file changed, 7 insertions(+), 34 deletions(-)

diff --git a/io/applications/rabbit-cat b/io/applications/rabbit-cat
index 89362d50d..0edf99964 100755
--- a/io/applications/rabbit-cat
+++ b/io/applications/rabbit-cat
@@ -1,33 +1,6 @@
-#!/usr/bin/python
+#!/usr/bin/env python
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2018 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 import argparse
 import signal
@@ -44,11 +17,11 @@ import pika
 def command_line_options():
     global application_name
     description="""Rabbit MQ client: send/receive messages to/from rabbit mq server
-    
+
 rabbit-cat <operation> <connection_string> [ <options> ]
 
 operation:
-    send        read messages from stdin and send 
+    send        read messages from stdin and send
     listen      receive messages and write to stdout, or run command with --exec
 """
     #rpc-send    <<NOT IMPLEMENTED>> send request and wait for reply
@@ -58,7 +31,7 @@ operation:
 
     epilog="""
 
-sample connection string:    
+sample connection string:
 # Set the connection parameters to connect to rabbit-server1 on port 5672
 # on the / virtual host using the username "guest" and password "guest"
 "amqp://guest:guest@rabbit-server1:5672/%2F"
@@ -78,7 +51,7 @@ example 2: send message to work queue with multiple receivers (each message is r
 
 
 example 3: publish and subscribe
-    rabbit-cat listen localhost --fanout --exchange="exchange2" 
+    rabbit-cat listen localhost --fanout --exchange="exchange2"
     &
     rabbit-cat listen localhost --fanout --exchange="exchange2"
     &
@@ -110,7 +83,7 @@ example 5: topic
     #rabbit-cat rpc-listen localhost --queue="queue1" --exec="bc"
     #&
     #echo "2+3" | rabbit-cat rpc-send localhost --queue="queue1" --routing-key="queue1"
-    
+
 
     #"""
 
@@ -158,7 +131,7 @@ def run_send( channel, exchange_name ):
             if message: send_message( channel, exchange_name, message )
             return
         if args.end_of_message=='\n':
-            while True:            
+            while True:
                 line = sys.stdin.readline()
                 if not line: break
                 if line.endswith('\n'): send_message( channel, exchange_name, line[:-1] )

From 3a9bc337ec510f2f45c9ea5b7627c83e013831a3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 13:17:11 +1000
Subject: [PATCH 0433/1056] system/package/debian/comma-package-make: minor
 change

---
 system/package/debian/comma-package-make | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 0fc522b06..d064ced6a 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -15,6 +15,7 @@ ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
 case $ubuntu_version in
     18.04) libproc_version="libprocps6 (>= 2:3.3.0)" ;;
     20.04) libproc_version="libprocps8 (>= 1)" ;;
+    22.04) libproc_version="libprocps8 (>= 1)" ;;
     *) libproc_version="libprocps8 (>= 1)" ;; # for now
 esac
 (
@@ -47,7 +48,6 @@ esac
             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
             -DBUILD_SHARED_LIBS=ON \
             -DBUILD_TESTS=OFF \
-            -DBUILD_TESTS=OFF \
             -DCMAKE_BUILD_TYPE=Release \
             -DCMAKE_INSTALL_PREFIX=/usr \
             -DINSTALL_BASH_COMPLETION=OFF \
@@ -57,6 +57,7 @@ esac
             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
             -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  \
             -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+            -Dcomma_BUILD_XML=OFF \
             -Dcomma_build_io_rabbit_cat=OFF || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"

From d3b7e2a0088f0856e2544ecf3b6a78de5d2f4a2b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 13:20:43 +1000
Subject: [PATCH 0434/1056] system/package/debian/Dockerfile: trivial warnings
 fixed

---
 system/package/debian/Dockerfile | 12 +++++-------
 1 file changed, 5 insertions(+), 7 deletions(-)

diff --git a/system/package/debian/Dockerfile b/system/package/debian/Dockerfile
index a3290cdc4..ad580af43 100644
--- a/system/package/debian/Dockerfile
+++ b/system/package/debian/Dockerfile
@@ -1,12 +1,10 @@
 ARG version
 FROM ubuntu:${version}
 ENV DEBIAN_FRONTEND="noninteractive"
-RUN apt update \
-    && apt install --yes apt-utils \
-    && apt install --yes software-properties-common \
-    && apt install --yes ansible git build-essential cmake cmake-curses-gui python3-pip devscripts
-RUN apt install --yes python3-stdeb
-RUN apt install --yes python3-all
-RUN apt install --yes dh-python
+RUN apt-get update \
+    && apt-get install --yes apt-utils \
+    && apt-get install --yes software-properties-common \
+    && apt-get install --yes ansible git build-essential cmake cmake-curses-gui python3-pip devscripts \
+    && apt-get install --yes python3-stdeb python3-all dh-python
 
 # && apt-add-repository --yes --update ppa:ansible/ansible \

From 28af1901ae4fdef1cdd091e022f88de74f880957 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 13:27:29 +1000
Subject: [PATCH 0435/1056] system/package/debian/comma-package-make: typo
 fixed

---
 system/package/debian/comma-package-make | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index d064ced6a..740a58ff3 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -10,8 +10,8 @@ comma_dir="$5"
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
 [[ -n "$version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
 cd ~
-echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.python3.yml' in $( pwd )..." >&2
-ansible-playbook "$comma_dir/system/ansible/install.python3.yml" || die "failed"
+echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.yml' in $( pwd )..." >&2
+ansible-playbook "$comma_dir/system/ansible/install.yml" || die "failed"
 case $ubuntu_version in
     18.04) libproc_version="libprocps6 (>= 2:3.3.0)" ;;
     20.04) libproc_version="libprocps8 (>= 1)" ;;

From 8fea305eb3b2d6440b74888831654c962b323043 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 14:51:31 +1000
Subject: [PATCH 0436/1056] CMakeLists.txt: minor change

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 59e446a58..e976cf228 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -342,7 +342,7 @@ set( CPACK_PACKAGE_NAME "comma" )
 #set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
 set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "cli utilities for structured or fixed-width offline or realtime data" )
 set( CPACK_PACKAGE_VENDOR "orthographic" )
-set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "command line utilities for processing structured or fixed-width data offline or in realtime" )
+set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "CLI for processing structured or fixed-width data offline or in realtime" )
 set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma/-/wikis/home" )
 set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine <vsevolod.vlaskine@gmail.com>" )
 set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/debian/changelog" )

From ebb8c027746e29221ba15e37a30c5e0e18dbe8b6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 14:51:51 +1000
Subject: [PATCH 0437/1056] system/package/debian/comma-package-docker-test:
 script path fixed

---
 system/package/debian/comma-package-docker-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/debian/comma-package-docker-test b/system/package/debian/comma-package-docker-test
index a2212949b..a716ae11f 100755
--- a/system/package/debian/comma-package-docker-test
+++ b/system/package/debian/comma-package-docker-test
@@ -18,4 +18,4 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$package_dir,target=/mnt/package" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/package/comma-package-test "/mnt/package/$( basename "$package" )" "/mnt/package/$( basename "$python_package" )" || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/debian/comma-package-test "/mnt/package/$( basename "$package" )" "/mnt/package/$( basename "$python_package" )" || { echo "$0: failed" >&2; exit 1; }

From 7076f16094c09c882e482c5a1bef8ecb32d3580d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 17:55:20 +1000
Subject: [PATCH 0438/1056] CMakeLists.txt: cpack: fixing libc dependency...

---
 CMakeLists.txt | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e976cf228..6b5d9dcb3 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -354,7 +354,8 @@ set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} CACHE STRING "cpack vers
 set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} CACHE STRING "cpack version patch" )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc" )
 set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )

From 0b5a28f86a2978c0ada6b3e2cff7cb43654782d7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 18:15:39 +1000
Subject: [PATCH 0439/1056] CMakeLists.txt: cpack: fixing libc dependency...

---
 CMakeLists.txt | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6b5d9dcb3..b3fa9b634 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -355,8 +355,10 @@ set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} CACHE STRING "cpack vers
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc" )
-set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc" )
+#set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc-dev" )
+set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc-dev" )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )
 

From 39351608a1823f01e342fe43e78033de6e78c275 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 19:40:15 +1000
Subject: [PATCH 0440/1056] CMakeLists.txt: todo comments added

---
 CMakeLists.txt | 33 +++++++++++++++++++++++++++------
 1 file changed, 27 insertions(+), 6 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b3fa9b634..3d92ffc87 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -111,9 +111,9 @@ SET( EXECUTABLE_OUTPUT_PATH
      ${PROJECT_BINARY_DIR}/bin CACHE PATH
      "Single output directory for building all executables." )
 
-set( comma_version_major "1" ) # quick and dirty
-set( comma_version_minor "0" ) # quick and dirty
-set( comma_version_patch "0" ) # quick and dirty
+set( comma_version_major "1" CACHE STRING "comma version major" ) # quick and dirty
+set( comma_version_minor "0" CACHE STRING "comma version minor" ) # quick and dirty
+set( comma_version_patch "0" CACHE STRING "comma version patch" ) # quick and dirty
 
 SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" )
 
@@ -338,6 +338,27 @@ endif( CMAKE_COMPILER_IS_GNUCXX )
 
 add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
 
+# todo
+#     set as cache variables
+#         CMAKE_PROJECT_VERSION
+#         CMAKE_PROJECT_VERSION_MAJOR
+#         CMAKE_PROJECT_VERSION_MINOR
+#         CMAKE_PROJECT_VERSION_PATCH
+#     lintian errors and warnings
+#         fix errors
+#             E: comma: no-changelog usr/share/doc/comma/changelog.gz (native package)
+#             E: comma: no-copyright-file
+#         fix warnings
+#             W: comma: package-name-doesnt-match-sonames: try comma_string -> comma-string, etc?
+#             W: comma: maintscript-calls-ldconfig [postinst]: don't call ldconfig from package?
+#             W: comma: maintscript-calls-ldconfig [postrm]: don't call ldconfig from package?
+#             W: comma: distant-prerequisite-in-shlibs comma (ON 1.0.0): try to add full version to shared libs
+#         investigate
+#             W: comma: non-standard-dir-in-usr usr/CMakeFiles/
+#         ignore for now
+#             W: comma: link-to-shared-library-in-wrong-package: deemed ok for small packages
+#             W: comma: no-manual-page: ok for now, lots of packages don't have man pages
+
 set( CPACK_PACKAGE_NAME "comma" )
 #set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
 set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "cli utilities for structured or fixed-width offline or realtime data" )
@@ -349,9 +370,9 @@ set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/de
 set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
 set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING" )
 set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
-set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} CACHE STRING "cpack version major" )
-set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} CACHE STRING "cpack version minor" )
-set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} CACHE STRING "cpack version patch" )
+set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} )
+set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} )
+set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )

From 81cfb0ebea1c4f56626bb99547edb950c2b324db Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 19:41:21 +1000
Subject: [PATCH 0441/1056] system/package/debian/comma-package-make: building
 python package commented out for now (will break comma-package-test for now,
 since csv-eval does not get installed)

---
 system/package/debian/comma-package-make | 79 +++++++++++++++++-------
 1 file changed, 55 insertions(+), 24 deletions(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 740a58ff3..3f395b473 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -18,29 +18,8 @@ case $ubuntu_version in
     22.04) libproc_version="libprocps8 (>= 1)" ;;
     *) libproc_version="libprocps8 (>= 1)" ;; # for now
 esac
+
 (
-    cd ~/src/comma/python
-    echo "$0: setting up python in $( pwd )" >&2
-    #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
-    echo "$0: running python3 setup.py ..." >&2
-    python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../COPYING --suite focal  || die "failed"
-    # todo: mount gpg key
-    # debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
-    # mkdir tmp
-    # cd tmp
-    # dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
-    # cd python3-comma-1.0.0
-    # debuild -S -sa
-    # dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
-    # ? debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 ../../deb_dist/python3-comma_1.0.0-1_source.changes
-    #
-    # ...
-    echo "$0: building package..." >&2
-    cd deb_dist/comma-$version_major.$version_minor.$version_patch || die "failed"
-    dpkg-buildpackage -rfakeroot -uc -us || die "failed"
-    #https://shallowsky.com/blog/programming/packaging-launchpad-ppas.html
-    # todo? or do all above outside of this script using something like (but also see above):
-    #       debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
@@ -61,8 +40,60 @@ esac
             -Dcomma_build_io_rabbit_cat=OFF || die "failed"
     echo "$0: running cpack in $( pwd )" >&2
     cpack || die "failed"
+    echo "$0: created package at $( realpath comma-$version_major.$version_minor.$version_patch-Linux.deb )" >&2
     # todo: optionally run full regression test
     echo "$0: done" >&2
 )
-cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
-cp ~/src/comma/python/deb_dist/python3-comma*.deb output
+if [[ -d output ]]; then
+    cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
+    echo "$0: copied $( realpath ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb ) to $( realpath output )" >&2
+fi
+
+# (
+#     cd ~/src/comma/python
+#     echo "$0: setting up python in $( pwd )" >&2
+#     #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
+#     echo "$0: running python3 setup.py ..." >&2
+#     python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../COPYING --suite focal  || die "failed"
+#     # todo: mount gpg key
+#     # debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
+#     # mkdir tmp
+#     # cd tmp
+#     # dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
+#     # cd python3-comma-1.0.0
+#     # debuild -S -sa
+#     # dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
+#     # ? debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 ../../deb_dist/python3-comma_1.0.0-1_source.changes
+#     #
+#     # ...
+#     echo "$0: building package..." >&2
+#     cd deb_dist/comma-$version_major.$version_minor.$version_patch || die "failed"
+#     dpkg-buildpackage -rfakeroot -uc -us || die "failed"
+#     #https://shallowsky.com/blog/programming/packaging-launchpad-ppas.html
+#     # todo? or do all above outside of this script using something like (but also see above):
+#     #       debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
+#     cd ~/build/comma
+#     echo "$0: running cmake in $( pwd )" >&2
+#     cmake . -DCPACK_GENERATOR=DEB \
+#             -DBUILD_PYTHON_PACKAGES=ON \
+#             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+#             -DBUILD_SHARED_LIBS=ON \
+#             -DBUILD_TESTS=OFF \
+#             -DCMAKE_BUILD_TYPE=Release \
+#             -DCMAKE_INSTALL_PREFIX=/usr \
+#             -DINSTALL_BASH_COMPLETION=OFF \
+#             -DINSTALL_TESTS=OFF \
+#             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
+#             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
+#             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
+#             -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  \
+#             -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+#             -Dcomma_BUILD_XML=OFF \
+#             -Dcomma_build_io_rabbit_cat=OFF || die "failed"
+#     echo "$0: running cpack in $( pwd )" >&2
+#     cpack || die "failed"
+#     # todo: optionally run full regression test
+#     echo "$0: done" >&2
+# )
+# cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
+# cp ~/src/comma/python/deb_dist/python3-comma*.deb output

From b8889fed5b3b4957fd671646d1eddf1a3b2930c8 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 20:37:31 +1000
Subject: [PATCH 0442/1056] CMakeLists.txt: versioning improved

---
 CMakeLists.txt | 24 ++++++++++++++----------
 1 file changed, 14 insertions(+), 10 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 3d92ffc87..be600729a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -8,9 +8,21 @@ if( USE_ARM_TOOLCHAIN )
     include( ${CMAKE_TOOLCHAIN_FILE} REQUIRED )
 endif( USE_ARM_TOOLCHAIN )
 
-PROJECT( "comma" )
-
 cmake_minimum_required( VERSION 3.1 )
+if(POLICY CMP0048)
+    cmake_policy( SET CMP0048 NEW )
+    project( comma VERSION 1.0.0 LANGUAGES CXX )
+else( POLICY CMP0048 )
+    project( comma )
+    set( CMAKE_PROJECT_VERSION_MAJOR "1" CACHE STRING "comma version major" )
+    set( CMAKE_PROJECT_VERSION_MINOR "0" CACHE STRING "comma version minor" )
+    set( CMAKE_PROJECT_VERSION_PATCH "0" CACHE STRING "comma version patch" )
+    set( CMAKE_PROJECT_VERSION "${CMAKE_PROJECT_VERSION_MAJOR}.${CMAKE_PROJECT_VERSION_MINOR}.${CMAKE_PROJECT_VERSION_PATCH}" )
+endif( POLICY CMP0048 )
+
+set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
+set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
+set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )
@@ -107,14 +119,6 @@ endif( UNIX )
 SET( SOURCE_CODE_BASE_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 SET( LIBRARY_OUTPUT_PATH ${CMAKE_BINARY_DIR}/lib )
 
-SET( EXECUTABLE_OUTPUT_PATH
-     ${PROJECT_BINARY_DIR}/bin CACHE PATH
-     "Single output directory for building all executables." )
-
-set( comma_version_major "1" CACHE STRING "comma version major" ) # quick and dirty
-set( comma_version_minor "0" CACHE STRING "comma version minor" ) # quick and dirty
-set( comma_version_patch "0" CACHE STRING "comma version patch" ) # quick and dirty
-
 SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" )
 
 IF( NOT comma_INSTALL_BIN_DIR )

From 777f5cd51d6783516957200446a64312087f7b1d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 21:06:09 +1000
Subject: [PATCH 0443/1056] cmake: shared library versioning sorted out

---
 CMakeLists.txt             | 5 +++--
 application/CMakeLists.txt | 4 ++--
 base/CMakeLists.txt        | 2 --
 csv/CMakeLists.txt         | 2 --
 io/CMakeLists.txt          | 6 ++----
 name_value/CMakeLists.txt  | 2 --
 string/CMakeLists.txt      | 2 --
 xpath/CMakeLists.txt       | 2 --
 8 files changed, 7 insertions(+), 18 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index be600729a..66b8627cd 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -9,7 +9,7 @@ if( USE_ARM_TOOLCHAIN )
 endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
-if(POLICY CMP0048)
+if( POLICY CMP0048 )
     cmake_policy( SET CMP0048 NEW )
     project( comma VERSION 1.0.0 LANGUAGES CXX )
 else( POLICY CMP0048 )
@@ -23,6 +23,7 @@ endif( POLICY CMP0048 )
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
 set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
+set( comma_version "${CMAKE_PROJECT_VERSION}" ) # quick and dirty
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )
@@ -119,7 +120,7 @@ endif( UNIX )
 SET( SOURCE_CODE_BASE_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 SET( LIBRARY_OUTPUT_PATH ${CMAKE_BINARY_DIR}/lib )
 
-SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" )
+SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" SOVERSION ${CMAKE_PROJECT_VERSION} LINK_FLAGS_RELEASE -s )
 
 IF( NOT comma_INSTALL_BIN_DIR )
   SET( comma_INSTALL_BIN_DIR bin )
diff --git a/application/CMakeLists.txt b/application/CMakeLists.txt
index fe718a5d2..60b4211da 100644
--- a/application/CMakeLists.txt
+++ b/application/CMakeLists.txt
@@ -8,8 +8,8 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
+#set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+#set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION "${comma_version}" ) #set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/base/CMakeLists.txt b/base/CMakeLists.txt
index 4c4d6dc08..772b1e337 100644
--- a/base/CMakeLists.txt
+++ b/base/CMakeLists.txt
@@ -6,8 +6,6 @@ FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
 SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 
 install( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 install( TARGETS ${TARGET_NAME}
diff --git a/csv/CMakeLists.txt b/csv/CMakeLists.txt
index a607236b7..3de46ff97 100644
--- a/csv/CMakeLists.txt
+++ b/csv/CMakeLists.txt
@@ -12,8 +12,6 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
-set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index e4d3a4fdf..19497c98f 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -1,7 +1,7 @@
 SET( PROJECT "io" )
 SET( TARGET_NAME comma_${PROJECT} )
 SET( dir ${SOURCE_CODE_BASE_DIR}/${PROJECT} )
-FILE( GLOB source   ${dir}/*.cpp) 
+FILE( GLOB source   ${dir}/*.cpp)
 FILE( GLOB includes ${dir}/*.h)
 FILE( GLOB impl_source   ${dir}/impl/*.cpp)
 FILE( GLOB impl_includes ${dir}/impl/*.h)
@@ -17,8 +17,6 @@ ELSE( comma_BUILD_ZEROMQ )
 ENDIF( comma_BUILD_ZEROMQ )
 
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
@@ -34,7 +32,7 @@ INSTALL(
 if( comma_BUILD_APPLICATIONS )
     add_subdirectory( applications )
 endif( comma_BUILD_APPLICATIONS )
-                                           
+
 IF( comma_BUILD_TESTS )
     ADD_SUBDIRECTORY( test )
 ENDIF( comma_BUILD_TESTS )
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index 9c2a3048e..b1b30b945 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -13,8 +13,6 @@ INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJE
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
-set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/string/CMakeLists.txt b/string/CMakeLists.txt
index 8b24fab83..57b62efda 100644
--- a/string/CMakeLists.txt
+++ b/string/CMakeLists.txt
@@ -6,8 +6,6 @@ FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
 SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL(
diff --git a/xpath/CMakeLists.txt b/xpath/CMakeLists.txt
index 2053921d4..1886d4819 100644
--- a/xpath/CMakeLists.txt
+++ b/xpath/CMakeLists.txt
@@ -8,8 +8,6 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
-set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
 TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )

From 669ad2f8e9ae45cf3a895977c6f0680b30af4028 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 21:16:36 +1000
Subject: [PATCH 0444/1056] copyright notice updated with the library
 description;

---
 COPYING | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/COPYING b/COPYING
index d880d7275..cf71e2b40 100644
--- a/COPYING
+++ b/COPYING
@@ -1,3 +1,5 @@
+comma, a library for efficient streaming and processing of comma-separated (csv)
+and fixed-width binary data
 Copyright (c) 2011 The University of Sydney
 Copyright (c) 2018 Vsevolod Vlaskine
 All rights reserved.

From 9bf446e140b7a6160858255d2837378165cdea4c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 21:31:13 +1000
Subject: [PATCH 0445/1056] CMakeLists.txt: installation of copyright and
 changelog.gz added

---
 CMakeLists.txt | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 66b8627cd..46e153707 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -24,6 +24,8 @@ set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
 set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
 set( comma_version "${CMAKE_PROJECT_VERSION}" ) # quick and dirty
+install( FILES COPYING DESTINATION share/doc/comma-${CMAKE_PROJECT_VERSION} RENAME copyright )
+install( FILES system/package/debian/changelog.gz DESTINATION share/doc/comma-${CMAKE_PROJECT_VERSION} )
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )

From b2e4d4c20f070dc12dba63f5d09c705cc0ddcf34 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 21:31:52 +1000
Subject: [PATCH 0446/1056] system/package/debian/comma-package-make: setting
 CMAKE_PROJECT_VERSION instead of CPACK_...

---
 system/package/debian/comma-package-make | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 3f395b473..8a3cd26d1 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -32,9 +32,9 @@ esac
             -DINSTALL_BASH_COMPLETION=OFF \
             -DINSTALL_TESTS=OFF \
             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
-            -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
-            -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
-            -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  \
+            -DCMAKE_PROJECT_VERSION_MAJOR=$version_major \
+            -DCMAKE_PROJECT_VERSION_MINOR=$version_minor \
+            -DCMAKE_PROJECT_VERSION_PATCH=$version_patch  \
             -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
             -Dcomma_BUILD_XML=OFF \
             -Dcomma_build_io_rabbit_cat=OFF || die "failed"

From f9ce776470982547d2ab6306f300273c627f3e4a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 21:54:33 +1000
Subject: [PATCH 0447/1056] comma-package-make: fixing...

---
 system/package/debian/comma-package-make | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 8a3cd26d1..aca6d6456 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -23,7 +23,7 @@ esac
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )" >&2
     cmake . -DCPACK_GENERATOR=DEB \
-            -DBUILD_PYTHON_PACKAGES=ON \
+            -DBUILD_PYTHON_PACKAGES=OFF \
             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
             -DBUILD_SHARED_LIBS=ON \
             -DBUILD_TESTS=OFF \

From 6e5b3b29a57ad5011f69761161d8477b75e14060 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 21:58:13 +1000
Subject: [PATCH 0448/1056] system/ansible/install.yml: deprecation warning
 fixed

---
 system/ansible/install.yml | 25 ++-----------------------
 1 file changed, 2 insertions(+), 23 deletions(-)

diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index c476c0e42..bed895c73 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -11,32 +11,11 @@
   tasks:
   - name: "install comma dependencies"
     become: true
-    apt: pkg={{ item }} state=present update_cache=yes
-    with_items:
-      - build-essential
-      - git
-      - cmake-curses-gui
-      - cmake
-      - gawk
-      - perl
-      - python3
-      - libboost-all-dev
-      - socat
-      - libzmq3-dev
-      - libgtest-dev
-      - python3-dev
-      - python3-numpy
-      - python3-pip
-      - libprocps-dev
-      - recode
+    apt: pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-numpy', 'python3-pip', 'libprocps-dev', 'recode'] state=present update_cache=yes
 
   - name: "install comma regressions test dependencies"
     become: true
-    apt: pkg={{ item }} state=present update_cache=yes
-    with_items:
-      - moreutils
-      - net-tools
-      - pv
+    apt: pkg=['moreutils', 'net-tools', 'pv'] state=present update_cache=yes
 
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory

From c847c22720a3407617a527b3d931a6bb108136ce Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 22:01:13 +1000
Subject: [PATCH 0449/1056] system/ansible/install.yml: deprecation warning:
 fixing...

---
 system/ansible/install.yml | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index bed895c73..9533f9853 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -11,11 +11,17 @@
   tasks:
   - name: "install comma dependencies"
     become: true
-    apt: pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-numpy', 'python3-pip', 'libprocps-dev', 'recode'] state=present update_cache=yes
+    apt:
+        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-numpy', 'python3-pip', 'libprocps-dev', 'recode']
+        state: present
+        update_cache: yes
 
   - name: "install comma regressions test dependencies"
     become: true
-    apt: pkg=['moreutils', 'net-tools', 'pv'] state=present update_cache=yes
+    apt:
+        pkg: ['moreutils', 'net-tools', 'pv']
+        state: present
+        update_cache: yes
 
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory

From df21590704e1b940443b993f2f952f17052803cc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 22:16:32 +1000
Subject: [PATCH 0450/1056] system/package/debian/comma-package-make: fixing...

---
 system/package/debian/comma-package-make | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index aca6d6456..16b97f1cc 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -21,7 +21,7 @@ esac
 
 (
     cd ~/build/comma
-    echo "$0: running cmake in $( pwd )" >&2
+    echo "$0: running cmake in $( pwd )..." >&2
     cmake . -DCPACK_GENERATOR=DEB \
             -DBUILD_PYTHON_PACKAGES=OFF \
             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
@@ -37,9 +37,9 @@ esac
             -DCMAKE_PROJECT_VERSION_PATCH=$version_patch  \
             -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
             -Dcomma_BUILD_XML=OFF \
-            -Dcomma_build_io_rabbit_cat=OFF || die "failed"
-    echo "$0: running cpack in $( pwd )" >&2
-    cpack || die "failed"
+            -Dcomma_build_io_rabbit_cat=OFF || die "cmake failed"
+    echo "$0: running cpack in $( pwd )..." >&2
+    cpack || die "cpack failed"
     echo "$0: created package at $( realpath comma-$version_major.$version_minor.$version_patch-Linux.deb )" >&2
     # todo: optionally run full regression test
     echo "$0: done" >&2

From ff521249ba3e877f56c422f6241c270847c95d32 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 22:28:10 +1000
Subject: [PATCH 0451/1056] system/package/debian/Dockerfile: installation of
 comma dependencies added

---
 system/package/debian/Dockerfile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/package/debian/Dockerfile b/system/package/debian/Dockerfile
index ad580af43..8a729e018 100644
--- a/system/package/debian/Dockerfile
+++ b/system/package/debian/Dockerfile
@@ -6,5 +6,5 @@ RUN apt-get update \
     && apt-get install --yes software-properties-common \
     && apt-get install --yes ansible git build-essential cmake cmake-curses-gui python3-pip devscripts \
     && apt-get install --yes python3-stdeb python3-all dh-python
-
+    && apt-get install --yes libboost-all-dev  libzmq3-dev libprocps-dev libc-dev socat recode
 # && apt-add-repository --yes --update ppa:ansible/ansible \

From c93a877953c5b00c757dbaa9597c0ce38dd0dd09 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 22:29:59 +1000
Subject: [PATCH 0452/1056] CMakeLists.txt: minor change that hopefully fixes
 things

---
 CMakeLists.txt | 29 ++++++++++++++---------------
 1 file changed, 14 insertions(+), 15 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 46e153707..d9bc6d202 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -205,8 +205,8 @@ IF( comma_BUILD_TESTS )
 
 OPTION( INSTALL_TESTS "Install the tests into the nominated directory" OFF )
 IF( INSTALL_TESTS )
-    SET ( comma_CPP_TESTS_INSTALL_DIR bin CACHE PATH "Install directory for cpp unit tests" )
-    SET ( comma_INSTALL_COMMA_TESTS_DIR share/test )
+SET ( comma_CPP_TESTS_INSTALL_DIR bin CACHE PATH "Install directory for cpp unit tests" )
+SET ( comma_INSTALL_COMMA_TESTS_DIR share/test )
 
 # Get the list of test directories (using glob).
 FILE ( GLOB_RECURSE all_files
@@ -222,19 +222,18 @@ FOREACH ( i ${all_files} )
 ENDFOREACH (i)
 
 # Add those directories
-	FOREACH (file ${test_dirs} )
-			# Determine the parent directories for a given file so to prefix the install location (otherwise they just all get installed in the destination root)
-			get_filename_component( dest_dir ${file} DIRECTORY )
-                        STRING( REGEX MATCH ".*\\/output\\/.*" skip ${file} )
-                        IF( NOT skip )
-			# See that slash there? 		 vvv It's really important.
-			INSTALL ( 	DIRECTORY ${dest_dir}/
-						DESTINATION ${comma_INSTALL_COMMA_TESTS_DIR}/${CMAKE_PROJECT_NAME}/unit/${dest_dir}
-						USE_SOURCE_PERMISSIONS
-                            PATTERN "output" EXCLUDE )
-                        ENDIF( NOT skip )
-	ENDFOREACH (file)
-
+FOREACH (file ${test_dirs} )
+		# Determine the parent directories for a given file so to prefix the install location (otherwise they just all get installed in the destination root)
+		get_filename_component( dest_dir ${file} DIRECTORY )
+                    STRING( REGEX MATCH ".*\\/output\\/.*" skip ${file} )
+                    IF( NOT skip )
+		# See that slash there? 		 vvv It's really important.
+		INSTALL ( 	DIRECTORY ${dest_dir}/
+					DESTINATION ${comma_INSTALL_COMMA_TESTS_DIR}/${CMAKE_PROJECT_NAME}/unit/${dest_dir}
+					USE_SOURCE_PERMISSIONS
+                        PATTERN "output" EXCLUDE )
+                    ENDIF( NOT skip )
+ENDFOREACH (file)
 ENDIF( INSTALL_TESTS )
 ENDIF( comma_BUILD_TESTS )
 

From c27cfd426615c52f748e0aa684a380e9bd754ae4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 22:35:10 +1000
Subject: [PATCH 0453/1056] system/package/debian/comma-package-make: fixing...

---
 system/package/debian/comma-package-make | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index 16b97f1cc..c048e54cf 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -11,7 +11,7 @@ comma_dir="$5"
 [[ -n "$version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
 cd ~
 echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.yml' in $( pwd )..." >&2
-ansible-playbook "$comma_dir/system/ansible/install.yml" || die "failed"
+#ansible-playbook "$comma_dir/system/ansible/install.yml" || die "ansible-playbook failed"
 case $ubuntu_version in
     18.04) libproc_version="libprocps6 (>= 2:3.3.0)" ;;
     20.04) libproc_version="libprocps8 (>= 1)" ;;
@@ -20,9 +20,11 @@ case $ubuntu_version in
 esac
 
 (
+    mkdir -p ~/build/comma
     cd ~/build/comma
     echo "$0: running cmake in $( pwd )..." >&2
-    cmake . -DCPACK_GENERATOR=DEB \
+    cmake $comma_dir \
+            -DCPACK_GENERATOR=DEB \
             -DBUILD_PYTHON_PACKAGES=OFF \
             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
             -DBUILD_SHARED_LIBS=ON \
@@ -39,7 +41,7 @@ esac
             -Dcomma_BUILD_XML=OFF \
             -Dcomma_build_io_rabbit_cat=OFF || die "cmake failed"
     echo "$0: running cpack in $( pwd )..." >&2
-    cpack || die "cpack failed"
+    cpack -j4 || die "cpack failed"
     echo "$0: created package at $( realpath comma-$version_major.$version_minor.$version_patch-Linux.deb )" >&2
     # todo: optionally run full regression test
     echo "$0: done" >&2

From 03e06f113e9860625cfbb3bbfe316f163e3164ba Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 9 May 2022 23:25:36 +1000
Subject: [PATCH 0454/1056] CMakeLists.txt: lintian errors fixed

---
 CMakeLists.txt | 12 ++----------
 1 file changed, 2 insertions(+), 10 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index d9bc6d202..67423f644 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -24,8 +24,8 @@ set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
 set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
 set( comma_version "${CMAKE_PROJECT_VERSION}" ) # quick and dirty
-install( FILES COPYING DESTINATION share/doc/comma-${CMAKE_PROJECT_VERSION} RENAME copyright )
-install( FILES system/package/debian/changelog.gz DESTINATION share/doc/comma-${CMAKE_PROJECT_VERSION} )
+install( FILES COPYING DESTINATION share/doc/comma RENAME copyright ) # required by lintian
+install( FILES system/package/debian/changelog.gz DESTINATION share/doc/comma ) # required by lintian
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )
@@ -345,15 +345,7 @@ endif( CMAKE_COMPILER_IS_GNUCXX )
 add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
 
 # todo
-#     set as cache variables
-#         CMAKE_PROJECT_VERSION
-#         CMAKE_PROJECT_VERSION_MAJOR
-#         CMAKE_PROJECT_VERSION_MINOR
-#         CMAKE_PROJECT_VERSION_PATCH
 #     lintian errors and warnings
-#         fix errors
-#             E: comma: no-changelog usr/share/doc/comma/changelog.gz (native package)
-#             E: comma: no-copyright-file
 #         fix warnings
 #             W: comma: package-name-doesnt-match-sonames: try comma_string -> comma-string, etc?
 #             W: comma: maintscript-calls-ldconfig [postinst]: don't call ldconfig from package?

From 5ad1c3e95cbc87c9e6111fff42fb374704f5b55c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 10 May 2022 00:09:47 +1000
Subject: [PATCH 0455/1056] system/package: lintian warning fixed:
 changelog.gz: timestamp removed

---
 CMakeLists.txt                     |   5 +++--
 system/package/debian/changelog.gz | Bin 81 -> 71 bytes
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 67423f644..0d911dd3e 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -160,7 +160,7 @@ SET( comma_BUILD_APPLICATIONS ${BUILD_APPLICATIONS} )
 
 OPTION( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
 
-option( BUILD_SHARED_LIBS "build with shared libraries" ON ) # option( BUILD_SHARED_LIBS "build with shared libraries" OFF )
+option( BUILD_SHARED_LIBS "build with shared libraries" ON )
 
 OPTION( comma_BUILD_PYTHON "build python" ON )
 
@@ -384,7 +384,7 @@ set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )
 # if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
 if( BUILD_SHARED_LIBS )
     #set( CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig" )
-    set( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "%posttrans -p /sbin/ldconfig" )
+    set( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "%posttrans -p /sbin/ldconfig" ) # this line works but commented out to avoid lintian error
     #set( SHLIBS_FILE "${CMAKE_CURRENT_BINARY_DIR}/shlibs" )
     # witchcraft from here: https://github.com/roboception/rcdiscover/blob/master/cmake/package_debian.cmake
     set( TRIGGERS_FILE "${CMAKE_CURRENT_BINARY_DIR}/triggers" )
@@ -407,6 +407,7 @@ if( BUILD_SHARED_LIBS )
         set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA};${SHLIBS_FILE};${TRIGGERS_FILE}" )
     endif ( CPACK_DEB_COMPONENT_INSTALL )
 endif( BUILD_SHARED_LIBS )
+
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy" )
     SET( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
diff --git a/system/package/debian/changelog.gz b/system/package/debian/changelog.gz
index 82cf0602f4746ae8aae6e4450818fd5553f043a7..185c51ea25005442984b026944438498aa641ef0 100644
GIT binary patch
delta 16
TcmWG^=aTQ{U;qQ=i6XWD6lelE

delta 26
hcmZ<{6p`=d;P9wXNnm15&PdElPtD0sXPC%k3jkV@2Q&Zx


From 5bb953f97d63b553f1186481332e1b346441110a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 10 May 2022 15:13:33 +1000
Subject: [PATCH 0456/1056] CMakeLists.txt, comma-package-make: cpack works
 now, it seems; tested in docker

---
 CMakeLists.txt                           | 5 ++++-
 system/package/debian/comma-package-make | 8 +++++---
 2 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 0d911dd3e..5d3ef4df6 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -345,6 +345,8 @@ endif( CMAKE_COMPILER_IS_GNUCXX )
 add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
 
 # todo
+#     build ppa
+#         see here? http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
 #     lintian errors and warnings
 #         fix warnings
 #             W: comma: package-name-doesnt-match-sonames: try comma_string -> comma-string, etc?
@@ -358,6 +360,7 @@ add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
 #             W: comma: no-manual-page: ok for now, lots of packages don't have man pages
 
 set( CPACK_PACKAGE_NAME "comma" )
+set( CPACK_PACKAGE_FILE_NAME "${CPACK_PACKAGE_NAME}-${CPACK_PACKAGE_VERSION}-${CPACK_SYSTEM_NAME}" CACHE STRING "package name" )
 #set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
 set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "cli utilities for structured or fixed-width offline or realtime data" )
 set( CPACK_PACKAGE_VENDOR "orthographic" )
@@ -371,7 +374,7 @@ set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
 set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} )
 set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} )
 set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} )
-set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04" )
+set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04 or later" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc" )
diff --git a/system/package/debian/comma-package-make b/system/package/debian/comma-package-make
index c048e54cf..0e0f00890 100755
--- a/system/package/debian/comma-package-make
+++ b/system/package/debian/comma-package-make
@@ -7,6 +7,7 @@ version_major=$2
 version_minor=$3
 version_patch=$4
 comma_dir="$5"
+package_name="comma-$version_major.$version_minor.$version_patch-ubuntu.$ubuntu_version"
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
 [[ -n "$version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
 cd ~
@@ -25,6 +26,7 @@ esac
     echo "$0: running cmake in $( pwd )..." >&2
     cmake $comma_dir \
             -DCPACK_GENERATOR=DEB \
+            -DCPACK_PACKAGE_NAME="$package_name" \
             -DBUILD_PYTHON_PACKAGES=OFF \
             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
             -DBUILD_SHARED_LIBS=ON \
@@ -42,13 +44,13 @@ esac
             -Dcomma_build_io_rabbit_cat=OFF || die "cmake failed"
     echo "$0: running cpack in $( pwd )..." >&2
     cpack -j4 || die "cpack failed"
-    echo "$0: created package at $( realpath comma-$version_major.$version_minor.$version_patch-Linux.deb )" >&2
+    echo "$0: created package at $( realpath $package_name.deb )" >&2
     # todo: optionally run full regression test
     echo "$0: done" >&2
 )
 if [[ -d output ]]; then
-    cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
-    echo "$0: copied $( realpath ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb ) to $( realpath output )" >&2
+    cp ~/build/comma/$package_name.deb output
+    echo "$0: copied $( realpath ~/build/comma/$package_name.deb ) to $( realpath output )" >&2
 fi
 
 # (

From e489ce4ffb75f44930e487dfa292b148f5c9e629 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 10 May 2022 15:14:06 +1000
Subject: [PATCH 0457/1056] system/package/debian/examples/package_with_cmake
 added

---
 .../hello-world/CMakeLists.txt                |  14 ++
 .../hello-world/debian/changelog              |   5 +
 .../hello-world/debian/control                |  14 ++
 .../hello-world/debian/copyright              |  18 ++
 .../hello-world/debian/files                  |   1 +
 .../hello-world/debian/rules                  |  28 +++
 .../package_with_cmake/hello-world/main.cpp   |   6 +
 .../package_with_cmake/hello-world/readme     | 212 ++++++++++++++++++
 .../debian/examples/package_with_cmake/readme |   3 +
 .../debian/examples/package_with_cmake/upload |   5 +
 10 files changed, 306 insertions(+)
 create mode 100644 system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
 create mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
 create mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/control
 create mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
 create mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/files
 create mode 100755 system/package/debian/examples/package_with_cmake/hello-world/debian/rules
 create mode 100644 system/package/debian/examples/package_with_cmake/hello-world/main.cpp
 create mode 100644 system/package/debian/examples/package_with_cmake/hello-world/readme
 create mode 100644 system/package/debian/examples/package_with_cmake/readme
 create mode 100755 system/package/debian/examples/package_with_cmake/upload

diff --git a/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt b/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
new file mode 100644
index 000000000..c3f4ed367
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
@@ -0,0 +1,14 @@
+project(greet-the-world)
+
+cmake_minimum_required(VERSION 2.6)
+
+set(EXECUTABLE_OUTPUT_PATH ${greet-the-world_SOURCE_DIR})
+
+add_executable(greet-the-world main.cpp)
+
+install(
+    TARGETS
+        greet-the-world
+    RUNTIME DESTINATION
+        ${CMAKE_INSTALL_PREFIX}/bin
+)
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog b/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
new file mode 100644
index 000000000..79522505d
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
@@ -0,0 +1,5 @@
+hello-world (0.1-0ppa0) oneiric; urgency=low
+
+  * Initial upload!
+
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Tue, 10 May 2022 00:32:17 +0100
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/control b/system/package/debian/examples/package_with_cmake/hello-world/debian/control
new file mode 100644
index 000000000..8a4e85747
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/debian/control
@@ -0,0 +1,14 @@
+Source: hello-worlkd
+Standards-Version: 4.6.0.1
+Section: devel
+Priority: optional
+Maintainer: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
+Build-Depends: cmake
+Homepage: https://gitlab.com/orthographic
+
+Package: hello-world
+Architecture: any
+Depends: 
+Description: First test-package
+ Long description of hello-world.
+ It can span multiple lines!
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright b/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
new file mode 100644
index 000000000..2d88c5665
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
@@ -0,0 +1,18 @@
+####################################################################
+#                        hello-world                               #
+####################################################################
+
+Copyright (C) 2011 Your Name
+
+This program is free software: you can redistribute it and/or modify
+it under the terms of the GNU General Public License as published by
+the Free Software Foundation, either version 3 of the License, or 
+(at your option) any later version.
+
+This program is distributed in the hope that it will be useful, but
+WITHOUT ANY WARRANTY; without even the implied warranty of 
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program.  If not, see <https://www.gnu.org/licenses/>.
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/files b/system/package/debian/examples/package_with_cmake/hello-world/debian/files
new file mode 100644
index 000000000..322b2dded
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/debian/files
@@ -0,0 +1 @@
+hello-world_0.1-0ppa0_source.buildinfo devel optional
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/rules b/system/package/debian/examples/package_with_cmake/hello-world/debian/rules
new file mode 100755
index 000000000..fba617ab4
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/debian/rules
@@ -0,0 +1,28 @@
+#!/usr/bin/make -f
+
+BUILDDIR = build_dir
+
+# secondly called by launchpad
+build:
+	mkdir $(BUILDDIR);
+	cd $(BUILDDIR); cmake -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr ..
+	make -C $(BUILDDIR)
+
+# thirdly called by launchpad
+binary: binary-indep binary-arch
+
+binary-indep:
+	# nothing to be done
+
+binary-arch:
+	cd $(BUILDDIR); cmake -P cmake_install.cmake
+	mkdir debian/tmp/DEBIAN
+	dpkg-gencontrol -phello-world
+	dpkg --build debian/tmp ..
+
+# firstly called by launchpad
+clean:
+	rm -f build
+	rm -rf $(BUILDDIR)
+
+.PHONY: binary binary-arch binary-indep clean
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/main.cpp b/system/package/debian/examples/package_with_cmake/hello-world/main.cpp
new file mode 100644
index 000000000..d0660b17c
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/main.cpp
@@ -0,0 +1,6 @@
+# include <iostream>
+
+int main() {
+    std::cout << "Hello World!" << std::endl;
+    return 0;
+}
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/readme b/system/package/debian/examples/package_with_cmake/hello-world/readme
new file mode 100644
index 000000000..1ee6a2d41
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/hello-world/readme
@@ -0,0 +1,212 @@
+homeHome PPA with CMake!
+bubble_chartGnome-Pie
+videogame_assetM.A.R.S.
+brushPictures
+play_circle_filledVideos
+learn it with a detailed step-by-step guide.
+
+PPA with CMake!
+When I first wanted to create a PPA for Ubuntu, it was a pain. It was barely documented, unnecessarily complex and — the worst thing of all — if there was a tutorial, it employed rather old build tools and no guide covered code generated with CMake.
+
+Motivation
+The goal was to upload M.A.R.S. to a PPA: M.A.R.S. uses CMake and I did not find any resource how to create a source package which launchpad would compile. With this tutorial I want to help those being in a similar situation I was some months ago. Please remark that I don’t have inside knowledge on what is going on here — it is the result of trial and error, but it works as supposed! So let’s get started…
+
+1. A short inroduction
+So first of all — for those not knowing it — what is a PPA?
+
+A PPA is a Personal Package Archive hosted on launchpad. Developers can upload source code to this archive which then will be build automatically for various releases of Ubuntu in a 32 bit and a 64 bit version. These archives can easily be added to the software sources of any Ubuntu-based Linux distribution, making it very easy to install the software on end-user systems.
+
+This tutorial will show you how to create and upload a source package to launchpad. This source package will contain a minimal application written in C++ which gets configured with CMake.
+
+The tutorial assumes you have knowledge in a programming language supported by CMake and in CMake itself. Even if I will provide copy&paste code snippets, I won't explain how CMake works on a general basis.
+The software requirements are CMake, the GCC and some packaging scripts. You can install them with the following command:
+
+sudo apt-get install build-essential cmake devscripts
+2. A minimal application with CMake
+First create an empty directory called “greet-the-world”. Open a text editor of your choice and paste the following code into it.
+
+## include <iostream>
+
+int main() {
+    std::cout << "Hello World!" << std::endl;
+    return 0;
+}
+Save the file as main.cpp in the newly created directory. This is the program which will serve as a basic example for this tutorial. Now it’s time to create a CMake-script which will generate a makefile for automatic compilation. Save the following file as CMakeLists.txt in the same directory as your main.cpp.
+
+Collapse keyboard_arrow_upproject(greet-the-world)
+
+cmake_minimum_required(VERSION 2.6)
+
+set(EXECUTABLE_OUTPUT_PATH ${greet-the-world_SOURCE_DIR})
+
+add_executable(greet-the-world main.cpp)
+
+install(
+    TARGETS
+        greet-the-world
+    RUNTIME DESTINATION
+        ${CMAKE_INSTALL_PREFIX}/bin
+)
+If you execute the following commands, your program should be build. They create a new directory called “build” inside your source directory. From there CMake is executed, creating a makefile which then is used to compile the source code. When all works according to plan, the last command should print “Hello World!” to your console.
+
+cd greet-the-world
+mkdir build && cd build
+cmake ..
+make
+cd .. && ./greet-the-world
+If everything works as supposed, clean up again:
+
+rm -rf build
+rm greet-the-world
+3. Creating a source package
+This step involves creation of four files which are needed by launchpad. They describe how the debian package should be build, what are the dependencies of the package and so on. They are all placed in a folder called “debian” in the source directory.
+
+cd greet-the-world
+mkdir debian && cd debian
+3.1 The control file
+Now we will go through each individual file and check what it is for. You can download the file of each section with the given command. Just execute it inside the “debian”-directory and open the downloaded file in an editor of your choice. Or copy & paste the contents from below.
+
+wget https://schneegans.github.io/assets/files/ppa-howto/control
+Source: greet-the-world
+Section: devel
+Priority: optional
+Maintainer: Your Name <your.email@some.where>
+Build-Depends: cmake, build-essential
+Homepage: https://www.yourhomepage.org
+
+Package: greet-the-world
+Architecture: any
+Depends:
+Description: First test-package
+ Long description of greet-the-world.
+ It can span multiple lines!
+This first file is “control”. It specifies which packages are needed for building your package, what it is called and some information on you. The first section of the file describes the source package. The second part is the configuration for the resulting binary package.
+
+You’ll have to write your name and e-mail address to the appropriate fields.
+
+3.2 The rules file
+The second file, “rules”, is very important, too. It tells launchpad how to exactly compile your application. It is basically a normal makefile with some special targets, which are invoked by launchpad.
+
+wget https://schneegans.github.io/assets/files/ppa-howto/rules
+Expand keyboard_arrow_down#!/usr/bin/make -f
+
+BUILDDIR = build_dir
+
+# secondly called by launchpad
+build:
+    mkdir $(BUILDDIR);
+    cd $(BUILDDIR); cmake -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr ..
+    make -C $(BUILDDIR)
+
+# thirdly called by launchpad
+binary: binary-indep binary-arch
+
+binary-indep:
+    # nothing to be done
+
+binary-arch:
+    cd $(BUILDDIR); cmake -P cmake_install.cmake
+    mkdir debian/tmp/DEBIAN
+    dpkg-gencontrol -pgreet-the-world
+    dpkg --build debian/tmp ..
+
+# firstly called by launchpad
+clean:
+    rm -f build
+    rm -rf $(BUILDDIR)
+
+.PHONY: binary binary-arch binary-indep clean
+The target “clean” is called firstly. Then launchpad will execute “build”, which does the same thing as we tested above. It will create a build directory, change to it, execute CMake (with the install prefix set to a directory inside the debian directory) and compile the application. When this succeeds, the package will be build with the target “binary-arch”.
+
+You don’t need to alter the content of this file.
+
+3.3 The changelog file
+The third file is “changelog”. It contains some information on what you have done since the last release.
+
+wget https://schneegans.github.io/assets/files/ppa-howto/changelog
+greet-the-world (0.1-0ppa0) oneiric; urgency=low
+
+  * Initial upload!
+
+ -- Your Name <your.email@some.where>  Tue, 01 Nov 2011 20:32:17 +0100
+The first line specifies for what distribution your package is made and its version. Then there can be multiple lines containing the change log information. The last line has to be exactly like it is shown there. Mind the two spaces after your e-mail address! Without them, your package will be rejected!
+
+Please change the date and the e-mail address accordingly. The date string can be obtained by the terminal command date -R.
+
+3.4 The copyright file
+The last file contains your copyright information. It does not follow any structure and can contain everything you want. Here is a GPL-3 example. Just insert your name.
+
+wget https://schneegans.github.io/assets/files/ppa-howto/copyright
+Expand keyboard_arrow_down####################################################################
+#                    greet-the-world                               #
+####################################################################
+
+Copyright (C) 2011 Your Name
+
+This program is free software: you can redistribute it and/or modify
+it under the terms of the GNU General Public License as published by
+the Free Software Foundation, either version 3 of the License, or
+(at your option) any later version.
+
+This program is distributed in the hope that it will be useful, but
+WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program.  If not, see <https://www.gnu.org/licenses/>.
+4. Uploading to launchpad
+Now, all necessary files have been created. The project is ready to be uploaded to launchpad! Therefore you will have to have a launchpad account. If you don’t already have one, please create one now. You will have to do some nasty stuff then — like uploading RSA-keys, signing the Ubuntu Code of Conduct and sharing OpenPGP-keys — but this is well documented at the launchpad help pages. Here are some links which may be useful:
+
+Create and personalise your launchpad account
+Import an OpenPGP key to launchpad
+Import your SSH keys
+Activating your PPA
+4.1 The initial upload
+Now you’re ready to upload your first package to launchpad! Just a few steps are needed to do so. First of all, you need to create a .tar.gz of your original source code and name it greet-the-world_0.1.orig.tar.gz. Then the package is created from within the folder “greet-the-world”. Finally you upload the package with dput to launchpad. Be sure to replace ppa:yourppa/name with your PPA.
+
+tar -acf greet-the-world_0.1.orig.tar.gz greet-the-world
+cd greet-the-world
+debuild -S -sa
+cd ..
+dput ppa:yourppa/name greet-the-world_0.1-0ppa0_source.changes
+That’s all! You’ve done it!
+
+Check your PPA’s website, there you can monitor the build status of your package. When it fails for some reason, launchpad will send you an e-mail containing information on the reason. If all works, you can now add the PPA to your system and install greet-the-world with synaptic!
+
+4.2 Further uploads
+If you want to upload a new version of your software, use the following commands. Before you have to create a new changelog file: remember to insert the new version number and the current date! In the terminal command below, you’ll have to change the file name accordingly.
+
+cd greet-the-world
+debuild -S -sd
+cd ..
+dput ppa:yourppa/name greet-the-world_0.1-0ppa0_source.changes
+5. Conclusions
+This is how I managed to upload code to launchpad. Once you understand the procedure, it’s quite easy — but I remember many difficulties at the beginning! Maybe a lot can be done more efficiently, maybe some steps are not done as supposed… but it works!
+
+If you got some questions or remarks… use the comment form below!
+
+Comments
+
+
+date_range Published
+02 November 2011
+create Author
+Simon Schneegans
+loyalty Tags
+loyalty tutorial loyalty c++ loyalty cmake loyalty code
+dehaze Contents
+PPA with CMake!
+Motivation
+1. A short inroduction
+2. A minimal application with CMake
+3. Creating a source package
+4. Uploading to launchpad
+5. Conclusions
+Comments
+Newer post:
+chevron_left Translate Gnome-Pie!
+code mail rss_feed
+
+© 2022 Desgin & Content by Simon Schneegans (Impressum) with help from Jekyll and Materialize, inspired by Darkstrap.
+Proudly hosted on github pages. (repository)
diff --git a/system/package/debian/examples/package_with_cmake/readme b/system/package/debian/examples/package_with_cmake/readme
new file mode 100644
index 000000000..2a48ffd59
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/readme
@@ -0,0 +1,3 @@
+courtesy of this generous tutorial: http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
+adding gpg-key and setting it in launchpad: https://help.launchpad.net/YourAccount/ImportingYourPGPKey
+debian package policy, all necessary files: https://www.debian.org/doc/debian-policy/ch-controlfields.html
diff --git a/system/package/debian/examples/package_with_cmake/upload b/system/package/debian/examples/package_with_cmake/upload
new file mode 100755
index 000000000..c53d7edbe
--- /dev/null
+++ b/system/package/debian/examples/package_with_cmake/upload
@@ -0,0 +1,5 @@
+tar -acf hello-world_0.1.orig.tar.gz hello-world
+cd hello-world
+debuild -S -sa
+cd ..
+dput ppa:yourppa/name hello-world_0.1-0ppa0_source.changes

From 6004594da8e85ed828743fb12a59e56ccf247fcc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 10 May 2022 15:22:42 +1000
Subject: [PATCH 0458/1056] system/package/debian/examples/package_with_cmake:
 fixing...

---
 .../examples/package_with_cmake/hello-world/debian/control     | 2 +-
 .../examples/package_with_cmake/hello-world/debian/files       | 1 -
 system/package/debian/examples/package_with_cmake/readme       | 3 +++
 3 files changed, 4 insertions(+), 2 deletions(-)
 delete mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/files

diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/control b/system/package/debian/examples/package_with_cmake/hello-world/debian/control
index 8a4e85747..2f9f26630 100644
--- a/system/package/debian/examples/package_with_cmake/hello-world/debian/control
+++ b/system/package/debian/examples/package_with_cmake/hello-world/debian/control
@@ -1,4 +1,4 @@
-Source: hello-worlkd
+Source: hello-world
 Standards-Version: 4.6.0.1
 Section: devel
 Priority: optional
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/files b/system/package/debian/examples/package_with_cmake/hello-world/debian/files
deleted file mode 100644
index 322b2dded..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/debian/files
+++ /dev/null
@@ -1 +0,0 @@
-hello-world_0.1-0ppa0_source.buildinfo devel optional
diff --git a/system/package/debian/examples/package_with_cmake/readme b/system/package/debian/examples/package_with_cmake/readme
index 2a48ffd59..249ad0986 100644
--- a/system/package/debian/examples/package_with_cmake/readme
+++ b/system/package/debian/examples/package_with_cmake/readme
@@ -1,3 +1,6 @@
 courtesy of this generous tutorial: http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
 adding gpg-key and setting it in launchpad: https://help.launchpad.net/YourAccount/ImportingYourPGPKey
 debian package policy, all necessary files: https://www.debian.org/doc/debian-policy/ch-controlfields.html
+
+to create package, run commands from upload script one by one, except dput (unless
+you want to actually upload your package to ubuntu ppa launchpad)

From 477ffb03bc293249cfdeee8c0b9ea17028c5e673 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 13:08:24 +1000
Subject: [PATCH 0459/1056] system/package/debian renamed to
 system/package/cpack

---
 CMakeLists.txt                                      |   4 ++--
 etc/bash_completion.d/CMakeLists.txt                |   4 +---
 system/package/{debian => cpack}/Dockerfile         |   2 +-
 system/package/{debian => cpack}/changelog.gz       | Bin
 .../{debian => cpack}/comma-package-docker-build    |   4 ++--
 .../{debian => cpack}/comma-package-docker-run      |   2 +-
 .../{debian => cpack}/comma-package-docker-test     |   2 +-
 system/package/{debian => cpack}/comma-package-make |   0
 system/package/{debian => cpack}/comma-package-test |   0
 .../{debian => cpack}/examples/package-python       |   0
 .../package_with_cmake/hello-world/CMakeLists.txt   |   0
 .../package_with_cmake/hello-world/debian/changelog |   0
 .../package_with_cmake/hello-world/debian/control   |   0
 .../package_with_cmake/hello-world/debian/copyright |   0
 .../package_with_cmake/hello-world/debian/rules     |   1 +
 .../package_with_cmake/hello-world/main.cpp         |   0
 .../examples/package_with_cmake/hello-world/readme  |   0
 .../examples/package_with_cmake/readme              |   0
 .../examples/package_with_cmake/upload              |   0
 system/package/{debian => cpack}/readme             |   0
 20 files changed, 9 insertions(+), 10 deletions(-)
 rename system/package/{debian => cpack}/Dockerfile (81%)
 rename system/package/{debian => cpack}/changelog.gz (100%)
 rename system/package/{debian => cpack}/comma-package-docker-build (77%)
 rename system/package/{debian => cpack}/comma-package-docker-run (79%)
 rename system/package/{debian => cpack}/comma-package-docker-test (83%)
 rename system/package/{debian => cpack}/comma-package-make (100%)
 rename system/package/{debian => cpack}/comma-package-test (100%)
 rename system/package/{debian => cpack}/examples/package-python (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/hello-world/CMakeLists.txt (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/hello-world/debian/changelog (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/hello-world/debian/control (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/hello-world/debian/copyright (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/hello-world/debian/rules (96%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/hello-world/main.cpp (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/hello-world/readme (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/readme (100%)
 rename system/package/{debian => cpack}/examples/package_with_cmake/upload (100%)
 rename system/package/{debian => cpack}/readme (100%)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 5d3ef4df6..c50a2033f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -24,8 +24,8 @@ set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
 set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
 set( comma_version "${CMAKE_PROJECT_VERSION}" ) # quick and dirty
-install( FILES COPYING DESTINATION share/doc/comma RENAME copyright ) # required by lintian
-install( FILES system/package/debian/changelog.gz DESTINATION share/doc/comma ) # required by lintian
+# install( FILES COPYING DESTINATION share/doc/comma RENAME copyright ) # required by lintian
+# install( FILES system/package/debian/changelog.gz DESTINATION share/doc/comma ) # required by lintian
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )
diff --git a/etc/bash_completion.d/CMakeLists.txt b/etc/bash_completion.d/CMakeLists.txt
index de41cd163..806af761c 100644
--- a/etc/bash_completion.d/CMakeLists.txt
+++ b/etc/bash_completion.d/CMakeLists.txt
@@ -1,8 +1,6 @@
 IF (UNIX)
-    SET( INSTALL_BASH_COMPLETION_DIR /etc/bash_completion.d
-         CACHE PATH "Location in which to install the bash completion scripts.")
+    SET( INSTALL_BASH_COMPLETION_DIR /etc/bash_completion.d CACHE PATH "Location in which to install the bash completion scripts.")
     IF( INSTALL_BASH_COMPLETION )
         INSTALL(FILES comma DESTINATION ${INSTALL_BASH_COMPLETION_DIR} )
     ENDIF()
 ENDIF()
-
diff --git a/system/package/debian/Dockerfile b/system/package/cpack/Dockerfile
similarity index 81%
rename from system/package/debian/Dockerfile
rename to system/package/cpack/Dockerfile
index 8a729e018..4c73eafa0 100644
--- a/system/package/debian/Dockerfile
+++ b/system/package/cpack/Dockerfile
@@ -6,5 +6,5 @@ RUN apt-get update \
     && apt-get install --yes software-properties-common \
     && apt-get install --yes ansible git build-essential cmake cmake-curses-gui python3-pip devscripts \
     && apt-get install --yes python3-stdeb python3-all dh-python
-    && apt-get install --yes libboost-all-dev  libzmq3-dev libprocps-dev libc-dev socat recode
+    && apt-get install --yes libboost-all-dev libzmq3-dev libprocps-dev libc-dev socat recode
 # && apt-add-repository --yes --update ppa:ansible/ansible \
diff --git a/system/package/debian/changelog.gz b/system/package/cpack/changelog.gz
similarity index 100%
rename from system/package/debian/changelog.gz
rename to system/package/cpack/changelog.gz
diff --git a/system/package/debian/comma-package-docker-build b/system/package/cpack/comma-package-docker-build
similarity index 77%
rename from system/package/debian/comma-package-docker-build
rename to system/package/cpack/comma-package-docker-build
index 424175d25..363fd4f54 100755
--- a/system/package/debian/comma-package-docker-build
+++ b/system/package/cpack/comma-package-docker-build
@@ -5,5 +5,5 @@ comma_dir="$2"
 [[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
 [[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
 echo "$0: running:" >&2
-echo "docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f '$comma_dir/system/package/debian/Dockerfile' ." >&2
-docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/debian/Dockerfile" .
+echo "docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f '$comma_dir/system/package/cpack/Dockerfile' ." >&2
+docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/cpack/Dockerfile" .
diff --git a/system/package/debian/comma-package-docker-run b/system/package/cpack/comma-package-docker-run
similarity index 79%
rename from system/package/debian/comma-package-docker-run
rename to system/package/cpack/comma-package-docker-run
index 2f78a4953..57cd148de 100755
--- a/system/package/debian/comma-package-docker-run
+++ b/system/package/cpack/comma-package-docker-run
@@ -13,4 +13,4 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$( pwd ),target=/root/output" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/package/debian/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/cpack/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
diff --git a/system/package/debian/comma-package-docker-test b/system/package/cpack/comma-package-docker-test
similarity index 83%
rename from system/package/debian/comma-package-docker-test
rename to system/package/cpack/comma-package-docker-test
index a716ae11f..f399e1ed9 100755
--- a/system/package/debian/comma-package-docker-test
+++ b/system/package/cpack/comma-package-docker-test
@@ -18,4 +18,4 @@ docker run \
        --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
        --mount "type=bind,source=$package_dir,target=/mnt/package" \
        ubuntu.$ubuntu_version.build.basics \
-       /mnt/comma/system/package/debian/comma-package-test "/mnt/package/$( basename "$package" )" "/mnt/package/$( basename "$python_package" )" || { echo "$0: failed" >&2; exit 1; }
+       /mnt/comma/system/package/cpack/comma-package-test "/mnt/package/$( basename "$package" )" "/mnt/package/$( basename "$python_package" )" || { echo "$0: failed" >&2; exit 1; }
diff --git a/system/package/debian/comma-package-make b/system/package/cpack/comma-package-make
similarity index 100%
rename from system/package/debian/comma-package-make
rename to system/package/cpack/comma-package-make
diff --git a/system/package/debian/comma-package-test b/system/package/cpack/comma-package-test
similarity index 100%
rename from system/package/debian/comma-package-test
rename to system/package/cpack/comma-package-test
diff --git a/system/package/debian/examples/package-python b/system/package/cpack/examples/package-python
similarity index 100%
rename from system/package/debian/examples/package-python
rename to system/package/cpack/examples/package-python
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt b/system/package/cpack/examples/package_with_cmake/hello-world/CMakeLists.txt
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
rename to system/package/cpack/examples/package_with_cmake/hello-world/CMakeLists.txt
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog b/system/package/cpack/examples/package_with_cmake/hello-world/debian/changelog
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
rename to system/package/cpack/examples/package_with_cmake/hello-world/debian/changelog
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/control b/system/package/cpack/examples/package_with_cmake/hello-world/debian/control
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/hello-world/debian/control
rename to system/package/cpack/examples/package_with_cmake/hello-world/debian/control
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright b/system/package/cpack/examples/package_with_cmake/hello-world/debian/copyright
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
rename to system/package/cpack/examples/package_with_cmake/hello-world/debian/copyright
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/rules b/system/package/cpack/examples/package_with_cmake/hello-world/debian/rules
similarity index 96%
rename from system/package/debian/examples/package_with_cmake/hello-world/debian/rules
rename to system/package/cpack/examples/package_with_cmake/hello-world/debian/rules
index fba617ab4..fa1cba04e 100755
--- a/system/package/debian/examples/package_with_cmake/hello-world/debian/rules
+++ b/system/package/cpack/examples/package_with_cmake/hello-world/debian/rules
@@ -24,5 +24,6 @@ binary-arch:
 clean:
 	rm -f build
 	rm -rf $(BUILDDIR)
+	rm -f debian/files
 
 .PHONY: binary binary-arch binary-indep clean
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/main.cpp b/system/package/cpack/examples/package_with_cmake/hello-world/main.cpp
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/hello-world/main.cpp
rename to system/package/cpack/examples/package_with_cmake/hello-world/main.cpp
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/readme b/system/package/cpack/examples/package_with_cmake/hello-world/readme
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/hello-world/readme
rename to system/package/cpack/examples/package_with_cmake/hello-world/readme
diff --git a/system/package/debian/examples/package_with_cmake/readme b/system/package/cpack/examples/package_with_cmake/readme
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/readme
rename to system/package/cpack/examples/package_with_cmake/readme
diff --git a/system/package/debian/examples/package_with_cmake/upload b/system/package/cpack/examples/package_with_cmake/upload
similarity index 100%
rename from system/package/debian/examples/package_with_cmake/upload
rename to system/package/cpack/examples/package_with_cmake/upload
diff --git a/system/package/debian/readme b/system/package/cpack/readme
similarity index 100%
rename from system/package/debian/readme
rename to system/package/cpack/readme

From b09c14e5b1b723cf76505e9d5bd3d86ec486b4c1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 14:52:49 +1000
Subject: [PATCH 0460/1056] packaging using debian tools...

---
 CMakeLists.txt                                |  2 +-
 system/package/debian/debian/changelog        |  5 +++
 system/package/debian/debian/control          | 14 +++++++
 system/package/debian/debian/copyright        | 32 +++++++++++++++
 system/package/debian/debian/rules            | 39 +++++++++++++++++++
 .../hello-world/CMakeLists.txt                |  0
 .../hello-world/debian/changelog              |  0
 .../hello-world/debian/control                |  0
 .../hello-world/debian/copyright              |  0
 .../hello-world/debian/rules                  |  0
 .../package_with_cmake/hello-world/main.cpp   |  0
 .../package_with_cmake/hello-world/readme     |  0
 .../examples/package_with_cmake/readme        |  0
 .../examples/package_with_cmake/upload        |  0
 14 files changed, 91 insertions(+), 1 deletion(-)
 create mode 100644 system/package/debian/debian/changelog
 create mode 100644 system/package/debian/debian/control
 create mode 100644 system/package/debian/debian/copyright
 create mode 100755 system/package/debian/debian/rules
 rename system/package/{cpack => debian}/examples/package_with_cmake/hello-world/CMakeLists.txt (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/hello-world/debian/changelog (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/hello-world/debian/control (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/hello-world/debian/copyright (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/hello-world/debian/rules (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/hello-world/main.cpp (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/hello-world/readme (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/readme (100%)
 rename system/package/{cpack => debian}/examples/package_with_cmake/upload (100%)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index c50a2033f..81b4d1f72 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -25,7 +25,7 @@ set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
 set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
 set( comma_version "${CMAKE_PROJECT_VERSION}" ) # quick and dirty
 # install( FILES COPYING DESTINATION share/doc/comma RENAME copyright ) # required by lintian
-# install( FILES system/package/debian/changelog.gz DESTINATION share/doc/comma ) # required by lintian
+# install( FILES system/package/cpack/changelog.gz DESTINATION share/doc/comma ) # required by lintian
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )
diff --git a/system/package/debian/debian/changelog b/system/package/debian/debian/changelog
new file mode 100644
index 000000000..ed63d8653
--- /dev/null
+++ b/system/package/debian/debian/changelog
@@ -0,0 +1,5 @@
+comma (1.0.0-0ppa0) jammy; urgency=low
+
+  * initial upload
+
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Wed, 11 May 2022 13:12:01 +1000
diff --git a/system/package/debian/debian/control b/system/package/debian/debian/control
new file mode 100644
index 000000000..b48ebb401
--- /dev/null
+++ b/system/package/debian/debian/control
@@ -0,0 +1,14 @@
+Source: comma
+Standards-Version: 4.6.0.1
+Section: devel
+Priority: optional
+Maintainer: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
+Build-Depends: cmake
+Homepage: https://gitlab.com/orthographic/comma/-/wikis/home
+
+Package: comma
+Architecture: any
+Depends: libc-dev, libboost-all-dev (>=1.65), libzmq5 (>= 4.2.5-1), recode (>=3.6), socat
+Description: generic libraries and cli for csv and fixed-width data processing
+  comma, libraries and command line utilitie for efficient streaming and
+  processing of comma-separated (csv) and fixed-width binary data
diff --git a/system/package/debian/debian/copyright b/system/package/debian/debian/copyright
new file mode 100644
index 000000000..b5a12d744
--- /dev/null
+++ b/system/package/debian/debian/copyright
@@ -0,0 +1,32 @@
+####################################################################
+#                              comma                               #
+####################################################################
+
+Copyright (c) 2011 The University of Sydney
+Copyright (c) 2018 Vsevolod Vlaskine
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+2. Redistributions in binary form must reproduce the above copyright
+   notice, this list of conditions and the following disclaimer in the
+   documentation and/or other materials provided with the distribution.
+3. Neither the name of the University of Sydney nor the
+   names of its contributors may be used to endorse or promote products
+   derived from this software without specific prior written permission.
+
+NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
diff --git a/system/package/debian/debian/rules b/system/package/debian/debian/rules
new file mode 100755
index 000000000..746b222cc
--- /dev/null
+++ b/system/package/debian/debian/rules
@@ -0,0 +1,39 @@
+#!/usr/bin/make -f
+
+BUILDDIR = build
+
+# secondly called by launchpad
+build:
+	mkdir $(BUILDDIR);
+	cd $(BUILDDIR); cmake .. \
+	                         -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr \
+							 -DCMAKE_BUILD_TYPE=Release \
+ 							 -DBUILD_SHARED_LIBS=ON \
+ 							 -DBUILD_PYTHON_PACKAGES=OFF \
+							 -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+							 -DBUILD_TESTS=OFF \
+							 -DINSTALL_BASH_COMPLETION=OFF \
+							 -DINSTALL_TESTS=OFF \
+							 -Dcomma_BUILD_XML=OFF \
+							 -Dcomma_build_io_rabbit_cat=OFF
+	make -C $(BUILDDIR)
+
+# thirdly called by launchpad
+binary: binary-indep binary-arch
+
+binary-indep:
+	# nothing to be done
+
+binary-arch:
+	cd $(BUILDDIR); cmake -P cmake_install.cmake
+	mkdir debian/tmp/DEBIAN
+	dpkg-gencontrol -pcomma
+	dpkg --build debian/tmp ..
+
+# firstly called by launchpad
+clean:
+	rm -f build
+	rm -rf $(BUILDDIR)
+	rm -f debian/files
+
+.PHONY: binary binary-arch binary-indep clean
diff --git a/system/package/cpack/examples/package_with_cmake/hello-world/CMakeLists.txt b/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/hello-world/CMakeLists.txt
rename to system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
diff --git a/system/package/cpack/examples/package_with_cmake/hello-world/debian/changelog b/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/hello-world/debian/changelog
rename to system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
diff --git a/system/package/cpack/examples/package_with_cmake/hello-world/debian/control b/system/package/debian/examples/package_with_cmake/hello-world/debian/control
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/hello-world/debian/control
rename to system/package/debian/examples/package_with_cmake/hello-world/debian/control
diff --git a/system/package/cpack/examples/package_with_cmake/hello-world/debian/copyright b/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/hello-world/debian/copyright
rename to system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
diff --git a/system/package/cpack/examples/package_with_cmake/hello-world/debian/rules b/system/package/debian/examples/package_with_cmake/hello-world/debian/rules
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/hello-world/debian/rules
rename to system/package/debian/examples/package_with_cmake/hello-world/debian/rules
diff --git a/system/package/cpack/examples/package_with_cmake/hello-world/main.cpp b/system/package/debian/examples/package_with_cmake/hello-world/main.cpp
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/hello-world/main.cpp
rename to system/package/debian/examples/package_with_cmake/hello-world/main.cpp
diff --git a/system/package/cpack/examples/package_with_cmake/hello-world/readme b/system/package/debian/examples/package_with_cmake/hello-world/readme
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/hello-world/readme
rename to system/package/debian/examples/package_with_cmake/hello-world/readme
diff --git a/system/package/cpack/examples/package_with_cmake/readme b/system/package/debian/examples/package_with_cmake/readme
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/readme
rename to system/package/debian/examples/package_with_cmake/readme
diff --git a/system/package/cpack/examples/package_with_cmake/upload b/system/package/debian/examples/package_with_cmake/upload
similarity index 100%
rename from system/package/cpack/examples/package_with_cmake/upload
rename to system/package/debian/examples/package_with_cmake/upload

From 968a042439656bbc800aea8719b874590d28d071 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 15:10:16 +1000
Subject: [PATCH 0461/1056] packaging using debian tools...

---
 system/package/debian/debian/control                     | 2 +-
 system/package/debian/examples/package_with_cmake/readme | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/system/package/debian/debian/control b/system/package/debian/debian/control
index b48ebb401..ffb0ebfde 100644
--- a/system/package/debian/debian/control
+++ b/system/package/debian/debian/control
@@ -3,7 +3,7 @@ Standards-Version: 4.6.0.1
 Section: devel
 Priority: optional
 Maintainer: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
-Build-Depends: cmake
+Build-Depends: cmake, libc-dev, libboost-all-dev (>=1.65), libzmq5 (>= 4.2.5-1)
 Homepage: https://gitlab.com/orthographic/comma/-/wikis/home
 
 Package: comma
diff --git a/system/package/debian/examples/package_with_cmake/readme b/system/package/debian/examples/package_with_cmake/readme
index 249ad0986..754a9c1c4 100644
--- a/system/package/debian/examples/package_with_cmake/readme
+++ b/system/package/debian/examples/package_with_cmake/readme
@@ -1,6 +1,7 @@
 courtesy of this generous tutorial: http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
 adding gpg-key and setting it in launchpad: https://help.launchpad.net/YourAccount/ImportingYourPGPKey
 debian package policy, all necessary files: https://www.debian.org/doc/debian-policy/ch-controlfields.html
+building ppa: https://www.ebower.com/docs/ubuntu-ppa/
 
 to create package, run commands from upload script one by one, except dput (unless
 you want to actually upload your package to ubuntu ppa launchpad)

From 7bc916a16b01ba706dcd723e2de6918de94e545c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 16:09:31 +1000
Subject: [PATCH 0462/1056] CMakeLists.txt: version bumped up to 1.0.1;
 building ppa: works; scripting and documenting...

---
 CMakeLists.txt                                           | 4 ++--
 system/package/debian/examples/package_with_cmake/readme | 1 +
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 81b4d1f72..48809cfba 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -11,12 +11,12 @@ endif( USE_ARM_TOOLCHAIN )
 cmake_minimum_required( VERSION 3.1 )
 if( POLICY CMP0048 )
     cmake_policy( SET CMP0048 NEW )
-    project( comma VERSION 1.0.0 LANGUAGES CXX )
+    project( comma VERSION 1.0.1 LANGUAGES CXX )
 else( POLICY CMP0048 )
     project( comma )
     set( CMAKE_PROJECT_VERSION_MAJOR "1" CACHE STRING "comma version major" )
     set( CMAKE_PROJECT_VERSION_MINOR "0" CACHE STRING "comma version minor" )
-    set( CMAKE_PROJECT_VERSION_PATCH "0" CACHE STRING "comma version patch" )
+    set( CMAKE_PROJECT_VERSION_PATCH "1" CACHE STRING "comma version patch" )
     set( CMAKE_PROJECT_VERSION "${CMAKE_PROJECT_VERSION_MAJOR}.${CMAKE_PROJECT_VERSION_MINOR}.${CMAKE_PROJECT_VERSION_PATCH}" )
 endif( POLICY CMP0048 )
 
diff --git a/system/package/debian/examples/package_with_cmake/readme b/system/package/debian/examples/package_with_cmake/readme
index 754a9c1c4..a73b97b2c 100644
--- a/system/package/debian/examples/package_with_cmake/readme
+++ b/system/package/debian/examples/package_with_cmake/readme
@@ -2,6 +2,7 @@ courtesy of this generous tutorial: http://schneegans.github.io/lessons/2011/11/
 adding gpg-key and setting it in launchpad: https://help.launchpad.net/YourAccount/ImportingYourPGPKey
 debian package policy, all necessary files: https://www.debian.org/doc/debian-policy/ch-controlfields.html
 building ppa: https://www.ebower.com/docs/ubuntu-ppa/
+using ppa: https://itsfoss.com/ppa-guide/
 
 to create package, run commands from upload script one by one, except dput (unless
 you want to actually upload your package to ubuntu ppa launchpad)

From d344d60d8c41406d7fbf816c10b6e7f0f89897ca Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 17:10:22 +1000
Subject: [PATCH 0463/1056] comma-launchpad-upload: in progress...

---
 ChangeLog                                     |   2 -
 .../debian/debian => debian}/changelog        |   2 +-
 .../package/debian/debian => debian}/control  |   2 +-
 .../debian/debian => debian}/copyright        |   2 +-
 .../package/debian/debian => debian}/rules    |   0
 system/launchpad/comma-launchpad-upload       |  26 +++
 system/launchpad/readme                       |  12 +
 .../hello-world/CMakeLists.txt                |  14 --
 .../hello-world/debian/changelog              |   5 -
 .../hello-world/debian/control                |  14 --
 .../hello-world/debian/copyright              |  18 --
 .../hello-world/debian/rules                  |  29 ---
 .../package_with_cmake/hello-world/main.cpp   |   6 -
 .../package_with_cmake/hello-world/readme     | 212 ------------------
 .../debian/examples/package_with_cmake/readme |   8 -
 .../debian/examples/package_with_cmake/upload |   5 -
 16 files changed, 41 insertions(+), 316 deletions(-)
 delete mode 100644 ChangeLog
 rename {system/package/debian/debian => debian}/changelog (73%)
 rename {system/package/debian/debian => debian}/control (88%)
 rename {system/package/debian/debian => debian}/copyright (97%)
 rename {system/package/debian/debian => debian}/rules (100%)
 create mode 100755 system/launchpad/comma-launchpad-upload
 create mode 100644 system/launchpad/readme
 delete mode 100644 system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
 delete mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
 delete mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/control
 delete mode 100644 system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
 delete mode 100755 system/package/debian/examples/package_with_cmake/hello-world/debian/rules
 delete mode 100644 system/package/debian/examples/package_with_cmake/hello-world/main.cpp
 delete mode 100644 system/package/debian/examples/package_with_cmake/hello-world/readme
 delete mode 100644 system/package/debian/examples/package_with_cmake/readme
 delete mode 100755 system/package/debian/examples/package_with_cmake/upload

diff --git a/ChangeLog b/ChangeLog
deleted file mode 100644
index 722f106cb..000000000
--- a/ChangeLog
+++ /dev/null
@@ -1,2 +0,0 @@
-* v1.0.1
- - fixed bug in csv-joit
diff --git a/system/package/debian/debian/changelog b/debian/changelog
similarity index 73%
rename from system/package/debian/debian/changelog
rename to debian/changelog
index ed63d8653..ebc3828ba 100644
--- a/system/package/debian/debian/changelog
+++ b/debian/changelog
@@ -1,4 +1,4 @@
-comma (1.0.0-0ppa0) jammy; urgency=low
+comma (1.0.1-0ppa0) jammy; urgency=low
 
   * initial upload
 
diff --git a/system/package/debian/debian/control b/debian/control
similarity index 88%
rename from system/package/debian/debian/control
rename to debian/control
index ffb0ebfde..2c30ecb68 100644
--- a/system/package/debian/debian/control
+++ b/debian/control
@@ -10,5 +10,5 @@ Package: comma
 Architecture: any
 Depends: libc-dev, libboost-all-dev (>=1.65), libzmq5 (>= 4.2.5-1), recode (>=3.6), socat
 Description: generic libraries and cli for csv and fixed-width data processing
-  comma, libraries and command line utilitie for efficient streaming and
+  comma, libraries and command line utilities for efficient streaming and
   processing of comma-separated (csv) and fixed-width binary data
diff --git a/system/package/debian/debian/copyright b/debian/copyright
similarity index 97%
rename from system/package/debian/debian/copyright
rename to debian/copyright
index b5a12d744..e21faf1d4 100644
--- a/system/package/debian/debian/copyright
+++ b/debian/copyright
@@ -3,7 +3,7 @@
 ####################################################################
 
 Copyright (c) 2011 The University of Sydney
-Copyright (c) 2018 Vsevolod Vlaskine
+Copyright (c) 2018-2022 Vsevolod Vlaskine
 All rights reserved.
 
 Redistribution and use in source and binary forms, with or without
diff --git a/system/package/debian/debian/rules b/debian/rules
similarity index 100%
rename from system/package/debian/debian/rules
rename to debian/rules
diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
new file mode 100755
index 000000000..6c898e6ba
--- /dev/null
+++ b/system/launchpad/comma-launchpad-upload
@@ -0,0 +1,26 @@
+#!/bin/bash
+
+# todo
+#   - manual steps (automate if possible)
+#     - update changelog
+#       - version
+#       - changes
+#     - update default version in cmake
+#     - tag repo with version
+#     - commit
+#     - push
+#   ? check current version at launchpad
+
+function say() { echo "usage: $0: $@" >&2; }
+function die() { say "$@"; exit 1; }
+[[ -n "$2" ]] || { echo "usage: $0 <ubuntu-name> <comma-version> [<comma_dir>]" >&2; exit 1; }
+ubuntu_name=$1
+comma_version=$2
+comma_dir=$3
+name=comma_$comma_version
+[[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
+rm -rf comma
+cp -r $comma_dir . || die "copying $comma_dir failed" # quick and dirty; or git clone instead?
+tar -acf $name.orig.tar.gz comma || die "tar failed"
+( cd comma && debuild -S -sa ) || die "debuild failed"
+dput ppa:yourppa/name $name-0ppa0_source.changes || die "dput failed"
diff --git a/system/launchpad/readme b/system/launchpad/readme
new file mode 100644
index 000000000..3fad2d39c
--- /dev/null
+++ b/system/launchpad/readme
@@ -0,0 +1,12 @@
+todo
+  - document
+    - uploading to launchpad
+    - verifying in docker
+  - move docker out of system/package/cpack (can symlink it back)
+
+useful links
+  - generous tutorial: http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
+  - adding gpg-key and setting it in launchpad: https://help.launchpad.net/YourAccount/ImportingYourPGPKey
+  - debian package policy, all necessary files: https://www.debian.org/doc/debian-policy/ch-controlfields.html
+  - building ppa: https://www.ebower.com/docs/ubuntu-ppa/
+  - using ppa: https://itsfoss.com/ppa-guide/
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt b/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
deleted file mode 100644
index c3f4ed367..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/CMakeLists.txt
+++ /dev/null
@@ -1,14 +0,0 @@
-project(greet-the-world)
-
-cmake_minimum_required(VERSION 2.6)
-
-set(EXECUTABLE_OUTPUT_PATH ${greet-the-world_SOURCE_DIR})
-
-add_executable(greet-the-world main.cpp)
-
-install(
-    TARGETS
-        greet-the-world
-    RUNTIME DESTINATION
-        ${CMAKE_INSTALL_PREFIX}/bin
-)
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog b/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
deleted file mode 100644
index 79522505d..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/debian/changelog
+++ /dev/null
@@ -1,5 +0,0 @@
-hello-world (0.1-0ppa0) oneiric; urgency=low
-
-  * Initial upload!
-
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Tue, 10 May 2022 00:32:17 +0100
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/control b/system/package/debian/examples/package_with_cmake/hello-world/debian/control
deleted file mode 100644
index 2f9f26630..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/debian/control
+++ /dev/null
@@ -1,14 +0,0 @@
-Source: hello-world
-Standards-Version: 4.6.0.1
-Section: devel
-Priority: optional
-Maintainer: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
-Build-Depends: cmake
-Homepage: https://gitlab.com/orthographic
-
-Package: hello-world
-Architecture: any
-Depends: 
-Description: First test-package
- Long description of hello-world.
- It can span multiple lines!
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright b/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
deleted file mode 100644
index 2d88c5665..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/debian/copyright
+++ /dev/null
@@ -1,18 +0,0 @@
-####################################################################
-#                        hello-world                               #
-####################################################################
-
-Copyright (C) 2011 Your Name
-
-This program is free software: you can redistribute it and/or modify
-it under the terms of the GNU General Public License as published by
-the Free Software Foundation, either version 3 of the License, or 
-(at your option) any later version.
-
-This program is distributed in the hope that it will be useful, but
-WITHOUT ANY WARRANTY; without even the implied warranty of 
-MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
-General Public License for more details.
-
-You should have received a copy of the GNU General Public License
-along with this program.  If not, see <https://www.gnu.org/licenses/>.
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/debian/rules b/system/package/debian/examples/package_with_cmake/hello-world/debian/rules
deleted file mode 100755
index fa1cba04e..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/debian/rules
+++ /dev/null
@@ -1,29 +0,0 @@
-#!/usr/bin/make -f
-
-BUILDDIR = build_dir
-
-# secondly called by launchpad
-build:
-	mkdir $(BUILDDIR);
-	cd $(BUILDDIR); cmake -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr ..
-	make -C $(BUILDDIR)
-
-# thirdly called by launchpad
-binary: binary-indep binary-arch
-
-binary-indep:
-	# nothing to be done
-
-binary-arch:
-	cd $(BUILDDIR); cmake -P cmake_install.cmake
-	mkdir debian/tmp/DEBIAN
-	dpkg-gencontrol -phello-world
-	dpkg --build debian/tmp ..
-
-# firstly called by launchpad
-clean:
-	rm -f build
-	rm -rf $(BUILDDIR)
-	rm -f debian/files
-
-.PHONY: binary binary-arch binary-indep clean
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/main.cpp b/system/package/debian/examples/package_with_cmake/hello-world/main.cpp
deleted file mode 100644
index d0660b17c..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/main.cpp
+++ /dev/null
@@ -1,6 +0,0 @@
-# include <iostream>
-
-int main() {
-    std::cout << "Hello World!" << std::endl;
-    return 0;
-}
diff --git a/system/package/debian/examples/package_with_cmake/hello-world/readme b/system/package/debian/examples/package_with_cmake/hello-world/readme
deleted file mode 100644
index 1ee6a2d41..000000000
--- a/system/package/debian/examples/package_with_cmake/hello-world/readme
+++ /dev/null
@@ -1,212 +0,0 @@
-homeHome PPA with CMake!
-bubble_chartGnome-Pie
-videogame_assetM.A.R.S.
-brushPictures
-play_circle_filledVideos
-learn it with a detailed step-by-step guide.
-
-PPA with CMake!
-When I first wanted to create a PPA for Ubuntu, it was a pain. It was barely documented, unnecessarily complex and — the worst thing of all — if there was a tutorial, it employed rather old build tools and no guide covered code generated with CMake.
-
-Motivation
-The goal was to upload M.A.R.S. to a PPA: M.A.R.S. uses CMake and I did not find any resource how to create a source package which launchpad would compile. With this tutorial I want to help those being in a similar situation I was some months ago. Please remark that I don’t have inside knowledge on what is going on here — it is the result of trial and error, but it works as supposed! So let’s get started…
-
-1. A short inroduction
-So first of all — for those not knowing it — what is a PPA?
-
-A PPA is a Personal Package Archive hosted on launchpad. Developers can upload source code to this archive which then will be build automatically for various releases of Ubuntu in a 32 bit and a 64 bit version. These archives can easily be added to the software sources of any Ubuntu-based Linux distribution, making it very easy to install the software on end-user systems.
-
-This tutorial will show you how to create and upload a source package to launchpad. This source package will contain a minimal application written in C++ which gets configured with CMake.
-
-The tutorial assumes you have knowledge in a programming language supported by CMake and in CMake itself. Even if I will provide copy&paste code snippets, I won't explain how CMake works on a general basis.
-The software requirements are CMake, the GCC and some packaging scripts. You can install them with the following command:
-
-sudo apt-get install build-essential cmake devscripts
-2. A minimal application with CMake
-First create an empty directory called “greet-the-world”. Open a text editor of your choice and paste the following code into it.
-
-## include <iostream>
-
-int main() {
-    std::cout << "Hello World!" << std::endl;
-    return 0;
-}
-Save the file as main.cpp in the newly created directory. This is the program which will serve as a basic example for this tutorial. Now it’s time to create a CMake-script which will generate a makefile for automatic compilation. Save the following file as CMakeLists.txt in the same directory as your main.cpp.
-
-Collapse keyboard_arrow_upproject(greet-the-world)
-
-cmake_minimum_required(VERSION 2.6)
-
-set(EXECUTABLE_OUTPUT_PATH ${greet-the-world_SOURCE_DIR})
-
-add_executable(greet-the-world main.cpp)
-
-install(
-    TARGETS
-        greet-the-world
-    RUNTIME DESTINATION
-        ${CMAKE_INSTALL_PREFIX}/bin
-)
-If you execute the following commands, your program should be build. They create a new directory called “build” inside your source directory. From there CMake is executed, creating a makefile which then is used to compile the source code. When all works according to plan, the last command should print “Hello World!” to your console.
-
-cd greet-the-world
-mkdir build && cd build
-cmake ..
-make
-cd .. && ./greet-the-world
-If everything works as supposed, clean up again:
-
-rm -rf build
-rm greet-the-world
-3. Creating a source package
-This step involves creation of four files which are needed by launchpad. They describe how the debian package should be build, what are the dependencies of the package and so on. They are all placed in a folder called “debian” in the source directory.
-
-cd greet-the-world
-mkdir debian && cd debian
-3.1 The control file
-Now we will go through each individual file and check what it is for. You can download the file of each section with the given command. Just execute it inside the “debian”-directory and open the downloaded file in an editor of your choice. Or copy & paste the contents from below.
-
-wget https://schneegans.github.io/assets/files/ppa-howto/control
-Source: greet-the-world
-Section: devel
-Priority: optional
-Maintainer: Your Name <your.email@some.where>
-Build-Depends: cmake, build-essential
-Homepage: https://www.yourhomepage.org
-
-Package: greet-the-world
-Architecture: any
-Depends:
-Description: First test-package
- Long description of greet-the-world.
- It can span multiple lines!
-This first file is “control”. It specifies which packages are needed for building your package, what it is called and some information on you. The first section of the file describes the source package. The second part is the configuration for the resulting binary package.
-
-You’ll have to write your name and e-mail address to the appropriate fields.
-
-3.2 The rules file
-The second file, “rules”, is very important, too. It tells launchpad how to exactly compile your application. It is basically a normal makefile with some special targets, which are invoked by launchpad.
-
-wget https://schneegans.github.io/assets/files/ppa-howto/rules
-Expand keyboard_arrow_down#!/usr/bin/make -f
-
-BUILDDIR = build_dir
-
-# secondly called by launchpad
-build:
-    mkdir $(BUILDDIR);
-    cd $(BUILDDIR); cmake -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr ..
-    make -C $(BUILDDIR)
-
-# thirdly called by launchpad
-binary: binary-indep binary-arch
-
-binary-indep:
-    # nothing to be done
-
-binary-arch:
-    cd $(BUILDDIR); cmake -P cmake_install.cmake
-    mkdir debian/tmp/DEBIAN
-    dpkg-gencontrol -pgreet-the-world
-    dpkg --build debian/tmp ..
-
-# firstly called by launchpad
-clean:
-    rm -f build
-    rm -rf $(BUILDDIR)
-
-.PHONY: binary binary-arch binary-indep clean
-The target “clean” is called firstly. Then launchpad will execute “build”, which does the same thing as we tested above. It will create a build directory, change to it, execute CMake (with the install prefix set to a directory inside the debian directory) and compile the application. When this succeeds, the package will be build with the target “binary-arch”.
-
-You don’t need to alter the content of this file.
-
-3.3 The changelog file
-The third file is “changelog”. It contains some information on what you have done since the last release.
-
-wget https://schneegans.github.io/assets/files/ppa-howto/changelog
-greet-the-world (0.1-0ppa0) oneiric; urgency=low
-
-  * Initial upload!
-
- -- Your Name <your.email@some.where>  Tue, 01 Nov 2011 20:32:17 +0100
-The first line specifies for what distribution your package is made and its version. Then there can be multiple lines containing the change log information. The last line has to be exactly like it is shown there. Mind the two spaces after your e-mail address! Without them, your package will be rejected!
-
-Please change the date and the e-mail address accordingly. The date string can be obtained by the terminal command date -R.
-
-3.4 The copyright file
-The last file contains your copyright information. It does not follow any structure and can contain everything you want. Here is a GPL-3 example. Just insert your name.
-
-wget https://schneegans.github.io/assets/files/ppa-howto/copyright
-Expand keyboard_arrow_down####################################################################
-#                    greet-the-world                               #
-####################################################################
-
-Copyright (C) 2011 Your Name
-
-This program is free software: you can redistribute it and/or modify
-it under the terms of the GNU General Public License as published by
-the Free Software Foundation, either version 3 of the License, or
-(at your option) any later version.
-
-This program is distributed in the hope that it will be useful, but
-WITHOUT ANY WARRANTY; without even the implied warranty of
-MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
-General Public License for more details.
-
-You should have received a copy of the GNU General Public License
-along with this program.  If not, see <https://www.gnu.org/licenses/>.
-4. Uploading to launchpad
-Now, all necessary files have been created. The project is ready to be uploaded to launchpad! Therefore you will have to have a launchpad account. If you don’t already have one, please create one now. You will have to do some nasty stuff then — like uploading RSA-keys, signing the Ubuntu Code of Conduct and sharing OpenPGP-keys — but this is well documented at the launchpad help pages. Here are some links which may be useful:
-
-Create and personalise your launchpad account
-Import an OpenPGP key to launchpad
-Import your SSH keys
-Activating your PPA
-4.1 The initial upload
-Now you’re ready to upload your first package to launchpad! Just a few steps are needed to do so. First of all, you need to create a .tar.gz of your original source code and name it greet-the-world_0.1.orig.tar.gz. Then the package is created from within the folder “greet-the-world”. Finally you upload the package with dput to launchpad. Be sure to replace ppa:yourppa/name with your PPA.
-
-tar -acf greet-the-world_0.1.orig.tar.gz greet-the-world
-cd greet-the-world
-debuild -S -sa
-cd ..
-dput ppa:yourppa/name greet-the-world_0.1-0ppa0_source.changes
-That’s all! You’ve done it!
-
-Check your PPA’s website, there you can monitor the build status of your package. When it fails for some reason, launchpad will send you an e-mail containing information on the reason. If all works, you can now add the PPA to your system and install greet-the-world with synaptic!
-
-4.2 Further uploads
-If you want to upload a new version of your software, use the following commands. Before you have to create a new changelog file: remember to insert the new version number and the current date! In the terminal command below, you’ll have to change the file name accordingly.
-
-cd greet-the-world
-debuild -S -sd
-cd ..
-dput ppa:yourppa/name greet-the-world_0.1-0ppa0_source.changes
-5. Conclusions
-This is how I managed to upload code to launchpad. Once you understand the procedure, it’s quite easy — but I remember many difficulties at the beginning! Maybe a lot can be done more efficiently, maybe some steps are not done as supposed… but it works!
-
-If you got some questions or remarks… use the comment form below!
-
-Comments
-
-
-date_range Published
-02 November 2011
-create Author
-Simon Schneegans
-loyalty Tags
-loyalty tutorial loyalty c++ loyalty cmake loyalty code
-dehaze Contents
-PPA with CMake!
-Motivation
-1. A short inroduction
-2. A minimal application with CMake
-3. Creating a source package
-4. Uploading to launchpad
-5. Conclusions
-Comments
-Newer post:
-chevron_left Translate Gnome-Pie!
-code mail rss_feed
-
-© 2022 Desgin & Content by Simon Schneegans (Impressum) with help from Jekyll and Materialize, inspired by Darkstrap.
-Proudly hosted on github pages. (repository)
diff --git a/system/package/debian/examples/package_with_cmake/readme b/system/package/debian/examples/package_with_cmake/readme
deleted file mode 100644
index a73b97b2c..000000000
--- a/system/package/debian/examples/package_with_cmake/readme
+++ /dev/null
@@ -1,8 +0,0 @@
-courtesy of this generous tutorial: http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
-adding gpg-key and setting it in launchpad: https://help.launchpad.net/YourAccount/ImportingYourPGPKey
-debian package policy, all necessary files: https://www.debian.org/doc/debian-policy/ch-controlfields.html
-building ppa: https://www.ebower.com/docs/ubuntu-ppa/
-using ppa: https://itsfoss.com/ppa-guide/
-
-to create package, run commands from upload script one by one, except dput (unless
-you want to actually upload your package to ubuntu ppa launchpad)
diff --git a/system/package/debian/examples/package_with_cmake/upload b/system/package/debian/examples/package_with_cmake/upload
deleted file mode 100755
index c53d7edbe..000000000
--- a/system/package/debian/examples/package_with_cmake/upload
+++ /dev/null
@@ -1,5 +0,0 @@
-tar -acf hello-world_0.1.orig.tar.gz hello-world
-cd hello-world
-debuild -S -sa
-cd ..
-dput ppa:yourppa/name hello-world_0.1-0ppa0_source.changes

From d13dc934a6ef6fdc0de3079f28a3862c5302dedf Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 17:12:34 +1000
Subject: [PATCH 0464/1056] comma-launchpad-upload: in progress...

---
 system/launchpad/readme | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/system/launchpad/readme b/system/launchpad/readme
index 3fad2d39c..d0fb1ea87 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -2,6 +2,12 @@ todo
   - document
     - uploading to launchpad
     - verifying in docker
+      add-apt-repository ppa:orthographic/ppa
+      apt-get update
+      add-apt-repository multiverse
+      apt-get update
+      apt-get install comma
+
   - move docker out of system/package/cpack (can symlink it back)
 
 useful links

From 72179d54ab43fba3987815dfa7bd8694d708b82a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 19:09:44 +1000
Subject: [PATCH 0465/1056] system/launchpad/comma-launchpad-test: in
 progress...

---
 system/launchpad/comma-launchpad-test   | 28 +++++++++++++++++++++++++
 system/launchpad/comma-launchpad-upload | 26 +++++++++++++----------
 system/launchpad/readme                 | 19 +++++++++++++++++
 system/package/cpack/comma-package-test |  2 +-
 4 files changed, 63 insertions(+), 12 deletions(-)
 create mode 100755 system/launchpad/comma-launchpad-test

diff --git a/system/launchpad/comma-launchpad-test b/system/launchpad/comma-launchpad-test
new file mode 100755
index 000000000..389edf734
--- /dev/null
+++ b/system/launchpad/comma-launchpad-test
@@ -0,0 +1,28 @@
+#!/bin/bash
+
+function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1; }
+
+add-apt-repository -y ppa:orthographic/ppa || die "add-apt-repository ppa:orthographic/ppa failed"
+add-apt-repository -y multiverse || die "add-apt-repository multiverse failed"
+apt-get update || die "apt-get update failed"
+apt-get -y install comma || die "apt-get install comma failed"
+
+say "testing basic csv utilities..."
+output=$( csv-paste line-number | head | csv-to-bin ui | csv-from-bin ui ) || die "failed: failed to run"
+expected=$( seq 0 9 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+say "testing basic csv utilities: done"
+
+say "testing bash utils..."
+type -p comma-application-util || die "failed: failed"
+say "testing bash utils: done"
+
+say "running csv-eval --help (for reference): todo"
+#csv-eval --help
+
+# todo
+say "testing csv-eval: todo"
+#output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
+#expected=$( seq 1 10 )
+#[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+#say "testing csv-eval: done"
diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
index 6c898e6ba..5ec39974e 100755
--- a/system/launchpad/comma-launchpad-upload
+++ b/system/launchpad/comma-launchpad-upload
@@ -11,16 +11,20 @@
 #     - push
 #   ? check current version at launchpad
 
-function say() { echo "usage: $0: $@" >&2; }
-function die() { say "$@"; exit 1; }
-[[ -n "$2" ]] || { echo "usage: $0 <ubuntu-name> <comma-version> [<comma_dir>]" >&2; exit 1; }
-ubuntu_name=$1
+function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1; }
+[[ -n "$2" ]] || { echo "usage: $0 <what> <ubuntu-name> <comma-version>" >&2; exit 1; }
+what=$1
 comma_version=$2
-comma_dir=$3
 name=comma_$comma_version
-[[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
-rm -rf comma
-cp -r $comma_dir . || die "copying $comma_dir failed" # quick and dirty; or git clone instead?
-tar -acf $name.orig.tar.gz comma || die "tar failed"
-( cd comma && debuild -S -sa ) || die "debuild failed"
-dput ppa:yourppa/name $name-0ppa0_source.changes || die "dput failed"
+[[ -d comma ]] || die "comma directory not found; please run in something like ~/src"
+if [[ "$what" == "orig" ]]; then
+    rm -f comma/debian/files
+    tar -acf $name.orig.tar.gz comma || die "tar failed"
+    ( cd comma && debuild -S -sa ) || die "debuild failed"
+    dput ppa:orthographic/ppa $name-0ppa0_source.changes || die "dput failed"
+elif [[ "$what" == "update" ]]; then
+    ( cd comma && debuild -S -sd ) || die "debuild failed"
+    dput ppa:orthographic/ppa $name-0ppa0_source.changes || die "dput failed"
+else
+    die "expected <what>: orig or update; got \"$what\""
+fi
diff --git a/system/launchpad/readme b/system/launchpad/readme
index d0fb1ea87..a2bc7cd57 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -1,3 +1,22 @@
+uploading to launchpad
+
+- update comma/debian/changelog; see https://www.debian.org/doc/debian-policy/ch-source.html#debian-changelog-debian-changelog
+  - ubuntu version (currently jammy)
+  - version, e.g. 1.2.3
+  - changes
+  - date
+- update default version in comma/CMakeLists.txt
+- run:
+      cd ~/src/comma
+      git tag -a 1.2.3 -m 'your comments for version 1.2.3'
+      cd ..
+      comma/system/launchpad/comma-launchpad-upload update 1.2.3
+- once build in launchpad succeeds, commit and push
+- if there were changes in comma/python, release them into pypi (todo)
+- notify interested parties
+
+verifying ppa in docker
+
 todo
   - document
     - uploading to launchpad
diff --git a/system/package/cpack/comma-package-test b/system/package/cpack/comma-package-test
index 250fe74f9..89e4cf5e1 100755
--- a/system/package/cpack/comma-package-test
+++ b/system/package/cpack/comma-package-test
@@ -15,7 +15,7 @@ expected=$( seq 0 9 )
 [[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
 echo "$0: testing basic csv utilities: done" >&2
 
-echo "$0: testing bash utils..."
+echo "$0: testing bash utils..." >&2
 type -p comma-application-util || die "failed: failed"
 echo "$0: testing bash utils: done" >&2
 

From d0b6775dba613190dc9169844167c6c9bee45002 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 21:18:42 +1000
Subject: [PATCH 0466/1056] python/setup.py: minor brush-up

---
 python/setup.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/python/setup.py b/python/setup.py
index df6606515..01dddb13f 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -31,5 +31,3 @@
         entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] },
         #scripts             = [ "comma/csv/applications/csv-eval" ]
      )
-
-# "console_scripts": [ 'sxm-detect=jfab.stm.imaging.scripts.sxm_detect:main'

From 04627cd40c7bf5e347bb58f662082377b65b867a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 21:39:17 +1000
Subject: [PATCH 0467/1056] comma/python: preparing for pypi

---
 python/README    | 24 ------------------------
 python/README.md |  1 +
 python/setup.py  | 16 +++++++++-------
 3 files changed, 10 insertions(+), 31 deletions(-)
 delete mode 100644 python/README
 create mode 100644 python/README.md

diff --git a/python/README b/python/README
deleted file mode 100644
index 5dbc6e10a..000000000
--- a/python/README
+++ /dev/null
@@ -1,24 +0,0 @@
-comma, generic python components and command-line
-utilities for quick and efficient data manipulation, especially streams
-of CSV and binary data, protocol packets, structured data (e.g. JSON), etc
-
-# installation from source
-
-Quickest way (works on Ubuntu 18.04 or higher with ansible playbook version 2.5 or higher):
-
-> mkdir src
-> cd src
-> git clone <repo>
-> ansible-playbook comma/system/ansible/install.yml --ask-become-pass
-
-Manual way:
-
-> mkdir -p src build/comma
-> cd src
-> git clone https://gitlab.com/orthographic/comma
-> cd ../build/comma
-> cmake ../../src/comma
-> make
-> sudo make install
-
-Read install.yml, if interested in tweaking build configuration.
diff --git a/python/README.md b/python/README.md
new file mode 100644
index 000000000..258cd5725
--- /dev/null
+++ b/python/README.md
@@ -0,0 +1 @@
+todo
diff --git a/python/setup.py b/python/setup.py
index 01dddb13f..41e7ee121 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python
 
-import setuptools #from distutils.core import setup
+import setuptools, pathlib #from distutils.core import setup
 import comma.version
 
 setuptools.setup(
@@ -14,20 +14,22 @@
           'Operating System :: MacOS :: MacOS X',
           'Operating System :: Microsoft :: Windows',
           'Operating System :: POSIX',
-          'Programming Language :: Python',
+          'Programming Language :: Python :: 3',
           'Topic :: Communications :: Email'
         ],
-        description         = 'comma python utilities',
+        description         = 'csv and fixed-width binary python utilities',
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
-        long_description    = 'comma python utilities for offline and streamed csv and fixed width data',
+        long_description    = ( pathlib.Path(__file__).parent / "README.md" ).read_text(),
+        long_description_content_type = "text/markdown",
+        author              = "vsevolod vlaskine",
+        author_email        = "vsevolod.vlaskine@gmail.com",
         maintainer          = 'vsevolod vlaskine',
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
         python_requires     = '>=3.6',
-        install_requires    = ['numpy'], # todo?
+        install_requires    = [ 'numpy' ], # todo?
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
-        entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] },
-        #scripts             = [ "comma/csv/applications/csv-eval" ]
+        entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] } #scripts             = [ "comma/csv/applications/csv-eval" ]
      )

From fe363975a5ce661f0b23d982d2f6b42c5e0bc628 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 22:07:17 +1000
Subject: [PATCH 0468/1056] prepared for pypi; readme: installation updated

---
 CMakeLists.txt                               |  2 +-
 README                                       | 28 --------------------
 python/setup.py                              |  6 +++--
 system/package/cpack/comma-package-make      | 12 ++++-----
 system/package/cpack/examples/package-python | 10 +++----
 system/package/cpack/readme                  |  4 +--
 6 files changed, 18 insertions(+), 44 deletions(-)
 delete mode 100644 README

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 48809cfba..06b1d3ba5 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -375,7 +375,7 @@ set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} )
 set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} )
 set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04 or later" )
-#set( CPACK_DEBIAN_PACKAGE_DEPENDS "python3-comma, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "comma-py, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc" )
 #set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
diff --git a/README b/README
deleted file mode 100644
index e0db4eaec..000000000
--- a/README
+++ /dev/null
@@ -1,28 +0,0 @@
-comma, a generic library of C++ and python components and command-line
-utilities for quick and efficient data manipulation, especially streams
-of CSV and binary data, protocol packets, structured data (e.g. JSON), etc
-
-
-INSTALLATION
-
-Currently only building from source using CMake is available. (After building
-from source, you can generate deb package using CPack, though.)
-
-Quickest way (works on Ubuntu 18.04 or higher with ansible playbook version 2.5 or higher):
-
-> mkdir src
-> cd src
-> git clone <repo>
-> ansible-playbook comma/system/ansible/install.yml --ask-become-pass
-
-Manual way:
-
-> mkdir -p src build/comma
-> cd src
-> git clone <repo>
-> cd ../build/comma
-> cmake ../../src/comma
-> make
-> sudo make install
-
-Read install.yml, if interested in tweaking build configuration.
diff --git a/python/setup.py b/python/setup.py
index 41e7ee121..fe9d03e82 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -3,14 +3,16 @@
 import setuptools, pathlib #from distutils.core import setup
 import comma.version
 
+# https://realpython.com/pypi-publish-python-package/
+
 setuptools.setup(
-        name                = 'python3-comma', # quick and dirty to make python packaging work
+        name                = 'comma-py', # quick and dirty to make python packaging work
         version             = comma.version.__version__,
         classifiers = [
           'Environment :: Console',
           'Intended Audience :: End Users/Desktop',
           'Intended Audience :: Developers',
-          'License :: OSI Approved :: BSD 3-Clause',
+          'License :: OSI Approved :: BSD License',
           'Operating System :: MacOS :: MacOS X',
           'Operating System :: Microsoft :: Windows',
           'Operating System :: POSIX',
diff --git a/system/package/cpack/comma-package-make b/system/package/cpack/comma-package-make
index 0e0f00890..f49068e93 100755
--- a/system/package/cpack/comma-package-make
+++ b/system/package/cpack/comma-package-make
@@ -60,14 +60,14 @@ fi
 #     echo "$0: running python3 setup.py ..." >&2
 #     python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../COPYING --suite focal  || die "failed"
 #     # todo: mount gpg key
-#     # debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
+#     # debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/comma-py_1.0.0-1.dsc
 #     # mkdir tmp
 #     # cd tmp
-#     # dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
-#     # cd python3-comma-1.0.0
+#     # dpkg-source -x ../deb_dist/comma-py_1.0.0-1.dsc
+#     # cd comma-py-1.0.0
 #     # debuild -S -sa
-#     # dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
-#     # ? debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 ../../deb_dist/python3-comma_1.0.0-1_source.changes
+#     # dput ppa:orthographic/ppa ../comma-py_1.0.0-1_source.changes
+#     # ? debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 ../../deb_dist/comma-py_1.0.0-1_source.changes
 #     #
 #     # ...
 #     echo "$0: building package..." >&2
@@ -100,4 +100,4 @@ fi
 #     echo "$0: done" >&2
 # )
 # cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
-# cp ~/src/comma/python/deb_dist/python3-comma*.deb output
+# cp ~/src/comma/python/deb_dist/comma-py*.deb output
diff --git a/system/package/cpack/examples/package-python b/system/package/cpack/examples/package-python
index 27b569d14..2438cfff9 100755
--- a/system/package/cpack/examples/package-python
+++ b/system/package/cpack/examples/package-python
@@ -2,11 +2,11 @@
 
 cd ~/src/comma/python
 rm -rf deb_dist dist tmp
-python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal --package python3-comma --build-depends python3-numpy
-debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/python3-comma_1.0.0-1.dsc
+python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal --package comma-py --build-depends python3-numpy
+debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/comma-py_1.0.0-1.dsc
 mkdir tmp
 cd tmp
-dpkg-source -x ../deb_dist/python3-comma_1.0.0-1.dsc
-cd python3-comma-1.0.0
+dpkg-source -x ../deb_dist/comma-py_1.0.0-1.dsc
+cd comma-py-1.0.0
 debuild -S -sa
-dput ppa:orthographic/test-ppa ../python3-comma_1.0.0-1_source.changes #dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
+dput ppa:orthographic/test-ppa ../comma-py_1.0.0-1_source.changes #dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
diff --git a/system/package/cpack/readme b/system/package/cpack/readme
index aa4ebd980..0d4cc5446 100644
--- a/system/package/cpack/readme
+++ b/system/package/cpack/readme
@@ -17,11 +17,11 @@ debian package will be built in your current directory
 
 test that package is ok, e.g:
 
-> ./comma-package-docker-test 20.04 comma-1.2.3-Linux.deb python3-comma_1.2.3-1_all.deb
+> ./comma-package-docker-test 20.04 comma-1.2.3-Linux.deb comma-py_1.2.3-1_all.deb
 
 sign packages, e.g:
 
 > debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
-> debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 python3-comma_1.0.0-1_all.deb
+> debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-py_1.0.0-1_all.deb
 
 todo: fix lintian misplaced-extra-member-in-deb, which happens after gpg-signing

From b88750a5061ce10f521081bfb01a081a4a99d66e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 22:08:06 +1000
Subject: [PATCH 0469/1056] README.md added

---
 README.md | 87 +++++++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 87 insertions(+)
 create mode 100644 README.md

diff --git a/README.md b/README.md
new file mode 100644
index 000000000..13f8219b4
--- /dev/null
+++ b/README.md
@@ -0,0 +1,87 @@
+[[_TOC_]]
+
+# overview
+
+**comma** is a generic library for fixed-width (comma-separated or binary) and structured (e.g. json) data processing primarily on Linux. MacOS is supported, but less tested.
+
+**comma** consists of a collection of command line utilities, as well as underlying C++ and python libraries.
+
+**comma** design considerations:
+- high throughput for offline data processing
+- working with latency-sensitive realtime data streams
+- high modularity and separation of concerns
+- ease of rapid prototyping and functionality change
+- ease of mixing with other applications
+
+You can limit yourself to using the **comma** command line utilities. Further, **comma** provides libraries for serialization, binary protocol packet layouts, etc.
+
+This documentation will have not more than a brief description of each command line utility. For details, each utility has elaborate help, e.g. run: **csv-eval --help**.
+
+Instead, this documentation is intended to provide more and more step-by-step tutorials and recipes for **comma** command line applications.
+
+The library code is self-documented. You can generate it with **doxigen**. Use **git grep** or explore code of respective applications for usage examples.
+
+# installation
+
+## latest release
+
+```
+sudo add-apt-repository --yes ppa:orthographic/ppa
+sudo add-apt-repository --yes multiverse
+sudo apt-get update
+sudo apt-get install comma
+pip3 install comma-py==1.0.0
+```
+
+## build from source
+### building with ansible
+
+```
+> sudo apt-get install ansible
+> mkdir src
+> cd src
+> git clone https://gitlab.com/orthographic/comma.git
+> ansible-playbook comma/system/ansible/install.yml --ask-become-pass
+```
+
+### building it manually
+#### install dependencies (ubuntu)
+```
+sudo apt-get install git build-essential cmake cmake-curses-gui perl python3-dev python3-numpy libboost-all-dev socat libzmq3-dev libgtest-dev libprocps-dev recode expat gawk
+```
+#### build
+
+If you build from source, you will get latest features.
+
+Albeit more tedious, it is safe since **comma** master branch is thoroughly tested and new features are backward-compatible.
+
+```
+> mkdir -p src build/comma
+> cd src
+> git clone https://gitlab.com/orthographic/comma.git
+> cd ../build/comma
+> cmake ../../src/comma && make && sudo make install
+```
+
+Read install.yml, if interested in tweaking build configuration.
+
+# command line applications
+
+- [**csv**: working with comma-separated and fixed-width binary data](csv/overview)
+- [**io**: utilities for input/output manipulations](io/overview)
+- [**name_value**: working with name-value pair data formats](name_value/overview)
+
+# bash scripting: utilities and design recipes
+
+**comma** applications help with complex data processing when they are bootstrapped together in Linux pipelines or bash scripts.
+
+**comma** bash utilities make writing bash scripts quicker and cleaner.
+
+[more...](bash/overview)
+
+# comma-test-run: regression test framework
+
+comma-test-run is a command line utility that runs minimalistic language-agnostic regression test suits.
+
+[more...](comma-test-run/comma-test-run:-a-simple-regression-test-framework)
+

From 281a52ba06cee27dcd4d9e04922a96017fdb5174 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 12:10:54 +0000
Subject: [PATCH 0470/1056] Update README.md

---
 README.md | 21 +--------------------
 1 file changed, 1 insertion(+), 20 deletions(-)

diff --git a/README.md b/README.md
index 13f8219b4..3673318b5 100644
--- a/README.md
+++ b/README.md
@@ -65,23 +65,4 @@ Albeit more tedious, it is safe since **comma** master branch is thoroughly test
 
 Read install.yml, if interested in tweaking build configuration.
 
-# command line applications
-
-- [**csv**: working with comma-separated and fixed-width binary data](csv/overview)
-- [**io**: utilities for input/output manipulations](io/overview)
-- [**name_value**: working with name-value pair data formats](name_value/overview)
-
-# bash scripting: utilities and design recipes
-
-**comma** applications help with complex data processing when they are bootstrapped together in Linux pipelines or bash scripts.
-
-**comma** bash utilities make writing bash scripts quicker and cleaner.
-
-[more...](bash/overview)
-
-# comma-test-run: regression test framework
-
-comma-test-run is a command line utility that runs minimalistic language-agnostic regression test suits.
-
-[more...](comma-test-run/comma-test-run:-a-simple-regression-test-framework)
-
+Documentation: [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)

From bf79ef673d98ba4342a66b93bb0c24ea8ae2f015 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 11 May 2022 22:16:33 +1000
Subject: [PATCH 0471/1056] README.md: minor brush-up

---
 README.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 3673318b5..ca1730957 100644
--- a/README.md
+++ b/README.md
@@ -65,4 +65,6 @@ Albeit more tedious, it is safe since **comma** master branch is thoroughly test
 
 Read install.yml, if interested in tweaking build configuration.
 
-Documentation: [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)
+#documentation
+
+[https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)

From 2bc620094f57ddd3b4dd67f0549d2f6fcf9904c2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 12 May 2022 12:46:29 +1000
Subject: [PATCH 0472/1056] system/launchpad/comma-launchpad-test: basic test
 of python/csv-eval installation added

---
 system/launchpad/comma-launchpad-test | 24 ++++++++++++++++--------
 1 file changed, 16 insertions(+), 8 deletions(-)

diff --git a/system/launchpad/comma-launchpad-test b/system/launchpad/comma-launchpad-test
index 389edf734..ad46ff2e8 100755
--- a/system/launchpad/comma-launchpad-test
+++ b/system/launchpad/comma-launchpad-test
@@ -2,10 +2,13 @@
 
 function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1; }
 
+comma_py_version='1.0.0'
+
 add-apt-repository -y ppa:orthographic/ppa || die "add-apt-repository ppa:orthographic/ppa failed"
 add-apt-repository -y multiverse || die "add-apt-repository multiverse failed"
 apt-get update || die "apt-get update failed"
 apt-get -y install comma || die "apt-get install comma failed"
+pip3 install comma-py==$comma_py_version
 
 say "testing basic csv utilities..."
 output=$( csv-paste line-number | head | csv-to-bin ui | csv-from-bin ui ) || die "failed: failed to run"
@@ -17,12 +20,17 @@ say "testing bash utils..."
 type -p comma-application-util || die "failed: failed"
 say "testing bash utils: done"
 
-say "running csv-eval --help (for reference): todo"
-#csv-eval --help
+say "running csv-eval --help (for reference)"
+csv-eval --help
+
+say "testing comma-pi..."
+output=$( python3 -c "import comma; print( comma.version.__version__ )" ) || die "failed: failed to run"
+expected=$comma_py_version
+[[ "$output" == "$expected" ]] || die "failed: expected: $expected; got: $output"
+say "testing comma-pi: done"
 
-# todo
-say "testing csv-eval: todo"
-#output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
-#expected=$( seq 1 10 )
-#[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
-#say "testing csv-eval: done"
+say "testing csv-eval..."
+output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
+expected=$( seq 1 10 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+say "testing csv-eval: done"

From 2111ed596a33d2fbf74398ed9764120a421cc7cb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 12 May 2022 20:26:34 +1000
Subject: [PATCH 0473/1056] comma-launchpad-upload: uploading to
 ppa:orthographic/comma (was orthographic/ppa)

---
 README.md                               | 2 +-
 system/launchpad/comma-launchpad-upload | 6 +++---
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/README.md b/README.md
index ca1730957..9a355ea23 100644
--- a/README.md
+++ b/README.md
@@ -26,7 +26,7 @@ The library code is self-documented. You can generate it with **doxigen**. Use *
 ## latest release
 
 ```
-sudo add-apt-repository --yes ppa:orthographic/ppa
+sudo add-apt-repository --yes ppa:orthographic/comma
 sudo add-apt-repository --yes multiverse
 sudo apt-get update
 sudo apt-get install comma
diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
index 5ec39974e..a289d41cc 100755
--- a/system/launchpad/comma-launchpad-upload
+++ b/system/launchpad/comma-launchpad-upload
@@ -15,16 +15,16 @@ function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1;
 [[ -n "$2" ]] || { echo "usage: $0 <what> <ubuntu-name> <comma-version>" >&2; exit 1; }
 what=$1
 comma_version=$2
-name=comma_$comma_version
+name=comma_${comma_version}
 [[ -d comma ]] || die "comma directory not found; please run in something like ~/src"
 if [[ "$what" == "orig" ]]; then
     rm -f comma/debian/files
     tar -acf $name.orig.tar.gz comma || die "tar failed"
     ( cd comma && debuild -S -sa ) || die "debuild failed"
-    dput ppa:orthographic/ppa $name-0ppa0_source.changes || die "dput failed"
+    dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"
 elif [[ "$what" == "update" ]]; then
     ( cd comma && debuild -S -sd ) || die "debuild failed"
-    dput ppa:orthographic/ppa $name-0ppa0_source.changes || die "dput failed"
+    dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"
 else
     die "expected <what>: orig or update; got \"$what\""
 fi

From eeb8a726ef89c1b1bf4eae1f51d7b28377a06f22 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 00:46:41 +1000
Subject: [PATCH 0474/1056] system/launchpad/comma-launchpad-test: ppa name
 changed from ppa to comma

---
 system/launchpad/comma-launchpad-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/launchpad/comma-launchpad-test b/system/launchpad/comma-launchpad-test
index ad46ff2e8..fd1189770 100755
--- a/system/launchpad/comma-launchpad-test
+++ b/system/launchpad/comma-launchpad-test
@@ -4,7 +4,7 @@ function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1;
 
 comma_py_version='1.0.0'
 
-add-apt-repository -y ppa:orthographic/ppa || die "add-apt-repository ppa:orthographic/ppa failed"
+add-apt-repository -y ppa:orthographic/comma || die "add-apt-repository ppa:orthographic/ppa failed"
 add-apt-repository -y multiverse || die "add-apt-repository multiverse failed"
 apt-get update || die "apt-get update failed"
 apt-get -y install comma || die "apt-get install comma failed"

From 81f8c250b413ac459d90a63abaa40118cd0bbe5e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 13:28:22 +1000
Subject: [PATCH 0475/1056] trivial typo fixed

---
 system/launchpad/comma-launchpad-test | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/system/launchpad/comma-launchpad-test b/system/launchpad/comma-launchpad-test
index fd1189770..6c7056e0e 100755
--- a/system/launchpad/comma-launchpad-test
+++ b/system/launchpad/comma-launchpad-test
@@ -23,11 +23,11 @@ say "testing bash utils: done"
 say "running csv-eval --help (for reference)"
 csv-eval --help
 
-say "testing comma-pi..."
+say "testing comma-py..."
 output=$( python3 -c "import comma; print( comma.version.__version__ )" ) || die "failed: failed to run"
 expected=$comma_py_version
 [[ "$output" == "$expected" ]] || die "failed: expected: $expected; got: $output"
-say "testing comma-pi: done"
+say "testing comma-py: done"
 
 say "testing csv-eval..."
 output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"

From c5861ecf0bdb8cf310839b2331d8be2d73bb025d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 17:21:47 +1000
Subject: [PATCH 0476/1056] comma-launchpad-test: trivial typo fixed

---
 system/launchpad/comma-launchpad-test | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/launchpad/comma-launchpad-test b/system/launchpad/comma-launchpad-test
index 6c7056e0e..f02be1f81 100755
--- a/system/launchpad/comma-launchpad-test
+++ b/system/launchpad/comma-launchpad-test
@@ -4,7 +4,7 @@ function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1;
 
 comma_py_version='1.0.0'
 
-add-apt-repository -y ppa:orthographic/comma || die "add-apt-repository ppa:orthographic/ppa failed"
+add-apt-repository -y ppa:orthographic/comma || die "add-apt-repository ppa:orthographic/comma failed"
 add-apt-repository -y multiverse || die "add-apt-repository multiverse failed"
 apt-get update || die "apt-get update failed"
 apt-get -y install comma || die "apt-get install comma failed"

From 4dee5d9274fd5e772aeaad36706099f4b32a0b7f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 20:59:55 +1000
Subject: [PATCH 0477/1056] cmake, debian: lib and cmake installation paths
 fixed

---
 CMakeLists.txt   | 35 +++++++----------------------------
 debian/changelog |  6 +++---
 debian/rules     |  2 ++
 3 files changed, 12 insertions(+), 31 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 06b1d3ba5..d0cc94436 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -9,23 +9,13 @@ if( USE_ARM_TOOLCHAIN )
 endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
-if( POLICY CMP0048 )
-    cmake_policy( SET CMP0048 NEW )
-    project( comma VERSION 1.0.1 LANGUAGES CXX )
-else( POLICY CMP0048 )
-    project( comma )
-    set( CMAKE_PROJECT_VERSION_MAJOR "1" CACHE STRING "comma version major" )
-    set( CMAKE_PROJECT_VERSION_MINOR "0" CACHE STRING "comma version minor" )
-    set( CMAKE_PROJECT_VERSION_PATCH "1" CACHE STRING "comma version patch" )
-    set( CMAKE_PROJECT_VERSION "${CMAKE_PROJECT_VERSION_MAJOR}.${CMAKE_PROJECT_VERSION_MINOR}.${CMAKE_PROJECT_VERSION_PATCH}" )
-endif( POLICY CMP0048 )
+cmake_policy( SET CMP0048 NEW )
+project( comma VERSION 1.0.2 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
 set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
 set( comma_version "${CMAKE_PROJECT_VERSION}" ) # quick and dirty
-# install( FILES COPYING DESTINATION share/doc/comma RENAME copyright ) # required by lintian
-# install( FILES system/package/cpack/changelog.gz DESTINATION share/doc/comma ) # required by lintian
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )
@@ -122,23 +112,12 @@ endif( UNIX )
 SET( SOURCE_CODE_BASE_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 SET( LIBRARY_OUTPUT_PATH ${CMAKE_BINARY_DIR}/lib )
 
-SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" SOVERSION ${CMAKE_PROJECT_VERSION} LINK_FLAGS_RELEASE -s )
-
-IF( NOT comma_INSTALL_BIN_DIR )
-  SET( comma_INSTALL_BIN_DIR bin )
-ENDIF( NOT comma_INSTALL_BIN_DIR )
-
-IF( NOT comma_INSTALL_INCLUDE_DIR )
-    SET( comma_INSTALL_INCLUDE_DIR include/${PROJECT_NAME} )
-ENDIF( NOT comma_INSTALL_INCLUDE_DIR )
+set( comma_INSTALL_BIN_DIR "bin" CACHE STRING "installation directory for binaries" )
+set( comma_INSTALL_INCLUDE_DIR "include/comma" CACHE STRING "installation directory for include directories" )
+set( comma_INSTALL_LIB_DIR "lib" CACHE STRING "installation directory for libraries" )
+set( comma_INSTALL_PACKAGE_DIR "CMakeFiles" CACHE STRING "installation directory for cmake files" )
 
-if( NOT comma_INSTALL_LIB_DIR ) # voodoo
-  set( comma_INSTALL_LIB_DIR lib )
-endif( NOT comma_INSTALL_LIB_DIR )
-
-IF( NOT comma_INSTALL_PACKAGE_DIR )
-  SET( comma_INSTALL_PACKAGE_DIR CMakeFiles )
-ENDIF( NOT comma_INSTALL_PACKAGE_DIR )
+SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" SOVERSION ${CMAKE_PROJECT_VERSION} LINK_FLAGS_RELEASE -s )
 
 #INCLUDE_DIRECTORIES( ${comma_INSTALL_INCLUDE_DIR}/../ )
 
diff --git a/debian/changelog b/debian/changelog
index ebc3828ba..dc5ac539c 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.1-0ppa0) jammy; urgency=low
+comma (1.0.2-0ppa0) jammy; urgency=low
 
-  * initial upload
+  * lib and cmake installation paths fixed
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Wed, 11 May 2022 13:12:01 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Fri, 13 May 2022 20:56:43 +1000
diff --git a/debian/rules b/debian/rules
index 746b222cc..625d6dfba 100755
--- a/debian/rules
+++ b/debian/rules
@@ -14,6 +14,8 @@ build:
 							 -DBUILD_TESTS=OFF \
 							 -DINSTALL_BASH_COMPLETION=OFF \
 							 -DINSTALL_TESTS=OFF \
+							 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+							 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake \
 							 -Dcomma_BUILD_XML=OFF \
 							 -Dcomma_build_io_rabbit_cat=OFF
 	make -C $(BUILDDIR)

From 4a48e7118fce1fbacf1eeef28f4c2b3d13bb942a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 21:04:03 +1000
Subject: [PATCH 0478/1056] comma-launchpad-upload: minor fix

---
 system/launchpad/comma-launchpad-upload | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
index a289d41cc..d6d7832af 100755
--- a/system/launchpad/comma-launchpad-upload
+++ b/system/launchpad/comma-launchpad-upload
@@ -20,10 +20,10 @@ name=comma_${comma_version}
 if [[ "$what" == "orig" ]]; then
     rm -f comma/debian/files
     tar -acf $name.orig.tar.gz comma || die "tar failed"
-    ( cd comma && debuild -S -sa ) || die "debuild failed"
+    ( cd comma && debuild -S -sa -d ) || die "debuild failed"
     dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"
 elif [[ "$what" == "update" ]]; then
-    ( cd comma && debuild -S -sd ) || die "debuild failed"
+    ( cd comma && debuild -S -sd -d ) || die "debuild failed"
     dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"
 else
     die "expected <what>: orig or update; got \"$what\""

From f9e94bb3c1ae56b7b572c930b5495209369448e7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 21:27:46 +1000
Subject: [PATCH 0479/1056] python/README.md updated

---
 python/README.md | 15 ++++++++++++++-
 1 file changed, 14 insertions(+), 1 deletion(-)

diff --git a/python/README.md b/python/README.md
index 258cd5725..9d61ceb42 100644
--- a/python/README.md
+++ b/python/README.md
@@ -1 +1,14 @@
-todo
+**comma** is a generic library for efficient processing of fixed-width
+(comma-separated or binary) data mostly written in C++
+
+**comma-py** is the part of **comma** written in python; the main part of
+it is **csv-eval** command line utility for efficient **numpy**-style
+conversions on an input stream of comma-separated or fixed-width binary
+data
+
+for more details, run:
+```
+csv-eval --help --verbose
+```
+
+**documentation**: [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)

From ae618ac57a0140302e2c70e9dbbbc29d8777481a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 21:43:45 +1000
Subject: [PATCH 0480/1056] python: version updated

---
 python/comma/version.py | 2 +-
 system/launchpad/readme | 8 ++++++++
 2 files changed, 9 insertions(+), 1 deletion(-)

diff --git a/python/comma/version.py b/python/comma/version.py
index 92b04f53c..6e9c8afd9 100644
--- a/python/comma/version.py
+++ b/python/comma/version.py
@@ -1,4 +1,4 @@
 # Copyright (c) 2011 The University of Sydney
 
 # if you change this file, check that it still works with ../setup.py, which gets the comma version by reading this file
-__version__ = "1.0.0"
+__version__ = "1.0.1"
diff --git a/system/launchpad/readme b/system/launchpad/readme
index a2bc7cd57..a89b95867 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -17,6 +17,14 @@ uploading to launchpad
 
 verifying ppa in docker
 
+uploading to pypi (i know, wrong place)
+
+cd comma/python
+# bump up version in version.py
+python setup.py sdist bdist_wheel
+twine upload --repository-url https://pypi.org/legacy/ dist/* # test
+twine upload dist/*
+
 todo
   - document
     - uploading to launchpad

From 5209ad911cde671e0e09854a22044e377d210f8e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 13 May 2022 22:05:53 +1000
Subject: [PATCH 0481/1056] version bumped up; fixing launchpad...

---
 CMakeLists.txt   | 2 +-
 debian/changelog | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index d0cc94436..3c341fbd9 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.2 LANGUAGES CXX )
+project( comma VERSION 1.0.3 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
diff --git a/debian/changelog b/debian/changelog
index dc5ac539c..8c48ed861 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,4 +1,4 @@
-comma (1.0.2-0ppa0) jammy; urgency=low
+comma (1.0.3-0ppa0) jammy; urgency=low
 
   * lib and cmake installation paths fixed
 

From 16b058f77af0435bba39bbb555769c4e29c21b6c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 01:14:43 +1000
Subject: [PATCH 0482/1056] cmake: comma version propagated correctly (although
 it is not really used anywhere for now)

---
 CMakeFiles/FindComma.cmake       |  7 +++----
 CMakeFiles/comma-config.cmake.in | 10 +++++++---
 2 files changed, 10 insertions(+), 7 deletions(-)

diff --git a/CMakeFiles/FindComma.cmake b/CMakeFiles/FindComma.cmake
index 599c3f7f9..12ec30316 100644
--- a/CMakeFiles/FindComma.cmake
+++ b/CMakeFiles/FindComma.cmake
@@ -3,10 +3,10 @@
 # The following variables are set if comma is found.
 #  comma_FOUND         - Set to true when comma is found.
 #  comma_USE_FILE      - CMake file to use comma.
-#  comma_MAJOR_VERSION - The comma major version number.
-#  comma_MINOR_VERSION - The comma minor version number
+#  comma_version_major - The comma major version number.
+#  comma_version_minor - The comma minor version number
 #                       (odd non-release).
-#  comma_BUILD_VERSION - The comma patch level
+#  comma_version_patch - The comma patch level
 #                       (meaningless for odd minor).
 #  comma_INCLUDE_DIRS  - Include directories for comma
 #  comma_LIBRARY_DIRS  - Link directories for comma libraries
@@ -85,4 +85,3 @@ ENDIF ( comma_FOUND )
 IF( NOT comma_FOUND )
   MESSAGE(FATAL_ERROR ${comma_DIR_MESSAGE})
 ENDIF( NOT comma_FOUND )
-
diff --git a/CMakeFiles/comma-config.cmake.in b/CMakeFiles/comma-config.cmake.in
index 0b3eda1b6..b9bbcd676 100644
--- a/CMakeFiles/comma-config.cmake.in
+++ b/CMakeFiles/comma-config.cmake.in
@@ -35,9 +35,13 @@ SET(comma_REQUIRED_EXE_LINKER_FLAGS "@comma_REQUIRED_EXE_LINKER_FLAGS@")
 SET(comma_REQUIRED_SHARED_LINKER_FLAGS "@comma_REQUIRED_SHARED_LINKER_FLAGS@")
 SET(comma_REQUIRED_MODULE_LINKER_FLAGS "@comma_REQUIRED_MODULE_LINKER_FLAGS@")
 
-SET(comma_MAJOR_VERSION "@comma_MAJOR_VERSION@")
-SET(comma_MINOR_VERSION "@comma_MINOR_VERSION@")
-SET(comma_BUILD_VERSION "@comma_BUILD_VERSION@")
+SET(comma_version_major "@comma_version_major@")
+SET(comma_version_minor "@comma_version_minor@")
+SET(comma_version_patch "@comma_version_patch@")
+SET(comma_MAJOR_VERSION "@comma_version_major@") # quick and dirty, otherwise comma so library version in dependent packages seem to get messed up
+SET(comma_MINOR_VERSION "@comma_version_minor@") # quick and dirty, otherwise comma so library version in dependent packages seem to get messed up
+SET(comma_BUILD_VERSION "@comma_version_patch@") # quick and dirty, otherwise comma so library version in dependent packages seem to get messed up
+set(comma_version "@comma_version@")
 
 SET(comma_USE_FILE "@comma_USE_FILE@")
 

From 318bcfbed9489a34a1980f1db7a50cede793a188 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 13:11:39 +1000
Subject: [PATCH 0483/1056] debian: fixed cmake installation path

---
 CMakeLists.txt   | 10 +++++-----
 debian/changelog |  6 +++---
 debian/rules     |  2 +-
 3 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 3c341fbd9..21bf11476 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.3 LANGUAGES CXX )
+project( comma VERSION 1.0.4 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
@@ -112,10 +112,10 @@ endif( UNIX )
 SET( SOURCE_CODE_BASE_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 SET( LIBRARY_OUTPUT_PATH ${CMAKE_BINARY_DIR}/lib )
 
-set( comma_INSTALL_BIN_DIR "bin" CACHE STRING "installation directory for binaries" )
-set( comma_INSTALL_INCLUDE_DIR "include/comma" CACHE STRING "installation directory for include directories" )
-set( comma_INSTALL_LIB_DIR "lib" CACHE STRING "installation directory for libraries" )
-set( comma_INSTALL_PACKAGE_DIR "CMakeFiles" CACHE STRING "installation directory for cmake files" )
+set( comma_INSTALL_BIN_DIR bin CACHE PATH "installation directory for binaries" )
+set( comma_INSTALL_INCLUDE_DIR include/comma CACHE PATH "installation directory for include directories" )
+set( comma_INSTALL_LIB_DIR lib CACHE PATH "installation directory for libraries" )
+set( comma_INSTALL_PACKAGE_DIR CMakeFiles CACHE PATH "installation directory for cmake files" )
 
 SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" SOVERSION ${CMAKE_PROJECT_VERSION} LINK_FLAGS_RELEASE -s )
 
diff --git a/debian/changelog b/debian/changelog
index 8c48ed861..a6574101d 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.3-0ppa0) jammy; urgency=low
+comma (1.0.4-0ppa0) jammy; urgency=low
 
-  * lib and cmake installation paths fixed
+  * cmake installation path fixed
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Fri, 13 May 2022 20:56:43 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 13:07:45 +1000
diff --git a/debian/rules b/debian/rules
index 625d6dfba..344f11d75 100755
--- a/debian/rules
+++ b/debian/rules
@@ -15,7 +15,7 @@ build:
 							 -DINSTALL_BASH_COMPLETION=OFF \
 							 -DINSTALL_TESTS=OFF \
 							 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
-							 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake \
+							 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
 							 -Dcomma_BUILD_XML=OFF \
 							 -Dcomma_build_io_rabbit_cat=OFF
 	make -C $(BUILDDIR)

From 05a1c95b04ab42f257954c6d1bf3c1d093e221f6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 16:47:01 +1000
Subject: [PATCH 0484/1056] cmake: install_tests: seems fixed...

---
 application/test/CMakeLists.txt | 29 +++++++++++++----------------
 containers/test/CMakeLists.txt  | 29 +++++++++++++----------------
 csv/test/CMakeLists.txt         | 29 +++++++++++++----------------
 dispatch/test/CMakeLists.txt    | 29 +++++++++++++----------------
 io/test/CMakeLists.txt          | 29 +++++++++++++----------------
 math/test/CMakeLists.txt        | 29 +++++++++++++----------------
 name_value/test/CMakeLists.txt  | 29 +++++++++++++----------------
 packed/test/CMakeLists.txt      | 28 +++++++++++++---------------
 string/test/CMakeLists.txt      | 29 +++++++++++++----------------
 sync/test/CMakeLists.txt        | 28 +++++++++++++---------------
 visiting/test/CMakeLists.txt    | 29 +++++++++++++----------------
 xpath/test/CMakeLists.txt       | 29 +++++++++++++----------------
 12 files changed, 156 insertions(+), 190 deletions(-)

diff --git a/application/test/CMakeLists.txt b/application/test/CMakeLists.txt
index 004a6d1e9..4f56b8487 100644
--- a/application/test/CMakeLists.txt
+++ b/application/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT application )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT application )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/containers/test/CMakeLists.txt b/containers/test/CMakeLists.txt
index bdfd90360..b9b7a7532 100644
--- a/containers/test/CMakeLists.txt
+++ b/containers/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT containers )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base ${GTEST_BOTH_LIBRARIES} )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT containers )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} pthread ) # target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/csv/test/CMakeLists.txt b/csv/test/CMakeLists.txt
index 6e6184332..4bbc487c2 100644
--- a/csv/test/CMakeLists.txt
+++ b/csv/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT csv )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_xpath comma_string comma_csv ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT csv )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/dispatch/test/CMakeLists.txt b/dispatch/test/CMakeLists.txt
index aae4ec058..25f6a18aa 100644
--- a/dispatch/test/CMakeLists.txt
+++ b/dispatch/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT dispatch )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT dispatch )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/io/test/CMakeLists.txt b/io/test/CMakeLists.txt
index eaa86c42b..c14125cbd 100644
--- a/io/test/CMakeLists.txt
+++ b/io/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT io )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base comma_string comma_io ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread rt )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT io )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/math/test/CMakeLists.txt b/math/test/CMakeLists.txt
index 4eed24bae..96c00afbc 100644
--- a/math/test/CMakeLists.txt
+++ b/math/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT math )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT math )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/name_value/test/CMakeLists.txt b/name_value/test/CMakeLists.txt
index 000281672..e95a9deb3 100644
--- a/name_value/test/CMakeLists.txt
+++ b/name_value/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT name_value )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_xpath comma_string comma_name_value ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT name_value )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_xpath comma_string comma_name_value ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/packed/test/CMakeLists.txt b/packed/test/CMakeLists.txt
index 940b46fd3..ab1f5d597 100644
--- a/packed/test/CMakeLists.txt
+++ b/packed/test/CMakeLists.txt
@@ -1,15 +1,13 @@
-SET( KIT packed )
-SET( DIR ${SOURCE_CODE_BASE_DIR}/${KIT}/test )
-FILE( GLOB source ${DIR}/*_test.cpp )
-FILE( GLOB extras ${DIR}/*.cpp ${DIR}/*.h )
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base comma_string ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT packed )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/string/test/CMakeLists.txt b/string/test/CMakeLists.txt
index 383d8775d..f6a0e1af7 100644
--- a/string/test/CMakeLists.txt
+++ b/string/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET(KIT string)
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT string )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${test_name} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/sync/test/CMakeLists.txt b/sync/test/CMakeLists.txt
index 5e759ecd1..049903f49 100644
--- a/sync/test/CMakeLists.txt
+++ b/sync/test/CMakeLists.txt
@@ -1,15 +1,13 @@
-SET( KIT sync )
-SET( DIR ${SOURCE_CODE_BASE_DIR}/${KIT}/test )
-FILE( GLOB source ${DIR}/*_test.cpp )
-FILE( GLOB extras ${DIR}/*.cpp ${DIR}/*.h )
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT sync )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/visiting/test/CMakeLists.txt b/visiting/test/CMakeLists.txt
index 8483176a1..99dbaad9d 100644
--- a/visiting/test/CMakeLists.txt
+++ b/visiting/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET(KIT visiting)
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT visiting )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/xpath/test/CMakeLists.txt b/xpath/test/CMakeLists.txt
index 10216ab48..d94d2e0d0 100644
--- a/xpath/test/CMakeLists.txt
+++ b/xpath/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET(KIT xpath)
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_xpath comma_string ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT xpath )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base comma_xpath ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )

From 328954cd1cc517de72415a7b2bf038d0282ee5c9 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 16:55:30 +1000
Subject: [PATCH 0485/1056] launchpad stopped installing so files; trying to
 fix...

---
 CMakeLists.txt   | 2 +-
 debian/changelog | 6 +++---
 debian/rules     | 1 +
 3 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 21bf11476..51568ae87 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.4 LANGUAGES CXX )
+project( comma VERSION 1.0.5 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
diff --git a/debian/changelog b/debian/changelog
index a6574101d..dc477ae6e 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.4-0ppa0) jammy; urgency=low
+comma (1.0.5-0ppa0) jammy; urgency=low
 
-  * cmake installation path fixed
+  * launchpad stopped installing so files; trying to fix...
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 13:07:45 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 16:51:55 +1000
diff --git a/debian/rules b/debian/rules
index 344f11d75..1fcd07d07 100755
--- a/debian/rules
+++ b/debian/rules
@@ -16,6 +16,7 @@ build:
 							 -DINSTALL_TESTS=OFF \
 							 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
 							 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
+							 -Dcomma_BUILD_ZEROMQ=ON \
 							 -Dcomma_BUILD_XML=OFF \
 							 -Dcomma_build_io_rabbit_cat=OFF
 	make -C $(BUILDDIR)

From d912ec9f2c6cf9fb3a515021a6a604eef7ab3ecc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 17:54:04 +1000
Subject: [PATCH 0486/1056] launchpad stopped installing so files; trying to
 fix...

---
 CMakeLists.txt   | 2 +-
 debian/changelog | 4 ++--
 debian/control   | 4 ++--
 debian/rules     | 2 +-
 4 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 51568ae87..04653746f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.5 LANGUAGES CXX )
+project( comma VERSION 1.0.7 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
diff --git a/debian/changelog b/debian/changelog
index dc477ae6e..95d142178 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.5-0ppa0) jammy; urgency=low
+comma (1.0.7-0ppa0) jammy; urgency=low
 
   * launchpad stopped installing so files; trying to fix...
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 16:51:55 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 17:52:49 +1000
diff --git a/debian/control b/debian/control
index 2c30ecb68..5a3e13941 100644
--- a/debian/control
+++ b/debian/control
@@ -3,12 +3,12 @@ Standards-Version: 4.6.0.1
 Section: devel
 Priority: optional
 Maintainer: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
-Build-Depends: cmake, libc-dev, libboost-all-dev (>=1.65), libzmq5 (>= 4.2.5-1)
+Build-Depends: cmake, libc-dev, libboost-all-dev (>=1.65)
 Homepage: https://gitlab.com/orthographic/comma/-/wikis/home
 
 Package: comma
 Architecture: any
-Depends: libc-dev, libboost-all-dev (>=1.65), libzmq5 (>= 4.2.5-1), recode (>=3.6), socat
+Depends: libc-dev, libboost-all-dev (>=1.65), gawk, recode, socat
 Description: generic libraries and cli for csv and fixed-width data processing
   comma, libraries and command line utilities for efficient streaming and
   processing of comma-separated (csv) and fixed-width binary data
diff --git a/debian/rules b/debian/rules
index 1fcd07d07..269c80814 100755
--- a/debian/rules
+++ b/debian/rules
@@ -16,8 +16,8 @@ build:
 							 -DINSTALL_TESTS=OFF \
 							 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
 							 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
-							 -Dcomma_BUILD_ZEROMQ=ON \
 							 -Dcomma_BUILD_XML=OFF \
+							 -Dcomma_BUILD_ZEROMQ=OFF \
 							 -Dcomma_build_io_rabbit_cat=OFF
 	make -C $(BUILDDIR)
 

From 338aa78062439ae1d481575fc52e08a743103f88 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 19:47:04 +1000
Subject: [PATCH 0487/1056] launchpad stopped installing so files; trying to
 fix...

---
 CMakeLists.txt   | 7 +++++--
 debian/changelog | 4 ++--
 debian/rules     | 1 +
 3 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 04653746f..a64be753c 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.7 LANGUAGES CXX )
+project( comma VERSION 1.0.8 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
@@ -321,7 +321,10 @@ if( CMAKE_COMPILER_IS_GNUCXX )
     endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
 endif( CMAKE_COMPILER_IS_GNUCXX )
 
-add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
+option( comma_INSTALL_RUN_POST_INSTALL "run post install step (currently just ldconfig)" ON )
+if( comma_INSTALL_RUN_POST_INSTALL )
+    add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
+endif( comma_INSTALL_RUN_POST_INSTALL )
 
 # todo
 #     build ppa
diff --git a/debian/changelog b/debian/changelog
index 95d142178..f55d9ef15 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.7-0ppa0) jammy; urgency=low
+comma (1.0.8-0ppa0) jammy; urgency=low
 
   * launchpad stopped installing so files; trying to fix...
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 17:52:49 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 19:30:05 +1000
diff --git a/debian/rules b/debian/rules
index 269c80814..ea7c04522 100755
--- a/debian/rules
+++ b/debian/rules
@@ -16,6 +16,7 @@ build:
 							 -DINSTALL_TESTS=OFF \
 							 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
 							 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
+							 -Dcomma_INSTALL_RUN_POST_INSTALL=OFF \
 							 -Dcomma_BUILD_XML=OFF \
 							 -Dcomma_BUILD_ZEROMQ=OFF \
 							 -Dcomma_build_io_rabbit_cat=OFF

From 76063bb28b4d454c4acfb459db455f36413d7136 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 21:30:46 +1000
Subject: [PATCH 0488/1056] launchpad stopped installing so files; trying to
 fix...

---
 CMakeLists.txt   |  2 +-
 debian/changelog |  4 ++--
 debian/rules     | 47 +++++++++++++++++++++++++----------------------
 3 files changed, 28 insertions(+), 25 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index a64be753c..63943cbc9 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.8 LANGUAGES CXX )
+project( comma VERSION 1.0.9 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
diff --git a/debian/changelog b/debian/changelog
index f55d9ef15..5c6f3c1cc 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.8-0ppa0) jammy; urgency=low
+comma (1.0.9-0ppa0) jammy; urgency=low
 
   * launchpad stopped installing so files; trying to fix...
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 19:30:05 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 21:26:51 +1000
diff --git a/debian/rules b/debian/rules
index ea7c04522..4ecade893 100755
--- a/debian/rules
+++ b/debian/rules
@@ -1,26 +1,24 @@
 #!/usr/bin/make -f
 
-BUILDDIR = build
-
 # secondly called by launchpad
 build:
-	mkdir $(BUILDDIR);
-	cd $(BUILDDIR); cmake .. \
-	                         -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr \
-							 -DCMAKE_BUILD_TYPE=Release \
- 							 -DBUILD_SHARED_LIBS=ON \
- 							 -DBUILD_PYTHON_PACKAGES=OFF \
-							 -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
-							 -DBUILD_TESTS=OFF \
-							 -DINSTALL_BASH_COMPLETION=OFF \
-							 -DINSTALL_TESTS=OFF \
-							 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
-							 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
-							 -Dcomma_INSTALL_RUN_POST_INSTALL=OFF \
-							 -Dcomma_BUILD_XML=OFF \
-							 -Dcomma_BUILD_ZEROMQ=OFF \
-							 -Dcomma_build_io_rabbit_cat=OFF
-	make -C $(BUILDDIR)
+	mkdir build;
+	cd build; cmake .. \
+                     -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr \
+					 -DCMAKE_BUILD_TYPE=Release \
+					 -DBUILD_SHARED_LIBS=ON \
+					 -DBUILD_PYTHON_PACKAGES=OFF \
+					 -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+					 -DBUILD_TESTS=OFF \
+					 -DINSTALL_BASH_COMPLETION=OFF \
+					 -DINSTALL_TESTS=OFF \
+					 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+					 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
+					 -Dcomma_INSTALL_RUN_POST_INSTALL=OFF \
+					 -Dcomma_BUILD_XML=OFF \
+					 -Dcomma_BUILD_ZEROMQ=OFF \
+					 -Dcomma_build_io_rabbit_cat=OFF
+	make -C build
 
 # thirdly called by launchpad
 binary: binary-indep binary-arch
@@ -28,16 +26,21 @@ binary: binary-indep binary-arch
 binary-indep:
 	# nothing to be done
 
+# super quick and dirty: cp -r build/lib debian/tmp
+# there seems to be a bug, most likely in generate_comma_config.cmake
+# that installs libraries in build instead of debian/tmp
+# (cannot reproduce it locally: locally, installation works,
+# but on launchpad it does not
 binary-arch:
-	cd $(BUILDDIR); cmake -P cmake_install.cmake
+	cp -r build/lib debian/tmp
+	cd build; cmake -P cmake_install.cmake
 	mkdir debian/tmp/DEBIAN
 	dpkg-gencontrol -pcomma
 	dpkg --build debian/tmp ..
 
 # firstly called by launchpad
 clean:
-	rm -f build
-	rm -rf $(BUILDDIR)
+	rm -rf build
 	rm -f debian/files
 
 .PHONY: binary binary-arch binary-indep clean

From ee316c183a5c0a0bda4d735fda440179002bc702 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 21:35:34 +1000
Subject: [PATCH 0489/1056] launchpad stopped installing so files; trying to
 fix...

---
 CMakeLists.txt   | 2 +-
 debian/changelog | 2 +-
 debian/rules     | 3 ++-
 3 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 63943cbc9..d1a0f8436 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.9 LANGUAGES CXX )
+project( comma VERSION 1.0.10 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
diff --git a/debian/changelog b/debian/changelog
index 5c6f3c1cc..eee2b5f9e 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,4 +1,4 @@
-comma (1.0.9-0ppa0) jammy; urgency=low
+comma (1.0.10-0ppa0) jammy; urgency=low
 
   * launchpad stopped installing so files; trying to fix...
 
diff --git a/debian/rules b/debian/rules
index 4ecade893..c17bc32bb 100755
--- a/debian/rules
+++ b/debian/rules
@@ -32,7 +32,8 @@ binary-indep:
 # (cannot reproduce it locally: locally, installation works,
 # but on launchpad it does not
 binary-arch:
-	cp -r build/lib debian/tmp
+	mkdir -p debian/tmp/usr
+	cp -r build/lib debian/tmp/usr
 	cd build; cmake -P cmake_install.cmake
 	mkdir debian/tmp/DEBIAN
 	dpkg-gencontrol -pcomma

From 5d99ae612834329f3f87639f48277e47666a6976 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 22:26:14 +1000
Subject: [PATCH 0490/1056] launchpad stopped installing so files; trying to
 fix...

---
 CMakeLists.txt   |  2 +-
 debian/changelog |  4 ++--
 debian/rules     | 22 +++++++++++++---------
 3 files changed, 16 insertions(+), 12 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index d1a0f8436..e3ce33c8f 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.10 LANGUAGES CXX )
+project( comma VERSION 1.0.12 LANGUAGES CXX )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
diff --git a/debian/changelog b/debian/changelog
index eee2b5f9e..d54a10c6e 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.10-0ppa0) jammy; urgency=low
+comma (1.0.12-0ppa0) jammy; urgency=low
 
   * launchpad stopped installing so files; trying to fix...
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 21:26:51 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 22:23:49 +1000
diff --git a/debian/rules b/debian/rules
index c17bc32bb..52f80513d 100755
--- a/debian/rules
+++ b/debian/rules
@@ -1,10 +1,12 @@
 #!/usr/bin/make -f
 
+BUILDDIR=build_dir
+
 # secondly called by launchpad
 build:
-	mkdir build;
-	cd build; cmake .. \
-                     -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr \
+	mkdir $(BUILDDIR);
+	cd $(BUILDDIR); cmake .. \
+	                 -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr \
 					 -DCMAKE_BUILD_TYPE=Release \
 					 -DBUILD_SHARED_LIBS=ON \
 					 -DBUILD_PYTHON_PACKAGES=OFF \
@@ -18,7 +20,7 @@ build:
 					 -Dcomma_BUILD_XML=OFF \
 					 -Dcomma_BUILD_ZEROMQ=OFF \
 					 -Dcomma_build_io_rabbit_cat=OFF
-	make -C build
+	cd $(BUILDDIR); make
 
 # thirdly called by launchpad
 binary: binary-indep binary-arch
@@ -26,22 +28,24 @@ binary: binary-indep binary-arch
 binary-indep:
 	# nothing to be done
 
-# super quick and dirty: cp -r build/lib debian/tmp
+# super quick and dirty:
+#     mkdir debian/tmp/usr/lib -p
+#     cp -r $(BUILDDIR)/lib/x86_64-linux-gnu debian/tmp/usr/lib
 # there seems to be a bug, most likely in generate_comma_config.cmake
 # that installs libraries in build instead of debian/tmp
 # (cannot reproduce it locally: locally, installation works,
 # but on launchpad it does not
 binary-arch:
-	mkdir -p debian/tmp/usr
-	cp -r build/lib debian/tmp/usr
-	cd build; cmake -P cmake_install.cmake
+	cd $(BUILDDIR); make install
+	mkdir debian/tmp/usr/lib -p
+	cp -r $(BUILDDIR)/lib/x86_64-linux-gnu debian/tmp/usr/lib
 	mkdir debian/tmp/DEBIAN
 	dpkg-gencontrol -pcomma
 	dpkg --build debian/tmp ..
 
 # firstly called by launchpad
 clean:
-	rm -rf build
+	rm -rf $(BUILDDIR)
 	rm -f debian/files
 
 .PHONY: binary binary-arch binary-indep clean

From 2d1183bdd6bd48c312343b3c947cd91f1cf5d77e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 May 2022 22:47:20 +1000
Subject: [PATCH 0491/1056] comma-launchpad-upload: brushed up; bug fixed

---
 system/launchpad/comma-launchpad-upload | 23 +++++++++--------------
 1 file changed, 9 insertions(+), 14 deletions(-)

diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
index d6d7832af..342d40d99 100755
--- a/system/launchpad/comma-launchpad-upload
+++ b/system/launchpad/comma-launchpad-upload
@@ -5,11 +5,11 @@
 #     - update changelog
 #       - version
 #       - changes
-#     - update default version in cmake
-#     - tag repo with version
+#       - date
+#     - cmake: update default version
 #     - commit
+#     - tag repo with version
 #     - push
-#   ? check current version at launchpad
 
 function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1; }
 [[ -n "$2" ]] || { echo "usage: $0 <what> <ubuntu-name> <comma-version>" >&2; exit 1; }
@@ -17,14 +17,9 @@ what=$1
 comma_version=$2
 name=comma_${comma_version}
 [[ -d comma ]] || die "comma directory not found; please run in something like ~/src"
-if [[ "$what" == "orig" ]]; then
-    rm -f comma/debian/files
-    tar -acf $name.orig.tar.gz comma || die "tar failed"
-    ( cd comma && debuild -S -sa -d ) || die "debuild failed"
-    dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"
-elif [[ "$what" == "update" ]]; then
-    ( cd comma && debuild -S -sd -d ) || die "debuild failed"
-    dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"
-else
-    die "expected <what>: orig or update; got \"$what\""
-fi
+tar -acf $name.orig.tar.gz comma || die "tar failed"
+if [[ "$what" == "orig" ]]; then rm -f comma/debian/files; what_option='a'
+elif [[ "$what" == "update" ]]; then what_option='d'
+else die "expected <what>: orig or update; got \"$what\""; fi
+( cd comma && debuild -S -s$what_option ) || die "debuild failed"
+dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"

From c576ad9f325908bd9bea302c8c2f27358f73de8a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 15 May 2022 00:10:49 +1000
Subject: [PATCH 0492/1056] debian/rules: todo comments added

---
 debian/rules | 17 ++++++++++-------
 1 file changed, 10 insertions(+), 7 deletions(-)

diff --git a/debian/rules b/debian/rules
index 52f80513d..22df25864 100755
--- a/debian/rules
+++ b/debian/rules
@@ -28,13 +28,16 @@ binary: binary-indep binary-arch
 binary-indep:
 	# nothing to be done
 
-# super quick and dirty:
-#     mkdir debian/tmp/usr/lib -p
-#     cp -r $(BUILDDIR)/lib/x86_64-linux-gnu debian/tmp/usr/lib
-# there seems to be a bug, most likely in generate_comma_config.cmake
-# that installs libraries in build instead of debian/tmp
-# (cannot reproduce it locally: locally, installation works,
-# but on launchpad it does not
+# todo
+#   ! try running rules with make locally
+#   - try cpack (which sucks)
+#   for now super quick and dirty:
+#       mkdir debian/tmp/usr/lib -p
+#       cp -r $(BUILDDIR)/lib/x86_64-linux-gnu debian/tmp/usr/lib
+#   there seems to be a bug, most likely in generate_comma_config.cmake
+#   that installs libraries in build instead of debian/tmp
+#   (cannot reproduce it locally: locally, installation works,
+#   but on launchpad it does not
 binary-arch:
 	cd $(BUILDDIR); make install
 	mkdir debian/tmp/usr/lib -p

From 112f50bb5d349b974276ee8aa8b18570022ef1f8 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 15 May 2022 07:31:10 +1000
Subject: [PATCH 0493/1056] cmake: gtest installation: use plain vanilla
 find_package (otherwise building shared libraries from source does not work
 on ubuntu 22.04)

---
 CMakeLists.txt | 21 ++++++++++++---------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index e3ce33c8f..d8bdc54e2 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -167,16 +167,19 @@ LINK_DIRECTORIES( ${Boost_LIBRARY_DIRS} )
 
 IF( comma_BUILD_TESTS )
 
+find_package( GTest REQUIRED )
+include_directories( ${GTEST_INCLUDE_DIRS} )
+
     # todo: maybe else clause is actually the right way to do things
-    IF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
-        FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/googletest/googletest DOC "source code of gtest" ) # FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/gtest DOC "source code of gtest" )
-        ADD_SUBDIRECTORY( ${GTest_SOURCE_DIR} gtest )
-        INCLUDE_DIRECTORIES( src ${GTest_SOURCE_DIR}/include ${GTest_SOURCE_DIR} )
-        SET( GTEST_BOTH_LIBRARIES gtest gtest_main )
-    ELSE( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
-        FIND_PACKAGE( GTest )
-        INCLUDE_DIRECTORIES( ${GTEST_INCLUDE_DIRS} )
-    ENDIF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
+#    IF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
+#        FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/googletest/googletest DOC "source code of gtest" ) # FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/gtest DOC "source code of gtest" )
+#        ADD_SUBDIRECTORY( ${GTest_SOURCE_DIR} gtest )
+#        INCLUDE_DIRECTORIES( src ${GTest_SOURCE_DIR}/include ${GTest_SOURCE_DIR} )
+#        SET( GTEST_BOTH_LIBRARIES gtest gtest_main )
+#    ELSE( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
+#        FIND_PACKAGE( GTest )
+#        INCLUDE_DIRECTORIES( ${GTEST_INCLUDE_DIRS} )
+#    ENDIF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
 
 #TT: Install tests to dir. This allows them to be packed by CPack.
 #Note: if your source tree is dirty (eg you've already run tests there and have output/ directories)

From 7516def6381b83f6676de9e00fd42e5990576bcc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 May 2022 10:01:54 +1000
Subject: [PATCH 0494/1056] cmake: project version: backward compatibility with
 earlier cmake versions restored

---
 CMakeLists.txt | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index d8bdc54e2..3ef873cea 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -9,8 +9,15 @@ if( USE_ARM_TOOLCHAIN )
 endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
-cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.12 LANGUAGES CXX )
+if( POLICY CMP0048 )
+    cmake_policy( SET CMP0048 NEW )
+    project( comma VERSION 1.0.12 LANGUAGES CXX )
+else( POLICY CMP0048 )
+    project( comma )
+    set( CMAKE_PROJECT_VERSION_MAJOR 1 )
+    set( CMAKE_PROJECT_VERSION_MINOR 0 )
+    set( CMAKE_PROJECT_VERSION_PATCH 12 )
+endif( POLICY CMP0048 )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty

From 629bc249002ff58a234a4c7f09758db09c737ae7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 May 2022 13:40:55 +1000
Subject: [PATCH 0495/1056] cmake: project version: backward compatibility with
 earlier cmake versions restored

---
 CMakeLists.txt | 17 ++++++++---------
 1 file changed, 8 insertions(+), 9 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 3ef873cea..632a74010 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -9,15 +9,14 @@ if( USE_ARM_TOOLCHAIN )
 endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
-if( POLICY CMP0048 )
-    cmake_policy( SET CMP0048 NEW )
-    project( comma VERSION 1.0.12 LANGUAGES CXX )
-else( POLICY CMP0048 )
-    project( comma )
-    set( CMAKE_PROJECT_VERSION_MAJOR 1 )
-    set( CMAKE_PROJECT_VERSION_MINOR 0 )
-    set( CMAKE_PROJECT_VERSION_PATCH 12 )
-endif( POLICY CMP0048 )
+cmake_policy( SET CMP0048 NEW )
+project( comma VERSION 1.0.12 LANGUAGES CXX )
+if( NOT DEFINED CMAKE_PROJECT_VERSION )
+    set( CMAKE_PROJECT_VERSION ${PROJECT_VERSION} )
+    set( CMAKE_PROJECT_VERSION_MAJOR ${PROJECT_VERSION_MAJOR} )
+    set( CMAKE_PROJECT_VERSION_MINOR ${PROJECT_VERSION_MINOR} )
+    set( CMAKE_PROJECT_VERSION_PATCH ${PROJECT_VERSION_PATCH} )
+endif( NOT DEFINED CMAKE_PROJECT_VERSION )
 
 set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
 set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty

From 7b884308b421aafcb30edd4f4e0727551b164ffb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 May 2022 14:02:36 +1000
Subject: [PATCH 0496/1056] python/setup.py: backward compatibility with
 earlier cmake versions restored

---
 python/setup.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/setup.py b/python/setup.py
index fe9d03e82..60e6b5e69 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,6 +1,6 @@
 #!/usr/bin/env python
 
-import setuptools, pathlib #from distutils.core import setup
+import setuptools #from distutils.core import setup
 import comma.version
 
 # https://realpython.com/pypi-publish-python-package/
@@ -22,7 +22,7 @@
         description         = 'csv and fixed-width binary python utilities',
         url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
-        long_description    = ( pathlib.Path(__file__).parent / "README.md" ).read_text(),
+        long_description    =  open( '/'.join( __file__.split( '/' )[:-1] ) + '/README.md' ).read(), #long_description    = ( pathlib.Path(__file__).parent / "README.md" ).read_text(),
         long_description_content_type = "text/markdown",
         author              = "vsevolod vlaskine",
         author_email        = "vsevolod.vlaskine@gmail.com",

From fa65bd1fd2d7a0275d5baa6ec27bda5be057da9f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 May 2022 17:54:07 +1000
Subject: [PATCH 0497/1056] numpy installation changed to pip (was apt install
 python3-numpy

---
 system/ansible/install.yml | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 9533f9853..3be479b03 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -12,7 +12,7 @@
   - name: "install comma dependencies"
     become: true
     apt:
-        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-numpy', 'python3-pip', 'libprocps-dev', 'recode']
+        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-pip', 'libprocps-dev', 'recode']
         state: present
         update_cache: yes
 
@@ -23,6 +23,11 @@
         state: present
         update_cache: yes
 
+  - name: "install python dependencies using pip"
+    become: true
+    pip:
+        name: numpy
+
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
     with_items:

From 100e5df76bd847e1605b1f1af0e40f9935a62310 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 May 2022 18:24:10 +1000
Subject: [PATCH 0498/1056] python: removed unnecessary #!.../python directives

---
 CMakeLists.txt                           |  2 +-
 python/comma/application/command_line.py |  2 --
 python/comma/io/windows_binary.py        | 29 ------------------------
 3 files changed, 1 insertion(+), 32 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 632a74010..311da286a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -370,7 +370,7 @@ set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps ve
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc" )
 #set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
-set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc-dev" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev" )
 set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc-dev" )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )
diff --git a/python/comma/application/command_line.py b/python/comma/application/command_line.py
index 6f5fbc0b9..e11a2f712 100644
--- a/python/comma/application/command_line.py
+++ b/python/comma/application/command_line.py
@@ -1,5 +1,3 @@
-#!/usr/bin/python
-
 import argparse
 
 class set_dictionary_action( argparse.Action ):
diff --git a/python/comma/io/windows_binary.py b/python/comma/io/windows_binary.py
index 0c56b0883..85249fa0d 100644
--- a/python/comma/io/windows_binary.py
+++ b/python/comma/io/windows_binary.py
@@ -1,33 +1,4 @@
-#!/bin/python
-
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 __author__ = 'j.underwood'
 '''

From ec21d170e90368e096cedafcb5f2402141b43c68 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 May 2022 18:34:43 +1000
Subject: [PATCH 0499/1056] python: cmake: default PYTHON set to python3

---
 python/CMakeLists.txt | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index d1422ee65..2fbcd5fbc 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -40,16 +40,15 @@ MACRO( set_python_build_lib_directory )
     ENDIF( MODULE_EXIT_CODE MATCHES 0 )
 ENDMACRO( set_python_build_lib_directory )
 
-
 IF( NOT BUILD_PYTHON_PACKAGES )
     disable_python_testing()
     RETURN()
 ENDIF( NOT BUILD_PYTHON_PACKAGES )
 
-FIND_PROGRAM( PYTHON "python" )
+FIND_PROGRAM( PYTHON "python3" )
 
 IF( NOT PYTHON )
-    MESSAGE( WARNING "python not found" )
+    MESSAGE( WARNING "python3 not found" )
     MESSAGE( STATUS "comma/python modules and scripts will not be installed" )
     disable_python_testing()
     RETURN()

From f7073dd9ee15d35fc1858bb424f0cdf6f26c11d4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 May 2022 18:43:02 +1000
Subject: [PATCH 0500/1056] python: python_requires downgraded to 2.7 for now
 for backward compatibility (that will break one day anyway...)

---
 python/setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/python/setup.py b/python/setup.py
index 60e6b5e69..9748152e8 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -28,7 +28,7 @@
         author_email        = "vsevolod.vlaskine@gmail.com",
         maintainer          = 'vsevolod vlaskine',
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
-        python_requires     = '>=3.6',
+        python_requires     = '>=2.7', # 3.6
         install_requires    = [ 'numpy' ], # todo?
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },

From 46bfa9a8b56ad4a3a48d521e5bd9d51d776aba3b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 17 May 2022 16:41:54 +1000
Subject: [PATCH 0501/1056] pytnon2 phased out from tests and installation
 (python2 compatibility still is preserved in the code, however cmake cannot
 be configured to using python2 anymore

---
 CMakeLists.txt                                |  8 +++---
 README.md                                     |  3 ++-
 .../comma_background/signature/basic/test     |  2 +-
 csv/format.cpp                                |  6 ++---
 io/applications/rabbit-cat                    |  2 +-
 name_value/applications/name-value-calc       |  2 +-
 name_value/applications/name-value-eval       |  8 +++---
 name_value/test/eval/test                     |  5 ++--
 python/CMakeLists.txt                         |  2 +-
 python/comma-rpm-post-install.sh              |  2 +-
 python/comma/application/test/dict/test       |  3 +--
 python/comma/application/test/remove/test     |  2 +-
 python/comma/csv/test/numpy_format/test       |  2 +-
 python/comma/csv/test/numpy_guess_format/test |  2 +-
 python/comma/csv/test/numpy_time/test         |  2 +-
 python/comma/csv/test/stream/array/test       |  2 +-
 .../stream/ascii_only/blank_lines/size_1/test |  2 +-
 .../ascii_only/blank_lines/size_all/test      |  2 +-
 .../ascii_only/blank_lines/size_default/test  |  2 +-
 .../test/stream/ascii_only/blank_values/test  |  2 +-
 .../ascii_only/default_values/time/test       |  2 +-
 .../csv/test/stream/ascii_only/delimiter/test |  2 +-
 .../csv/test/stream/ascii_only/precision/test |  2 +-
 .../ascii_only/tied/wrong_delimiter/test      |  2 +-
 .../stream/ascii_only/time_converter/test     |  2 +-
 python/comma/csv/test/stream/basic/test       |  2 +-
 .../csv/test/stream/binary_keyword/false/test |  2 +-
 .../binary_keyword/format_via_binary/test     |  2 +-
 .../stream/binary_keyword/ignore/format/test  |  2 +-
 .../binary_keyword/mismatched_with_tied/test  |  2 +-
 .../csv/test/stream/binary_keyword/true/test  |  2 +-
 .../fields/binary_is_true/known_fields/test   |  2 +-
 .../fields/binary_is_true/unknown_fields/test |  2 +-
 .../binary_only/fields/comma_types/test       |  2 +-
 .../fields/inconsistent_format/test           |  2 +-
 .../stream/binary_only/not-a-date-time/test   |  2 +-
 python/comma/csv/test/stream/buffer_size/test |  6 ++---
 .../csv/test/stream/default_values/basic/test |  2 +-
 .../default_values/full_xpath_is_false/test   |  2 +-
 .../ignore/field_in_stream/test               |  2 +-
 .../ignore/field_not_in_struct/test           |  2 +-
 .../default_values/no_missing_fields/test     |  2 +-
 .../csv/test/stream/default_values/size/test  |  2 +-
 .../comma/csv/test/stream/dump/no_mask/test   |  2 +-
 .../comma/csv/test/stream/dump/with_mask/test |  2 +-
 .../stream/duplicates/expected_fields/test    |  2 +-
 .../test/stream/duplicates/other_fields/test  |  2 +-
 python/comma/csv/test/stream/empty_input/test |  2 +-
 .../csv/test/stream/fields/array/test_1d/test |  2 +-
 .../csv/test/stream/fields/array/test_2d/test |  2 +-
 .../csv/test/stream/fields/array/test_3d/test |  2 +-
 .../comma/csv/test/stream/fields/basic/test   |  2 +-
 .../test/stream/fields/extra_field_names/test |  2 +-
 .../stream/fields/missing_fields/one/test     |  2 +-
 .../stream/fields/missing_fields/several/test |  2 +-
 python/comma/csv/test/stream/fields/read/test |  2 +-
 .../csv/test/stream/fields/shorthand/test     |  2 +-
 python/comma/csv/test/stream/fields/size/test |  2 +-
 python/comma/csv/test/stream/files/test       |  2 +-
 python/comma/csv/test/stream/flush/test       |  2 +-
 python/comma/csv/test/stream/iter/test        |  2 +-
 .../csv/test/stream/leaves/ambiguous/test     |  2 +-
 .../comma/csv/test/stream/leaves/basic/test   |  2 +-
 .../comma/csv/test/stream/leaves/slash/test   |  2 +-
 python/comma/csv/test/stream/one_field/test   |  2 +-
 python/comma/csv/test/stream/recarray/test    |  2 +-
 python/comma/csv/test/stream/size/test        |  2 +-
 .../csv/test/stream/standard_field_names/test |  2 +-
 .../stream/stdin/corrupt_input/ascii/test     |  2 +-
 .../stream/stdin/corrupt_input/binary/test    |  2 +-
 .../comma/csv/test/stream/stdin/simple/test   |  2 +-
 python/comma/csv/test/stream/tied/basic/test  |  2 +-
 .../comma/csv/test/stream/tied/mixedup/test   |  2 +-
 python/comma/csv/test/stream/timedelta/test   |  2 +-
 python/comma/csv/test/struct/test             | 26 +++++++++----------
 python/comma/csv/test/unit/test               |  2 +-
 python/comma/csv/time.py                      |  2 +-
 python/comma/numpy/test/test                  |  2 +-
 .../test/performance/csv/calc/max/data/max    |  3 +--
 python/comma/test/performance/csv/calc/test   |  5 ++--
 python/comma/test/performance/csv/stream/test |  2 +-
 python/setup.py                               |  4 +--
 system/launchpad/readme                       |  2 +-
 83 files changed, 110 insertions(+), 111 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 311da286a..b976d08c8 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -366,9 +366,9 @@ set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} )
 set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} )
 set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04 or later" )
-#set( CPACK_DEBIAN_PACKAGE_DEPENDS "comma-py, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
-#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc (>=6)" )
-#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, python3-numpy (>=1.14.1), libc" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "comma-py, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev" )
 #set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev" )
 set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc-dev" )
@@ -403,7 +403,7 @@ if( BUILD_SHARED_LIBS )
 endif( BUILD_SHARED_LIBS )
 
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
-    SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy" )
+    SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python3 numpy" )
     SET( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
     SET( CPACK_RPM_PRE_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-pre-install.sh" )
     SET( CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" ) # Prevents /tmp from permission change when installing RPM package
diff --git a/README.md b/README.md
index 9a355ea23..b988105ad 100644
--- a/README.md
+++ b/README.md
@@ -47,7 +47,8 @@ pip3 install comma-py==1.0.0
 ### building it manually
 #### install dependencies (ubuntu)
 ```
-sudo apt-get install git build-essential cmake cmake-curses-gui perl python3-dev python3-numpy libboost-all-dev socat libzmq3-dev libgtest-dev libprocps-dev recode expat gawk
+sudo apt-get install git python3-pip build-essential cmake cmake-curses-gui perl python3-dev libboost-all-dev socat libzmq3-dev libgtest-dev libprocps-dev recode expat gawk
+sudo pip3 install numpy
 ```
 #### build
 
diff --git a/bash/test/comma_background/signature/basic/test b/bash/test/comma_background/signature/basic/test
index 7e2f3b335..f7bad1464 100755
--- a/bash/test/comma_background/signature/basic/test
+++ b/bash/test/comma_background/signature/basic/test
@@ -19,7 +19,7 @@ echo "clock_ticks_per_second=$ticks"
 comma_process_exec_and_validate "$fifo" sleep 100 || { echo "$scriptname: fatal system error, wrong background PID" >&2; exit 1; }
 background_pid=$!
 
-now=$( python -c "from __future__ import print_function; import sys; from numpy import int64; a = sys.stdin.readline().split()[0]; print( int64(float(a) * $ticks) )" < /proc/uptime )
+now=$( python3 -c "import sys; from numpy import int64; a = sys.stdin.readline().split()[0]; print( int64(float(a) * $ticks) )" < /proc/uptime )
 echo "time/now=$now"
 
 signature=$( comma_process_signature "$background_pid" )
diff --git a/csv/format.cpp b/csv/format.cpp
index 956e1ceaf..36ca1fac0 100644
--- a/csv/format.cpp
+++ b/csv/format.cpp
@@ -226,8 +226,8 @@ static boost::posix_time::ptime time_from_iso_string( const std::string& s )
     if ( s.empty() || s == "not-a-date-time" ) { return boost::posix_time::not_a_date_time; }
     else if ( s == "+infinity" || s == "+inf" || s == "inf" ) { return boost::posix_time::pos_infin; }
     else if ( s == "-infinity" || s == "-inf" ) { return boost::posix_time::neg_infin; }
-    else 
-    { 
+    else
+    {
         try { return boost::posix_time::from_iso_string( s ); }
         catch ( ... ) { return boost::posix_time::not_a_date_time; }
     }
@@ -459,7 +459,7 @@ std::string format::collapsed_string() const
 
 // formats for not-a-date-time, +infinity, -infinity
 // note: these are not boost representations. in boost, +infinity = int64::max() - 1, -infinity = int64::min(), not-a-date-time = int64::max()
-// not-a-date-time is chosen to matche python numpy.datetime64('NaT') = int64::min()
+// not-a-date-time is chosen to match python numpy.datetime64('NaT') = int64::min()
 static const comma::int64 bin_not_a_date_time = std::numeric_limits< comma::int64 >::min();
 static const comma::int64 bin_time_pos_infin = std::numeric_limits< comma::int64 >::max();
 static const comma::int64 bin_time_neg_infin = std::numeric_limits< comma::int64 >::min() + 1;
diff --git a/io/applications/rabbit-cat b/io/applications/rabbit-cat
index 0edf99964..3a17a0275 100755
--- a/io/applications/rabbit-cat
+++ b/io/applications/rabbit-cat
@@ -1,4 +1,4 @@
-#!/usr/bin/env python
+#!/usr/bin/env python3
 
 # Copyright (c) 2018 The University of Sydney
 
diff --git a/name_value/applications/name-value-calc b/name_value/applications/name-value-calc
index 261d85d78..3db8ce4ab 100755
--- a/name_value/applications/name-value-calc
+++ b/name_value/applications/name-value-calc
@@ -118,7 +118,7 @@ function logical_op()
 function python_converter()
 {
     # todo? python2 -c "import operator...
-    python -c "
+    python3 -c "
 from __future__ import division
 from __future__ import print_function
 import operator
diff --git a/name_value/applications/name-value-eval b/name_value/applications/name-value-eval
index 4fadac7e3..5e190eb6b 100755
--- a/name_value/applications/name-value-eval
+++ b/name_value/applications/name-value-eval
@@ -73,7 +73,7 @@ Options:
 Examples:
 
     $name --variables=vars.pv commands.py
-    
+
     cat commands.py | $name --variables=vars.pv
 
     cat vars.pv | $name commands.py
@@ -134,7 +134,8 @@ output_vars_option=
 input=
 tmpdir="."
 # python_cmd="python2"
-python_cmd="python"
+# python_cmd="python"
+python_cmd="python3"
 
 while [[ $# -gt 0 ]]; do
     arg="${1#*=}"
@@ -195,7 +196,7 @@ if (( test_option )); then preparse_options+=" --test"; fi
   cat "$tmp_vars";
   if [[ -n "$input" ]]; then name-value-eval-preparse $preparse_options "$input"
   else name-value-eval-preparse $preparse_options; fi ) > $python_input
-  
+
 if (( debug )); then cat $python_input | sed 's/^/debug: /g' > /dev/tty; fi
 
 #cat "$python_input" > ./python_input
@@ -215,4 +216,3 @@ else
 fi
 
 exit $exit_code
-
diff --git a/name_value/test/eval/test b/name_value/test/eval/test
index 36189340f..7edada245 100755
--- a/name_value/test/eval/test
+++ b/name_value/test/eval/test
@@ -28,8 +28,9 @@ done
 variables="$data_dir/variable_vals"
 pass_count=0
 total_count=0
-python_version="$( python -c "from __future__ import print_function; import sys; print( sys.version_info.major )" )" # sigh...
-python_prefix="python${python_version}:"
+#python_version="$( python -c "from __future__ import print_function; import sys; print( sys.version_info.major )" )" # sigh...
+#python_prefix="python${python_version}:"
+python_prefix="python3:"
 
 for input in $data_dir/input_*; do # for input in $data_dir/input*; do
     (( ++total_count ))
diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index 2fbcd5fbc..ced969491 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -85,7 +85,7 @@ ADD_CUSTOM_TARGET( python_build ALL
 #                    COMMAND ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE} install ${INSTALL_PREFIX_OPTION} --force
 #                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
 
-INSTALL( CODE "EXECUTE_PROCESS(
+install( CODE "EXECUTE_PROCESS(
                     COMMAND ${PYTHON} -m pip install ${CMAKE_CURRENT_SOURCE_DIR} --ignore-installed
                     WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
 
diff --git a/python/comma-rpm-post-install.sh b/python/comma-rpm-post-install.sh
index c123837af..1f82ccfe7 100644
--- a/python/comma-rpm-post-install.sh
+++ b/python/comma-rpm-post-install.sh
@@ -1,3 +1,3 @@
 #!/bin/sh
 
-cd /tmp/comma/python_modules_for_rpm_install && python setup.py install
+cd /tmp/comma/python_modules_for_rpm_install && python3 setup.py install
diff --git a/python/comma/application/test/dict/test b/python/comma/application/test/dict/test
index b5ec5c40c..bf8440ccc 100755
--- a/python/comma/application/test/dict/test
+++ b/python/comma/application/test/dict/test
@@ -10,8 +10,7 @@ function main()
 {
     local value_type
     value_type=${input_value_type:+"value_type=$input_value_type, "}
-    python -c "
-from __future__ import print_function
+    python3 -c "
 import comma.application
 import argparse
 
diff --git a/python/comma/application/test/remove/test b/python/comma/application/test/remove/test
index 9eb261bb5..de0be364a 100755
--- a/python/comma/application/test/remove/test
+++ b/python/comma/application/test/remove/test
@@ -7,7 +7,7 @@ mkdir -p "$output_dir" || exit 1
 
 function main()
 {
-    python -c "
+    python3 -c "
 import comma.application
 import argparse
 
diff --git a/python/comma/csv/test/numpy_format/test b/python/comma/csv/test/numpy_format/test
index 876acea0e..339f99486 100755
--- a/python/comma/csv/test/numpy_format/test
+++ b/python/comma/csv/test/numpy_format/test
@@ -4,7 +4,7 @@ function comma_format_to_numpy
 {
     local compress=$2
     compress=${compress:+", $compress"}
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import comma
 import numpy
diff --git a/python/comma/csv/test/numpy_guess_format/test b/python/comma/csv/test/numpy_guess_format/test
index 29df57222..ce53b3e1b 100755
--- a/python/comma/csv/test/numpy_guess_format/test
+++ b/python/comma/csv/test/numpy_guess_format/test
@@ -2,7 +2,7 @@
 
 function comma_guess_format
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import comma
 import numpy
diff --git a/python/comma/csv/test/numpy_time/test b/python/comma/csv/test/numpy_time/test
index 90a84acb0..c2de5abb6 100755
--- a/python/comma/csv/test/numpy_time/test
+++ b/python/comma/csv/test/numpy_time/test
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 function comma_time_roundabout {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import numpy
 import comma
diff --git a/python/comma/csv/test/stream/array/test b/python/comma/csv/test/stream/array/test
index 9284da636..5810ce637 100755
--- a/python/comma/csv/test/stream/array/test
+++ b/python/comma/csv/test/stream/array/test
@@ -8,7 +8,7 @@ function process_records
 {
     local binary
     if [[ "$1" == "binary" ]]; then binary=True; else binary=False; fi
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test b/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test
index 178f33111..b457fba0e 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 'x', 'u4' )
diff --git a/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test b/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test
index 6ad8c3658..93fc9562f 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 'x', 'u4' )
diff --git a/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test b/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test
index d3176282f..8d9622e83 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 'x', 'u4' )
diff --git a/python/comma/csv/test/stream/ascii_only/blank_values/test b/python/comma/csv/test/stream/ascii_only/blank_values/test
index f9723eb9c..0ab8038d1 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_values/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_values/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 's1,x,y,t,array,s2,z', 'S2', 'i4', 'f8', 'datetime64[us]', '2u1', 'S4', 'f8' )
diff --git a/python/comma/csv/test/stream/ascii_only/default_values/time/test b/python/comma/csv/test/stream/ascii_only/default_values/time/test
index 4fb6effe3..977b47546 100755
--- a/python/comma/csv/test/stream/ascii_only/default_values/time/test
+++ b/python/comma/csv/test/stream/ascii_only/default_values/time/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function default_values
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy as np
 from datetime import datetime
diff --git a/python/comma/csv/test/stream/ascii_only/delimiter/test b/python/comma/csv/test/stream/ascii_only/delimiter/test
index 7f42025fd..01dc2c941 100755
--- a/python/comma/csv/test/stream/ascii_only/delimiter/test
+++ b/python/comma/csv/test/stream/ascii_only/delimiter/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/ascii_only/precision/test b/python/comma/csv/test/stream/ascii_only/precision/test
index bb09387bf..06f963b26 100755
--- a/python/comma/csv/test/stream/ascii_only/precision/test
+++ b/python/comma/csv/test/stream/ascii_only/precision/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test b/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test
index cf1b4f506..3c6b5c7cc 100755
--- a/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test
+++ b/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/ascii_only/time_converter/test b/python/comma/csv/test/stream/ascii_only/time_converter/test
index 018360c9a..2fbaee398 100755
--- a/python/comma/csv/test/stream/ascii_only/time_converter/test
+++ b/python/comma/csv/test/stream/ascii_only/time_converter/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/basic/test b/python/comma/csv/test/stream/basic/test
index 8307292ec..d7200ba5d 100755
--- a/python/comma/csv/test/stream/basic/test
+++ b/python/comma/csv/test/stream/basic/test
@@ -8,7 +8,7 @@ function process_records
 {
     local binary
     if [[ "$1" == "binary" ]]; then binary=True; else binary=False; fi
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_keyword/false/test b/python/comma/csv/test/stream/binary_keyword/false/test
index 4f7fe1b12..ef93e4356 100755
--- a/python/comma/csv/test/stream/binary_keyword/false/test
+++ b/python/comma/csv/test/stream/binary_keyword/false/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_keyword/format_via_binary/test b/python/comma/csv/test/stream/binary_keyword/format_via_binary/test
index 9b4d49327..ada326a60 100755
--- a/python/comma/csv/test/stream/binary_keyword/format_via_binary/test
+++ b/python/comma/csv/test/stream/binary_keyword/format_via_binary/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_keyword/ignore/format/test b/python/comma/csv/test/stream/binary_keyword/ignore/format/test
index 415225f01..cff48145e 100755
--- a/python/comma/csv/test/stream/binary_keyword/ignore/format/test
+++ b/python/comma/csv/test/stream/binary_keyword/ignore/format/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test b/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test
index 54e592ef8..6247624b2 100755
--- a/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test
+++ b/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function mismatched
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/binary_keyword/true/test b/python/comma/csv/test/stream/binary_keyword/true/test
index 756955a1f..03d0232a5 100755
--- a/python/comma/csv/test/stream/binary_keyword/true/test
+++ b/python/comma/csv/test/stream/binary_keyword/true/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test
index 015830d23..c06dc2427 100755
--- a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test
+++ b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test
index a513332e2..5bf2ae78c 100755
--- a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test
+++ b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function unknown_fields
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/binary_only/fields/comma_types/test b/python/comma/csv/test/stream/binary_only/fields/comma_types/test
index fdbad741f..d49d5f4f3 100755
--- a/python/comma/csv/test/stream/binary_only/fields/comma_types/test
+++ b/python/comma/csv/test/stream/binary_only/fields/comma_types/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test b/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test
index ced6d026e..c3532302f 100755
--- a/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test
+++ b/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_only/not-a-date-time/test b/python/comma/csv/test/stream/binary_only/not-a-date-time/test
index 418466696..18fd42028 100755
--- a/python/comma/csv/test/stream/binary_only/not-a-date-time/test
+++ b/python/comma/csv/test/stream/binary_only/not-a-date-time/test
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 numpy_int=$(
-python -c "
+python3 -c "
 from comma.csv import *
 t = struct( 'f', *format.to_numpy('t') )
 s = stream( t, binary=True )
diff --git a/python/comma/csv/test/stream/buffer_size/test b/python/comma/csv/test/stream/buffer_size/test
index 5598de759..3a4ae9b61 100755
--- a/python/comma/csv/test/stream/buffer_size/test
+++ b/python/comma/csv/test/stream/buffer_size/test
@@ -1,12 +1,12 @@
 #!/bin/bash
 
-function get_buffer_size_in_bytes { python -c "from __future__ import print_function; import comma; print( comma.csv.stream.buffer_size_in_bytes )"; }
+function get_buffer_size_in_bytes { python3 -c "from __future__ import print_function; import comma; print( comma.csv.stream.buffer_size_in_bytes )"; }
 
 function get_default_size
 {
     local fields=$1
     local type=$2
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import sys
 import comma
@@ -21,6 +21,6 @@ END
 echo "buffer_size_in_bytes=$( get_buffer_size_in_bytes )"
 
 fields="x,y"
-echo "number_of_fields=$( python -c "from __future__ import print_function; s = '$fields'; print( len( s.split(',') ) )" )"
+echo "number_of_fields=$( python3 -c "from __future__ import print_function; s = '$fields'; print( len( s.split(',') ) )" )"
 echo "size/uint8=$( get_default_size $fields uint8 )"
 echo "size/float64=$( get_default_size $fields float64 )"
diff --git a/python/comma/csv/test/stream/default_values/basic/test b/python/comma/csv/test/stream/default_values/basic/test
index 7d41d9288..3c7220d5b 100755
--- a/python/comma/csv/test/stream/default_values/basic/test
+++ b/python/comma/csv/test/stream/default_values/basic/test
@@ -6,7 +6,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/full_xpath_is_false/test b/python/comma/csv/test/stream/default_values/full_xpath_is_false/test
index d036f408e..440db7021 100755
--- a/python/comma/csv/test/stream/default_values/full_xpath_is_false/test
+++ b/python/comma/csv/test/stream/default_values/full_xpath_is_false/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test b/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test
index 01a2cc00d..da3e582b8 100755
--- a/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test
+++ b/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test b/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test
index bb7aea2de..5579a152b 100755
--- a/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test
+++ b/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/no_missing_fields/test b/python/comma/csv/test/stream/default_values/no_missing_fields/test
index 1429b376a..501aaf4b7 100755
--- a/python/comma/csv/test/stream/default_values/no_missing_fields/test
+++ b/python/comma/csv/test/stream/default_values/no_missing_fields/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/size/test b/python/comma/csv/test/stream/default_values/size/test
index 0b5909c09..bf896ecc4 100755
--- a/python/comma/csv/test/stream/default_values/size/test
+++ b/python/comma/csv/test/stream/default_values/size/test
@@ -8,7 +8,7 @@ function default_values
 {
     local input_format=$1
     local size=$( cat size )
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 comma.csv.time.zone( 'UTC' )
 point_t = comma.csv.struct( 'id,signal,x,y,z', 'uint64', '(2,)float64', 'float64', 'float64', 'int64' )
diff --git a/python/comma/csv/test/stream/dump/no_mask/test b/python/comma/csv/test/stream/dump/no_mask/test
index f9536fe1b..f76a7fc62 100755
--- a/python/comma/csv/test/stream/dump/no_mask/test
+++ b/python/comma/csv/test/stream/dump/no_mask/test
@@ -6,7 +6,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,mask', 'float64', 'float64', 'uint32' )
diff --git a/python/comma/csv/test/stream/dump/with_mask/test b/python/comma/csv/test/stream/dump/with_mask/test
index 7d52d2188..a8e664ddc 100755
--- a/python/comma/csv/test/stream/dump/with_mask/test
+++ b/python/comma/csv/test/stream/dump/with_mask/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,mask', 'float64', 'float64', 'uint32' )
diff --git a/python/comma/csv/test/stream/duplicates/expected_fields/test b/python/comma/csv/test/stream/duplicates/expected_fields/test
index ad2836af7..dacc4a8f3 100755
--- a/python/comma/csv/test/stream/duplicates/expected_fields/test
+++ b/python/comma/csv/test/stream/duplicates/expected_fields/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/duplicates/other_fields/test b/python/comma/csv/test/stream/duplicates/other_fields/test
index 674b0e132..6c24d7eee 100755
--- a/python/comma/csv/test/stream/duplicates/other_fields/test
+++ b/python/comma/csv/test/stream/duplicates/other_fields/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/empty_input/test b/python/comma/csv/test/stream/empty_input/test
index bf4a2ec61..d950ca766 100755
--- a/python/comma/csv/test/stream/empty_input/test
+++ b/python/comma/csv/test/stream/empty_input/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/array/test_1d/test b/python/comma/csv/test/stream/fields/array/test_1d/test
index 5ebce3c24..c24fe2bb9 100755
--- a/python/comma/csv/test/stream/fields/array/test_1d/test
+++ b/python/comma/csv/test/stream/fields/array/test_1d/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/array/test_2d/test b/python/comma/csv/test/stream/fields/array/test_2d/test
index d0f3a4f52..7d4750fed 100755
--- a/python/comma/csv/test/stream/fields/array/test_2d/test
+++ b/python/comma/csv/test/stream/fields/array/test_2d/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/array/test_3d/test b/python/comma/csv/test/stream/fields/array/test_3d/test
index 06e22cda6..98f49489d 100755
--- a/python/comma/csv/test/stream/fields/array/test_3d/test
+++ b/python/comma/csv/test/stream/fields/array/test_3d/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/basic/test b/python/comma/csv/test/stream/fields/basic/test
index b8ff4b082..a36a4d226 100755
--- a/python/comma/csv/test/stream/fields/basic/test
+++ b/python/comma/csv/test/stream/fields/basic/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/extra_field_names/test b/python/comma/csv/test/stream/fields/extra_field_names/test
index d3df29eb5..4773393de 100755
--- a/python/comma/csv/test/stream/fields/extra_field_names/test
+++ b/python/comma/csv/test/stream/fields/extra_field_names/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
    local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/missing_fields/one/test b/python/comma/csv/test/stream/fields/missing_fields/one/test
index 41ea3e7eb..62368ce0d 100755
--- a/python/comma/csv/test/stream/fields/missing_fields/one/test
+++ b/python/comma/csv/test/stream/fields/missing_fields/one/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/fields/missing_fields/several/test b/python/comma/csv/test/stream/fields/missing_fields/several/test
index 12cbca8ba..cd486f230 100755
--- a/python/comma/csv/test/stream/fields/missing_fields/several/test
+++ b/python/comma/csv/test/stream/fields/missing_fields/several/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/fields/read/test b/python/comma/csv/test/stream/fields/read/test
index 008f6cd7e..0143734fc 100755
--- a/python/comma/csv/test/stream/fields/read/test
+++ b/python/comma/csv/test/stream/fields/read/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/shorthand/test b/python/comma/csv/test/stream/fields/shorthand/test
index 9d9f31868..2887bb9f9 100755
--- a/python/comma/csv/test/stream/fields/shorthand/test
+++ b/python/comma/csv/test/stream/fields/shorthand/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/size/test b/python/comma/csv/test/stream/fields/size/test
index 97a65250c..a9e8d756e 100755
--- a/python/comma/csv/test/stream/fields/size/test
+++ b/python/comma/csv/test/stream/fields/size/test
@@ -8,7 +8,7 @@ function process_records
 {
     local size=$1
     local input_format=$2
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/files/test b/python/comma/csv/test/stream/files/test
index e379df890..9eed7373e 100755
--- a/python/comma/csv/test/stream/files/test
+++ b/python/comma/csv/test/stream/files/test
@@ -9,7 +9,7 @@ function process_records
     local input_format=$1
     local in=$2
     local out=$3
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/flush/test b/python/comma/csv/test/stream/flush/test
index 577f6ea49..8f626bf59 100755
--- a/python/comma/csv/test/stream/flush/test
+++ b/python/comma/csv/test/stream/flush/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/iter/test b/python/comma/csv/test/stream/iter/test
index 5e2534a6c..ba8e0c2e0 100755
--- a/python/comma/csv/test/stream/iter/test
+++ b/python/comma/csv/test/stream/iter/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/leaves/ambiguous/test b/python/comma/csv/test/stream/leaves/ambiguous/test
index 6a80007ee..71c44631e 100755
--- a/python/comma/csv/test/stream/leaves/ambiguous/test
+++ b/python/comma/csv/test/stream/leaves/ambiguous/test
@@ -2,7 +2,7 @@
 
 function ambiguous_fields
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/leaves/basic/test b/python/comma/csv/test/stream/leaves/basic/test
index 600a383c9..420d61ae9 100755
--- a/python/comma/csv/test/stream/leaves/basic/test
+++ b/python/comma/csv/test/stream/leaves/basic/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/leaves/slash/test b/python/comma/csv/test/stream/leaves/slash/test
index 2347fec04..869c9f64c 100755
--- a/python/comma/csv/test/stream/leaves/slash/test
+++ b/python/comma/csv/test/stream/leaves/slash/test
@@ -2,7 +2,7 @@
 
 function slash
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/one_field/test b/python/comma/csv/test/stream/one_field/test
index 9a90c9a34..76f9a4c5b 100755
--- a/python/comma/csv/test/stream/one_field/test
+++ b/python/comma/csv/test/stream/one_field/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x', 'float64' )
diff --git a/python/comma/csv/test/stream/recarray/test b/python/comma/csv/test/stream/recarray/test
index c4088d4a9..cc025d9cb 100755
--- a/python/comma/csv/test/stream/recarray/test
+++ b/python/comma/csv/test/stream/recarray/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/size/test b/python/comma/csv/test/stream/size/test
index aa61f9d4a..ee912c968 100755
--- a/python/comma/csv/test/stream/size/test
+++ b/python/comma/csv/test/stream/size/test
@@ -8,7 +8,7 @@ function process_records
 {
     local size=$1
     local input_format=$2
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/standard_field_names/test b/python/comma/csv/test/stream/standard_field_names/test
index c1f2a3d7a..bd49a23bb 100755
--- a/python/comma/csv/test/stream/standard_field_names/test
+++ b/python/comma/csv/test/stream/standard_field_names/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test b/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
index a4754d1e1..2ad7dfc7a 100755
--- a/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
+++ b/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import comma
 import numpy
diff --git a/python/comma/csv/test/stream/stdin/corrupt_input/binary/test b/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
index ec1cd6000..81f61352b 100755
--- a/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
+++ b/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import comma
 import numpy
diff --git a/python/comma/csv/test/stream/stdin/simple/test b/python/comma/csv/test/stream/stdin/simple/test
index 311cc7826..04da5b08c 100755
--- a/python/comma/csv/test/stream/stdin/simple/test
+++ b/python/comma/csv/test/stream/stdin/simple/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/tied/basic/test b/python/comma/csv/test/stream/tied/basic/test
index ed2b3f331..ca0f094d4 100755
--- a/python/comma/csv/test/stream/tied/basic/test
+++ b/python/comma/csv/test/stream/tied/basic/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/tied/mixedup/test b/python/comma/csv/test/stream/tied/mixedup/test
index d9a86908b..d3fb26177 100755
--- a/python/comma/csv/test/stream/tied/mixedup/test
+++ b/python/comma/csv/test/stream/tied/mixedup/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/timedelta/test b/python/comma/csv/test/stream/timedelta/test
index 4082f1666..151537abf 100755
--- a/python/comma/csv/test/stream/timedelta/test
+++ b/python/comma/csv/test/stream/timedelta/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/struct/test b/python/comma/csv/test/struct/test
index 2ca45ac28..b2ebab968 100755
--- a/python/comma/csv/test/struct/test
+++ b/python/comma/csv/test/struct/test
@@ -1,14 +1,14 @@
 #!/bin/bash
 
-function types_incorrect_name { python -c "import comma; point_t = comma.csv.struct( 'x', 'invalid' )"; }
-function types_empty_name { python -c "import comma; point_t = comma.csv.struct( 'x', '' )"; }
-function types_insufficient_number { python -c "import comma; point_t = comma.csv.struct( 'x,y', 'float64' )"; }
-function duplicate_field { python -c "import comma; point_t = comma.csv.struct( 'x,x,z', 'float64', 'int32', 'float64' )"; }
-function field_with_slash { python -c "import comma; point_t = comma.csv.struct( 'x,x/y,z', 'float64', 'int32', 'float64' )"; }
+function types_incorrect_name { python3 -c "import comma; point_t = comma.csv.struct( 'x', 'invalid' )"; }
+function types_empty_name { python3 -c "import comma; point_t = comma.csv.struct( 'x', '' )"; }
+function types_insufficient_number { python3 -c "import comma; point_t = comma.csv.struct( 'x,y', 'float64' )"; }
+function duplicate_field { python3 -c "import comma; point_t = comma.csv.struct( 'x,x,z', 'float64', 'int32', 'float64' )"; }
+function field_with_slash { python3 -c "import comma; point_t = comma.csv.struct( 'x,x/y,z', 'float64', 'int32', 'float64' )"; }
 
 function excess_number_of_types
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 point_t = comma.csv.struct( 'x,y', 'float64','float64','uint64' )
@@ -23,7 +23,7 @@ END
 
 function blank_fields
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 point_t = comma.csv.struct( ',,z', 'float64', 'int32', 'float64' )
@@ -36,7 +36,7 @@ END
 
 function basic
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import numpy
 import comma
 
@@ -51,7 +51,7 @@ END
 
 function shorthand
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import comma
 
@@ -67,7 +67,7 @@ END
 
 function leaves
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import comma
 
@@ -84,7 +84,7 @@ END
 function record
 {
     local what=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 from __future__ import print_function
 import comma
 
@@ -99,7 +99,7 @@ END
 function assign()
 {
     local what=$1
-    python -c "
+    python3 -c "
 from __future__ import print_function
 import sys
 import numpy as np
@@ -110,7 +110,7 @@ class test_class:
     class nested:
         def __init__( self ):
             self.a = int( 3 )
-            
+
     def __init__( self ):
         self.a = int( 1 )
         self.b = float( 2 )
diff --git a/python/comma/csv/test/unit/test b/python/comma/csv/test/unit/test
index e4997a032..6724cd089 100755
--- a/python/comma/csv/test/unit/test
+++ b/python/comma/csv/test/unit/test
@@ -3,5 +3,5 @@
 name=$( basename $0 )
 
 for t in test_*.py; do
-    python $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
+    python3 $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
 done
diff --git a/python/comma/csv/time.py b/python/comma/csv/time.py
index 742773092..65000e66b 100644
--- a/python/comma/csv/time.py
+++ b/python/comma/csv/time.py
@@ -39,7 +39,7 @@ def to_numpy(t):
     >>> to_numpy('')
     numpy.datetime64('NaT')
     """
-    if NUMPY_VERSION_MAJOR_ == 1 and NUMPY_VERSION_MAJOR_ < 14 and isinstance( t, bytes ): t = t.decode( 'utf-8' ) # quick and dirty, since ubuntu 18.04 python3-numpy still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
+    if NUMPY_VERSION_MAJOR_ == 1 and NUMPY_VERSION_MAJOR_ < 14 and isinstance( t, bytes ): t = t.decode( 'utf-8' ) # quick and dirty, since some packages, e.g. ubuntu 18.04 python3-numpy, still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
     if t in ['', 'not-a-date-time']: return NOT_A_DATE_TIME
     if t in ['+infinity', '+inf', 'infinity', 'inf']: return POSITIVE_INFINITY
     if t in ['-infinity', '-inf']: return NEGATIVE_INFINITY
diff --git a/python/comma/numpy/test/test b/python/comma/numpy/test/test
index e4997a032..6724cd089 100755
--- a/python/comma/numpy/test/test
+++ b/python/comma/numpy/test/test
@@ -3,5 +3,5 @@
 name=$( basename $0 )
 
 for t in test_*.py; do
-    python $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
+    python3 $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
 done
diff --git a/python/comma/test/performance/csv/calc/max/data/max b/python/comma/test/performance/csv/calc/max/data/max
index 43b7f6ca1..d89e0dd60 100755
--- a/python/comma/test/performance/csv/calc/max/data/max
+++ b/python/comma/test/performance/csv/calc/max/data/max
@@ -1,4 +1,4 @@
-#!/usr/bin/python
+#!/usr/bin/env python3
 import numpy as np
 import comma
 t = comma.csv.struct( 'id,value', 'u4', 'f8' )
@@ -11,4 +11,3 @@ for data in s:
             continue
         max[id] = current_max
 s.write(np.array(max.items(), dtype=t))
-
diff --git a/python/comma/test/performance/csv/calc/test b/python/comma/test/performance/csv/calc/test
index 0d1c6cebe..230e6d433 100755
--- a/python/comma/test/performance/csv/calc/test
+++ b/python/comma/test/performance/csv/calc/test
@@ -4,7 +4,7 @@ function generate_uniform_input
 {
     local size=$1
     local number_of_ids=100
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import numpy as np
 import comma
 t = comma.csv.struct('id,value', 'u4', 'f8')
@@ -23,7 +23,7 @@ END
 function generate_random_input
 {
     local size=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import numpy as np
 import comma
 t = comma.csv.struct('id,value', 'u4', 'f8')
@@ -71,4 +71,3 @@ python_script=$( pwd )/$python_script
 
 ( mkdir -p output/random && cd output/random && process random )
 ( mkdir -p output/uniform && cd output/uniform && process uniform )
-
diff --git a/python/comma/test/performance/csv/stream/test b/python/comma/test/performance/csv/stream/test
index 36f0c29d3..36d9494a5 100755
--- a/python/comma/test/performance/csv/stream/test
+++ b/python/comma/test/performance/csv/stream/test
@@ -11,7 +11,7 @@ function output_code
         *) echo "$scriptname: expected --ascii or --binary, got '$1'"; exit 1 ;;
     esac
 cat <<END
-#!/usr/bin/python
+#!/usr/bin/env python3
 
 import comma
 comma.csv.time.zone( 'UTC' )
diff --git a/python/setup.py b/python/setup.py
index 9748152e8..570a46594 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python
+#!/usr/bin/env python3
 
 import setuptools #from distutils.core import setup
 import comma.version
@@ -28,7 +28,7 @@
         author_email        = "vsevolod.vlaskine@gmail.com",
         maintainer          = 'vsevolod vlaskine',
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
-        python_requires     = '>=2.7', # 3.6
+        python_requires     = '>=3.6',
         install_requires    = [ 'numpy' ], # todo?
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
diff --git a/system/launchpad/readme b/system/launchpad/readme
index a89b95867..38a9babd7 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -21,7 +21,7 @@ uploading to pypi (i know, wrong place)
 
 cd comma/python
 # bump up version in version.py
-python setup.py sdist bdist_wheel
+python3 setup.py sdist bdist_wheel
 twine upload --repository-url https://pypi.org/legacy/ dist/* # test
 twine upload dist/*
 

From 3253155a8d61bbf4d25dbb9d77de1dcbd968b926 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 18 May 2022 13:23:24 +1000
Subject: [PATCH 0502/1056] python: cmake: use python setup.py instead of pip
 for now

---
 python/CMakeLists.txt | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index ced969491..94d059f5d 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -81,14 +81,14 @@ ADD_CUSTOM_TARGET( python_build ALL
                    ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE}
                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )
 
-#INSTALL( CODE "EXECUTE_PROCESS(
-#                    COMMAND ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE} install ${INSTALL_PREFIX_OPTION} --force
-#                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
-
-install( CODE "EXECUTE_PROCESS(
-                    COMMAND ${PYTHON} -m pip install ${CMAKE_CURRENT_SOURCE_DIR} --ignore-installed
+INSTALL( CODE "EXECUTE_PROCESS(
+                    COMMAND ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE} install ${INSTALL_PREFIX_OPTION} --force
                     WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
 
+#install( CODE "EXECUTE_PROCESS(
+#                    COMMAND ${PYTHON} -m pip install ${CMAKE_CURRENT_SOURCE_DIR} --ignore-installed
+#                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
+
 SET_DIRECTORY_PROPERTIES( PROPERTIES ADDITIONAL_MAKE_CLEAN_FILES build )
 
 IF( ADD_PYTHON_PACKAGES_TO_RPM )

From cbb6caf856f86fbeced4413e1e2b12f0905bd07e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 18 May 2022 16:36:33 +1000
Subject: [PATCH 0503/1056] cmake: CPACK_DEPENDENCIES_PYTHON added, OFF by
 default

---
 CMakeLists.txt | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b976d08c8..fd9ebe140 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -366,11 +366,15 @@ set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} )
 set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} )
 set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} )
 set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04 or later" )
+option( CPACK_DEPENDENCIES_PYTHON "add python dependencies, currently: python3-numpy" OFF )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "comma-py, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev (>=6)" )
 #set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev" )
 #set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
 set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev" )
+if( CPACK_DEPENDENCIES_PYTHON )
+    set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEBIAN_PACKAGE_DEPENDS}, python3-numpy" )
+endif( CPACK_DEPENDENCIES_PYTHON )
 set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc-dev" )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
 set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )

From 77393e6d8c78e3d12b1824fe410d30d56725cda7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 31 May 2022 21:35:00 +1000
Subject: [PATCH 0504/1056] name-value-get: trailing new line added to
 path-value output

---
 name_value/applications/name-value-get.cpp | 45 ++++++++++-------
 name_value/ptree.cpp                       | 59 ++++++++--------------
 name_value/test/name-value-get/expected    |  8 +--
 name_value/test/name-value-get/input       |  2 +-
 name_value/test/regex/expected             |  6 +--
 5 files changed, 55 insertions(+), 65 deletions(-)

diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index 060a1300a..239177d99 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -151,7 +151,7 @@ template <> struct traits< path_value > // quick and dirty
         ptree = comma::property_tree::from_path_value_string( line, equal_sign, path_value_delimiter, check_type, true );
     }
     static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const std::string& path )
-    { 
+    {
         static bool first = true; // todo: will not work linewise, fix
         if( !first ) { std::cout << path_value_delimiter; }
         first = false;
@@ -164,30 +164,36 @@ static std::vector< boost::property_tree::ptree::path_type > paths;
 static std::vector< boost::optional< boost::regex > > path_regex;
 static void ( * input )( std::istream& is, boost::property_tree::ptree& ptree );
 static void ( * output )( std::ostream& is, const boost::property_tree::ptree& ptree, const std::string& );
+static bool output_last_line_break = false;
 
 static void match_( std::ostream& os, const boost::property_tree::ptree& ptree )
 {
     static const boost::property_tree::ptree::path_type empty;
+    bool found = false;
     for( std::size_t i = 0; i < paths.size(); ++i )
     {
         boost::optional< const boost::property_tree::ptree& > child = comma::property_tree::get_tree(ptree, path_strings[i]);
         if( !child ) { continue; }
         boost::optional< std::string > value = child->get_optional< std::string >( empty );
-        if( value && !value->empty() )
-        { 
+        if( value && !value->empty() ) // todo! homogenise single values with path-value pairs; currently the following example will output junk: ( echo x/z=0; echo y=1 ) | name-value-get x y
+        {
+            if( found ) { os << path_value_delimiter; }
             if( output_path ) { os << path_strings[i] << equal_sign; }
-            os << *value << std::endl;
+            os << *value;
         }
         else
-        { 
+        {
             output( os, *child, path_strings[i] );
         }
+        found = true;
     }
+    if( found && output_last_line_break ) { os << std::endl; }
 }
 
-static void traverse_( std::ostream& os, const boost::property_tree::ptree& ptree, boost::property_tree::ptree::const_iterator it, comma::xpath& path )
+static bool traverse_( std::ostream& os, const boost::property_tree::ptree& ptree, boost::property_tree::ptree::const_iterator it, comma::xpath& path )
 {
     static const boost::property_tree::ptree::path_type empty;
+    static bool found = false;
     path /= it->first;
     const std::string& s = path.to_string( '/' ); // quick and dirty
     for( std::size_t i = 0; i < paths.size(); ++i ) // todo: quick and dirty: can prune much earlier, i guess...
@@ -197,30 +203,32 @@ static void traverse_( std::ostream& os, const boost::property_tree::ptree& ptre
         boost::optional< const boost::property_tree::ptree& > child = ptree.get_child_optional( path.to_string( '.' ) ); // quick and dirty, watch performance
         if( !child ) { continue; }
         boost::optional< std::string > value = child->get_optional< std::string >( empty );
-        if( value && !value->empty() )
-        { 
+        if( value && !value->empty() ) // todo! homogenise single values with path-value pairs; currently the following example will output junk: ( echo x/z=0; echo y=1 ) | name-value-get x y
+        {
+            if( found ) { os << path_value_delimiter; }
             if( output_path ) { os << s << equal_sign; }
-            os << *value << std::endl;
+            os << *value;
         }
         else
         {
             output( os, *child, s );
         }
+        found = true;
     }
-    for( boost::property_tree::ptree::const_iterator j = it->second.begin(); j != it->second.end(); ++j )
-    {
-        traverse_( os, ptree, j, path );
-    }
-    if( !(it->first.empty()) ) { path = path.head(); }
+    for( boost::property_tree::ptree::const_iterator j = it->second.begin(); j != it->second.end(); ++j ) { traverse_( os, ptree, j, path ); }
+    if( !( it->first.empty() ) ) { path = path.head(); }
+    return found; // todo! aweful!
 }
 
 void match_regex_( std::ostream& os, const boost::property_tree::ptree& ptree )
 {
+    bool found = false;
     for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
     {
         comma::xpath path;
-        traverse_( os, ptree, i, path );
+        found = traverse_( os, ptree, i, path ) || found;
     }
+    if( found && output_last_line_break ) { os << std::endl; }
 }
 
 static bool is_regex_(const std::string& s)
@@ -228,7 +236,7 @@ static bool is_regex_(const std::string& s)
     std::string regex_characters = regex_characters_;
     if (option_regex) { regex_characters += "[]"; }
     for( unsigned int k = 0; k < regex_characters.size(); ++k )
-    { 
+    {
         if( s.find_first_of( regex_characters[k] ) != std::string::npos ) { return true; }
     }
     return false;
@@ -263,13 +271,14 @@ int main( int ac, char** av )
         boost::optional< char > delimiter = options.optional< char >( "--delimiter,-d" );
         path_value_delimiter = delimiter ? *delimiter : ( linewise ? ',' : '\n' );
         output_path = options.exists( "--output-path" );
+        if( output_path && to != "path-value" ) { std::cerr << "name-value-get: --output-path is compatible only with --to=path-value; got: --to=" << to << std::endl; return 1; }
         if( from )
         {
             if( *from == "ini" ) { input = &traits< ini >::input; }
             else if( *from == "info" ) { input = &traits< info >::input; }
             else if( *from == "json" ) { input = &traits< json >::input; }
             else if( *from == "xml" ) { input = &traits< xml >::input; }
-            else if( *from == "path-value" ) { input = &traits< path_value >::input; }
+            else if( *from == "path-value" ) { input = &traits< path_value >::input; } // super-quick and dirty!
             else { std::cerr << "name-value-get: expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         }
         else
@@ -281,7 +290,7 @@ int main( int ac, char** av )
         else if( to == "info" ) { output = &traits< info >::output; }
         else if( to == "json" ) { output = &traits< json >::output; }
         else if( to == "xml" ) { output = &traits< xml >::output; }
-        else if( to == "path-value" ) { output = &traits< path_value >::output; }
+        else if( to == "path-value" ) { output = &traits< path_value >::output; output_last_line_break = true; }
         else { std::cerr << "name-value-get: expected --to format to be ini, info, json, xml, or path-value, got " << to << std::endl; return 1; }
         indices_mode = options.exists( "--no-brackets" ) ? comma::property_tree::without_brackets : comma::property_tree::with_brackets;
         if( linewise )
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index a42a6c985..78f9454d5 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author cedric wohlleber
 /// @author vsevolod vlaskine
@@ -50,7 +23,7 @@
 #include "ptree.h"
 
 namespace comma {
-    
+
 void property_tree::put( boost::property_tree::ptree& ptree, const xpath& path, const std::string& value, bool use_index )
 {
     boost::property_tree::ptree* t = &ptree;
@@ -132,7 +105,7 @@ boost::optional< std::string > property_tree::get( const boost::property_tree::p
     if( !t ) { return boost::none; }
     return t->get_value_optional< std::string >();
 }
-    
+
 } // namespace comma {
 
 namespace comma { namespace impl {
@@ -145,15 +118,23 @@ static void ptree_output_value_( std::ostream& os, const std::string& value, boo
     os << path.to_string() << equal_sign;
     bool quoted = true;
     if( unquote_numbers )
-    { 
+    {
         if( "true" == value || "false" == value ) { quoted = false; }
         else if( !boost::regex_match( value, number_like_string ) ) { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
     }
     if( quoted ) { os << '"' << value << '"'; } else { os << value; }
 }
 
-static void ptree_to_path_value_string_impl( std::ostream& os, boost::property_tree::ptree::const_iterator i, bool is_begin, xpath& path, xpath& display_path, 
-                                                    property_tree::path_mode mode, char equal_sign, char delimiter, const std::string& root, bool const unquote_numbers )
+static void ptree_to_path_value_string_impl( std::ostream& os
+                                           , boost::property_tree::ptree::const_iterator i
+                                           , bool is_begin
+                                           , xpath& path
+                                           , xpath& display_path
+                                           , property_tree::path_mode mode
+                                           , char equal_sign
+                                           , char delimiter
+                                           , const std::string& root
+                                           , bool const unquote_numbers )
 {
     if( i->second.begin() == i->second.end() )
     {
@@ -169,7 +150,7 @@ static void ptree_to_path_value_string_impl( std::ostream& os, boost::property_t
             const std::string& stripped = comma::strip( *v );
             if( !stripped.empty() )  { ptree_output_value_( os, stripped, is_begin, display_path, equal_sign, delimiter, root, unquote_numbers );  }
         }
-        
+
         comma::uint32 index=0;
         for( boost::property_tree::ptree::const_iterator j = i->second.begin(); j != i->second.end(); ++j )
         {
@@ -195,7 +176,7 @@ void property_tree::to_path_value( std::ostream& os, const boost::property_tree:
     {
         // display_path is the modified key path showing array indices, if array exists within e.g abc[0]/xyz[0]
         // But the actual path to the value is many empty keys under abc and abc/xyz
-        // Boost: "JSON arrays are mapped to nodes. Each element is a child node with an empty name. 
+        // Boost: "JSON arrays are mapped to nodes. Each element is a child node with an empty name.
         //         If a node has both named and unnamed child nodes, it cannot be mapped to a JSON representation."
         // http://www.boost.org/doc/libs/1_41_0/doc/html/boost_propertytree/parsers.html#boost_propertytree.parsers.json_parser
         xpath path;
@@ -241,7 +222,7 @@ template <> struct path_filter< property_tree::path_value::no_overwrite >
     bool put_allowed( const std::string& p, bool use_index ) const
     {
         if( use_index )
-        { 
+        {
             if( property_tree::get( ptree_, p, use_index ) ) { COMMA_THROW( comma::exception, "input path '" << p << "' already in the tree" ); }
         }
         else
@@ -328,11 +309,11 @@ bool is_seekable( std::istream& stream ) { return static_cast< bool >( stream.se
 
 void property_tree::from_unknown( std::istream& stream, boost::property_tree::ptree& ptree, property_tree::path_value::check_repeated_paths check_type, char equal_sign, char delimiter, bool use_index )
 {
-    if( is_seekable( stream ) ) 
+    if( is_seekable( stream ) )
     {
-        from_unknown_seekable( stream, ptree, check_type, equal_sign, delimiter, use_index ); 
+        from_unknown_seekable( stream, ptree, check_type, equal_sign, delimiter, use_index );
     }
-    else 
+    else
     {
         std::stringstream buffer;
         buffer << stream.rdbuf();
@@ -396,7 +377,7 @@ static boost::property_tree::ptree xml_to_ptree_( boost::property_tree::ptree& p
 
 void property_tree::read_xml( std::istream& is, boost::property_tree::ptree& ptree )
 {
-        boost::property_tree::read_xml( is, ptree ); 
+        boost::property_tree::read_xml( is, ptree );
         ptree=xml_to_ptree_(ptree);
 }
 
diff --git a/name_value/test/name-value-get/expected b/name_value/test/name-value-get/expected
index bdc7f1975..317e32094 100644
--- a/name_value/test/name-value-get/expected
+++ b/name_value/test/name-value-get/expected
@@ -11,14 +11,14 @@ empty_input[0]/output=''
 non_existant[0]/output=''
 non_existant[1]/output=''
 
-multiple_results[0]/output='c="0";c="1"'
-multiple_results[1]/output='c="0";d="1";e="2"'
+multiple_results[0]/output='c="0";c="1";'
+multiple_results[1]/output='c="0";d="1";e="2";'
 
 indexed_path[0]/output='1'
 indexed_path[1]/output='1'
-indexed_path[2]/output='c="0"'
+indexed_path[2]/output='c="0";'
 indexed_path[3]/output='1'
-indexed_path[4]/output='b[0]/c="0";b[1]/c="1"'
+indexed_path[4]/output='b[0]/c="0";b[1]/c="1";'
 
 regex[0]/output='1'
 regex[1]/output='0;1;'
diff --git a/name_value/test/name-value-get/input b/name_value/test/name-value-get/input
index e17167dda..e1d56b2df 100644
--- a/name_value/test/name-value-get/input
+++ b/name_value/test/name-value-get/input
@@ -11,7 +11,7 @@ non_existant[1]=echo '{ "a": 1, "b": 2, "c": { "d": 3 }}' | name-value-get x/b
 
 empty_input[0]=name-value-get x < /dev/null
 
-multiple_results[0]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-convert --to json | name-value-get a/b | tr \'\\\n\' \';\'"
+multiple_results[0]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-convert --to json | name-value-get a/b | tr '\\n' ';'"
 multiple_results[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/e=2; ) | name-value-get a/b | tr \'\\\n\' \';\'"
 
 indexed_path[0]="echo a[0]=1 | name-value-get a[0]"
diff --git a/name_value/test/regex/expected b/name_value/test/regex/expected
index bd52695f3..624277f58 100644
--- a/name_value/test/regex/expected
+++ b/name_value/test/regex/expected
@@ -10,13 +10,13 @@ test[4]/output='b'
 test[4]/status=0
 #test[5]/output='a;b;'
 #test[5]/status=0
-test[6]/output='y[0]="a";y[1]="b"'
+test[6]/output='y[0]="a";y[1]="b";'
 test[6]/status=0
-test[7]/output='y[0]="4";y[0]="5"'
+test[7]/output='y[0]="4";y[0]="5";'
 test[7]/status=0
 test[8]/output='4'
 test[8]/status=0
 test[9]/output='5'
 test[9]/status=0
 test[10]/output='6;7;'
-test[10]/status=0
\ No newline at end of file
+test[10]/status=0

From 57766e8805a9a1c4466a1064a93dcb65572d5f26 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 1 Jun 2022 12:04:25 +1000
Subject: [PATCH 0505/1056] name-value-convert: --path implemented and tested

---
 .../applications/name-value-convert.cpp       | 65 ++++++++++---------
 name_value/applications/name-value-get.cpp    | 28 --------
 name_value/test/name-value-convert/expected   | 18 +++++
 name_value/test/name-value-convert/input      | 17 +++++
 4 files changed, 71 insertions(+), 57 deletions(-)

diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index b228f76d8..ec4f7f5f3 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -54,6 +27,10 @@ static void usage( bool verbose = false )
     std::cerr << "data options" << std::endl;
     std::cerr << "    --from <format>: input format; if this options is omitted, input format will be guessed (only for json, xml, and path-value)" << std::endl;
     std::cerr << "    --to <format>: output format; default path-value" << std::endl;
+    std::cerr << "    --path=[<path>]; output data at a given path in the input" << std::endl;
+    std::cerr << "                     multiple instances of --path supported" << std::endl;
+    std::cerr << "                     regex expression support: todo" << std::endl;
+    std::cerr << "    --strict: return error if path specified in --path not found" << std::endl;
     std::cerr << std::endl;
     std::cerr << "formats" << std::endl;
     std::cerr << "    info: info data (see boost::property_tree)" << std::endl;
@@ -167,6 +144,7 @@ int main( int ac, char** av )
         linewise = options.exists( "--linewise,-l" );
         minify_json = options.exists( "--minify" );
         options.assert_mutually_exclusive( "--unquote-numbers,--unquote", "--quote-numbers,--quote" );
+        options.assert_mutually_exclusive( "--path", "--linewise" );
         unquote_numbers = options.exists( "--unquote-numbers,--unquote" );
         quote_numbers = options.exists( "--quote-numbers,--quote" ) && !unquote_numbers; // todo: quick and dirty, combine logic, it sucks now that there is different logic for json and everything else
         if ( options.exists( "--take-last" ) ) check_type = comma::property_tree::path_value::take_last;
@@ -174,6 +152,9 @@ int main( int ac, char** av )
         xml_writer_settings.indent_count = options.value( "--indent", options.exists( "--indented" ) ? 4 : 0 );
         boost::optional< char > delimiter = options.optional< char >( "--delimiter,-d" );
         path_value_delimiter = delimiter ? *delimiter : ( linewise ? ',' : '\n' );
+        const auto& paths = options.values< std::string >( "--path" );
+        bool strict = options.exists( "--strict" );
+        bool output_line_breaks = to == "path-value" && path_value_delimiter != '\n'; // hyper-quick and dirty
         if( from )
         {
             if( *from == "ini" ) { input = &traits< ini >::input; }
@@ -192,7 +173,8 @@ int main( int ac, char** av )
         else if( to == "info" ) { output = &traits< info >::output; }
         else if( to == "json" ) { output = &traits< json >::output; }
         else if( to == "xml" ) { output = &traits< xml >::output; }
-        else { output = &traits< path_value >::output; }
+        else if( to == "path-value" ) { output = &traits< path_value >::output; }
+        else { std::cerr << "name-value-convert: expected --to format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         if( use_index )
         {
             if( options.exists( "--no-brackets" ) ) { indices_mode = comma::property_tree::without_brackets; }
@@ -233,7 +215,32 @@ int main( int ac, char** av )
         {
             boost::property_tree::ptree ptree;
             input( std::cin, ptree );
-            output( std::cout, ptree, indices_mode );
+            if( paths.empty() )
+            {
+                output( std::cout, ptree, indices_mode );
+            }
+            else
+            {
+                std::string eol;
+                for( const auto& path: paths )
+                {
+                    auto child = comma::property_tree::get_tree( ptree, path ); // paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' )
+                    if( !child ) { if( strict ) { std::cerr << "name-value-convert: path \"" << path << "\" not found" << std::endl; return 1; } else { continue; } }
+                    boost::optional< std::string > value = child->get_optional< std::string >( "" );
+                    std::cout << eol;
+                    if( value && !value->empty() ) // todo? output empty values?
+                    {
+                        boost::property_tree::ptree t;
+                        t.add_child( comma::split( path, '/' ).back(), boost::property_tree::ptree() ).put_value( *value ); // quick and dirty; lame...
+                        output( std::cout, t, indices_mode );
+                    }
+                    else
+                    {
+                        output( std::cout, *child, indices_mode );
+                    }
+                    if( output_line_breaks ) { eol = std::string( 1, path_value_delimiter ); } // quick and dirty
+                }
+            }
         }
         return 0;
     }
diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index 239177d99..9991008ff 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
diff --git a/name_value/test/name-value-convert/expected b/name_value/test/name-value-convert/expected
index d8170fca7..14ceb85d1 100644
--- a/name_value/test/name-value-convert/expected
+++ b/name_value/test/name-value-convert/expected
@@ -7,3 +7,21 @@ quoting[6]/output='a=1'
 quoting[4]/output='{"a":"1"}'
 quoting[5]/output='a="1"'
 quoting[6]/output='a=1'
+
+paths[0]/output='a/b="1";a/c="2";x/y="3";x/z="4"'
+paths[1]/output='b="1";c="2"'
+paths[2]/output='b=1;c=2'
+paths[3]/output='y="3";z="4";b="1";c="2"'
+paths[4]/output='y="3"'
+paths[5]/output='y=3'
+paths[6]/output='z="4";y="3"'
+paths[7]/output='y=3;z=4'
+paths[8]/output='z="4";y="3";b="1";c="2"'
+paths[9]/output=''
+paths[9]/status=0
+paths[10]/status=1
+paths[11]/output='b="1";c="2";'
+paths[12]/output='y="3";z="4";b="1";c="2";'
+paths[13]/output='y="3";'
+paths[14]/output='z="4";y="3";'
+paths[15]/output='z="4";y="3";b="1";c="2";'
diff --git a/name_value/test/name-value-convert/input b/name_value/test/name-value-convert/input
index 54cdf54fb..90557b5d0 100644
--- a/name_value/test/name-value-convert/input
+++ b/name_value/test/name-value-convert/input
@@ -7,3 +7,20 @@ quoting[6]="echo a=1 | name-value-convert --to json --minify | name-value-conver
 quoting[4]="echo a=1 | name-value-convert --to json --quote-numbers --minify"
 quoting[5]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert"
 quoting[6]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert --unquote-numbers"
+
+paths[0]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --delimiter=';'"
+paths[1]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path a --delimiter=';'"
+paths[2]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path a --delimiter=';' --unquote-numbers"
+paths[3]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x --path a --delimiter=';'"
+paths[4]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y --delimiter=';'"
+paths[5]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y --delimiter=';' --unquote-numbers"
+paths[6]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y --delimiter=';'"
+paths[7]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y --path x/z --delimiter=';' --unquote-numbers"
+paths[8]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y --path a --delimiter=';'"
+paths[9]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path s/t --delimiter=';'"
+paths[10]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path s/t --strict --delimiter=';'"
+paths[11]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path a | tr '\\n' ';'"
+paths[12]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x --path a | tr '\\n' ';'"
+paths[13]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y | tr '\\n' ';'"
+paths[14]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y | tr '\\n' ';'"
+paths[15]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y --path a | tr '\\n' ';'"

From 085a239fc2dfc322f3c52126cc3a179b25fa2f7f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 1 Jun 2022 12:15:05 +1000
Subject: [PATCH 0506/1056] name-value-convert: --from/--to: pv as alias for
 path-value added for backward compatibility

---
 name_value/applications/name-value-convert.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index ec4f7f5f3..f8caf56d2 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -25,8 +25,8 @@ static void usage( bool verbose = false )
     std::cerr << "usage: cat data.xml | name-value-convert [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "data options" << std::endl;
-    std::cerr << "    --from <format>: input format; if this options is omitted, input format will be guessed (only for json, xml, and path-value)" << std::endl;
-    std::cerr << "    --to <format>: output format; default path-value" << std::endl;
+    std::cerr << "    --from <format>: input format; if this options is omitted, input format will be guessed; formats: json, xml, path-value/pv" << std::endl;
+    std::cerr << "    --to <format>: output format; formats: ini, json, xml, path-value (pv); default: path-value" << std::endl;
     std::cerr << "    --path=[<path>]; output data at a given path in the input" << std::endl;
     std::cerr << "                     multiple instances of --path supported" << std::endl;
     std::cerr << "                     regex expression support: todo" << std::endl;
@@ -161,7 +161,7 @@ int main( int ac, char** av )
             else if( *from == "info" ) { input = &traits< info >::input; }
             else if( *from == "json" ) { input = &traits< json >::input; }
             else if( *from == "xml" ) { input = &traits< xml >::input; }
-            else if( *from == "path-value" ) { input = &traits< path_value >::input; }
+            else if( *from == "path-value" || *from == "pv" ) { input = &traits< path_value >::input; }
             else { std::cerr << "name-value-convert: expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         }
         else
@@ -173,7 +173,7 @@ int main( int ac, char** av )
         else if( to == "info" ) { output = &traits< info >::output; }
         else if( to == "json" ) { output = &traits< json >::output; }
         else if( to == "xml" ) { output = &traits< xml >::output; }
-        else if( to == "path-value" ) { output = &traits< path_value >::output; }
+        else if( to == "path-value" || to == "pv" ) { output = &traits< path_value >::output; }
         else { std::cerr << "name-value-convert: expected --to format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         if( use_index )
         {

From 9885e3e66595f066953197cbd3149b003a52ae96 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 5 Jun 2022 11:16:33 +1000
Subject: [PATCH 0507/1056] name_value::map: unique constructor flag added

---
 name_value/map.h                    | 77 ++++++++++-------------------
 name_value/test/name_value_test.cpp | 47 +++++-------------
 2 files changed, 38 insertions(+), 86 deletions(-)

diff --git a/name_value/map.h b/name_value/map.h
index 127aa1ae2..802358c1a 100644
--- a/name_value/map.h
+++ b/name_value/map.h
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @authors cedric wohlleber, vsevolod vlaskine
 
@@ -41,23 +13,23 @@
 namespace comma { namespace name_value {
 
 /// constructs a map of name-value pair from an input string
-/// TODO implement full_path_as_name ? 
+/// TODO implement full_path_as_name ?
 class map
 {
     public:
         /// constructor
-        map( const std::string& line, char delimiter = ';', char value_delimiter = '=' );
+        map( const std::string& line, char delimiter = ';', char value_delimiter = '=', bool unique = false );
         /// constructor
-        map( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=' );
+        map( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=', bool unique = false );
         /// constructor
-        map( const std::string& line, const impl::options& options );
-        
+        map( const std::string& line, const impl::options& options, bool unique = false );
+
         /// return vector of name-value pairs in the given order
         static std::vector< std::pair< std::string, std::string > > as_vector( const std::string& line, char delimiter = ';', char value_delimiter = '=' );
-        
+
         /// return vector of name-value pairs in the given order
         static std::vector< std::pair< std::string, std::string > > as_vector( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=' );
-        
+
         /// return vector of name-value pairs in the given order
         static std::vector< std::pair< std::string, std::string > > as_vector( const std::string& line, const impl::options& options );
 
@@ -75,7 +47,7 @@ class map
         /// return first available value, if field exists; otherwise throw
         template < typename T >
         T value( const std::string& name ) const;
-        
+
         /// return first available value, if field exists; otherwise return empty optional
         template < typename T >
         boost::optional< T > optional( const std::string& name ) const;
@@ -84,19 +56,19 @@ class map
         typedef std::multimap< std::string, std::string > map_type;
 
         /// return name-value map
-        const map_type& get() const { return m_map; }
+        const map_type& get() const { return _map; }
 
     private:
-        void init_( const comma::name_value::impl::options& options );
-        const std::string m_line;
-        map_type m_map;
+        void init_( const comma::name_value::impl::options& options, bool unique );
+        const std::string _line;
+        map_type _map;
 };
 
-inline map::map( const std::string& line, char delimiter, char value_delimiter ): m_line( line ) { init_( impl::options( delimiter, value_delimiter ) ); }
+inline map::map( const std::string& line, char delimiter, char value_delimiter, bool unique ): _line( line ) { init_( impl::options( delimiter, value_delimiter ), unique ); }
 
-inline map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter ): m_line( line ) { init_( impl::options( fields, delimiter, value_delimiter ) ); }
+inline map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter, bool unique ): _line( line ) { init_( impl::options( fields, delimiter, value_delimiter ), unique ); }
 
-inline map::map( const std::string& line, const comma::name_value::impl::options& options ): m_line( line ) { init_( options ); }
+inline map::map( const std::string& line, const comma::name_value::impl::options& options, bool unique ): _line( line ) { init_( options, unique ); }
 
 inline static std::vector< std::string > get_named_values( const std::string& line, const comma::name_value::impl::options& options )
 {
@@ -110,22 +82,23 @@ inline static std::vector< std::string > get_named_values( const std::string& li
     return named_values;
 }
 
-inline void map::init_( const comma::name_value::impl::options& options )
+inline void map::init_( const comma::name_value::impl::options& options, bool unique )
 {
-    const std::vector< std::string >& named_values = get_named_values( m_line, options );
+    const std::vector< std::string >& named_values = get_named_values( _line, options );
     for( std::size_t i = 0; i < named_values.size(); ++i )
     {
-        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &(options.m_quotes[0]), options.m_escape );
+        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &( options.m_quotes[0]), options.m_escape );
+        if( unique && pair.size() > 0 && _map.find( pair[0] ) != _map.end() ) { COMMA_THROW_STREAM( comma::exception, "expected unique names, got more than one \"" << pair[0] << "\"" ); }
         switch( pair.size() )
         {
-            case 1: m_map.insert( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
-            case 2: m_map.insert( std::make_pair( pair[0], pair[1] ) ); break;
+            case 1: _map.insert( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
+            case 2: _map.insert( std::make_pair( pair[0], pair[1] ) ); break;
             default: { COMMA_THROW_STREAM( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
         }
     }
 }
 
-inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( delimiter, value_delimiter ) ); } 
+inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( delimiter, value_delimiter ) ); }
 
 inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const std::string& fields, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( fields, delimiter, value_delimiter ) ); }
 
@@ -146,7 +119,7 @@ inline std::vector< std::pair< std::string, std::string > > map::as_vector( cons
     return v;
 }
 
-inline bool map::exists( const std::string& name ) const { return m_map.find( name ) != m_map.end(); }
+inline bool map::exists( const std::string& name ) const { return _map.find( name ) != _map.end(); }
 
 namespace detail {
 
@@ -176,7 +149,7 @@ template < typename T >
 inline std::vector< T > map::values( const std::string& name ) const
 {
     std::vector< T > v;
-    for( typename map_type::const_iterator it = m_map.begin(); it != m_map.end(); ++it )
+    for( typename map_type::const_iterator it = _map.begin(); it != _map.end(); ++it )
     {
         if( it->first == name ) { v.push_back( detail::lexical_cast< T >( it->second ) ); }
     }
@@ -194,7 +167,7 @@ template < typename T >
 inline T map::value( const std::string& name ) const
 {
     const std::vector< T >& v = values< T >( name );
-    if( v.empty() ) { COMMA_THROW_STREAM( comma::exception, "'" << name << "' not found in \"" << m_line << "\"" ); }
+    if( v.empty() ) { COMMA_THROW_STREAM( comma::exception, "'" << name << "' not found in \"" << _line << "\"" ); }
     return v[0];
 }
 
diff --git a/name_value/test/name_value_test.cpp b/name_value/test/name_value_test.cpp
index d166e1390..375b15b6a 100644
--- a/name_value/test/name_value_test.cpp
+++ b/name_value/test/name_value_test.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 #include <gtest/gtest.h>
 #include "../../name_value/parser.h"
@@ -110,12 +82,12 @@ template <> struct traits< nested_with_optional >
         v.apply( "c", t.c );
         v.apply( "d", t.d );
     }
-    
+
     template < typename Key, class Visitor > static void visit( Key, nested_with_optional& t, Visitor& v )
     {
         v.apply( "c", t.c );
         v.apply( "d", t.d );
-    }    
+    }
 };
 
 template <> struct traits< struct_with_optional >
@@ -126,13 +98,13 @@ template <> struct traits< struct_with_optional >
         v.apply( "b", t.b );
         v.apply( "nested", t.nested );
     }
-    
+
     template < typename Key, class Visitor > static void visit( Key, struct_with_optional& t, Visitor& v )
     {
         v.apply( "a", t.a );
         v.apply( "b", t.b );
         v.apply( "nested", t.nested );
-    }    
+    }
 };
 
 } } // namespace comma { namespace visiting {
@@ -174,7 +146,7 @@ template <> struct traits< config >
 
 } } // namespace comma { namespace visiting {
 
-    
+
 namespace comma { namespace name_value { namespace test {
 
 TEST( name_value, get )
@@ -302,7 +274,7 @@ TEST( name_value, serialize_json )
     EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\"b\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\"b\" }" ) );
     EXPECT_EQ( "{ \"a\": 1, \"b\": \"val\" }", json_remove_quotes_wrapper( "{ \"a\": \"1\", \"b\": \"val\" }" ) );
     EXPECT_EQ( "{ \"a\": [ 4.44, true, \"e\" ] }", json_remove_quotes_wrapper( "{ \"a\": [ \"4.44\", \"true\", \"e\" ] }" ) );
-    
+
     EXPECT_EQ( "{ \"a\": [ { \"b\": { \"c\": [ { \"d\": 1, \"e\": false }, { \"d\":2, \"e\": true } ] } } ], \"p\": { \"q\": { \"r\": 3.9e8, \"s\": \"t\"} }, \"x\": { \"y\": [ \"z\", 0.1e-3 ] } }", json_remove_quotes_wrapper( "{ \"a\": [ { \"b\": { \"c\": [ { \"d\": \"1\", \"e\": \"false\" }, { \"d\":2, \"e\": \"true\" } ] } } ], \"p\": { \"q\": { \"r\": \"3.9e8\", \"s\": \"t\"} }, \"x\": { \"y\": [ \"z\", \"0.1e-3\" ] } }" ) );
 
     //minify
@@ -362,6 +334,13 @@ TEST( name_value, as_vector )
     }
 }
 
+TEST( name_value, unique )
+{
+    void( name_value::map( "a=1;b;c=2", ';', '=', true ) );
+    EXPECT_THROW( name_value::map( "a=1;b;a=2;c=2", ';', '=', true ), comma::exception );
+    EXPECT_THROW( name_value::map( "a=1;b;b;c=2", ';', '=', true ), comma::exception );
+}
+
 } } }
 
 int main( int argc, char* argv[] )

From 2625d60ba9871c8b99c7057f35a7c66bb50366b2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 5 Jun 2022 12:05:02 +1000
Subject: [PATCH 0508/1056] name_value::map: optional allowed_names added

---
 name_value/map.h                    | 27 +++++++++++++----------
 name_value/test/name_value_test.cpp |  7 ++++++
 string/split.h                      | 34 +++--------------------------
 3 files changed, 26 insertions(+), 42 deletions(-)

diff --git a/name_value/map.h b/name_value/map.h
index 802358c1a..c56fc4d4a 100644
--- a/name_value/map.h
+++ b/name_value/map.h
@@ -4,10 +4,12 @@
 
 #pragma once
 
+#include <unordered_set>
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/date_time/posix_time/time_parsers.hpp>
 #include <boost/optional.hpp>
 #include <boost/lexical_cast.hpp>
+#include "../string/string.h"
 #include "impl/options.h"
 
 namespace comma { namespace name_value {
@@ -18,11 +20,11 @@ class map
 {
     public:
         /// constructor
-        map( const std::string& line, char delimiter = ';', char value_delimiter = '=', bool unique = false );
+        map( const std::string& line, char delimiter = ';', char value_delimiter = '=', bool unique = false, const std::string& allowed_names = "" );
         /// constructor
-        map( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=', bool unique = false );
+        map( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=', bool unique = false, const std::string& allowed_names = "" );
         /// constructor
-        map( const std::string& line, const impl::options& options, bool unique = false );
+        map( const std::string& line, const impl::options& options, bool unique = false, const std::string& allowed_names = "" );
 
         /// return vector of name-value pairs in the given order
         static std::vector< std::pair< std::string, std::string > > as_vector( const std::string& line, char delimiter = ';', char value_delimiter = '=' );
@@ -59,16 +61,16 @@ class map
         const map_type& get() const { return _map; }
 
     private:
-        void init_( const comma::name_value::impl::options& options, bool unique );
+        void init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names );
         const std::string _line;
         map_type _map;
 };
 
-inline map::map( const std::string& line, char delimiter, char value_delimiter, bool unique ): _line( line ) { init_( impl::options( delimiter, value_delimiter ), unique ); }
+inline map::map( const std::string& line, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( delimiter, value_delimiter ), unique, allowed_names ); }
 
-inline map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter, bool unique ): _line( line ) { init_( impl::options( fields, delimiter, value_delimiter ), unique ); }
+inline map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( fields, delimiter, value_delimiter ), unique, allowed_names ); }
 
-inline map::map( const std::string& line, const comma::name_value::impl::options& options, bool unique ): _line( line ) { init_( options, unique ); }
+inline map::map( const std::string& line, const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names ): _line( line ) { init_( options, unique, allowed_names ); }
 
 inline static std::vector< std::string > get_named_values( const std::string& line, const comma::name_value::impl::options& options )
 {
@@ -76,24 +78,27 @@ inline static std::vector< std::string > get_named_values( const std::string& li
     for( std::size_t i = 0; i < options.m_names.size() && i < named_values.size(); ++i )
     {
         if( options.m_names[i].empty() ) { continue; }
-        if( split( named_values[i], options.m_value_delimiter ).size() != 1U ) { COMMA_THROW_STREAM( comma::exception, "expected unnamed value for " << options.m_names[i] << ", got: " << named_values[i] ); }
+        if( split( named_values[i], options.m_value_delimiter ).size() != 1U ) { COMMA_THROW( comma::exception, "expected unnamed value for " << options.m_names[i] << ", got: " << named_values[i] ); }
         named_values[i] = options.m_names[i] + options.m_value_delimiter + named_values[i];
     }
     return named_values;
 }
 
-inline void map::init_( const comma::name_value::impl::options& options, bool unique )
+inline void map::init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names )
 {
+    std::unordered_set< std::string > allowed;
+    for( auto name: comma::split( allowed_names, ',', true ) ) { allowed.insert( name ); }
     const std::vector< std::string >& named_values = get_named_values( _line, options );
     for( std::size_t i = 0; i < named_values.size(); ++i )
     {
         std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &( options.m_quotes[0]), options.m_escape );
-        if( unique && pair.size() > 0 && _map.find( pair[0] ) != _map.end() ) { COMMA_THROW_STREAM( comma::exception, "expected unique names, got more than one \"" << pair[0] << "\"" ); }
+        if( !allowed.empty() && allowed.find( pair[0] ) == allowed.end() ) { COMMA_THROW( comma::exception, "name \"" << pair[0] << "\" is not among allowed names: " << allowed_names ); }
+        if( unique && pair.size() > 0 && _map.find( pair[0] ) != _map.end() ) { COMMA_THROW( comma::exception, "expected unique names, got more than one \"" << pair[0] << "\"" ); }
         switch( pair.size() )
         {
             case 1: _map.insert( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
             case 2: _map.insert( std::make_pair( pair[0], pair[1] ) ); break;
-            default: { COMMA_THROW_STREAM( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
+            default: { COMMA_THROW( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
         }
     }
 }
diff --git a/name_value/test/name_value_test.cpp b/name_value/test/name_value_test.cpp
index 375b15b6a..5a0912d8c 100644
--- a/name_value/test/name_value_test.cpp
+++ b/name_value/test/name_value_test.cpp
@@ -341,6 +341,13 @@ TEST( name_value, unique )
     EXPECT_THROW( name_value::map( "a=1;b;b;c=2", ';', '=', true ), comma::exception );
 }
 
+TEST( name_value, allowed_names )
+{
+    void( name_value::map( "a=1;b;c=2", ';', '=', false, "a,b,c" ) );
+    EXPECT_THROW( name_value::map( "a=1;b;x;a=2;c=2", ';', '=', false, "a,b,c" ), comma::exception );
+    EXPECT_THROW( name_value::map( "a=1;b;x=5;b;c=2", ';', '=', false, "a,b,c" ), comma::exception );
+}
+
 } } }
 
 int main( int argc, char* argv[] )
diff --git a/string/split.h b/string/split.h
index 3e293a0e6..a21310dbc 100644
--- a/string/split.h
+++ b/string/split.h
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -38,7 +11,7 @@
 namespace comma {
 
 namespace string {
-    
+
 bool is_one_of( char c, const char* characters );
 
 } // namespace string {
@@ -66,7 +39,7 @@ std::vector< T > split_as( const std::string& s, char separator );
 /// An escape character will only escape a delimiter, quote or escape character;
 /// escaping any other character will result in both being kept;
 /// e.g. c:\windows\ will be kept as c:\windows\ with the trailing backslash
-/// e.g. filename;delimiter=\\;fields=a,b will be kept as filename;delimiter=\;fields=a,b 
+/// e.g. filename;delimiter=\\;fields=a,b will be kept as filename;delimiter=\;fields=a,b
 ///
 /// A quote may be anywhere in a string. Quotes must be closed; i.e Each start
 /// quote must be paired with an end quote, or an exception is thrown.
@@ -74,7 +47,7 @@ std::vector< T > split_as( const std::string& s, char separator );
 /// However "'" and '"' are perfectly legal strings of ' and "
 std::vector< std::string > split_escaped( const std::string& s, const char * separators = " ", const char * quotes = "\"\'", char escape = '\\' );
 /// split string into tokens; always contains at least one element;
-/// skips backslash escaped seperator, handle boolean quotes 
+/// skips backslash escaped separator, handle boolean quotes
 std::vector< std::string > split_escaped( const std::string& s, char separator, const char * quotes = "\"\'", char escape = '\\' );
 /// skips bracketed separators
 std::vector< std::string > split_bracketed( const std::string& s, const char * separators = " ", char lbracket = '(', char rbrackets = ')', bool strip_brackets = true );
@@ -97,4 +70,3 @@ template < typename T > inline std::vector< T > split_as( const std::string& s,
 }
 
 } // namespace comma {
-

From 7be8c53ed5d44531e1c5c7209a18e72fdd625b00 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 5 Jun 2022 12:06:02 +1000
Subject: [PATCH 0509/1056] csv-select: option name check added

---
 csv/applications/csv-select.cpp | 110 ++++++++++----------------------
 csv/options.h                   |  39 ++---------
 csv/traits.h                    |  29 +--------
 3 files changed, 39 insertions(+), 139 deletions(-)

diff --git a/csv/applications/csv-select.cpp b/csv/applications/csv-select.cpp
index 66ef2c3fc..dea184bac 100644
--- a/csv/applications/csv-select.cpp
+++ b/csv/applications/csv-select.cpp
@@ -1,37 +1,11 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
 #include <iostream>
-#include <sstream>
 #include <map>
+#include <sstream>
+#include <unordered_set>
 #include <vector>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
@@ -46,7 +20,7 @@
 #include "../../string/string.h"
 #include "../../visiting/traits.h"
 
-void usage()
+void usage( bool verbose )
 {
     std::cerr << std::endl;
     std::cerr << "find in a file or stream by constraints on a given key" << std::endl;
@@ -80,7 +54,7 @@ void usage()
     std::cerr << "fields: any non-empty fields will be treated as keys" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
-    std::cerr << comma::csv::options::usage() << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    cat a.csv | csv-select --fields=,,t --from=20120101T000000" << std::endl;
@@ -89,8 +63,7 @@ void usage()
     std::cerr << "    cat a.csv | csv-select --fields=t,scalar \"t;from=20120101T000000;sorted\" \"scalar;from=-10;to=20.5\"" << std::endl;
     std::cerr << "    echo hello,world | csv-select --fields=h,w \"h;regex=he.*\"" << std::endl;
     std::cerr << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 bool matches( const std::string& value, const boost::regex& r ) { return boost::regex_match( value, r ); }
@@ -135,19 +108,22 @@ struct constraints
 
     constraints( const std::string& options )
     {
-        comma::name_value::map m( options, ';', '=' ); // quick and dirty, since optional is not well-supported (euphymism for 'buggy') in comma::name_value::parser
-        if( m.exists( "equals" ) ) { equals = m.value< T >( "equals" ); }
-        if( m.exists( "not-equal" ) ) { not_equal = m.value< T >( "not-equal" ); }
-        if( m.exists( "less" ) ) { less = m.value< T >( "less" ); }
-        if( m.exists( "greater" ) ) { greater = m.value< T >( "greater" ); } // it was: { equal = m.value< T >( "greater" ); }
-        if( m.exists( "from" ) ) { from = m.value< T >( "from" ); }
-        if( m.exists( "greater-or-equal" ) ) { from = m.value< T >( "greater-or-equal" ); }
-        if( m.exists( "ge" ) ) { from = m.value< T >( "ge" ); }
-        if( m.exists( "to" ) ) { to = m.value< T >( "to" ); }
-        if( m.exists( "less-or-equal" ) ) { to = m.value< T >( "less-or-equal" ); }
-        if( m.exists( "le" ) ) { to = m.value< T >( "le" ); }
-        if( m.exists( "regex" ) ) { regex = boost::regex( m.value< std::string >( "regex" ) ); }
-        sorted = m.exists( "sorted" );
+        comma::name_value::map m( options.substr( options.find_first_of( ';' ) + 1 ), ';', '=', true, "equals,not-equal,less,greater,from,greater-or-equal,ge,to,less-or-equal,le,regex,sorted,fields,f,binary,b,delimiter,d,format" ); // quick and dirty, since optional is not well-supported (euphymism for 'buggy') in comma::name_value::parser
+        for( const auto& v: m.get() ) // super quick and dirty, suboptimal
+        {
+            if( v.first == "equals" ) { equals = m.value< T >( "equals" ); }
+            else if( v.first == "not-equal" ) { not_equal = m.value< T >( "not-equal" ); }
+            else if( v.first == "less" ) { less = m.value< T >( "less" ); }
+            else if( v.first == "greater" ) { greater = m.value< T >( "greater" ); } // it was: { equal = m.value< T >( "greater" ); }
+            else if( v.first == "from" ) { from = m.value< T >( "from" ); }
+            else if( v.first == "greater-or-equal" ) { from = m.value< T >( "greater-or-equal" ); }
+            else if( v.first == "ge" ) { from = m.value< T >( "ge" ); }
+            else if( v.first == "to" ) { to = m.value< T >( "to" ); }
+            else if( v.first == "less-or-equal" ) { to = m.value< T >( "less-or-equal" ); }
+            else if( v.first == "le" ) { to = m.value< T >( "le" ); }
+            else if( v.first == "regex" ) { regex = boost::regex( m.value< std::string >( "regex" ) ); }
+            else if( v.first == "sorted" ) { sorted = true; }
+        }
     }
 
     bool is_a_match( const T& t ) const // quick and dirty, implement a proper expression parser
@@ -216,15 +192,11 @@ struct input_t
 
     bool is_a_match( bool is_or ) const
     {
-//         std::cerr << "==> is_a_match: doubles: ";
-//         for( unsigned int i = 0; i < doubles.size(); ++i ) { std::cerr << doubles[i].value << " "; }
-//         std::cerr << std::endl;
         if( is_or )
         {
             for( unsigned int i = 0; i < time.size(); ++i ) { if( time[i].is_a_match( is_or ) ) { return true; } }
             for( unsigned int i = 0; i < doubles.size(); ++i ) { if( doubles[i].is_a_match( is_or ) ) { return true; } }
             for( unsigned int i = 0; i < strings.size(); ++i ) { if( strings[i].is_a_match( is_or ) ) { return true; } }
-    //        std::cerr << "==> is_a_match: done" << std::endl << std::endl;
             return false;
         }
         else
@@ -232,7 +204,6 @@ struct input_t
             for( unsigned int i = 0; i < time.size(); ++i ) { if( !time[i].is_a_match() ) { return false; } }
             for( unsigned int i = 0; i < doubles.size(); ++i ) { if( !doubles[i].is_a_match() ) { return false; } }
             for( unsigned int i = 0; i < strings.size(); ++i ) { if( !strings[i].is_a_match() ) { return false; } }
-    //        std::cerr << "==> is_a_match: done" << std::endl << std::endl;
             return true;
         }
     }
@@ -260,15 +231,8 @@ namespace comma { namespace visiting {
 
 template < typename T > struct traits< constrained< T > >
 {
-    template < typename K, typename V > static void visit( const K&, const constrained< T >& p, V& v )
-    {
-        v.apply( "value", p.value );
-    }
-
-    template < typename K, typename V > static void visit( const K&, constrained< T >& p, V& v )
-    {
-        v.apply( "value", p.value );
-    }
+    template < typename K, typename V > static void visit( const K&, const constrained< T >& p, V& v ) { v.apply( "value", p.value ); }
+    template < typename K, typename V > static void visit( const K&, constrained< T >& p, V& v ) { v.apply( "value", p.value ); }
 };
 
 template <> struct traits< input_t >
@@ -290,22 +254,17 @@ template <> struct traits< input_t >
 
 } } // namespace comma { namespace visiting {
 
-static bool verbose;
 static comma::csv::options csv;
 static input_t input;
 static std::vector< std::string > fields;
 typedef std::multimap< std::string, std::string > constraints_map_t;
 static constraints_map_t constraints_map;
 
-template < typename T >
-static constrained< T > make_value( unsigned int i, const comma::command_line_options& options )
+template < typename T > static constrained< T > make_value( unsigned int i, const comma::command_line_options& options )
 {
     constrained< T > v;
-    for( std::pair< constraints_map_t::const_iterator, constraints_map_t::const_iterator > r = constraints_map.equal_range( fields[i] ); r.first != r.second; ++r.first )
-    {
-        v.constraints.push_back( constraints< T >( r.first->second ) );
-    }
-    static constraints< T > common_constraints( options );
+    for( auto r = constraints_map.equal_range( fields[i] ); r.first != r.second; ++r.first ) { v.constraints.push_back( constraints< T >( r.first->second ) ); }
+    static constraints< T > common_constraints( options ); // quick and dirty
     if( !common_constraints.empty() ) { v.constraints.push_back( common_constraints ); }
     return v;
 }
@@ -339,16 +298,15 @@ static void init_input( const comma::csv::format& format, const comma::command_l
 
 int main( int ac, char** av )
 {
-        comma::command_line_options options( ac, av );
     try
     {
-        if( options.exists( "--help,-h" ) ) { usage(); }
-        verbose = options.exists( "--verbose,-v" );
+        comma::command_line_options options( ac, av, usage );
         bool is_or = options.exists( "--or" );
         csv = comma::csv::options( options );
         fields = comma::split( csv.fields, ',' );
         if( fields.size() == 1 && fields[0].empty() ) { fields.clear(); }
-        std::vector< std::string > unnamed = options.unnamed( "--first-matching,--or,--sorted,--input-sorted,--not-matching,--output-all,--all,--strict,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--first-matching,--or,--sorted,--input-sorted,--not-matching,--output-all,--all,--strict,--verbose,-v,--flush"
+                                                            , "--equals,--not-equal,--less,--greater,--from,--greater-or-equal,--ge,--to,--less-or-equal,--le,--regex,--fields,-f,--binary,-b,--format,--delimiter,-d,--precision" );
         //for( unsigned int i = 0; i < unnamed.size(); constraints_map.insert( std::make_pair( comma::split( unnamed[i], ';' )[0], unnamed[i] ) ), ++i );
         bool strict = options.exists( "--strict" );
         bool first_matching = options.exists( "--first-matching" );
@@ -359,13 +317,9 @@ int main( int ac, char** av )
             std::string field = comma::split( unnamed[i], ';' )[0];
             bool found = false;
             for( unsigned int j = 0; j < fields.size() && !found; found = field == fields[j], ++j );
-            if( !found )
-            {
-                if( strict ) { std::cerr << "csv-select: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl; return 1; }
-                std::cerr << "csv-select: warning: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl;
-                continue;
-            }
-            constraints_map.insert( std::make_pair( field, unnamed[i] ) );
+            if( found ) { constraints_map.insert( std::make_pair( field, unnamed[i] ) ); continue; }
+            if( strict ) { std::cerr << "csv-select: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl; return 1; }
+            std::cerr << "csv-select: warning: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl;
         }
         if( csv.binary() )
         {
diff --git a/csv/options.h b/csv/options.h
index 12bc7c863..d813587f8 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -52,7 +25,7 @@ class options
 
         /// return usage to incorporate into application usage
         static std::string usage( const std::string& default_fields = "", bool verbose = true );
-        
+
         /// return usage to incorporate into application usage
         static std::string usage( bool verbose ) { return usage( "", verbose ); }
 
@@ -71,10 +44,10 @@ class options
 
         /// precision
         unsigned int precision;
-        
+
         /// quote sign for strings
         boost::optional< char > quote;
-        
+
         /// if true, flush output stream after each record
         bool flush;
 
@@ -96,16 +69,16 @@ class options
         /// return true, if fields have all given fields (convenience function, slow)
         /// @param field comma-separated fields, e.g. "x,y,z"
         bool has_field( const std::string& fields_to_check ) const;
-        
+
         /// return true, if fields have some given fields (convenience function, slow)
         /// @param field comma-separated fields, e.g. "x,y,z"
         bool has_some_of_fields( const std::string& fields_to_check ) const;
-        
+
         /// return true, if fields have all given paths (convenience function, slow)
         /// @param field comma-separated fields, e.g. fields "centre/position/x,centre/position/y,centre/position/z,..."
         ///              have paths 'centre/position', 'centre', 'centre/position/x', etc
         bool has_paths( const std::string& paths ) const;
-        
+
         /// return true, if fields have some given paths (convenience function, slow)
         /// @param field comma-separated fields, e.g. fields "centre/position/x,centre/position/y,centre/position/z,..."
         ///              have paths 'centre/position', 'centre', 'centre/position/x', etc
diff --git a/csv/traits.h b/csv/traits.h
index d8ed02bf2..2f444a01e 100644
--- a/csv/traits.h
+++ b/csv/traits.h
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -49,7 +22,7 @@ template <> struct traits< comma::csv::options >
         v.apply( "quote", p.quote ? std::string( 1, *p.quote ) : std::string() );
         v.apply( "flush", p.flush );
         if( p.binary() ) { v.apply( "binary", p.format().string() ); }
-        
+
     }
 
     template < typename Key, class Visitor >

From 07fb9f407d66174d9d9674f1f563905ff887fc45 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 16 Jun 2022 12:06:49 +1000
Subject: [PATCH 0510/1056] python/setup.py: install_requires commented out;
 readme for pypi packaging updated

---
 python/setup.py         | 2 +-
 system/launchpad/readme | 5 +++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/python/setup.py b/python/setup.py
index 570a46594..7aa189ff2 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -29,7 +29,7 @@
         maintainer          = 'vsevolod vlaskine',
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
         python_requires     = '>=3.6',
-        install_requires    = [ 'numpy' ], # todo?
+        #install_requires    = [ 'numpy' ], # todo? does it need to be uncommented for packaging
         packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
diff --git a/system/launchpad/readme b/system/launchpad/readme
index 38a9babd7..e4f748c65 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -17,10 +17,11 @@ uploading to launchpad
 
 verifying ppa in docker
 
-uploading to pypi (i know, wrong place)
+uploading to pypi (i know, wrong place; todo: script)
 
 cd comma/python
-# bump up version in version.py
+# version.py: bump up version
+# setup.py: uncomment install_requires (commented since it messes installation for those who use apt to install python3 packages (e.g. numpy)
 python3 setup.py sdist bdist_wheel
 twine upload --repository-url https://pypi.org/legacy/ dist/* # test
 twine upload dist/*

From eb1516dfe3e302238dee90db82edccb3c002ba1d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 16 Jun 2022 14:32:09 +1000
Subject: [PATCH 0511/1056] csv/format: signed byte limits fixed: -128 to 127
 (was: -127 to 128)

---
 csv/format.cpp | 42 ++++--------------------------------------
 1 file changed, 4 insertions(+), 38 deletions(-)

diff --git a/csv/format.cpp b/csv/format.cpp
index 36ca1fac0..2e272e0ec 100644
--- a/csv/format.cpp
+++ b/csv/format.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -243,7 +215,7 @@ static std::size_t csv_to_bin( char* buf, const std::string& s, format::types_en
             case format::int8:
             {
                 int i = boost::lexical_cast< int >( s );
-                if( i < -127 || i > 128 ) { COMMA_THROW( comma::exception, "expected byte, got " << i ); }
+                if( i < -128 || i > 127 ) { COMMA_THROW( comma::exception, "expected byte, got " << i ); }
                 *buf = static_cast< char >( i );
                 return sizeof( char );
             }
@@ -287,14 +259,8 @@ static std::size_t csv_to_bin( char* buf, const std::string& s, format::types_en
             default: COMMA_THROW( comma::exception, "todo: not implemented" );
         }
     }
-    catch( std::exception& ex )
-    {
-        COMMA_THROW( comma::exception, "failed to convert \"" << s << "\" to type \"" << format::to_format(type) << "\": "  << ex.what() );
-    }
-    catch( ... )
-    {
-        throw;
-    }
+    catch( std::exception& ex ) { COMMA_THROW( comma::exception, "failed to convert \"" << s << "\" to type \"" << format::to_format(type) << "\": "  << ex.what() ); }
+    catch( ... ) { throw; }
 }
 
 static std::size_t bin_to_csv( std::ostringstream& oss, const char* buf, format::types_enum type, std::size_t size, const boost::optional< unsigned int >& precision )
@@ -377,7 +343,7 @@ std::string format::csv_to_bin( const std::vector< std::string >& csv ) const
 std::string format::bin_to_csv( const std::string& bin, char delimiter, const boost::optional< unsigned int >& precision ) const
 {
     if( bin.length() != size_ ) { COMMA_THROW( comma::exception, "expected binary string of size " << size_ << ", got " << bin.length() << " bytes" ); }
-    return bin_to_csv( bin.c_str(), delimiter, precision );
+    return bin_to_csv( &bin[0], delimiter, precision );
 }
 
 std::string format::bin_to_csv( const char* buf, char delimiter, const boost::optional< unsigned int >& precision ) const

From 89200f8a2907d4e718b4979b401c6de1f050ae13 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 16 Jun 2022 17:49:13 +1000
Subject: [PATCH 0512/1056] csv: signed char handling added

---
 csv/format.cpp        | 6 +++---
 csv/format.h          | 9 ++++++++-
 csv/impl/from_ascii.h | 5 +++--
 csv/impl/to_ascii.h   | 1 +
 4 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/csv/format.cpp b/csv/format.cpp
index 2e272e0ec..59f238ff8 100644
--- a/csv/format.cpp
+++ b/csv/format.cpp
@@ -104,7 +104,7 @@ static boost::array< unsigned int, 14 > Sizesimpl()
 {
     boost::array< unsigned int, 14 > sizes;
     sizes[ format::char_t ] = sizeof( char );
-    sizes[ format::int8 ] = sizeof( char );
+    sizes[ format::int8 ] = sizeof( signed char );
     sizes[ format::uint8 ] = sizeof( unsigned char );
     sizes[ format::int16 ] = sizeof( int16 );
     sizes[ format::uint16 ] = sizeof( uint16 );
@@ -216,8 +216,8 @@ static std::size_t csv_to_bin( char* buf, const std::string& s, format::types_en
             {
                 int i = boost::lexical_cast< int >( s );
                 if( i < -128 || i > 127 ) { COMMA_THROW( comma::exception, "expected byte, got " << i ); }
-                *buf = static_cast< char >( i );
-                return sizeof( char );
+                *buf = static_cast< signed char >( i );
+                return sizeof( signed char );
             }
             case format::uint8:
             {
diff --git a/csv/format.h b/csv/format.h
index c167ecc49..a1063461b 100644
--- a/csv/format.h
+++ b/csv/format.h
@@ -257,6 +257,7 @@ inline std::string format::value( const std::string& fields, bool full_xpath, co
 
 template <> inline std::string format::value_impl< bool >( const bool& ) { return "b"; }
 template <> inline std::string format::value_impl< char >( const char& ) { return "b"; }
+template <> inline std::string format::value_impl< signed char >( const signed char& ) { return "b"; }
 template <> inline std::string format::value_impl< unsigned char >( const unsigned char& ) { return "ub"; }
 template <> inline std::string format::value_impl< int16 >( const comma::int16& ) { return "w"; }
 template <> inline std::string format::value_impl< comma::uint16 >( const comma::uint16& ) { return "uw"; }
@@ -282,7 +283,13 @@ template <> struct format::type_to_enum< bool >
     static const char* as_string() { return "b"; }
 };
 
-template <> struct format::type_to_enum< char >
+template <> struct format::type_to_enum< char > // ATTENTION: char is unsigned on arm
+{
+    static const format::types_enum value = format::int8;
+    static const char* as_string() { return "b"; }
+};
+
+template <> struct format::type_to_enum< signed char >
 {
     static const format::types_enum value = format::int8;
     static const char* as_string() { return "b"; }
diff --git a/csv/impl/from_ascii.h b/csv/impl/from_ascii.h
index 94dd64296..1b69ebe7c 100644
--- a/csv/impl/from_ascii.h
+++ b/csv/impl/from_ascii.h
@@ -55,8 +55,8 @@ class from_ascii_
     public:
         /// constructor
         from_ascii_( const std::vector< boost::optional< std::size_t > >& indices
-                  , const std::deque< bool >& optional
-                  , const std::vector< std::string >& line );
+                   , const std::deque< bool >& optional
+                   , const std::vector< std::string >& line );
 
         /// apply
         template < typename K, typename T > void apply( const K& name, boost::optional< T >& value );
@@ -83,6 +83,7 @@ class from_ascii_
         std::size_t index_;
         std::size_t optional_index;
         static void lexical_cast_( char& v, const std::string& s ) { v = s.at( 0 ) == '\'' && s.at( 2 ) == '\'' && s.length() == 3 ? s.at( 1 ) : static_cast< char >( boost::lexical_cast< int >( s ) ); }
+        static void lexical_cast_( signed char& v, const std::string& s ) { v = s.at( 0 ) == '\'' && s.at( 2 ) == '\'' && s.length() == 3 ? s.at( 1 ) : static_cast< signed char >( boost::lexical_cast< int >( s ) ); }
         static void lexical_cast_( unsigned char& v, const std::string& s ) { v = s.at( 0 ) == '\'' && s.at( 2 ) == '\'' && s.length() == 3 ? s.at( 1 ) : static_cast< unsigned char >( boost::lexical_cast< unsigned int >( s ) ); }
         static void lexical_cast_( boost::posix_time::ptime& v, const std::string& s )
         { 
diff --git a/csv/impl/to_ascii.h b/csv/impl/to_ascii.h
index 79b7ce91c..936a07412 100644
--- a/csv/impl/to_ascii.h
+++ b/csv/impl/to_ascii.h
@@ -91,6 +91,7 @@ class to_ascii
         std::string as_string_( const std::string& v ) { return quote_ ? *quote_ + v + *quote_ : v; } // todo: escape/unescape
         // todo: better output semantics for char/unsigned char
         std::string as_string_( const char& v ) { std::ostringstream oss; oss << static_cast< int >( v ); return oss.str(); }
+        std::string as_string_( const signed char& v ) { std::ostringstream oss; oss << static_cast< int >( v ); return oss.str(); }
         std::string as_string_( const unsigned char& v ) { std::ostringstream oss; oss << static_cast< unsigned int >( v ); return oss.str(); }
         void set_precision_( std::ostringstream& oss ) const;
 

From 9f53b2ebaccee895d0016568357056a0e3b32e57 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 17 Jun 2022 16:39:52 +1000
Subject: [PATCH 0513/1056] name_value/impl/json_writer: unquoting numbers: bug
 fixed: multiple backslashes in front of quote handled correctly

---
 name_value/impl/json_writer.h       | 5 +++--
 name_value/test/name_value_test.cpp | 3 +++
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index 7308cd8da..eefce886c 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -34,8 +34,9 @@ template< typename C > inline void json_remove_quotes( std::basic_string< C >& j
         while( true )
         {
             value_end = std::find( value_end + 1, json_text.cend(), '"' );
-            auto i = value_end - 1;
-            if( *i != '\\' || *( i - 1 ) == '\\' ) { break; } // hyper quick and dirty fix, sigh
+            unsigned int backslash_count = 0;
+            for( auto i = value_end - 1; *i == '\\'; ++backslash_count, --i );
+            if( backslash_count % 2 == 0 ) { break; } // hyper quick and dirty fix, sigh
         }
         auto next_token = std::find_if_not( value_end + 1, json_text.cend(), []( C ch ) { return ' ' == ch || '\t' == ch || '\n' == ch; } );
         bool quoted = true;
diff --git a/name_value/test/name_value_test.cpp b/name_value/test/name_value_test.cpp
index 5a0912d8c..f4c8b98cb 100644
--- a/name_value/test/name_value_test.cpp
+++ b/name_value/test/name_value_test.cpp
@@ -271,7 +271,10 @@ TEST( name_value, exists )
 
 TEST( name_value, serialize_json )
 {
+    EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\\\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\\\" }" ) );
     EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\"b\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\"b\" }" ) );
+    EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\\c\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\\c\" }" ) );
+    EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\\\\\"b\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\\\\\"b\" }" ) );
     EXPECT_EQ( "{ \"a\": 1, \"b\": \"val\" }", json_remove_quotes_wrapper( "{ \"a\": \"1\", \"b\": \"val\" }" ) );
     EXPECT_EQ( "{ \"a\": [ 4.44, true, \"e\" ] }", json_remove_quotes_wrapper( "{ \"a\": [ \"4.44\", \"true\", \"e\" ] }" ) );
 

From b6255339ec4e42e51abf41351ee820900984752a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 5 Jul 2022 15:39:45 +1000
Subject: [PATCH 0514/1056] application/test/application_test.cpp: nan test
 made slightly more resilient

---
 application/test/application_test.cpp | 30 ++-------------------------
 1 file changed, 2 insertions(+), 28 deletions(-)

diff --git a/application/test/application_test.cpp b/application/test/application_test.cpp
index d4ebe5a0c..c8d91faea 100644
--- a/application/test/application_test.cpp
+++ b/application/test/application_test.cpp
@@ -1,32 +1,6 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+#include <cmath>
 #include <limits>
 #include <gtest/gtest.h>
 #include "../command_line_options.h"
@@ -198,7 +172,7 @@ TEST( command_line_options, optional )
         EXPECT_FALSE( bool( d ) );
         boost::optional< double > e = options.value< double >( "--d", std::numeric_limits< double >::quiet_NaN() );
         EXPECT_TRUE( bool( e ) );
-        EXPECT_FALSE( *e == *e );
+        EXPECT_TRUE( !std::numeric_limits< double >::has_quiet_NaN || std::isnan( *e ) ); // EXPECT_FALSE( *e == *e );
     }
 }
 

From fbfdba143aab70822d062c5e6998866934325aa5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 5 Jul 2022 15:40:41 +1000
Subject: [PATCH 0515/1056] cmake: ENABLE_FAST_MATH (OFF by default) and
 ENABLE_OPTIMISATION (ON by default) added

---
 CMakeLists.txt | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index fd9ebe140..fff280f40 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -69,7 +69,7 @@ if( NOT CMAKE_BUILD_TYPE )
   set( CMAKE_BUILD_TYPE Release CACHE STRING "options are: None Debug Release RelWithDebInfo MinSizeRel." FORCE )
 endif( NOT CMAKE_BUILD_TYPE )
 
-IF(WIN32)
+if( WIN32 )
   SET(CMAKE_CXX_WARNING_LEVEL 4)
   IF(CMAKE_CXX_FLAGS MATCHES "/W[0-4]")
     STRING(REGEX REPLACE "/W[0-4]" "/W4" CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS}")
@@ -84,7 +84,16 @@ IF(WIN32)
   SET (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} /D \"NOMINMAX\"")
   ADD_DEFINITIONS(-D_USE_MATH_DEFINES)
   ADD_DEFINITIONS(-DWIN32_LEAN_AND_MEAN) #used to fix winsock redefinition error
-ENDIF(WIN32)
+else( WIN32 )
+    option( ENABLE_FAST_MATH "enable compiler fast-math; experimental, some tests fail on nan and precision" OFF )
+    if( ENABLE_FAST_MATH )
+        set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -ffast-math" )
+    endif( ENABLE_FAST_MATH )
+    option( ENABLE_OPTIMIZATION "enable compiler optimisation" ON )
+    if( ENABLE_OPTIMIZATION )
+        set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O3" ) # quick and dirty; make optimisation level configurable
+    endif( ENABLE_OPTIMIZATION )
+endif( WIN32 )
 
 IF( CMAKE_SIZEOF_VOID_P EQUAL 8 )
   SET( IS_64_BIT TRUE )

From 2e6645858268f1ec9d4a5ee164c166c578e00e24 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 18 Jul 2022 23:03:15 +1000
Subject: [PATCH 0516/1056] csv-split: brushed up help to be similar to other
 comma applications

also reflowed to fit on a 80-column width terminal
---
 csv/applications/csv-split.cpp | 135 +++++++++++++++++++--------------
 1 file changed, 78 insertions(+), 57 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index ca1dada76..6294830df 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -103,63 +103,84 @@ int main( int argc, char** argv )
         boost::program_options::notify( vm );
         if ( vm.count( "help" ) || vm.count( "long-help" ) )
         {
-            std::cerr << std::endl;
-            std::cerr << "read from stdin by packet or by line and split into files named by field value or time (if split by time)." << std::endl;
-            std::cerr << "if splitting by id, input can also be splitted into streams" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "usage: csv-split [options] [outputs]*" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "use cases" << std::endl;
-            std::cerr << "    split by id field, output to files" << std::endl;
-            std::cerr << "        if id field present in --fields:" << std::endl;
-            std::cerr << "        for each id value, output records with this id to a separate file, e.g. 0.csv, 1.csv, etc" << std::endl;
-            std::cerr << "        - by id with default filenames, e.g:" << std::endl;
-            std::cerr << "              ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields id" << std::endl;
-            std::cerr << "        - by id with specified filenames" << std::endl;
-            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields id --files <( echo a; echo b; echo c )" << std::endl;
-            std::cerr << "        - by id with filenames mapped to block ids" << std::endl;
-            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields id --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "    split by block field, output to files" << std::endl;
-            std::cerr << "        if block field present in --fields:" << std::endl;
-            std::cerr << "        output records with this block to a separate file, on change of block, open a new file, e.g. 0.csv, 1.csv, etc" << std::endl;
-            std::cerr << "        - by block with default filenames, e.g:" << std::endl;
-            std::cerr << "              ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block" << std::endl;
-            std::cerr << "        - by block with specified filenames" << std::endl;
-            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo a; echo b; echo c )" << std::endl;
-            std::cerr << "        - by block with filenames mapped to block ids" << std::endl;
-            std::cerr << "              ( echo 0; echo 1; echo 2 ) | csv-split --fields block --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "    split by t field, output to files" << std::endl;
-            std::cerr << "        if t (timestamp) field present in --fields:" << std::endl;
-            std::cerr << "        separate records into different time periods, outputting in separate files" << std::endl;
-            std::cerr << "        example: ( echo 20170101T000001,a; echo 20170101T000003,b; echo 20170101T000007,c ) | csv-split --fields=t --period=4" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "    split by id field, output to streams" << std::endl;
-            std::cerr << "        if output streams (see example below) are present on the command line and id field present in --fields:" << std::endl;
-            std::cerr << "        output records with the given ids to the corresponding streams, while outputing the rest into files" << std::endl;
-            std::cerr << "        records with ids for which output stream is not specified will be discarded, unless ... stream is specified:" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "        outputs: <keys>;<stream>; to send records with a given set of ids to this stream" << std::endl;
-            std::cerr << "            keys:" << std::endl;
-            std::cerr << "                <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc" << std::endl;
-            std::cerr << "                ...: three dots mean: send to this stream all the records with ids for which no other stream is specified (see example below)" << std::endl;
-            std::cerr << "            stream:" << std::endl;
-            std::cerr << "                tcp:<port>: e.g. tcp:1234" << std::endl;
-            std::cerr << "                udp:<port>: e.g. udp:1234 (todo)" << std::endl;
-            std::cerr << "                local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
-            std::cerr << "                <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
-            std::cerr << "                <filename>: a regular file" << std::endl;
-            std::cerr << "        examples" << std::endl;
-            std::cerr << "            ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) | csv-split --fields id \"0,1;tcp:5999\" \"...;local:/tmp/named_fifo\"" << std::endl;
-            std::cerr << "            ( echo 0,a; echo 1,b ) | csv-split --fields id --files <( echo '1,one.csv'; echo '0,zero.csv' )';fields=id,filename'" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << description << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "fields to split by listed in descending precedence" << std::endl;
-            std::cerr << "    block: split on the block number change" << std::endl;
-            std::cerr << "    id: split by id (same as block, except does not have to be contiguous by the price of worse performance)" << std::endl;
-            std::cerr << "    t: if present, use timestamp from the packet; if absent, use system time" << std::endl;
+            std::cerr << "\n";
+            std::cerr << "read from stdin by packet or by line and split into files\n";
+            std::cerr << "files are named by field value or time (if split by time)\n";
+            std::cerr << "if splitting by id, input can also be split into streams\n";
+            std::cerr << "\n";
+            std::cerr << "usage: csv-split [options] [outputs]*\n";
+            std::cerr << "\n";
+            std::cerr << description;
+            std::cerr << "\n";
+            std::cerr << "data is split by one of the following fields (listed in descending precedence)\n";
+            std::cerr << "    block: split on the block number change\n";
+            std::cerr << "    id:    split by id (same as block, except does not have to be contiguous\n";
+            std::cerr << "                        with the price of worse performance)\n";
+            std::cerr << "    t:     if present, use timestamp from the packet; if absent, use system time\n";
+            std::cerr << "\n";
+            std::cerr << "examples:\n";
+            std::cerr << "    --- split by block field, output to files ---\n";
+            std::cerr << "    output records for each block to a separate file\n";
+            std::cerr << "    on change of block, open a new file, e.g. 0.csv, 1.csv, etc\n";
+            std::cerr << "\n";
+            std::cerr << "    with default filenames:\n";
+            std::cerr << "    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block\n";
+            std::cerr << "\n";
+            std::cerr << "    with specified filenames:\n";
+            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
+            std::cerr << "        | csv-split --fields block --files <( echo a; echo b; echo c )\n";
+            std::cerr << "\n";
+            std::cerr << "    with filenames mapped to block ids:\n";
+            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
+            std::cerr << "        | csv-split --fields block \\\n";
+            std::cerr << "              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'\n";
+            std::cerr << "\n";
+            std::cerr << "    --- split by id field, output to files ---\n";
+            std::cerr << "    for each id value, output records with this id to a separate file,\n";
+            std::cerr << "    e.g. 0.csv, 1.csv, etc\n";
+            std::cerr << "\n";
+            std::cerr << "    with default filenames:\n";
+            std::cerr << "    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields id\n";
+            std::cerr << "\n";
+            std::cerr << "    with specified filenames:\n";
+            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
+            std::cerr << "        | csv-split --fields id --files <( echo a; echo b; echo c )\n";
+            std::cerr << "\n";
+            std::cerr << "    with filenames mapped to block ids:\n";
+            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
+            std::cerr << "        | csv-split --fields id \\\n";
+            std::cerr << "              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'\n";
+            std::cerr << "\n";
+            std::cerr << "    --- split by t field, output to files ---\n";
+            std::cerr << "    separate records into different time periods, outputting in separate files\n";
+            std::cerr << "    ( echo 20170101T000001,a; echo 20170101T000003,b; echo 20170101T000007,c ) \\\n";
+            std::cerr << "        | csv-split --fields=t --period=4\n";
+            std::cerr << "\n";
+            std::cerr << "    --- split by id field, output to streams ---\n";
+            std::cerr << "    if output streams (see example below) are present on the command line and \n";
+            std::cerr << "    id field present in --fields output records with the given ids to the\n";
+            std::cerr << "    corresponding streams, while outputing the rest into files\n";
+            std::cerr << "\n";
+            std::cerr << "    records with ids for which output stream is not specified will be discarded,\n";
+            std::cerr << "    unless ... stream is specified:\n";
+            std::cerr << "\n";
+            std::cerr << "    outputs: <keys>;<stream>; send records with given set of ids to this stream\n";
+            std::cerr << "        keys:\n";
+            std::cerr << "            <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc\n";
+            std::cerr << "            ... (three dots): send to this stream all the records with ids\n";
+            std::cerr << "                for which no other stream is specified (see example below)\n";
+            std::cerr << "        stream:\n";
+            std::cerr << "            tcp:<port>: e.g. tcp:1234\n";
+            std::cerr << "            udp:<port>: e.g. udp:1234 (todo)\n";
+            std::cerr << "            local:<name>: linux/unix local server socket\n";
+            std::cerr << "                          e.g. local:./tmp/my_socket\n";
+            std::cerr << "            <named pipe name>: named pipe, re-opened if client reconnects\n";
+            std::cerr << "            <filename>: a regular file\n";
+            std::cerr << "\n";
+            std::cerr << "        ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) \\\n";
+            std::cerr << "            | csv-split --fields id \"0,1;tcp:5999\" \"...;local:/tmp/named_fifo\"\n";
+            std::cerr << "        ( echo 0,a; echo 1,b ) | csv-split --fields id --files \\\n";
+            std::cerr << "                  <( echo '1,one.csv'; echo '0,zero.csv' )';fields=id,filename'\n";
             std::cerr << std::endl;
             return 0;
         }

From a2d2ba0e8a798da3f7bde232dcda2faea9506db3 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 18 Jul 2022 23:51:06 +1000
Subject: [PATCH 0517/1056] csv-split: move test for required time-splitting
 options deeper in code

previous test erroneously checked for those options even if we were using the
field precedence rules to split by block or id
---
 csv/applications/csv-split.cpp   |  1 -
 csv/applications/split/split.cpp | 10 +++++++---
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index 6294830df..aeb731248 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -197,7 +197,6 @@ int main( int argc, char** argv )
         else { suffix += "."; suffix += extension; }
         streams = boost::program_options::collect_unrecognized( parsed.options, boost::program_options::include_positional );
         if( !streams.empty() && ( csv.has_field( "block" ) || id_is_time ) ) { std::cerr << "publisher streams are not compatible with splitting by block or timestamp." << std::endl; return 1; }
-        if( ( csv.has_field( "t" ) || csv.fields.empty() ) && !period && timestamps.empty() ) { COMMA_THROW( comma::exception, "got fields '" << csv.fields << "' meaning split by time; thus please specify either --period or --timestamps" ); }
         if( id_is_string ) { run< std::string >(); }
         else if( id_is_time ) { run< boost::posix_time::ptime >(); }
         else { run< comma::uint32 >(); }
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 206e8248c..7a8034eed 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -160,10 +160,14 @@ split< T >::split( const boost::optional< boost::posix_time::time_duration >& pe
     {
         ofstream_ = std::bind( &split< T >::ofstream_by_block_, this );
     }
-    else
+    else if( csv.has_field( "id" ) )
     {
-        if( csv.has_field( "id" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_id_, this ); }
-        else { if( !filenames_.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); } }
+        ofstream_ = std::bind( &split< T >::ofstream_by_id_, this );
+    }
+    else   // splitting by time
+    {
+        if( !filenames_.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); }
+        if( !period && timestamps.empty() ) { COMMA_THROW( comma::exception, "splitting by time; please specify either --period or --timestamps" ); }
     }
     timestamps_stream_make_( timestamps );
 }

From b92b44b11a6908c2d959d7f3b8c6e4accd920eb7 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 19 Jul 2022 12:42:53 +1000
Subject: [PATCH 0518/1056] .gitignore: added python/comma_py.egg-info/ and
 python/dist

artifacts of the install process I think
---
 .gitignore | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/.gitignore b/.gitignore
index ebaa5be7f..50b820a33 100644
--- a/.gitignore
+++ b/.gitignore
@@ -12,3 +12,5 @@ doc/generated
 tags
 compile_commands.json
 .ycm_extra_conf.py
+python/comma_py.egg-info/
+python/dist/

From c101cb18485b3cd8f64b02a5424ca71223da8e71 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 29 Jul 2022 15:27:18 +1000
Subject: [PATCH 0519/1056] say(), saymore() implemented

---
 application/command_line_options.cpp | 67 +++++++++++++---------------
 application/command_line_options.h   | 67 +++++++++++-----------------
 application/verbose.h                |  2 +-
 3 files changed, 58 insertions(+), 78 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 31872993a..ef3579fa7 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
@@ -36,31 +9,53 @@
 #include <unordered_map>
 #include <boost/bind.hpp>
 #include <boost/config/warning_disable.hpp>
+#include "boost/filesystem.hpp"
+#include "boost/iostreams/stream.hpp"
+#include "boost/iostreams/device/null.hpp"
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>
 #include "../string/split.h"
-#include "../application/command_line_options.h"
 #include "../base/exception.h"
+#include "command_line_options.h"
 
 namespace comma {
 
+namespace application { namespace detail {
+
+static std::string name;
+static bool verbose = false;
+static boost::iostreams::stream< boost::iostreams::null_sink > null_ostream( ( boost::iostreams::null_sink() ) );
+
+} } // namespace application { namespace detail {
+
+std::ostream& say( std::ostream& os ) { std::cerr << comma::application::detail::name << ": "; return os; }
+
+std::ostream& saymore() { return say( verbose ? std::cerr : comma::application::detail::null_ostream ); }
+
+void command_line_options::_init_verbose( bool v, const std::string& path )
+{
+    comma::verbose.init( v, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
+    comma::application::detail::name = boost::filesystem::basename( path );
+    comma::application::detail::verbose = v;
+}
+
 command_line_options::command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage )
 {
     argv_.resize( argc );
     for( int i = 0; i < argc; ++i ) { argv_[i] = argv[i]; }
-    fill_map_( argv_ );
-    bool v=exists("--verbose,-v");
-    comma::verbose.init(v, argv[0]);
+    _fill_map( argv_ );
+    bool v = exists("--verbose,-v");
+    _init_verbose( v, argv[0] );
     if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 1 ); }
 }
 
 command_line_options::command_line_options( const std::vector< std::string >& argv, boost::function< void( bool ) > usage )
     : argv_( argv )
 {
-    fill_map_( argv_ );
-    bool v=exists("--verbose,-v");
-    comma::verbose.init(v, argv[0]);
+    _fill_map( argv_ );
+    bool v = exists( "--verbose,-v" );
+    _init_verbose( v, argv[0] );
     if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 1 ); }
 }
 
@@ -122,7 +117,7 @@ std::vector< std::string > command_line_options::unnamed( const std::string& val
 
 std::vector< std::string > command_line_options::names() const { return names_; }
 
-void command_line_options::fill_map_( const std::vector< std::string >& v )
+void command_line_options::_fill_map( const std::vector< std::string >& v )
 {
     for( std::size_t i = 1; i < v.size(); ++i )
     {
diff --git a/application/command_line_options.h b/application/command_line_options.h
index 10fff8d41..71ee9746f 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -1,37 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_APPLICATION_COMMAND_LINE_OPTIONS_H_
-#define COMMA_APPLICATION_COMMAND_LINE_OPTIONS_H_
+#pragma once
 
 #include <map>
 #include <string>
@@ -42,10 +14,24 @@
 #include <boost/optional.hpp>
 #include "../base/exception.h"
 #include "../string/string.h"
-#include "verbose.h"
+#include "verbose.h" // todo: deprecate
 
 namespace comma {
 
+/// @example
+///      in my-application:
+///          say() << "some message";
+///      will print on stderr:
+///          my-application: some message
+std::ostream& say( std::ostream& os = std::cerr );
+
+/// @example
+///      in my-application
+///          saymore() << "some debug message";
+///      if run as: my-application --verbose, will print on stderr:
+///          my-application: some debug message
+std::ostream& saymore();
+    
 /// a simple command line options class
 class command_line_options
 {
@@ -161,25 +147,26 @@ class command_line_options
 
     private:
         typedef std::map< std::string, std::vector< std::string > > map_type_;
-
-        void fill_map_( const std::vector< std::string >& v );
-        template < typename T > static T lexical_cast_( const std::string& s );
-
         std::vector< std::string > argv_;
         map_type_ map_;
         std::vector< std::string > names_;
+        void _fill_map( const std::vector< std::string >& v );
+        void _init_verbose( bool v, const std::string& path );
+        template < typename T > static T lexical_cast_( const std::string& s );
+        
 };
 
 template< typename Iterator > inline command_line_options::command_line_options( Iterator begin, Iterator end, boost::function< void( bool ) > usage )
 {
     argv_.resize( std::distance( begin, end ) );
     for ( Iterator i = begin; i < end; ++i ) { argv_[i] = *i; }
-    fill_map_( argv_ );
-    if ( usage && exists( "--help,-h" ) )
+    _fill_map( argv_ );
+    if( usage && exists( "--help,-h" ) )
     {
         bool v = exists( "--verbose,-v" );
-        comma::verbose.init( v, *begin );
-        usage( v ); exit( 1 );
+        _init_verbose( v, *begin );
+        usage( v );
+        exit( 0 );
     }
 }
 
@@ -237,5 +224,3 @@ inline std::vector< T > command_line_options::values( const std::string& name, T
 }
 
 } // namespace comma {
-
-#endif // COMMA_APPLICATION_COMMAND_LINE_OPTIONS_H_
diff --git a/application/verbose.h b/application/verbose.h
index 296cd1709..b220f0730 100644
--- a/application/verbose.h
+++ b/application/verbose.h
@@ -31,7 +31,6 @@
 
 #include <iostream>
 
-//prototype for comma::verbose
 namespace comma {
 
 //a pseudo ostream for outputing information to stderr
@@ -39,6 +38,7 @@ namespace comma {
 //examples: 
 //  comma::verbose << "hello!" << std::endl;
 //  if (comma::verbose) { std::cerr << comma::verbose.app_name() << "info" << std::endl; }
+/// @deprecated
 class verbose_t
 {
     bool enabled_;

From f7347dee5eb8576ffdba0e7fc52f57ecfdab8509 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 29 Jul 2022 15:46:31 +1000
Subject: [PATCH 0520/1056] say(): typos fixed

---
 application/command_line_options.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index ef3579fa7..edf9687f0 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -29,9 +29,9 @@ static boost::iostreams::stream< boost::iostreams::null_sink > null_ostream( ( b
 
 } } // namespace application { namespace detail {
 
-std::ostream& say( std::ostream& os ) { std::cerr << comma::application::detail::name << ": "; return os; }
+std::ostream& say( std::ostream& os ) { os << comma::application::detail::name << ": "; return os; }
 
-std::ostream& saymore() { return say( verbose ? std::cerr : comma::application::detail::null_ostream ); }
+std::ostream& saymore() { return say( comma::application::detail::verbose ? std::cerr : comma::application::detail::null_ostream ); }
 
 void command_line_options::_init_verbose( bool v, const std::string& path )
 {

From f8feacf40dab96e2d408ce001eb0da04ffac5823 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 4 Aug 2022 12:42:07 +1000
Subject: [PATCH 0521/1056] base/none.h added

---
 base/none.h       |  15 +++++
 base/types.h      |  33 +--------
 visiting/traits.h | 166 ++++++++++++----------------------------------
 3 files changed, 59 insertions(+), 155 deletions(-)
 create mode 100644 base/none.h

diff --git a/base/none.h b/base/none.h
new file mode 100644
index 000000000..6752d7de3
--- /dev/null
+++ b/base/none.h
@@ -0,0 +1,15 @@
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+namespace comma {
+
+/// convenience type to use e.g. as a "tag" type in template definitions
+/// since boost::none_t is not default-constructible as it is designed
+/// to be a singleton type (see boost/none_t.hpp for details) meaning
+/// that it won't compile for some use cases
+struct none {};
+    
+} // namespace comma {
diff --git a/base/types.h b/base/types.h
index fecd5afa9..22f4f1944 100644
--- a/base/types.h
+++ b/base/types.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_BASE_TYPES_H_
-#define COMMA_BASE_TYPES_H_
+#pragma once
 
 #if defined(__linux__) || defined(__APPLE__) || defined(__QNXNTO__)
 #include <arpa/inet.h>
@@ -90,5 +61,3 @@ template <> struct integer< 8, true > { typedef comma::int64 type; };
 template <> struct integer< 8, false > { typedef comma::uint64 type; };
 
 } // namespace comma {
-
-#endif /*COMMA_BASE_TYPES_H_*/
diff --git a/visiting/traits.h b/visiting/traits.h
index 20a8c5146..57ea8baf0 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_VISITING_TRAITS_HEADER_GUARD_
-#define COMMA_VISITING_TRAITS_HEADER_GUARD_
+#pragma once
 
 #ifndef WIN32
 #include <stdlib.h>
@@ -40,8 +11,11 @@
 #include <map>
 #include <set>
 #include <string>
+#include <unordered_map>
+#include <unordered_set>
 #include <vector>
 #include <boost/array.hpp>
+#include "../base/none.h"
 
 namespace comma { namespace visiting {
 
@@ -50,22 +24,25 @@ namespace comma { namespace visiting {
 template < typename T >
 struct traits
 {
-    /// visit arbitrary type
     template < typename K, typename V > static void visit( const K& key, T& t, V& v );
+    template < typename K, typename V > static void visit( const K& key, const T& t, V& v );
+};
+
+template <> struct traits< comma::none >
+{
+    template < typename K, typename V > static void visit( const K& key, comma::none& t, V& v ) {}
+    template < typename K, typename V > static void visit( const K&, const comma::none& t, V& v ) {}
 };
 
-/// std::pair visiting traits; todo: better semantics?
 template < typename T, typename S >
 struct traits< std::pair< T, S > >
 {
-    /// visit
     template < typename K, typename V > static void visit( const K& key, std::pair< T, S >& t, V& v )
     {
         v.apply( "first", t.first );
         v.apply( "second", t.second );
     }
     
-    /// visit const
     template < typename K, typename V > static void visit( const K&, const std::pair< T, S >& t, V& v )
     {
         v.apply( "first", t.first );
@@ -73,26 +50,20 @@ struct traits< std::pair< T, S > >
     }    
 };
 
-namespace Impl {
+namespace impl {
 
 template < typename K, typename V, typename Visitor >
 inline void visit_non_associative_container( const K&, const V& c, Visitor& v )
 {
     std::size_t index = 0;
-    for( typename V::const_iterator it = c.begin(); it != c.end(); ++it, ++index )
-    {
-        v.apply( index, *it );
-    }
+    for( typename V::const_iterator it = c.begin(); it != c.end(); ++it, ++index ) { v.apply( index, *it ); }
 }
 
 template < typename K, typename V, typename Visitor >
 inline void visit_non_associative_container( const K&, V& c, Visitor& v )
 {
     std::size_t index = 0;
-    for( typename V::iterator it = c.begin(); it != c.end(); ++it, ++index )
-    {
-        v.apply( index, *it );
-    }
+    for( typename V::iterator it = c.begin(); it != c.end(); ++it, ++index ) { v.apply( index, *it ); }
 }
 
 template < typename T, typename Visitor >
@@ -110,110 +81,59 @@ inline void visit_associative_container_key( const K& k, const T& t, Visitor& v
 template < typename K, typename M, typename Visitor >
 inline void visit_associative_container( const K&, M& c, Visitor& v )
 {
-    for( typename M::iterator it = c.begin(); it != c.end(); ++it )
-    {
-        visit_associative_container_key( it->first, it->second, v );
-    }
+    for( typename M::iterator it = c.begin(); it != c.end(); ++it ) { visit_associative_container_key( it->first, it->second, v ); }
 }
 
 template < typename K, typename M, typename Visitor >
 inline void visit_associative_container( const K&, const M& c, Visitor& v )
 {
-    for( typename M::const_iterator it = c.begin(); it != c.end(); ++it )
-    {
-        visit_associative_container_key( it->first, it->second, v );
-    }
+    for( typename M::const_iterator it = c.begin(); it != c.end(); ++it ) { visit_associative_container_key( it->first, it->second, v ); }
 }
 
-} // namespace Impl {
+} // namespace impl {
 
-/// vector visiting traits
-template < typename T, typename A >
-struct traits< std::vector< T, A > >
+template < typename T, typename A > struct traits< std::vector< T, A > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::vector< T, A >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::vector< T, A >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, std::vector< T, A >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::vector< T, A >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
 };
 
-/// set visiting traits
-template < typename T >
-struct traits< std::set< T > >
+template < typename T > struct traits< std::set< T > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::set< T >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::set< T >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, std::set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
 };
 
-/// std array visiting traits
-template < typename T, std::size_t S >
-struct traits< std::array< T, S > >
+template < typename T > struct traits< std::unordered_set< T > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
+    template < typename K, typename V > static void visit( const K& key, std::unordered_set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::unordered_set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
+};
 
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
+template < typename T, std::size_t S > struct traits< std::array< T, S > >
+{
+    template < typename K, typename V > static void visit( const K& key, std::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
 };
 
-/// boost array visiting traits
-template < typename T, std::size_t S >
-struct traits< boost::array< T, S > >
+template < typename T, std::size_t S > struct traits< boost::array< T, S > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, boost::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const boost::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, boost::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const boost::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
 };
 
-/// map visiting traits
-template < typename T, typename S >
-struct traits< std::map< T, S > >
+template < typename T, typename S > struct traits< std::map< T, S > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::map< T, S >& t, V& v )
-    {
-        Impl::visit_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::map< T, S >& t, V& v )
-    {
-        Impl::visit_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, std::map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }    
+};
+
+template < typename T, typename S > struct traits< std::unordered_map< T, S > >
+{
+    template < typename K, typename V > static void visit( const K& key, std::unordered_map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::unordered_map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }    
 };
 
 /// @todo add more types as needed
 
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_VISITING_TRAITS_HEADER_GUARD_

From c92a385b25276e0d83444de272476d9f7f9c6c2c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Aug 2022 15:02:23 +1000
Subject: [PATCH 0522/1056] name-value-to-csv: --map implemented

---
 name_value/applications/name-value-to-csv.cpp | 58 +++++++++++++++----
 .../test/name-value-to-csv/map/expected       |  5 ++
 name_value/test/name-value-to-csv/map/input   |  2 +
 name_value/test/name-value-to-csv/map/test    |  3 +
 4 files changed, 56 insertions(+), 12 deletions(-)
 create mode 100644 name_value/test/name-value-to-csv/map/expected
 create mode 100644 name_value/test/name-value-to-csv/map/input
 create mode 100755 name_value/test/name-value-to-csv/map/test

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index 104f08f1f..666b6178a 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -24,6 +24,8 @@ static void usage( bool )
     std::cerr << "    --delimiter,-d=<delimiter>; default=','; csv delimiter" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal_sign>; default='='; equal sign" << std::endl;
     std::cerr << "    --fields,-f=<fields>; fields to output" << std::endl;
+    std::cerr << "    --map,--dict; prefixed paths are a map, not list; expects input sorted by path" << std::endl;
+    std::cerr << "                  run example below to make sense of it" << std::endl;
     std::cerr << "    --prefix,--path,-p=[<prefix>]; optional prefix" << std::endl;
     std::cerr << "    --unindexed-fields=<fields>; if no --fields specified, output unindexed fields once, if --fields specified, append given unindexed fields to all records" << std::endl;
     std::cerr << "    --unindexed-stream,--stream; read a stream of key-value pairs, on every input record output csv record with the field value set and other fields empty, see example below" << std::endl;
@@ -42,9 +44,20 @@ static void usage( bool )
     std::cerr << "        EOF" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        yields:" << std::endl;
+    std::cerr << "            a,10,0" << std::endl;
+    std::cerr << "            b,20,1" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "        a,10,0" << std::endl;
-    std::cerr << "        b,20,1" << std::endl;
+    std::cerr << "        cat <<EOF | name-value-to-csv --map --fields=name,value,status --prefix=my/test" << std::endl;
+    std::cerr << "        my/test/x/name=a" << std::endl;
+    std::cerr << "        my/test/x/value=10" << std::endl;
+    std::cerr << "        my/test/x/status=0" << std::endl;
+    std::cerr << "        my/test/y/name=b" << std::endl;
+    std::cerr << "        my/test/y/status=1" << std::endl;
+    std::cerr << "        EOF" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        yields:" << std::endl;
+    std::cerr << "            x,a,10,0" << std::endl;
+    std::cerr << "            y,b,,1" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    unindexed fields" << std::endl;
     std::cerr << "        todo" << std::endl;
@@ -103,6 +116,9 @@ int main( int ac, char** av )
         values_t values; // quick and dirty; watch performance?
         std::map< unsigned int, values_t > map;
         boost::optional< unsigned int > index;
+        std::string key;
+        bool is_map = options.exists( "--dict,--map" );
+        if( is_map && unsorted ) { comma::say() << "combination of --map and --unsorted: todo, just ask" << std::endl; return 1; }
         while( std::cin.good() && !std::cin.eof() )
         {
             std::string s;
@@ -124,16 +140,30 @@ int main( int ac, char** av )
                 else if( name[ prefix.size() ] == '/' ) { values[ name.substr( prefix.size() + 1 ) ] = s.substr( e + 1 ); }
                 continue;
             }
-            if( name[prefix.size()] != '[' ) { continue; }
-            auto b = s.find_first_of( ']', prefix.size() );
-            if( b == std::string::npos ) { std::cerr << "name-value-to-csv: expected path-value pair with valid indices; got: '" << s << "'" << std::endl; return 1; }
-            if( s[ b + 1 ] != '/' ) { continue; }
-            unsigned int current_index = boost::lexical_cast< unsigned int >( name.substr( prefix.size() + 1, b - prefix.size() - 1 ) );
-            if( unsorted || !unindexed_fields.empty() ) { map[current_index][name.substr( b + 2 )] = s.substr( e + 1 ); continue; }
-            if( index && current_index < *index ) { std::cerr << "name-value-to-csv: expected sorted index, got index " << current_index << " after " << *index << " in line: '" << comma::strip( s ) << "'" << std::endl; return 1; }
-            if( index && current_index > *index ) { std::cout << join( fields, values, delimiter ) << std::endl; }
-            values[name.substr( b + 2 )] = s.substr( e + 1 );
-            index = current_index;
+            if( is_map )
+            {
+                if( name[prefix.size()] != '/' ) { continue; }
+                auto b = s.find_first_of( '/', prefix.size() + 1 );
+                if( b == std::string::npos ) { std::cerr << "name-value-to-csv: with prefix \"" << prefix << "\" expected path-value pair with valid keys; got: '" << s << "'" << std::endl; return 1; }
+                std::string current_key = name.substr( prefix.size() + 1, b - prefix.size() - 1 );
+                if( unsorted ) {} // todo
+                if( !key.empty() && current_key != key ) { std::cout << key << delimiter << join( fields, values, delimiter ) << std::endl; }
+                values[name.substr( b + 1 )] = s.substr( e + 1 );
+                key = current_key;
+            }
+            else
+            {
+                if( name[prefix.size()] != '[' ) { continue; }
+                auto b = s.find_first_of( ']', prefix.size() );
+                if( b == std::string::npos ) { std::cerr << "name-value-to-csv: with prefix \"" << prefix << "\" expected path-value pair with valid indices; got: '" << s << "'" << std::endl; return 1; }
+                if( s[ b + 1 ] != '/' ) { continue; }
+                unsigned int current_index = boost::lexical_cast< unsigned int >( name.substr( prefix.size() + 1, b - prefix.size() - 1 ) );
+                if( unsorted || !unindexed_fields.empty() ) { map[current_index][name.substr( b + 2 )] = s.substr( e + 1 ); continue; }
+                if( index && current_index < *index ) { std::cerr << "name-value-to-csv: expected sorted index, got index " << current_index << " after " << *index << " in line: '" << comma::strip( s ) << "'" << std::endl; return 1; }
+                if( index && current_index > *index ) { std::cout << join( fields, values, delimiter ) << std::endl; }
+                values[name.substr( b + 2 )] = s.substr( e + 1 );
+                index = current_index;
+            }
         }
         if( unindexed && !unindexed_stream )
         { 
@@ -154,6 +184,10 @@ int main( int ac, char** av )
         {
             std::cout << join( fields, values, delimiter ) << std::endl;
         }
+        else if( is_map && !key.empty() )
+        {
+            std::cout << key << delimiter << join( fields, values, delimiter ) << std::endl;
+        }
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "name-value-to-csv: " << ex.what() << std::endl; }
diff --git a/name_value/test/name-value-to-csv/map/expected b/name_value/test/name-value-to-csv/map/expected
new file mode 100644
index 000000000..494667105
--- /dev/null
+++ b/name_value/test/name-value-to-csv/map/expected
@@ -0,0 +1,5 @@
+map/basics[0]/output/line[0]="x,0,1"
+map/basics[0]/output/line[1]="y,2,"
+map/basics[0]/status=0
+map/basics[1]/output="x,0,1"
+map/basics[1]/status=0
diff --git a/name_value/test/name-value-to-csv/map/input b/name_value/test/name-value-to-csv/map/input
new file mode 100644
index 000000000..247604259
--- /dev/null
+++ b/name_value/test/name-value-to-csv/map/input
@@ -0,0 +1,2 @@
+map/basics[0]="( echo p/x/a/b=0; echo p/x/c=1; echo p/y/a/b=2 ) | name-value-to-csv --map --prefix=p --fields a/b,c"
+map/basics[1]="( echo p/x/a/b=0; echo p/x/c=1 ) | name-value-to-csv --map --prefix=p --fields a/b,c"
diff --git a/name_value/test/name-value-to-csv/map/test b/name_value/test/name-value-to-csv/map/test
new file mode 100755
index 000000000..988ba14ee
--- /dev/null
+++ b/name_value/test/name-value-to-csv/map/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+comma_test_commands

From f184dae43756624d8419c99d5e5313917b1e0629 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Aug 2022 11:46:57 +1000
Subject: [PATCH 0523/1056] comma-application-util:
 comma-application-swiss-init: options_unnamed implemented

---
 bash/comma-application-util | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 998444614..49141e15f 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -303,6 +303,7 @@ function comma-application-swiss-init()
         local operation_options; operation_options=$( ${comma_application_swiss_operation}-options | comma-options-to-name-value "$@" ) || die "invalid options"
         eval "$( grep -v '^"' <<< "$operation_options" | sed 's#^#options_#' | comma_path_value_mangle )"
     fi
+    mapfile -t options_unnamed < <( ( echo "$options"; echo "$operation_options" ) | grep '^"' | sed -e 's#^"##' -e 's#"$##' )
 }
 
 export -f comma-application-swiss-init

From f1d9f01d7d9bae9c53407790a1e93e398e1d31f5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Aug 2022 14:49:33 +1000
Subject: [PATCH 0524/1056] name-value-to-csv --unquote implemented

---
 name_value/applications/name-value-to-csv.cpp | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index 666b6178a..32be635df 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -30,6 +30,7 @@ static void usage( bool )
     std::cerr << "    --unindexed-fields=<fields>; if no --fields specified, output unindexed fields once, if --fields specified, append given unindexed fields to all records" << std::endl;
     std::cerr << "    --unindexed-stream,--stream; read a stream of key-value pairs, on every input record output csv record with the field value set and other fields empty, see example below" << std::endl;
     std::cerr << "    --unindexed-stream-update,--update; read a stream of key-value pairs, on every input record output all up-to-date values of fields present in --unindexed-fields, see example below" << std::endl;
+    std::cerr << "    --unquote; unquote string values" << std::endl;
     std::cerr << "    --unsorted; the input data is not sorted by index" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
@@ -88,6 +89,9 @@ static std::string join( const std::vector< std::string >& fields, values_t& val
     return oss.str();
 }
 
+static bool unquote;
+static std::string _unquoted( const std::string s ) { return unquote && s.size() >= 2 ? comma::strip( s, "\"" ) : s; }
+
 int main( int ac, char** av )
 {
     try
@@ -109,6 +113,7 @@ int main( int ac, char** av )
         if( fields[0].empty() && unindexed_fields.empty() ) { std::cerr << "name-value-to-csv: please specify --fields or --unindexed-fields" << std::endl; return 1; }
         bool unindexed = fields[0].empty();
         values_t unindexed_values;
+        unquote = options.exists( "--unquote" );
         bool unsorted = options.exists( "--unsorted" );
         char delimiter = options.value( "--delimiter,-d", ',' );
         char equal_sign = options.value( "--equal-sign,-e", '=' );
@@ -136,8 +141,8 @@ int main( int ac, char** av )
             if( name.substr( 0, prefix.size() ) != prefix ) { continue; }
             if( unindexed )
             {
-                if( prefix.empty() ) { values[name] = s.substr( e + 1 ); }
-                else if( name[ prefix.size() ] == '/' ) { values[ name.substr( prefix.size() + 1 ) ] = s.substr( e + 1 ); }
+                if( prefix.empty() ) { values[name] = _unquoted( s.substr( e + 1 ) ); }
+                else if( name[ prefix.size() ] == '/' ) { values[ name.substr( prefix.size() + 1 ) ] = _unquoted( s.substr( e + 1 ) ); }
                 continue;
             }
             if( is_map )
@@ -148,7 +153,7 @@ int main( int ac, char** av )
                 std::string current_key = name.substr( prefix.size() + 1, b - prefix.size() - 1 );
                 if( unsorted ) {} // todo
                 if( !key.empty() && current_key != key ) { std::cout << key << delimiter << join( fields, values, delimiter ) << std::endl; }
-                values[name.substr( b + 1 )] = s.substr( e + 1 );
+                values[name.substr( b + 1 )] = _unquoted( s.substr( e + 1 ) );
                 key = current_key;
             }
             else
@@ -161,7 +166,7 @@ int main( int ac, char** av )
                 if( unsorted || !unindexed_fields.empty() ) { map[current_index][name.substr( b + 2 )] = s.substr( e + 1 ); continue; }
                 if( index && current_index < *index ) { std::cerr << "name-value-to-csv: expected sorted index, got index " << current_index << " after " << *index << " in line: '" << comma::strip( s ) << "'" << std::endl; return 1; }
                 if( index && current_index > *index ) { std::cout << join( fields, values, delimiter ) << std::endl; }
-                values[name.substr( b + 2 )] = s.substr( e + 1 );
+                values[name.substr( b + 2 )] = _unquoted( s.substr( e + 1 ) );
                 index = current_index;
             }
         }

From 6d85d67b5285bfb98c8539776b59bae32efd8ddf Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Aug 2022 15:00:10 +1000
Subject: [PATCH 0525/1056] name-value-to-csv: --unquote: basic test added

---
 name_value/test/name-value-to-csv/basic/expected | 12 +++++++++---
 name_value/test/name-value-to-csv/basic/input    |  8 +++-----
 name_value/test/name-value-to-csv/basic/options  |  1 -
 name_value/test/name-value-to-csv/basic/test     |  3 +++
 4 files changed, 15 insertions(+), 9 deletions(-)
 delete mode 100644 name_value/test/name-value-to-csv/basic/options
 create mode 100755 name_value/test/name-value-to-csv/basic/test

diff --git a/name_value/test/name-value-to-csv/basic/expected b/name_value/test/name-value-to-csv/basic/expected
index 335e6a7c6..8491ee5b1 100644
--- a/name_value/test/name-value-to-csv/basic/expected
+++ b/name_value/test/name-value-to-csv/basic/expected
@@ -1,3 +1,9 @@
-line[0]="a,1"
-line[1]="b,2"
-status=0
+basics[0]/output/line[0]="a,1"
+basics[0]/output/line[1]="b,2"
+basics[0]/status=0
+unquote[0]/output/line[0]="\"a\",1"
+unquote[0]/output/line[1]="\"b\",2"
+unquote[0]/status=0
+unquote[1]/output/line[0]="a,1"
+unquote[1]/output/line[1]="b,2"
+unquote[1]/status=0
diff --git a/name_value/test/name-value-to-csv/basic/input b/name_value/test/name-value-to-csv/basic/input
index 7e2e2a24d..a50ad6f2c 100644
--- a/name_value/test/name-value-to-csv/basic/input
+++ b/name_value/test/name-value-to-csv/basic/input
@@ -1,5 +1,3 @@
-[0]/name=a
-[0]/value=1
-[1]/name=b
-[1]/value=2
-
+basics[0]="( echo [0]/name=a; echo [0]/value=1; echo [1]/name=b; echo [1]/value=2 ) | name-value-to-csv --fields name,value"
+unquote[0]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2 ) | name-value-to-csv --fields name,value"
+unquote[1]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2 ) | name-value-to-csv --fields name,value --unquote"
diff --git a/name_value/test/name-value-to-csv/basic/options b/name_value/test/name-value-to-csv/basic/options
deleted file mode 100644
index 5241b8824..000000000
--- a/name_value/test/name-value-to-csv/basic/options
+++ /dev/null
@@ -1 +0,0 @@
---fields=name,value
diff --git a/name_value/test/name-value-to-csv/basic/test b/name_value/test/name-value-to-csv/basic/test
new file mode 100755
index 000000000..988ba14ee
--- /dev/null
+++ b/name_value/test/name-value-to-csv/basic/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+comma_test_commands

From 16edc3ff461cf1abad47eaa354f84efdb92c9e51 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Aug 2022 15:45:01 +1000
Subject: [PATCH 0526/1056] comma-application-util: swiss init: unnamed
 options: bug fixed

---
 bash/comma-application-util | 35 +++++------------------------------
 1 file changed, 5 insertions(+), 30 deletions(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 49141e15f..8d8d72703 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -1,34 +1,7 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
 # Copyright (c) 2020 Vsevolod Vlaskine
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 ## @page comma-application-util comma-application-util
 # this script is designed to be included in another script directly, for example:
@@ -292,7 +265,8 @@ function comma-application-swiss-init()
     function verbose() { (( ! options_verbose )) || echo "$comma_application_name: ${comma_application_swiss_operation}: $@" >&2; }
     function die() { say "$@"; exit 1; }
     [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
-    local options; options=$( ( echo "$common_options"; comma-application-common-options ) | comma-options-to-name-value "$@" ) || die "invalid options"
+    local options_described=$( echo "$common_options"; comma-application-common-options )
+    local options; options=$( comma-options-to-name-value "$@" <<< "$options_described" ) || die "invalid options"
     eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
     #(( !options_verbose )) || verbose_option="--verbose"
     #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
@@ -300,10 +274,11 @@ function comma-application-swiss-init()
     #(( !options_output_fields )) || { eval "echo \$${operation//-/_}_output_fields"; exit 0; } # quick and dirty
     #(( !options_output_format )) || { eval "echo \$${operation//-/_}_output_format"; exit 0; } # quick and dirty
     if [[ $( type -t ${comma_application_swiss_operation}-options ) == "function" ]]; then
-        local operation_options; operation_options=$( ${comma_application_swiss_operation}-options | comma-options-to-name-value "$@" ) || die "invalid options"
+        local operation_options_described=$( ${comma_application_swiss_operation}-options )
+        local operation_options; operation_options=$( comma-options-to-name-value "$@" <<< "$operation_options_described" ) || die "invalid options"
         eval "$( grep -v '^"' <<< "$operation_options" | sed 's#^#options_#' | comma_path_value_mangle )"
     fi
-    mapfile -t options_unnamed < <( ( echo "$options"; echo "$operation_options" ) | grep '^"' | sed -e 's#^"##' -e 's#"$##' )
+    mapfile -t options_unnamed < <( ( echo "$options_described"; echo "$operation_options_described"; ) | comma-options-to-name-value "$@" | grep '^"' | sed -e 's#^"##' -e 's#"$##' )
 }
 
 export -f comma-application-swiss-init

From c5f43480b6c5b034cf01efd448235912703a5143 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 17 Aug 2022 14:31:24 +1000
Subject: [PATCH 0527/1056] name_value/parser: trivial brush-up

---
 name_value/parser.h | 64 +++++++--------------------------------------
 1 file changed, 10 insertions(+), 54 deletions(-)

diff --git a/name_value/parser.h b/name_value/parser.h
index 4143ff2f0..9cb4e16aa 100644
--- a/name_value/parser.h
+++ b/name_value/parser.h
@@ -1,51 +1,16 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author cedric wohlleber
 
-#ifndef COMMA_APPLICATION_NAME_VALUE_PARSER_H
-#define COMMA_APPLICATION_NAME_VALUE_PARSER_H
-
-#include <map>
+#pragma once
 
-#include "../base/exception.h"
 #include "../visiting/apply.h"
 #include "../name_value/map.h"
 #include "../name_value/impl/options.h"
 #include "../name_value/impl/from_name_value.h"
 #include "../name_value/impl/to_name_value.h"
 
-namespace comma
-{
-namespace name_value
-{
+namespace comma { namespace name_value {
     
 /// parser for semicolon-separated name-value string
 class parser
@@ -78,25 +43,18 @@ class parser
     void put( std::string& line, const S& s ) const;
 
 private:
-    impl::options m_options;
+    impl::options _options;
 };
 
+inline parser::parser( char delimiter, char value_delimiter, bool full_path_as_name ): _options( delimiter, value_delimiter, full_path_as_name ) {}
 
-inline parser::parser( char delimiter, char value_delimiter, bool full_path_as_name ):
-    m_options( delimiter, value_delimiter, full_path_as_name )
-{
-}
-
-inline parser::parser( const std::string& fields, char delimiter, char value_delimiter, bool full_path_as_name ):
-    m_options( fields, delimiter, value_delimiter, full_path_as_name )
-{
-}
+inline parser::parser( const std::string& fields, char delimiter, char value_delimiter, bool full_path_as_name ): _options( fields, delimiter, value_delimiter, full_path_as_name ) {}
 
 template < typename S >
 inline S parser::get( const std::string& line, const S& default_s ) const
 {
-    map::map_type m = map( line, m_options ).get();
-    name_value::impl::from_name_value from_name_value( m, m_options.m_full_path_as_name );
+    map::map_type m = map( line, _options ).get();
+    name_value::impl::from_name_value from_name_value( m, _options.m_full_path_as_name );
     S s = default_s;
     visiting::apply( from_name_value ).to( s );
     return s;
@@ -105,11 +63,9 @@ inline S parser::get( const std::string& line, const S& default_s ) const
 template < typename S >
 inline std::string parser::put( const S& s ) const
 {
-    name_value::impl::to_name_value toname_value( m_options.m_value_delimiter, m_options.m_full_path_as_name );
+    name_value::impl::to_name_value toname_value( _options.m_value_delimiter, _options.m_full_path_as_name );
     visiting::apply( toname_value ).to( s );
-    return join( toname_value.strings(), m_options.m_delimiter );
+    return join( toname_value.strings(), _options.m_delimiter );
 }
 
-} }
-
-#endif // COMMA_APPLICATION_NAME_VALUE_PARSER_H
+} } // namespace comma { namespace name_value {

From 2c7345ab7c0ca69d8e82f6e83e967b06bed097a9 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 17 Aug 2022 18:22:41 +1000
Subject: [PATCH 0528/1056] csv-random: make: gaussian: implementing...

---
 csv/applications/csv-random.cpp | 37 ++++++++++++++++++++-------------
 1 file changed, 23 insertions(+), 14 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 658cbc507..504bfe993 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -13,6 +13,7 @@
 #include "../../application/command_line_options.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
+#include "../../string/string.h"
 
 static void usage( bool verbose )
 {
@@ -30,7 +31,10 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "        options" << std::endl;
     std::cerr << "            --append; append random numbers to stdin input" << std::endl;
-    std::cerr << "            --distribution=<distribution>; default=uniform; todo: more distributions to plug in, just ask" << std::endl;
+    std::cerr << "            --distribution=<distribution>[;<options>]; default=uniform; values: uniform, gaussian, normal; todo: more distributions to plug in, just ask" << std::endl;
+    std::cerr << "                uniform[;<min>;<max>]: if <min>, <max> not present, --range values will be used" << std::endl;
+    std::cerr << "                gaussian[;<mean>;<sigma>]" << std::endl;
+    std::cerr << "                normal: alias for gaussian" << std::endl;
     std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
     std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
     std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
@@ -207,12 +211,15 @@ static int run_impl( const comma::command_line_options& options )
 
 static int run( const comma::command_line_options& options ) // quick and dirty
 {
-    const auto& distribution = options.value< std::string >( "--distribution", "uniform" );
+    const auto& params = comma::split( options.value< std::string >( "--distribution", "uniform" ), ',' );
+    const std::string& distribution = params[0];
     const auto& format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
     if ( format.collapsed_string().find( ',' ) != std::string::npos ) { std::cerr << "csv-random make: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl; return 1; }
     if( distribution == "uniform" )
     {
-        switch ( format.offset( 0 ).type )
+        if( params.size() != 1 && params.size() != 3 ) { std::cerr << "csv-random make: uniform: expected uniform[,<min>,<max>]; got: \"" << options.value< std::string >( "--distribution" ) << "\"" << std::endl; return 1; }
+        if( params.size() == 3 ) { std::cerr << "csv-random make: uniform: parameters handling: implementing..." << std::endl; return 1; }
+        switch( format.offset( 0 ).type )
         {
             case csv::format::int8: return run_impl< char, std::uniform_int_distribution >( options );
             case csv::format::uint8: return run_impl< unsigned char, std::uniform_int_distribution >( options );
@@ -224,7 +231,17 @@ static int run( const comma::command_line_options& options ) // quick and dirty
             case csv::format::uint64: return run_impl< comma::uint64, std::uniform_int_distribution >( options );
             case csv::format::float_t: return run_impl< float, std::uniform_real_distribution >( options );
             case csv::format::double_t: return run_impl< double, std::uniform_real_distribution >( options );
-            default: std::cerr << "csv-random make: expected type; got: '" << format.string() << "'" << std::endl; return 1;
+            default: std::cerr << "csv-random make: uniform distribution: expected type; got: '" << format.string() << "'" << std::endl; return 1;
+        }
+    }
+    if( distribution == "gaussian" || distribution == "normal" )
+    {
+        std::cerr << "csv-random make: normal: implementing..." << std::endl; return 1;
+        switch( format.offset( 0 ).type )
+        {
+            case csv::format::float_t: return run_impl< float, std::normal_distribution >( options );
+            case csv::format::double_t: return run_impl< double, std::normal_distribution >( options );
+            default: std::cerr << "csv-random make: normal distribution: expected floating point --type; got unsupported type: '" << format.string() << "'" << std::endl; return 1;
         }
     }
     std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
@@ -331,11 +348,7 @@ static int run_impl( const comma::command_line_options& options, std::size_t cou
             {
                 std::cin.read( &buf[0], buf.size() );
                 if( std::cin.gcount() == 0 ) { return 0; }
-                if( std::cin.gcount() != static_cast< int >( buf.size() ) )
-                {
-                    std::cerr << "csv-random true-random: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl;
-                    return 1;
-                }
+                if( std::cin.gcount() != static_cast< int >( buf.size() ) ) { std::cerr << "csv-random true-random: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
             }
             else
             {
@@ -360,11 +373,7 @@ static int run_impl( const comma::command_line_options& options, std::size_t cou
 static int run( const comma::command_line_options& options )
 {
     const auto format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
-    if( format.collapsed_string().find( ',' ) != std::string::npos )
-    {
-        std::cerr << "csv-random true-random: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl;
-        return 1;
-    }
+    if( format.collapsed_string().find( ',' ) != std::string::npos ) { std::cerr << "csv-random true-random: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl; return 1; }
     switch( format.offset( 0 ).type ) {
         case csv::format::int8: return run_impl< char >( options, format.count() );
         case csv::format::uint8: return run_impl< unsigned char >( options, format.count() );

From d326b116c27e62bd98c2cd62f873a99d9f1bf315 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 18 Aug 2022 11:23:01 +1000
Subject: [PATCH 0529/1056] csv-random: make: normal distribution plugged in

---
 csv/applications/csv-random.cpp | 94 +++++++++++++++++++++------------
 1 file changed, 60 insertions(+), 34 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 504bfe993..b69045527 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -11,6 +11,7 @@
 #include <vector>
 
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../string/string.h"
@@ -118,7 +119,7 @@ template <> struct type_traits< unsigned char > { static unsigned int cast( cons
 namespace make {
 
 template < typename T, template < typename > class Distribution, typename Engine >
-static int run_impl( Distribution< T >& distribution, bool append, bool binary, std::size_t count )
+static int run_impl( Distribution< T >& distribution, bool append, bool binary, std::size_t count, const boost::optional< std::pair< T, T > >& range )
 {
     Engine engine = ::seed ? Engine( *::seed ) : Engine();
     if( !::csv.flush ) { std::cin.tie( nullptr ); }
@@ -181,66 +182,91 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
     return 0;
 }
 
+template < typename T > static std::vector< T > _as( const std::vector< std::string >& v, unsigned int begin ) // todo? move to library?
+{
+    std::vector< T > r( v.size() - begin );
+    for( unsigned int i = begin; i < v.size(); r[ i - begin ] = boost::lexical_cast< T >( v[i] ), ++i );
+    return r;
+}
+
+template < typename T, template < typename > class Distribution, unsigned int Size > struct distribution_traits { static Distribution< T > make( const std::vector< T >& p ); }; // quick and dirty
+template < typename T, template < typename > class Distribution > struct distribution_traits< T, Distribution, 0 > { static Distribution< T > make( const std::vector< T >& p ) { return Distribution< T >(); } };
+template < typename T, template < typename > class Distribution > struct distribution_traits< T, Distribution, 1 > { static Distribution< T > make( const std::vector< T >& p ) { return Distribution< T >( p[0] ); } };
+template < typename T, template < typename > class Distribution > struct distribution_traits< T, Distribution, 2 > { static Distribution< T > make( const std::vector< T >& p ) { return Distribution< T >( p[0], p[1] ); } };
+
+template < typename T, template < typename > class Distribution > static Distribution< T > make_distribution( const std::vector< std::string >& params ) // quick and dirty
+{
+    const auto& p = _as< T >( params, 1 );
+    switch( p.size() ) // quick and dirty; does not scale, but for now just to make it working
+    {
+        case 0: return distribution_traits< T, Distribution, 0 >::make( p );
+        case 1: return distribution_traits< T, Distribution, 1 >::make( p );
+        case 2: return distribution_traits< T, Distribution, 2 >::make( p );
+        default: COMMA_THROW( comma::exception, "distribution traits for " << p.size() << " parameters: not implemented; just ask" );
+    }
+}
+
 template < typename T, template < typename > class Distribution >
-static int run_impl( const comma::command_line_options& options )
+static int run_impl( const std::vector< std::string >& params, const comma::command_line_options& options )
 {
     const auto& append = options.exists( "--append" );
     const auto& binary = options.exists( "--output-binary" ) || ::csv.binary();
     const auto& engine = options.value< std::string >( "--engine", "mt19937_64" );
     const auto& count = comma::csv::format( options.value< std::string >( "--type", "ui" ) ).count();
-    const auto& r = options.optional< std::string >( "--range" ); // todo: parse distribution parameters
-    Distribution< T > distribution;
-    if( r )
-    {
-        const auto& range = comma::csv::ascii< std::pair< T, T > >().get( *r );
-        distribution = Distribution< T >( range.first, range.second );
-    }
-    if( engine == "minstd_rand0" ) { return run_impl< T, Distribution, std::minstd_rand0 >( distribution, append, binary, count ); }
-    if( engine == "minstd_rand" ) { return run_impl< T, Distribution, std::minstd_rand >( distribution, append, binary, count ); }
-    if( engine == "mt19937" ) { return run_impl< T, Distribution, std::mt19937 >( distribution, append, binary, count ); }
-    if( engine == "mt19937_64" ) { return run_impl< T, Distribution, std::mt19937_64 >( distribution, append, binary, count ); }
-    if( engine == "ranlux24_base" ) { return run_impl< T, Distribution, std::ranlux24_base >( distribution, append, binary, count ); }
-    if( engine == "ranlux48_base" ) { return run_impl< T, Distribution, std::ranlux48_base >( distribution, append, binary, count ); }
-    if( engine == "ranlux24" ) { return run_impl< T, Distribution, std::ranlux24 >( distribution, append, binary, count ); }
-    if( engine == "ranlux48" ) { return run_impl< T, Distribution, std::ranlux48 >( distribution, append, binary, count ); }
-    if( engine == "knuth_b" ) { return run_impl< T, Distribution, std::knuth_b >( distribution, append, binary, count ); }
-    if( engine == "default_random_engine" ) { return run_impl< T, Distribution, std::default_random_engine >( distribution, append, binary, count ); }
+    boost::optional< std::pair< T, T > > range;
+    if( options.exists( "--range" ) ) { range = comma::csv::ascii< std::pair< T, T > >().get( options.value< std::string >( "--range" ) ); }
+    Distribution< T > distribution = make_distribution< T, Distribution >( params );
+    if( engine == "minstd_rand0" ) { return run_impl< T, Distribution, std::minstd_rand0 >( distribution, append, binary, count, range ); }
+    if( engine == "minstd_rand" ) { return run_impl< T, Distribution, std::minstd_rand >( distribution, append, binary, count, range ); }
+    if( engine == "mt19937" ) { return run_impl< T, Distribution, std::mt19937 >( distribution, append, binary, count, range ); }
+    if( engine == "mt19937_64" ) { return run_impl< T, Distribution, std::mt19937_64 >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux24_base" ) { return run_impl< T, Distribution, std::ranlux24_base >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux48_base" ) { return run_impl< T, Distribution, std::ranlux48_base >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux24" ) { return run_impl< T, Distribution, std::ranlux24 >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux48" ) { return run_impl< T, Distribution, std::ranlux48 >( distribution, append, binary, count, range ); }
+    if( engine == "knuth_b" ) { return run_impl< T, Distribution, std::knuth_b >( distribution, append, binary, count, range ); }
+    if( engine == "default_random_engine" ) { return run_impl< T, Distribution, std::default_random_engine >( distribution, append, binary, count, range ); }
     std::cerr << "csv-random make: expected engine; got: '" << engine << "'" << std::endl;
     return 1;
 }
 
 static int run( const comma::command_line_options& options ) // quick and dirty
 {
-    const auto& params = comma::split( options.value< std::string >( "--distribution", "uniform" ), ',' );
+    auto params = comma::split( options.value< std::string >( "--distribution", "uniform" ), ',' );
     const std::string& distribution = params[0];
     const auto& format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
     if ( format.collapsed_string().find( ',' ) != std::string::npos ) { std::cerr << "csv-random make: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl; return 1; }
     if( distribution == "uniform" )
     {
+        if( options.exists( "--range" ) ) // super-quick and dirty to preserve backward compatibility
+        {
+            if( params.size() > 1 ) { std::cerr << "csv-random make: uniform: either use --range or uniform[,<min>,<max>], not both" << std::endl; return 1; }
+            const auto& r = comma::split( options.value< std::string >( "--range" ), ',' );
+            params = { "uniform", r[0], r[1] };
+        }
         if( params.size() != 1 && params.size() != 3 ) { std::cerr << "csv-random make: uniform: expected uniform[,<min>,<max>]; got: \"" << options.value< std::string >( "--distribution" ) << "\"" << std::endl; return 1; }
-        if( params.size() == 3 ) { std::cerr << "csv-random make: uniform: parameters handling: implementing..." << std::endl; return 1; }
         switch( format.offset( 0 ).type )
         {
-            case csv::format::int8: return run_impl< char, std::uniform_int_distribution >( options );
-            case csv::format::uint8: return run_impl< unsigned char, std::uniform_int_distribution >( options );
-            case csv::format::int16: return run_impl< comma::int16, std::uniform_int_distribution >( options );
-            case csv::format::uint16: return run_impl< comma::uint16, std::uniform_int_distribution >( options );
-            case csv::format::int32: return run_impl< comma::int32, std::uniform_int_distribution >( options );
-            case csv::format::uint32: return run_impl< comma::uint32, std::uniform_int_distribution >( options );
-            case csv::format::int64: return run_impl< comma::int64, std::uniform_int_distribution >( options );
-            case csv::format::uint64: return run_impl< comma::uint64, std::uniform_int_distribution >( options );
-            case csv::format::float_t: return run_impl< float, std::uniform_real_distribution >( options );
-            case csv::format::double_t: return run_impl< double, std::uniform_real_distribution >( options );
+            case csv::format::int8: return run_impl< char, std::uniform_int_distribution >( params, options );
+            case csv::format::uint8: return run_impl< unsigned char, std::uniform_int_distribution >( params, options );
+            case csv::format::int16: return run_impl< comma::int16, std::uniform_int_distribution >( params, options );
+            case csv::format::uint16: return run_impl< comma::uint16, std::uniform_int_distribution >( params, options );
+            case csv::format::int32: return run_impl< comma::int32, std::uniform_int_distribution >( params, options );
+            case csv::format::uint32: return run_impl< comma::uint32, std::uniform_int_distribution >( params, options );
+            case csv::format::int64: return run_impl< comma::int64, std::uniform_int_distribution >( params, options );
+            case csv::format::uint64: return run_impl< comma::uint64, std::uniform_int_distribution >( params, options );
+            case csv::format::float_t: return run_impl< float, std::uniform_real_distribution >( params, options );
+            case csv::format::double_t: return run_impl< double, std::uniform_real_distribution >( params, options );
             default: std::cerr << "csv-random make: uniform distribution: expected type; got: '" << format.string() << "'" << std::endl; return 1;
         }
     }
     if( distribution == "gaussian" || distribution == "normal" )
     {
-        std::cerr << "csv-random make: normal: implementing..." << std::endl; return 1;
+        if( params.size() != 1 && params.size() != 3 ) { std::cerr << "csv-random make: gaussian: expected gaussian[,<mean>,<sigma>]; got: \"" << options.value< std::string >( "--distribution" ) << "\"" << std::endl; return 1; }
         switch( format.offset( 0 ).type )
         {
-            case csv::format::float_t: return run_impl< float, std::normal_distribution >( options );
-            case csv::format::double_t: return run_impl< double, std::normal_distribution >( options );
+            case csv::format::float_t: return run_impl< float, std::normal_distribution >( params, options );
+            case csv::format::double_t: return run_impl< double, std::normal_distribution >( params, options );
             default: std::cerr << "csv-random make: normal distribution: expected floating point --type; got unsupported type: '" << format.string() << "'" << std::endl; return 1;
         }
     }

From 052cc4f5a99f839709055e669a950be68e0d00cc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 18 Aug 2022 11:47:40 +1000
Subject: [PATCH 0530/1056] csv-random: --range plugged in

---
 csv/applications/csv-random.cpp | 23 ++++++++++++++++-------
 1 file changed, 16 insertions(+), 7 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index b69045527..e5189572d 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -38,7 +38,7 @@ static void usage( bool verbose )
     std::cerr << "                normal: alias for gaussian" << std::endl;
     std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
     std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
-    std::cerr << "            --range=[<min>,<max>]; desired value range, default: whatever stl defines (usually numeric limits)" << std::endl;
+    std::cerr << "            --range=[<min>,<max>]; desired value range: attention! currently, will pick value until gets something in range" << std::endl;
     std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, l, ul, f, d; can have more than one <type> i.e. 3ui" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    true-random: output non-deterministic uniformly distributed unsigned int random numbers (if non-deterministic source is not available" << std::endl;
@@ -122,6 +122,15 @@ template < typename T, template < typename > class Distribution, typename Engine
 static int run_impl( Distribution< T >& distribution, bool append, bool binary, std::size_t count, const boost::optional< std::pair< T, T > >& range )
 {
     Engine engine = ::seed ? Engine( *::seed ) : Engine();
+    auto _pick = [&]() -> T
+    {
+        if( !range ) { return distribution( engine ); }
+        while( true ) // todo? parametrise? while( true ) is quite cruel
+        {
+            T r = distribution( engine );
+            if( r >= range->first && r <= range->second ) { return r; }
+        }
+    };
     if( !::csv.flush ) { std::cin.tie( nullptr ); }
     if( append )
     {
@@ -136,7 +145,7 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
                 std::cout.write( &buf[0], buf.size() );
                 for( std::size_t i = 0; i < count; ++i )
                 {
-                    T r = distribution( engine );
+                    T r = _pick();
                     std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
                 }
                 if( ::csv.flush ) { std::cout.flush(); }
@@ -149,7 +158,7 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
             std::getline( std::cin, s );
             if( s.empty() ) { continue; }
             std::cout << s;
-            for( std::size_t i = 0; i < count; ++i ) { std::cout << ::csv.delimiter << type_traits< T >::cast( distribution( engine ) ); }
+            for( std::size_t i = 0; i < count; ++i ) { std::cout << ::csv.delimiter << type_traits< T >::cast( _pick() ); }
             std::cout << std::endl;
             if( ::csv.flush ) { std::cout.flush(); }
         }
@@ -161,7 +170,7 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
         {
             for( std::size_t i = 0; i < count; ++i )
             {
-                T r = distribution( engine );
+                T r = _pick();
                 std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
             }
             if( ::csv.flush ) { std::cout.flush(); }
@@ -173,7 +182,7 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
         std::string comma;
         for( std::size_t i = 0; i < count; ++i )
         {
-            std::cout << comma << type_traits< T >::cast( distribution( engine ) );
+            std::cout << comma << type_traits< T >::cast( _pick() );
             comma = ::csv.delimiter;
         }
         std::cout << std::endl;
@@ -214,7 +223,7 @@ static int run_impl( const std::vector< std::string >& params, const comma::comm
     const auto& engine = options.value< std::string >( "--engine", "mt19937_64" );
     const auto& count = comma::csv::format( options.value< std::string >( "--type", "ui" ) ).count();
     boost::optional< std::pair< T, T > > range;
-    if( options.exists( "--range" ) ) { range = comma::csv::ascii< std::pair< T, T > >().get( options.value< std::string >( "--range" ) ); }
+    if( options.exists( "--range" ) && params[0] != "uniform" ) { range = comma::csv::ascii< std::pair< T, T > >().get( options.value< std::string >( "--range" ) ); } // quick and dirty
     Distribution< T > distribution = make_distribution< T, Distribution >( params );
     if( engine == "minstd_rand0" ) { return run_impl< T, Distribution, std::minstd_rand0 >( distribution, append, binary, count, range ); }
     if( engine == "minstd_rand" ) { return run_impl< T, Distribution, std::minstd_rand >( distribution, append, binary, count, range ); }
@@ -262,7 +271,7 @@ static int run( const comma::command_line_options& options ) // quick and dirty
     }
     if( distribution == "gaussian" || distribution == "normal" )
     {
-        if( params.size() != 1 && params.size() != 3 ) { std::cerr << "csv-random make: gaussian: expected gaussian[,<mean>,<sigma>]; got: \"" << options.value< std::string >( "--distribution" ) << "\"" << std::endl; return 1; }
+        if( params.size() != 1 && params.size() != 3 ) { std::cerr << "csv-random make: gaussian: expected gaussian[,<mean>,<stddev>]; got: \"" << options.value< std::string >( "--distribution" ) << "\"" << std::endl; return 1; }
         switch( format.offset( 0 ).type )
         {
             case csv::format::float_t: return run_impl< float, std::normal_distribution >( params, options );

From e9bfb1e20a2b3403ec83f1db01ce46a5a5a0f2b1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Aug 2022 10:37:45 +1000
Subject: [PATCH 0531/1056] name-value-to-csv: quoting bug fixed, basic tests
 added

---
 name_value/applications/name-value-to-csv.cpp | 21 +++++++++----------
 .../test/name-value-to-csv/basic/expected     |  9 ++++++++
 name_value/test/name-value-to-csv/basic/input |  3 +++
 3 files changed, 22 insertions(+), 11 deletions(-)

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index 32be635df..19ebb77db 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -89,9 +89,6 @@ static std::string join( const std::vector< std::string >& fields, values_t& val
     return oss.str();
 }
 
-static bool unquote;
-static std::string _unquoted( const std::string s ) { return unquote && s.size() >= 2 ? comma::strip( s, "\"" ) : s; }
-
 int main( int ac, char** av )
 {
     try
@@ -113,7 +110,7 @@ int main( int ac, char** av )
         if( fields[0].empty() && unindexed_fields.empty() ) { std::cerr << "name-value-to-csv: please specify --fields or --unindexed-fields" << std::endl; return 1; }
         bool unindexed = fields[0].empty();
         values_t unindexed_values;
-        unquote = options.exists( "--unquote" );
+        bool unquote = options.exists( "--unquote" );
         bool unsorted = options.exists( "--unsorted" );
         char delimiter = options.value( "--delimiter,-d", ',' );
         char equal_sign = options.value( "--equal-sign,-e", '=' );
@@ -124,25 +121,27 @@ int main( int ac, char** av )
         std::string key;
         bool is_map = options.exists( "--dict,--map" );
         if( is_map && unsorted ) { comma::say() << "combination of --map and --unsorted: todo, just ask" << std::endl; return 1; }
+        std::string::size_type e = std::string::npos;
+        auto value = [&]( const std::string& s ) { const std::string& t = s.substr( e + 1 ); return unquote && t.size() >= 2 ? comma::strip( t, "\"" ) : t; };
         while( std::cin.good() && !std::cin.eof() )
         {
             std::string s;
             std::getline( std::cin, s );
             if( comma::strip( s, " \t" ).empty() || comma::strip( s, " \t" )[0] == '#' ) { continue; }
-            auto e = s.find_first_of( equal_sign ); // todo: use boost::spirit
+            e = s.find_first_of( equal_sign ); // todo: use boost::spirit
             if( e == std::string::npos ) { std::cerr << "name-value-to-csv: expected path-value pair; got: '" << s << "'" << std::endl; return 1; }
             std::string name = s.substr( 0, e );
             if( unindexed_fields_set.find( name ) != unindexed_fields_set.end() )
             {
-                unindexed_values[name] = s.substr( e + 1 );
+                unindexed_values[name] = value( s );
                 if( unindexed_stream ) { std::cout << join( unindexed_fields, unindexed_values, delimiter, !unindexed_stream_update ) << std::endl; }
                 continue;
             }
             if( name.substr( 0, prefix.size() ) != prefix ) { continue; }
             if( unindexed )
             {
-                if( prefix.empty() ) { values[name] = _unquoted( s.substr( e + 1 ) ); }
-                else if( name[ prefix.size() ] == '/' ) { values[ name.substr( prefix.size() + 1 ) ] = _unquoted( s.substr( e + 1 ) ); }
+                if( prefix.empty() ) { values[name] = value( s ); }
+                else if( name[ prefix.size() ] == '/' ) { values[ name.substr( prefix.size() + 1 ) ] = value( s ); }
                 continue;
             }
             if( is_map )
@@ -153,7 +152,7 @@ int main( int ac, char** av )
                 std::string current_key = name.substr( prefix.size() + 1, b - prefix.size() - 1 );
                 if( unsorted ) {} // todo
                 if( !key.empty() && current_key != key ) { std::cout << key << delimiter << join( fields, values, delimiter ) << std::endl; }
-                values[name.substr( b + 1 )] = _unquoted( s.substr( e + 1 ) );
+                values[name.substr( b + 1 )] = value( s );
                 key = current_key;
             }
             else
@@ -163,10 +162,10 @@ int main( int ac, char** av )
                 if( b == std::string::npos ) { std::cerr << "name-value-to-csv: with prefix \"" << prefix << "\" expected path-value pair with valid indices; got: '" << s << "'" << std::endl; return 1; }
                 if( s[ b + 1 ] != '/' ) { continue; }
                 unsigned int current_index = boost::lexical_cast< unsigned int >( name.substr( prefix.size() + 1, b - prefix.size() - 1 ) );
-                if( unsorted || !unindexed_fields.empty() ) { map[current_index][name.substr( b + 2 )] = s.substr( e + 1 ); continue; }
+                if( unsorted || !unindexed_fields.empty() ) { map[current_index][name.substr( b + 2 )] = value( s ); continue; }
                 if( index && current_index < *index ) { std::cerr << "name-value-to-csv: expected sorted index, got index " << current_index << " after " << *index << " in line: '" << comma::strip( s ) << "'" << std::endl; return 1; }
                 if( index && current_index > *index ) { std::cout << join( fields, values, delimiter ) << std::endl; }
-                values[name.substr( b + 2 )] = _unquoted( s.substr( e + 1 ) );
+                values[name.substr( b + 2 )] = value( s );
                 index = current_index;
             }
         }
diff --git a/name_value/test/name-value-to-csv/basic/expected b/name_value/test/name-value-to-csv/basic/expected
index 8491ee5b1..0f2b23313 100644
--- a/name_value/test/name-value-to-csv/basic/expected
+++ b/name_value/test/name-value-to-csv/basic/expected
@@ -7,3 +7,12 @@ unquote[0]/status=0
 unquote[1]/output/line[0]="a,1"
 unquote[1]/output/line[1]="b,2"
 unquote[1]/status=0
+unquote[2]/output/line[0]="\"a\",1"
+unquote[2]/output/line[1]="\"b\",2"
+unquote[2]/status=0
+unquote[3]/output/line[0]="\"a\",1,3,z"
+unquote[3]/output/line[1]="\"b\",2,3,z"
+unquote[3]/status=0
+unquote[4]/output/line[0]="a,1,3,z"
+unquote[4]/output/line[1]="b,2,3,z"
+unquote[4]/status=0
diff --git a/name_value/test/name-value-to-csv/basic/input b/name_value/test/name-value-to-csv/basic/input
index a50ad6f2c..6a89da8fb 100644
--- a/name_value/test/name-value-to-csv/basic/input
+++ b/name_value/test/name-value-to-csv/basic/input
@@ -1,3 +1,6 @@
 basics[0]="( echo [0]/name=a; echo [0]/value=1; echo [1]/name=b; echo [1]/value=2 ) | name-value-to-csv --fields name,value"
 unquote[0]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2 ) | name-value-to-csv --fields name,value"
 unquote[1]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2 ) | name-value-to-csv --fields name,value --unquote"
+unquote[2]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2; echo c=3 ) | name-value-to-csv --fields name,value"
+unquote[3]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2; echo c=3; echo d="z" ) | name-value-to-csv --fields name,value --unindexed-fields c,d"
+unquote[4]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2; echo c=3; echo d="z" ) | name-value-to-csv --fields name,value --unindexed-fields c,d --unquote"

From af5f59d52b56e50b266cb3144962ead85f9ae980 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Aug 2022 11:24:54 +1000
Subject: [PATCH 0532/1056] csv-thin: minor brush-up

---
 csv/applications/csv-thin.cpp | 46 +++++++----------------------------
 1 file changed, 9 insertions(+), 37 deletions(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index a71e24183..aee6464ee 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -165,14 +138,13 @@ int main( int ac, char** av )
         deterministic = options.exists( "--deterministic,-d" );
         invert = options.exists( "--invert,-i" );
         seed = options.optional< comma::uint32 >( "--seed" );
-        if( options.exists( "--period" )) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
+        if( options.exists( "--period" )) { period = boost::posix_time::microseconds( static_cast< unsigned int >( options.value< double >( "--period" ) * 1000000 ) ); }
         #ifdef WIN32
         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
-
         if( options.exists( "--fields" ))
         {
-            if( !period ) { COMMA_THROW( comma::exception, "--fields requires --period option" ); }
+            if( !period ) { comma::say() << "--fields requires --period option" << std::endl; }
             comma::csv::input_stream< timestamped > istream( std::cin, comma::csv::options( options ) );
             while( std::cin.good() && !std::cin.eof() )
             {
@@ -192,9 +164,9 @@ int main( int ac, char** av )
         if( !period )
         {
             v = options.unnamed( "--deterministic,-d", "-.*" );
-            if( v.empty() ) { std::cerr << "csv-thin: please specify rate" << std::endl; usage(); }
+            if( v.empty() ) { comma::say() << "please specify rate" << std::endl; usage(); }
             rate = boost::lexical_cast< double >( v[0] );
-            if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { std::cerr << "csv-thin: expected rate between 0 and 1, got " << rate << std::endl; usage(); }
+            if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { comma::say() << "expected rate between 0 and 1, got " << rate << std::endl; usage(); }
         }
         if( binary ) // quick and dirty, improve performance by reading larger buffer
         {
@@ -203,7 +175,7 @@ int main( int ac, char** av )
             boost::optional< comma::csv::format > f;
             if( !format_string.empty() ) { f.reset( comma::csv::format( format_string ) ); }
             if( !size ) { size = f->size(); }
-            if( f && f->size() != size ) { std::cerr << "csv-thin: expected consistent size, got --size " << size << " and --binary of size " << f->size() << std::endl; return 1; }
+            if( f && f->size() != size ) { comma::say() << "expected consistent size, got --size " << size << " and --binary of size " << f->size() << std::endl; return 1; }
             unsigned int factor = 65536 / size; // arbitrary
             if( factor == 0 ) { factor = 1; }
             std::vector< char > buf( size * factor );
@@ -217,7 +189,7 @@ int main( int ac, char** av )
                 //std::size_t e = available < int( size ) ? size : available - available % size;
                 std::cin.read( &buf[0], size ); // quick and dirty
                 if( std::cin.gcount() <= 0 ) { break; }
-                if( std::cin.gcount() < int( size ) ) { std::cerr << "csv-thin: expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; return 1; }
+                if( std::cin.gcount() < int( size ) ) { comma::say() << "expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; return 1; }
                 if( keep() ) { std::cout.write( &buf[0], size ); std::cout.flush(); }
             }
             #else
@@ -229,7 +201,7 @@ int main( int ac, char** av )
                 int count = ::read( comma::io::stdin_fd, cur + offset, capacity );
                 if( count <= 0 )
                 {
-                    if( offset != 0 ) { std::cerr << "csv-thin: expected at least " << size << " bytes, got only " << offset << std::endl; return 1; }
+                    if( offset != 0 ) { comma::say() << "expected at least " << size << " bytes, got only " << offset << std::endl; return 1; }
                     break;
                 }
                 offset += count;
@@ -254,7 +226,7 @@ int main( int ac, char** av )
         }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-thin: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-thin: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }

From a380ee8ad59989be68c00e5a4643ee40466b1387 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Aug 2022 11:26:28 +1000
Subject: [PATCH 0533/1056] csv-thin: exit on error: verbose output improved

---
 csv/applications/csv-thin.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index aee6464ee..238a5c506 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -54,7 +54,7 @@ static void usage( bool verbose = false )
     std::cerr << "    using timestamp from input:  cat full.csv | csv-thin --period 2 --fields t" << std::endl;
     std::cerr << "    binary data:                 cat full.bin | csv-thin 0.1 --binary 3d" << std::endl;
     std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 static double rate;
@@ -164,9 +164,9 @@ int main( int ac, char** av )
         if( !period )
         {
             v = options.unnamed( "--deterministic,-d", "-.*" );
-            if( v.empty() ) { comma::say() << "please specify rate" << std::endl; usage(); }
+            if( v.empty() ) { comma::say() << "please specify rate" << std::endl; return 1; }
             rate = boost::lexical_cast< double >( v[0] );
-            if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { comma::say() << "expected rate between 0 and 1, got " << rate << std::endl; usage(); }
+            if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { comma::say() << "expected rate between 0 and 1, got " << rate << std::endl; return 1; }
         }
         if( binary ) // quick and dirty, improve performance by reading larger buffer
         {

From 64a03310426576dc7ba09a1873f0e791da4f25c4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Sep 2022 12:54:53 +1000
Subject: [PATCH 0534/1056] comma-timeout-group: --help: typo fixed

---
 io/load.h                                 | 43 +++++++++++++++++
 util/applications/comma-timeout-group.cpp | 59 ++++++-----------------
 2 files changed, 58 insertions(+), 44 deletions(-)
 create mode 100644 io/load.h

diff --git a/io/load.h b/io/load.h
new file mode 100644
index 000000000..fe05fb204
--- /dev/null
+++ b/io/load.h
@@ -0,0 +1,43 @@
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <fstream>
+#include <string>
+#include <vector>
+#include <boost/filesystem.hpp>
+#include "../base/exception.h"
+
+namespace comma { namespace io {
+
+/// convenience function to load a vector-like contiguous container from file
+template < typename T, template < typename S > class A = std::vector >
+A< T >& load_array( A< T >& a, const std::string& path );
+    
+/// convenience function to load a vector-like contiguous container from file
+/// @note allocates and returns the container, thus it is up to the user to use move semantics
+template < typename T, template < typename S > class A = std::vector >
+A< T > load_array( const std::string& path );
+
+
+template < typename T, template < typename S > class A >
+inline A< T >& load_array( A< T >& a, const std::string& path )
+{
+    std::ifstream ifs( path );
+    if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << path << "\"" ); }
+    a.resize( boost::filesystem::file_size( path ) / sizeof( T ) );
+    auto r = ifs.read( reinterpret_cast< char * >( &a[0] ), a.size() * sizeof( T ) );
+    if( r != a.size() * sizeof( T ) ) { COMMA_THROW( comma::exception, "expected to read " << a.size() * sizeof( T ) << " bytes (" << a.size() << " elements " << sizeof( T ) << " byte(s) each) from \"" << path << "\"; got: " << r << " byte(s)" ); }
+    return a;
+}
+
+template < typename T, template < typename S > class A >
+inline A< T > load_array( const std::string& path )
+{
+    A< T > a;
+    return load_array( a, path );
+}
+    
+} } // namespace comma { namespace io {
diff --git a/util/applications/comma-timeout-group.cpp b/util/applications/comma-timeout-group.cpp
index 5ab4eceed..9e514e4b8 100644
--- a/util/applications/comma-timeout-group.cpp
+++ b/util/applications/comma-timeout-group.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author dmitry mikhin
 
@@ -179,29 +151,28 @@ void usage( bool )
         "\n        -or-"
         "\n        comma-timeout-group --wait-for-process-group=5 --enforce-group 10 cmd"
         "\n            as above, but if comma-timeout-group is built without procps support"
-        "\n            exit with error"
-        "\n"
-        "\n";
+        "\n            exit with error";
+    std::cerr << msg_general << std::endl;
     exit( 0 );
 }
 
 // many values are used in the signal handler, no way to pass via arguments, hence, global
 // the rest just moved here to keep all in one place
-sig_atomic_t timed_out = 0;
-int signal_to_use = SIGTERM;  // same default as kill and timeout commands
-int child_pid = 0;
-bool verbose = false;
-bool verbose_signal_handler = false;
-bool report_timeout = false;
-bool preserve_status = false;
-double timeout = 0.0;
-double kill_after = 0.0;
+static sig_atomic_t timed_out = 0;
+static int signal_to_use = SIGTERM;  // same default as kill and timeout commands
+static int child_pid = 0;
+static bool verbose = false;
+static bool verbose_signal_handler = false;
+static bool report_timeout = false;
+static bool preserve_status = false;
+static double timeout = 0.0;
+static double kill_after = 0.0;
 #ifdef HAVE_PROCPS_DEV
-bool wait_for_process_group = false;
-const bool can_wait_for_process_group = true;
-unsigned int wait_for_process_group_delay = 100000;
+static bool wait_for_process_group = false;
+static const bool can_wait_for_process_group = true;
+static unsigned int wait_for_process_group_delay = 100000;
 #else
-const bool can_wait_for_process_group = false;
+static const bool can_wait_for_process_group = false;
 #endif
 
 double seconds_from_string( const std::string& s, bool allow_forever = false )

From 2e130512d5190d88074a6243c4b753cb080540b6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Sep 2022 12:55:14 +1000
Subject: [PATCH 0535/1056] io::load_array() implemented

---
 io/load.h               |  2 +-
 io/test/stream_test.cpp | 32 +++-----------------------------
 2 files changed, 4 insertions(+), 30 deletions(-)

diff --git a/io/load.h b/io/load.h
index fe05fb204..8691b3159 100644
--- a/io/load.h
+++ b/io/load.h
@@ -27,7 +27,7 @@ inline A< T >& load_array( A< T >& a, const std::string& path )
 {
     std::ifstream ifs( path );
     if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << path << "\"" ); }
-    a.resize( boost::filesystem::file_size( path ) / sizeof( T ) );
+    a.resize( boost::filesystem::file_size( path ) / sizeof( T ) ); // todo? will file_size work on symlinks?
     auto r = ifs.read( reinterpret_cast< char * >( &a[0] ), a.size() * sizeof( T ) );
     if( r != a.size() * sizeof( T ) ) { COMMA_THROW( comma::exception, "expected to read " << a.size() * sizeof( T ) << " bytes (" << a.size() << " elements " << sizeof( T ) << " byte(s) each) from \"" << path << "\"; got: " << r << " byte(s)" ); }
     return a;
diff --git a/io/test/stream_test.cpp b/io/test/stream_test.cpp
index 27133a78b..4fdab8db1 100644
--- a/io/test/stream_test.cpp
+++ b/io/test/stream_test.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <cstdio>
 #include <fstream>
@@ -34,6 +7,7 @@
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
 #include <boost/filesystem/operations.hpp>
+#include "../load.h" // just to make sure it compiles
 #include "../select.h"
 #include "../stream.h"
 
@@ -54,14 +28,14 @@ TEST( io, file_stream )
         boost::filesystem::remove( "./test.file" );
     }
     // todo: more testing?
-    system( "mkfifo test.pipe" );
+    EXPECT_EQ( system( "mkfifo test.pipe" ), 0 );
     EXPECT_TRUE( boost::filesystem::exists( "./test.pipe" ) );
     EXPECT_TRUE( !boost::filesystem::is_regular_file( "./test.pipe" ) );
     EXPECT_TRUE( ::open( "./test.pipe", O_RDONLY | O_NONBLOCK ) > 0 );
     comma::io::ostream os( "./test.pipe" );
     EXPECT_TRUE( os() != NULL );
     EXPECT_TRUE( os->good() );
-    system( "rm ./test.pipe" );
+    EXPECT_EQ( system( "rm ./test.pipe" ), 0 );
 }
 
 TEST( io, std_stream )

From 0b70b375e1449d9eb1b2df640d8eaf3d4bf4fdcf Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Sep 2022 13:56:31 +1000
Subject: [PATCH 0536/1056] io::load_array(): fixed

---
 io/load.h | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/io/load.h b/io/load.h
index 8691b3159..fd3f22af5 100644
--- a/io/load.h
+++ b/io/load.h
@@ -13,17 +13,17 @@
 namespace comma { namespace io {
 
 /// convenience function to load a vector-like contiguous container from file
-template < typename T, template < typename S > class A = std::vector >
-A< T >& load_array( A< T >& a, const std::string& path );
+template < typename T, template < typename S, typename A > class C = std::vector, typename A = std::allocator< T > >
+C< T, A >& load_array( C< T, A >& a, const std::string& path );
     
 /// convenience function to load a vector-like contiguous container from file
 /// @note allocates and returns the container, thus it is up to the user to use move semantics
-template < typename T, template < typename S > class A = std::vector >
-A< T > load_array( const std::string& path );
+template < typename T, template < typename S, typename A > class C = std::vector, typename A = std::allocator< T > >
+C< T, A > load_array( const std::string& path );
 
 
-template < typename T, template < typename S > class A >
-inline A< T >& load_array( A< T >& a, const std::string& path )
+template < typename T, template < typename S, typename A > class C = std::vector, typename A >
+inline C< T, A >& load_array( C< T, A >& a, const std::string& path )
 {
     std::ifstream ifs( path );
     if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << path << "\"" ); }
@@ -33,10 +33,10 @@ inline A< T >& load_array( A< T >& a, const std::string& path )
     return a;
 }
 
-template < typename T, template < typename S > class A >
-inline A< T > load_array( const std::string& path )
+template < typename T, template < typename S, typename A > class C = std::vector, typename A >
+inline C< T, A > load_array( const std::string& path )
 {
-    A< T > a;
+    C< T, A > a;
     return load_array( a, path );
 }
     

From 3f34df818604b442a3499edd182ebef511230c7a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Sep 2022 13:58:48 +1000
Subject: [PATCH 0537/1056] io::load_array(): gcount fixed

---
 io/load.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/load.h b/io/load.h
index fd3f22af5..35ee617fc 100644
--- a/io/load.h
+++ b/io/load.h
@@ -28,8 +28,8 @@ inline C< T, A >& load_array( C< T, A >& a, const std::string& path )
     std::ifstream ifs( path );
     if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << path << "\"" ); }
     a.resize( boost::filesystem::file_size( path ) / sizeof( T ) ); // todo? will file_size work on symlinks?
-    auto r = ifs.read( reinterpret_cast< char * >( &a[0] ), a.size() * sizeof( T ) );
-    if( r != a.size() * sizeof( T ) ) { COMMA_THROW( comma::exception, "expected to read " << a.size() * sizeof( T ) << " bytes (" << a.size() << " elements " << sizeof( T ) << " byte(s) each) from \"" << path << "\"; got: " << r << " byte(s)" ); }
+    ifs.read( reinterpret_cast< char * >( &a[0] ), a.size() * sizeof( T ) );
+    if( ifs.gcount() != int( a.size() * sizeof( T ) ) ) { COMMA_THROW( comma::exception, "expected to read " << a.size() * sizeof( T ) << " bytes (" << a.size() << " elements " << sizeof( T ) << " byte(s) each) from \"" << path << "\"; got: " << ifs.gcount() << " byte(s)" ); }
     return a;
 }
 

From 0436a7b528c31bb5b16374e18d6f289f486fb3a4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 13 Oct 2022 13:23:03 +1100
Subject: [PATCH 0538/1056] io-console: --help: exit with success; restoring
 terminal: made exception-safe

---
 io/applications/io-console.cpp | 65 ++++++++++++----------------------
 1 file changed, 22 insertions(+), 43 deletions(-)

diff --git a/io/applications/io-console.cpp b/io/applications/io-console.cpp
index fc12de231..6076306e1 100644
--- a/io/applications/io-console.cpp
+++ b/io/applications/io-console.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <termios.h>
 #include <iostream>
@@ -34,6 +7,23 @@
 #include "../../application/signal_flag.h"
 #include "../select.h"
 
+class no_echo_term
+{
+    public:
+        no_echo_term()
+        {
+            ::tcgetattr( STDIN_FILENO, &_old );
+            termios t = _old;
+            t.c_lflag &= ~( ICANON | ECHO );
+            ::tcsetattr( STDIN_FILENO, TCSANOW, &t );
+        }
+
+        ~no_echo_term() { ::tcsetattr( STDIN_FILENO, TCSANOW, &_old ); }
+
+    private:
+        struct termios _old;
+};
+
 int main( int argc, char** argv )
 {
     try
@@ -44,22 +34,20 @@ int main( int argc, char** argv )
             ( "help,h", "display help message" )
             ( "heartbeat,b", "output byte with value 0x00 when key pressed" )
             ( "period,t", boost::program_options::value< double >( &period )->default_value( 0.1, "0.1" ), "period in seconds between heartbeats" );
-
         boost::program_options::variables_map vm;
         boost::program_options::store( boost::program_options::parse_command_line( argc, argv, description), vm );
         boost::program_options::notify( vm );
-
         if ( vm.count( "help" ) )
         {
+            std::cerr << std::endl;
             std::cerr << "take key presses, output key numeric values to stdout" << std::endl;
             std::cerr << "usage: io-console [<options>]" << std::endl;
             std::cerr << description << std::endl;
-            return 1;
+            std::cerr << std::endl;
+            return 0;
         }
-
         boost::scoped_ptr< comma::io::select > select;
-        unsigned int seconds = 0;
-        unsigned int nanoseconds = 0;
+        unsigned int seconds{0}, nanoseconds{0};
         if ( vm.count( "heartbeat" ) )
         {
             select.reset( new comma::io::select() );
@@ -67,15 +55,7 @@ int main( int argc, char** argv )
             seconds = std::floor( period );
             nanoseconds = std::floor( double( seconds == 0 ? period : std::fmod( period, seconds ) ) * 1e9 );
         }
-        
-        // remove echo from the console
-        struct termios oldTerm;
-        struct termios newTerm;
-        ::tcgetattr( STDIN_FILENO, &oldTerm );
-        newTerm = oldTerm;
-        newTerm.c_lflag &= ~( ICANON | ECHO );
-        ::tcsetattr( STDIN_FILENO, TCSANOW, &newTerm );
-        
+        no_echo_term t;
         comma::signal_flag signal;
         while( !signal && std::cout.good() && !std::cout.bad() )
         {
@@ -88,7 +68,6 @@ int main( int argc, char** argv )
             std::cout.write( &c, 1 );
             std::cout.flush();
         }
-        ::tcsetattr( STDIN_FILENO, TCSANOW, &oldTerm ); // restore the console
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << argv[0] << ": " << ex.what() << std::endl; }

From 52c39e7e0297e146be9ac8e6303878db92bd83ee Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 2 Nov 2022 11:44:28 +1100
Subject: [PATCH 0539/1056] comma-test-run: allow process substitution for
 white and black lists

---
 util/applications/comma-test-run | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 2dcc5b32d..0021178c1 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -254,6 +254,9 @@ ${brown}White(and black)-listing tests${none}
         comma-test-run --white-list=white.list
     Do not remove leading dots or append input file names or anything similar.
 
+    This can also be done with an on-the-fly generated file:
+        comma-test-run --black-list <( echo ./exclude-me )
+
 ${brown}White(and black)-listing pro hint${none}
     Assume some tests failed:
         comma-test-run > comma-test-run.log 2>&1 ; echo \$?
@@ -1063,11 +1066,11 @@ function apply_white_black_list() { apply_white_list | apply_black_list ; }
 # if "test" is absent, use the "test" in the closest parent directory
 function test_directories()
 {
-    if [[ -n "$options_white_list" && -f "$options_white_list" ]]; then
+    if [[ -n "$options_white_list" && -e "$options_white_list" ]]; then
         message_ "$name: applying white list from file '$options_white_list'"
         options_white_list="^(\./)?($( sed 's#\./##' <$options_white_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//'  ))";
     fi
-    if [[ -n "$options_black_list" && -f "$options_black_list" ]]; then
+    if [[ -n "$options_black_list" && -e "$options_black_list" ]]; then
         message_ "$name: applying black list from file '$options_black_list'"
         options_black_list="^(\./)?($( sed 's#\./##' <$options_black_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//' ))";
     fi

From 52cda98774622ef04fe10ad2a9a44bfed02657a4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 7 Nov 2022 11:36:59 +1100
Subject: [PATCH 0540/1056] csv::options::make_output_options() convenience
 method implemented

---
 csv/options.h | 13 +++++++++++++
 1 file changed, 13 insertions(+)

diff --git a/csv/options.h b/csv/options.h
index d813587f8..66ce870cf 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -23,6 +23,10 @@ class options
         /// constructor
         options( const comma::command_line_options& options, const std::string& defaultFields = "", bool full_xpath = true );
 
+        /// convenience method: make output options from input options (propagate binary setting, flush); todo? add more parameters?
+        template < typename T >
+        static options make_output_options( const options& input_options );
+
         /// return usage to incorporate into application usage
         static std::string usage( const std::string& default_fields = "", bool verbose = true );
 
@@ -91,4 +95,13 @@ class options
         boost::optional< csv::format > format_;
 };
 
+template < typename T >
+inline options make_output_options( const options& input_options )
+{
+    options o;
+    o.flush = input_options.flush;
+    if( input_options.binary() ) { o.format( format::value< T >() ); }
+    return o;
+}
+
 } } // namespace comma { namespace csv {

From 22aa01adf8a3195f3cac23e03908675905eb63a6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 7 Nov 2022 11:43:54 +1100
Subject: [PATCH 0541/1056] csv::options::make_output_options(): typo fixed

---
 csv/options.h | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/csv/options.h b/csv/options.h
index 66ce870cf..a94c95ecf 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -10,6 +10,12 @@
 
 namespace comma { namespace csv {
 
+class options;
+
+/// convenience method: make output options from input options (propagate binary setting, flush); todo? add more parameters?
+template < typename T >
+static options make_output_options( const options& input_options );
+
 /// a helper class to extract csv-related command line options
 class options
 {
@@ -23,10 +29,6 @@ class options
         /// constructor
         options( const comma::command_line_options& options, const std::string& defaultFields = "", bool full_xpath = true );
 
-        /// convenience method: make output options from input options (propagate binary setting, flush); todo? add more parameters?
-        template < typename T >
-        static options make_output_options( const options& input_options );
-
         /// return usage to incorporate into application usage
         static std::string usage( const std::string& default_fields = "", bool verbose = true );
 

From 73ebd2fb430e5e1080e4ea06d78cfc4a16570bea Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 13 Nov 2022 00:36:00 +1100
Subject: [PATCH 0542/1056] name_value: fixing array handling in ptree visitors

---
 name_value/impl/to_name_value.h | 105 ++++++--------------------------
 name_value/ptree.h              | 105 ++++++++------------------------
 2 files changed, 42 insertions(+), 168 deletions(-)

diff --git a/name_value/impl/to_name_value.h b/name_value/impl/to_name_value.h
index d57c6c2e6..653a2a42c 100644
--- a/name_value/impl/to_name_value.h
+++ b/name_value/impl/to_name_value.h
@@ -1,37 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2022 Vsevolod Vlaskine
 
+/// @authors cedric wohlleber, vsevolod vlaskine
 
-/// @author cedric wohlleber
-
-#ifndef COMMA_APPLICATION_TO_NAME_VALUE_H
-#define COMMA_APPLICATION_TO_NAME_VALUE_H
+#pragma once
 
 #include <map>
 #include <boost/lexical_cast.hpp>
@@ -53,41 +25,36 @@ class to_name_value
     /// constructor
     /// @param delimiter delimiter between name and value
     /// @param full_path_as_name use full path as name
-    to_name_value( char delimiter = '=', bool full_path_as_name = true ):
-        m_delimiter(delimiter), m_full_path_as_name(full_path_as_name){};
+    to_name_value( char delimiter = '=', bool full_path_as_name = true ): m_delimiter(delimiter), m_full_path_as_name( full_path_as_name ) {};
 
     /// apply
-    template < typename K, typename T > void apply( const K& name, const boost::optional< T >& value );
+    template < typename K, typename T > void apply( const K& name, const boost::optional< T >& value ) { if( value ) { apply( name, *value ); } }
     
     /// apply
-    template < typename K, typename T > void apply( const K& name, const boost::scoped_ptr< T >& value );
+    template < typename K, typename T > void apply( const K& name, const boost::scoped_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
     
     /// apply
-    template < typename K, typename T > void apply( const K& name, const boost::shared_ptr< T >& value );        
+    template < typename K, typename T > void apply( const K& name, const boost::shared_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
         
     /// apply
-    template < typename K, typename T >
-    void apply( const K& name, const T& value );
+    template < typename K, typename T > void apply( const K& name, const T& value );
 
     /// apply to non-leaf elements
-    template < typename K, typename T >
-    void apply_next( const K& name, const T& value );
+    template < typename K, typename T > void apply_next( const K& name, const T& value ) { comma::visiting::visit( name, value, *this ); }
 
     /// apply to leaf elements
-    template < typename K, typename T >
-    void apply_final( const K& name, const T& value );
+    template < typename K, typename T > void apply_final( const K& name, const T& value );
 
     /// return named values as strings
     const std::vector< std::string >& strings() const { return m_strings; }
 
 private:
-    template < typename T >
-        std::string as_string( T v )
-        {
-            std::ostringstream oss;
-            oss << v;
-            return oss.str();
-        }
+    template < typename T > std::string as_string( T v )
+    {
+        std::ostringstream oss;
+        oss << v;
+        return oss.str();
+    }
         
     char m_delimiter;
     bool m_full_path_as_name;
@@ -96,24 +63,6 @@ class to_name_value
      
 };
 
-template < typename K, typename T >
-inline void to_name_value::apply( const K& name, const boost::optional< T >& value )
-{
-    if( value ) { apply( name, *value ); }
-}
-
-template < typename K, typename T >
-inline void to_name_value::apply( const K& name, const boost::scoped_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); }
-}
-
-template < typename K, typename T >
-inline void to_name_value::apply( const K& name, const boost::shared_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); }
-}
-
 template < typename K, typename T >
 inline void to_name_value::apply( const K& name, const T& value )
 {
@@ -123,27 +72,7 @@ inline void to_name_value::apply( const K& name, const T& value )
     m_xpath = m_xpath.head();
 }
 
-
-
 template < typename K, typename T >
-inline void to_name_value::apply_next( const K& name, const T& value ) { comma::visiting::visit( name, value, *this ); }
-
-template < typename K, typename T >
-inline void to_name_value::apply_final( const K&, const T& value )
-{
-    std::string string;
-    if( m_full_path_as_name )
-    {
-        string += m_xpath.to_string();
-    }
-    else
-    {
-        string += m_xpath.elements.back().to_string();
-    }
-    string += m_delimiter + as_string( value );
-    m_strings.push_back( string );
-}
+inline void to_name_value::apply_final( const K&, const T& value ) { m_strings.push_back( std::string( m_full_path_as_name ? m_xpath.to_string() : m_xpath.elements.back().to_string() ) + m_delimiter + as_string( value ) ); }
 
 } } } // namespace comma { namespace name_value { namespace impl {
-
-#endif // COMMA_APPLICATION_TO_NAME_VALUE_H
diff --git a/name_value/ptree.h b/name_value/ptree.h
index aacb5a83e..2cacf281c 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -1,38 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-/// @author cedric wohlleber
-/// @author vsevolod vlaskine
-
-#ifndef COMMA_NAME_VALUE_PTREE_H_
-#define COMMA_NAME_VALUE_PTREE_H_
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @authors cedric wohlleber, vsevolod vlaskine
+
+#pragma once
 
 #include <iostream>
 #include <sstream>
@@ -125,30 +96,13 @@ struct property_tree // quick and dirty
             /// @param ptree: property tree for the structure to fill
             /// @param root: path to the root of the subtree to visit
             /// @param branch: path to the subtree to visit (i.e. other branches will be pruned)
-            from( const boost::property_tree::ptree& ptree )
-                : ptree_( ptree )
-                , cur_( ptree )
-                , permissive_( false )
-            {
-            }
-            from( const boost::property_tree::ptree& ptree, bool permissive )
-                : ptree_( ptree )
-                , cur_( ptree )
-                , permissive_( permissive )
-            {
-            }
-            from( const boost::property_tree::ptree& ptree, const char* root, bool permissive = false )
-                : ptree_( ptree )
-                , cur_( get_tree( ptree_, xpath( root ) ) )
-                , permissive_( permissive )
-            {
-            }
-            from( const boost::property_tree::ptree& ptree, const xpath& root, bool permissive = false )
-                : ptree_( ptree )
-                , cur_( get_tree( ptree_, root ) )
-                , permissive_( permissive )
-            {
-            }
+            from( const boost::property_tree::ptree& ptree ): ptree_( ptree ), cur_( ptree ), permissive_( false ) {}
+
+            from( const boost::property_tree::ptree& ptree, bool permissive ): ptree_( ptree ), cur_( ptree ), permissive_( permissive ) {}
+
+            from( const boost::property_tree::ptree& ptree, const char* root, bool permissive = false ): ptree_( ptree ), cur_( get_tree( ptree_, xpath( root ) ) ), permissive_( permissive ) {}
+
+            from( const boost::property_tree::ptree& ptree, const xpath& root, bool permissive = false ): ptree_( ptree ), cur_( get_tree( ptree_, root ) ), permissive_( permissive ) {}
 
             //ptree_visitor( const boost::property_tree::ptree& ptree, const xpath& root, const xpath& branch, bool permissive = false ) : ptree_( ptree ), cur_( &ptree ), path_( root ), branch_( branch ), permissive_( permissive ) {}
 
@@ -172,7 +126,7 @@ struct property_tree // quick and dirty
 
             /// apply to vector
             template < typename K, typename T, typename A >
-            void apply_next( const K& key, std::vector< T, A >& value )
+            void apply_next( const K& key, std::vector< T, A >& value ) // todo? std::array? boost::array?
             {
                 std::string name = boost::lexical_cast< std::string >( key );
                 boost::optional< const boost::property_tree::ptree& > t = cur_ && !name.empty() ? cur_->get_child_optional( name ) : cur_;
@@ -252,6 +206,7 @@ struct property_tree // quick and dirty
             const boost::property_tree::ptree& ptree_;
             boost::optional< const boost::property_tree::ptree& > cur_;
             const bool permissive_;
+
             void value_( const std::string& name, boost::optional< boost::posix_time::ptime >& v ) // quick and dirty, imlement traits instead
             {
                 if( !cur_ ) { return; }
@@ -259,6 +214,7 @@ struct property_tree // quick and dirty
                 if( !s ) { s = cur_->get_optional< std::string >( "<xmlattr>." + name ); }
                 if( s ) { v = boost::posix_time::from_iso_string( *s ); }
             }
+
             template < typename T > void value_( const std::string& name, boost::optional< T >& v )
             {
                 if( !cur_ ) { return; }
@@ -284,20 +240,16 @@ class to_ptree
         to_ptree( boost::property_tree::ptree& ptree, const char* root ) : ptree_( ptree ), path_( root ) {}
 
         /// apply_next on boost optional
-        template < typename K, typename T >
-        void apply_next( const K& name, const boost::optional< T >& value )
+        template < typename K, typename T > void apply_next( const K& name, const boost::optional< T >& value )
         {
-            if( value )
-            {
-                visiting::do_while<    !boost::is_fundamental< T >::value
-                                    && !boost::is_same< T, boost::posix_time::ptime >::value
-                                    && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
-            }
+            if( !value ) { return; }
+            visiting::do_while<    !boost::is_fundamental< T >::value
+                                && !boost::is_same< T, boost::posix_time::ptime >::value
+                                && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
         }
 
-        /// apply
-        template < typename K, typename T, typename A >
-        void apply( const K& name, const std::vector< T, A >& value )
+        /// apply to vector
+        template < typename K, typename T, typename A > void apply( const K& name, const std::vector< T, A >& value ) // do we even need it?
         {
             if( !( path_ <= branch_ ) ) { return; } // visit, only if on the branch
             append_( name );
@@ -313,8 +265,7 @@ class to_ptree
         }
 
         /// apply
-        template < typename K, typename T >
-        void apply( const K& name, const T& value )
+        template < typename K, typename T > void apply( const K& name, const T& value )
         {
             if( !( path_ <= branch_ ) ) { return; } // visit, only if on the branch
             const std::string& s = boost::lexical_cast< std::string >( name );
@@ -326,15 +277,10 @@ class to_ptree
         }
 
         /// apply to non-leaf elements
-        template < typename K, typename T >
-        void apply_next( const K& name, const T& value )
-        {
-            comma::visiting::visit( name, value, *this );
-        }
+        template < typename K, typename T > void apply_next( const K& name, const T& value ) { comma::visiting::visit( name, value, *this ); }
 
         /// apply to leaf elements
-        template < typename K, typename T >
-        void apply_final( const K&, const T& value ) { ptree_.put( path_.to_string( '.' ), value_( value ) ); }
+        template < typename K, typename T > void apply_final( const K&, const T& value ) { ptree_.put( path_.to_string( '.' ), value_( value ) ); }
 
     private:
         boost::property_tree::ptree& ptree_;
@@ -354,4 +300,3 @@ class to_ptree
 
 } // namespace comma
 
-#endif /*COMMA_NAME_VALUE_PTREE_H_*/

From 4c99cc752f07e34e53b0bee3242bd3157ede0b31 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 13 Nov 2022 01:46:55 +1100
Subject: [PATCH 0543/1056] name_value: fixing array handling in ptree
 visitors...

---
 name_value/ptree.h | 79 ++++++++++++++++++++++++++--------------------
 1 file changed, 44 insertions(+), 35 deletions(-)

diff --git a/name_value/ptree.h b/name_value/ptree.h
index 2cacf281c..83d23a722 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -5,17 +5,19 @@
 
 #pragma once
 
+#include <array>
 #include <iostream>
 #include <sstream>
-#include <boost/version.hpp>
-#include <boost/lexical_cast.hpp>
+#include <boost/array.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/lexical_cast.hpp>
 #include <boost/property_tree/ptree.hpp>
 #include <boost/property_tree/info_parser.hpp>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include <boost/unordered_set.hpp>
+#include <boost/version.hpp>
 #include "../base/exception.h"
 #include "../base/types.h"
 #include "../string/string.h"
@@ -74,9 +76,11 @@ struct property_tree // quick and dirty
 
     /// convert path-value-style string into boost parameter tree
     static boost::property_tree::ptree from_path_value_string( const std::string& s, char equal_sign = '=', char delimiter = ',', path_value::check_repeated_paths check_type = path_value::no_check, bool use_index = true );
+
     static boost::property_tree::ptree& from_path_value_string( boost::property_tree::ptree& ptree, const std::string& s, char equal_sign, char delimiter, path_value::check_repeated_paths check_type = path_value::no_check, bool use_index = true );
 
     static void read_xml( std::istream& is, boost::property_tree::ptree& ptree );
+
     static void write_xml( std::ostream& os, const boost::property_tree::ptree& ptree, const xml_writer_settings_t& xml_writer_settings  = xml_writer_settings_t()  );
     
     /// read as path-value from input stream
@@ -106,51 +110,25 @@ struct property_tree // quick and dirty
 
             //ptree_visitor( const boost::property_tree::ptree& ptree, const xpath& root, const xpath& branch, bool permissive = false ) : ptree_( ptree ), cur_( &ptree ), path_( root ), branch_( branch ), permissive_( permissive ) {}
 
-            /// apply
-            template < typename K, typename T >
-            void apply( const K& key, T& value )
+            template < typename K, typename T > void apply( const K& key, T& value )
             {
                 visiting::do_while<    !boost::is_fundamental< T >::value
                                     && !boost::is_same< T, boost::posix_time::ptime >::value
                                     && !boost::is_same< T, std::string >::value >::visit( key, value, *this );
             }
 
-            /// apply on boost optional
-            template < typename K, typename T >
-            void apply_next( const K& name, boost::optional< T >& value )
+            template < typename K, typename T > void apply_next( const K& name, boost::optional< T >& value )
             {
                 if( !cur_ || cur_->find( name ) == cur_->not_found() ) { return; }
                 if( !value ) { value = T(); }
                 apply( name, *value );
             }
 
-            /// apply to vector
-            template < typename K, typename T, typename A >
-            void apply_next( const K& key, std::vector< T, A >& value ) // todo? std::array? boost::array?
-            {
-                std::string name = boost::lexical_cast< std::string >( key );
-                boost::optional< const boost::property_tree::ptree& > t = cur_ && !name.empty() ? cur_->get_child_optional( name ) : cur_;
-                if( t )
-                {
-                    const boost::property_tree::ptree& parent = *cur_;
-                    value.resize( t->size() );
-                    std::size_t i = 0;
-                    for( boost::property_tree::ptree::const_assoc_iterator j = t->ordered_begin(); j != t->not_found(); ++j, ++i )
-                    {
-                        cur_ = j->second;
-                        //std::size_t index = j->first == "" ? i : boost::lexical_cast< std::size_t >( j->first ); // way quick and dirty
-                        //if( index >= t->size() ) { COMMA_THROW( comma::exception, "expected index less than " << t->size() << "; got: " << index ); }
-                        visiting::do_while<    !boost::is_fundamental< T >::value
-                                            && !boost::is_same< T, boost::posix_time::ptime >::value
-                                            && !boost::is_same< T, std::string >::value >::visit( "", value[i], *this );
-                    }
-                    cur_ = parent;
-                }
-                else if( !permissive_ )
-                {
-                    COMMA_THROW( comma::exception, "key " << key << " not found" );
-                }
-            }
+            template < typename K, typename T, typename A > void apply_next( const K& key, std::vector< T, A >& value ) { _apply_to_arraylike( key, value ); }
+
+            template < typename K, typename T, unsigned int Size > void apply_next( const K& key, boost::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
+
+            template < typename K, typename T, unsigned int Size > void apply_next( const K& key, std::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
 
             /// apply to map
             template < typename K, typename L, typename T, typename A >
@@ -221,6 +199,37 @@ struct property_tree // quick and dirty
                 v = name.empty() ? cur_->get_value_optional< T >() : cur_->get_optional< T >( name );
                 if( !v ) { v = cur_->get_optional< T >( "<xmlattr>." + name ); }
             }
+
+            template < typename T, typename A > void resize_( std::vector< T, A >& a, unsigned int size ) { a.resize( size ); }
+
+            template < typename A > void resize_( A& a, unsigned int size ) {}
+
+            template < typename K, typename A >
+            void _apply_to_arraylike( const K& key, A& value ) // todo? std::array? boost::array?
+            {
+                std::string name = boost::lexical_cast< std::string >( key );
+                boost::optional< const boost::property_tree::ptree& > t = cur_ && !name.empty() ? cur_->get_child_optional( name ) : cur_;
+                if( t )
+                {
+                    const boost::property_tree::ptree& parent = *cur_;
+                    resize_( value, t->size() );
+                    std::size_t i = 0;
+                    for( boost::property_tree::ptree::const_assoc_iterator j = t->ordered_begin(); j != t->not_found(); ++j, ++i )
+                    {
+                        cur_ = j->second;
+                        //std::size_t index = j->first == "" ? i : boost::lexical_cast< std::size_t >( j->first ); // way quick and dirty
+                        //if( index >= t->size() ) { COMMA_THROW( comma::exception, "expected index less than " << t->size() << "; got: " << index ); }
+                        visiting::do_while<    !boost::is_fundamental< typename A::value_type >::value
+                                            && !boost::is_same< typename A::value_type, boost::posix_time::ptime >::value
+                                            && !boost::is_same< typename A::value_type, std::string >::value >::visit( "", value[i], *this );
+                    }
+                    cur_ = parent;
+                }
+                else if( !permissive_ )
+                {
+                    COMMA_THROW( comma::exception, "key " << key << " not found" );
+                }
+            }
     };
 };
 

From 2c2badf800f690faf04481289356b23d60bd0c73 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 13 Nov 2022 02:10:40 +1100
Subject: [PATCH 0544/1056] name_value: fixing array handling in ptree
 visitors...

---
 name_value/test/ptree_test.cpp | 33 ++++-----------------------------
 1 file changed, 4 insertions(+), 29 deletions(-)

diff --git a/name_value/test/ptree_test.cpp b/name_value/test/ptree_test.cpp
index b59941bf4..59c27d9ae 100644
--- a/name_value/test/ptree_test.cpp
+++ b/name_value/test/ptree_test.cpp
@@ -1,34 +1,10 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
+#include <array>
+#include <vector>
+#include <boost/array.hpp>
 #include <boost/function.hpp>
 #include <boost/optional.hpp>
 #include <boost/property_tree/json_parser.hpp>
@@ -272,7 +248,6 @@ TEST( ptree, from_path_value )
         EXPECT_EQ( 2, m[6].nested->moon );
         EXPECT_EQ( "world",  *m[6].nested->value );
     }
-
 }
 
 TEST( ptree, permissive_visiting )

From c7682d406019b3024c8707166ad113387e645a24 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 15 Nov 2022 15:36:46 +1100
Subject: [PATCH 0545/1056] visiting::traits: std::tuple traits implemented;
 basic unit test added

---
 visiting/test/visiting_test.cpp | 38 +++++++++------------------------
 visiting/traits.h               | 32 +++++++++++++++++++++++++++
 2 files changed, 42 insertions(+), 28 deletions(-)

diff --git a/visiting/test/visiting_test.cpp b/visiting/test/visiting_test.cpp
index 02aa44ed7..919ed624c 100644
--- a/visiting/test/visiting_test.cpp
+++ b/visiting/test/visiting_test.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
 #include <sstream>
@@ -225,6 +198,15 @@ TEST( visiting, container )
     }
 }
 
+TEST( visiting, tuple )
+{
+    std::tuple< int, double, std::string > t{ 5, 10, "hello" };
+    std::ostringstream oss;
+    o_stream_visitor v( oss );
+    visiting::apply( v, t );
+    EXPECT_EQ( oss.str(), "{ int:0=5 double:1=10 string:2=\"hello\" }" );
+}
+
 } } } /// namespace comma { namespace visiting { namespace test {
 
 int main( int argc, char* argv[] )
diff --git a/visiting/traits.h b/visiting/traits.h
index 57ea8baf0..d133162a4 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -1,4 +1,5 @@
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
@@ -11,6 +12,7 @@
 #include <map>
 #include <set>
 #include <string>
+#include <tuple>
 #include <unordered_map>
 #include <unordered_set>
 #include <vector>
@@ -50,6 +52,36 @@ struct traits< std::pair< T, S > >
     }    
 };
 
+namespace detail {
+
+template < unsigned int I, unsigned int Size > struct elementwise
+{
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+};
+
+template < unsigned int Size > struct elementwise< 1, Size >
+{
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
+};
+
+} // namespace detail {
+
+template < typename... T >
+struct traits< std::tuple< T... > >
+{
+    typedef std::tuple< T... > tuple_t;
+
+    static const unsigned int size{ std::tuple_size< tuple_t >::value };
+
+    static_assert( size > 0 );
+
+    template < typename K, typename V > static void visit( const K& key, tuple_t& t, V& v ) { detail::elementwise< size, size >::visit( t, v ); }
+    
+    template < typename K, typename V > static void visit( const K&, const tuple_t& t, V& v ) { detail::elementwise< size, size >::visit( t, v ); }
+};
+
 namespace impl {
 
 template < typename K, typename V, typename Visitor >

From b39b7797b393248ec13215f45996f17c3a7ffe57 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 15 Nov 2022 16:27:23 +1100
Subject: [PATCH 0546/1056] visiting::traits: std::tuple traits: using element
 names for now since indices introduce a bit of pain in the serializers (but
 indices are much better)

---
 visiting/test/visiting_test.cpp |  2 +-
 visiting/traits.h               | 18 ++++++++++++++----
 2 files changed, 15 insertions(+), 5 deletions(-)

diff --git a/visiting/test/visiting_test.cpp b/visiting/test/visiting_test.cpp
index 919ed624c..040650814 100644
--- a/visiting/test/visiting_test.cpp
+++ b/visiting/test/visiting_test.cpp
@@ -204,7 +204,7 @@ TEST( visiting, tuple )
     std::ostringstream oss;
     o_stream_visitor v( oss );
     visiting::apply( v, t );
-    EXPECT_EQ( oss.str(), "{ int:0=5 double:1=10 string:2=\"hello\" }" );
+    EXPECT_EQ( oss.str(), "{ int:elem_0=5 double:elem_1=10 string:elem_2=\"hello\" }" );
 }
 
 } } } /// namespace comma { namespace visiting { namespace test {
diff --git a/visiting/traits.h b/visiting/traits.h
index d133162a4..1d0c73b97 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -54,16 +54,26 @@ struct traits< std::pair< T, S > >
 
 namespace detail {
 
+template < unsigned int I > const char* element_name(); // super-quick and dirty for now, certainly improve it (somehow)
+template <> inline const char* element_name< 0 >() { return "elem_0"; }
+template <> inline const char* element_name< 1 >() { return "elem_1"; }
+template <> inline const char* element_name< 2 >() { return "elem_2"; }
+template <> inline const char* element_name< 3 >() { return "elem_3"; }
+template <> inline const char* element_name< 4 >() { return "elem_4"; }
+template <> inline const char* element_name< 5 >() { return "elem_5"; }
+template <> inline const char* element_name< 6 >() { return "elem_6"; }
+template <> inline const char* element_name< 7 >() { return "elem_7"; }
+
 template < unsigned int I, unsigned int Size > struct elementwise
 {
-    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
-    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
 };
 
 template < unsigned int Size > struct elementwise< 1, Size >
 {
-    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
-    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
 };
 
 } // namespace detail {

From fa05c572c5055e8540595320aa23c0a3dc143e1c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 15 Nov 2022 17:05:13 +1100
Subject: [PATCH 0547/1056] visiting::traits: std::tuple traits: reverted to
 indices as tuple keys to stay more consistent with e.g. python tuples; tuple
 support needs to be added to all the visitors, though

---
 visiting/test/visiting_test.cpp |  2 +-
 visiting/traits.h               | 44 +++++++++++++++++++++------------
 2 files changed, 29 insertions(+), 17 deletions(-)

diff --git a/visiting/test/visiting_test.cpp b/visiting/test/visiting_test.cpp
index 040650814..a0e062d9f 100644
--- a/visiting/test/visiting_test.cpp
+++ b/visiting/test/visiting_test.cpp
@@ -204,7 +204,7 @@ TEST( visiting, tuple )
     std::ostringstream oss;
     o_stream_visitor v( oss );
     visiting::apply( v, t );
-    EXPECT_EQ( oss.str(), "{ int:elem_0=5 double:elem_1=10 string:elem_2=\"hello\" }" );
+    EXPECT_EQ( oss.str(), "{ int:0=5 double:1=10 string:2=\"hello\" }" ); // EXPECT_EQ( oss.str(), "{ int:elem_0=5 double:elem_1=10 string:elem_2=\"hello\" }" );
 }
 
 } } } /// namespace comma { namespace visiting { namespace test {
diff --git a/visiting/traits.h b/visiting/traits.h
index 1d0c73b97..87b2429e9 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -54,26 +54,38 @@ struct traits< std::pair< T, S > >
 
 namespace detail {
 
-template < unsigned int I > const char* element_name(); // super-quick and dirty for now, certainly improve it (somehow)
-template <> inline const char* element_name< 0 >() { return "elem_0"; }
-template <> inline const char* element_name< 1 >() { return "elem_1"; }
-template <> inline const char* element_name< 2 >() { return "elem_2"; }
-template <> inline const char* element_name< 3 >() { return "elem_3"; }
-template <> inline const char* element_name< 4 >() { return "elem_4"; }
-template <> inline const char* element_name< 5 >() { return "elem_5"; }
-template <> inline const char* element_name< 6 >() { return "elem_6"; }
-template <> inline const char* element_name< 7 >() { return "elem_7"; }
-
-template < unsigned int I, unsigned int Size > struct elementwise
-{
-    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
-    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+// template < unsigned int I > const char* element_name(); // super-quick and dirty for now, it would be better to use numeric indices, but then all visitors need to support tuple correctly
+// template <> inline const char* element_name< 0 >() { return "first"; }
+// template <> inline const char* element_name< 1 >() { return "second"; }
+// template <> inline const char* element_name< 2 >() { return "third"; }
+// template <> inline const char* element_name< 3 >() { return "fourth"; }
+// template <> inline const char* element_name< 4 >() { return "fifth"; }
+// template <> inline const char* element_name< 5 >() { return "sixth"; }
+// template <> inline const char* element_name< 6 >() { return "seventh"; }
+// template <> inline const char* element_name< 7 >() { return "eighth"; }
+
+// template < unsigned int I, unsigned int Size > struct elementwise
+// {
+//     template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+//     template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+// };
+
+// template < unsigned int Size > struct elementwise< 1, Size >
+// {
+//     template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
+//     template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
+// };
+
+template < unsigned int I, unsigned int Size > struct elementwise // todo! add tuple support to all visitors
+{
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
 };
 
 template < unsigned int Size > struct elementwise< 1, Size >
 {
-    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
-    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
 };
 
 } // namespace detail {

From 956a789f1a5b7a30df7077a6221f503b1bf6b40d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 17 Nov 2022 11:32:46 +1100
Subject: [PATCH 0548/1056] csv-sort: --fixed-block: basics added

---
 csv/applications/csv-sort.cpp               | 134 ++++++++------------
 csv/test/csv-sort/fixed_block_size/expected |  14 ++
 csv/test/csv-sort/fixed_block_size/input    |   2 +
 csv/test/csv-sort/fixed_block_size/test     |   5 +
 4 files changed, 71 insertions(+), 84 deletions(-)
 create mode 100644 csv/test/csv-sort/fixed_block_size/expected
 create mode 100644 csv/test/csv-sort/fixed_block_size/input
 create mode 100755 csv/test/csv-sort/fixed_block_size/test

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index b6a3a8d73..3f81323af 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @authors matthew imhoff, dewey nguyen, vsevolod vlaskine
 
@@ -63,6 +36,7 @@ static void usage( bool more )
     std::cerr << std::endl;
     std::cerr << "Options:" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
+    std::cerr << "    --block-size,--size=<n>; number of input records in the block assuming all blocks are of the same size" << std::endl;
     std::cerr << "    --discard-out-of-order,--discard-unsorted: instead of sorting, discard records out of order" << std::endl;
     std::cerr << "    --first: first line matching given keys; first line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
     std::cerr << "           fields" << std::endl;
@@ -125,20 +99,33 @@ static comma::csv::options csv;
 static bool is_min = false;
 static bool is_max = false;
 
+class block_counter // todo? move block handling to library
+{
+    public:
+        block_counter( comma::uint32 b = 0, comma::uint32 s = 0 ): _block( 0 ), _size( 0 ) {}
+        comma::uint32 operator()() const { return _block; }
+        comma::uint32 size() const { return _size; }
+        bool fixed() const { return _size > 0; }
+        template < typename T > bool operator==( const T& t ) const { return _size > 0 ? _block < _size : t.block == _block; }
+        template < typename T > bool operator!=( const T& t ) const { return !operator==( t ); }
+        template < typename T > comma::uint32 update( const T& t ) { _block = _size > 0 ? _block + 1 == _size ? 0 : _block + 1 : t.block; return _block; }
+        template < typename T > bool ready( const T& t ) const { return _size > 0 ? _block + 1 == _size : t.block != _block; }
+    private:
+        comma::uint32 _block{0}; 
+        comma::uint32 _size{0}; 
+};
+
+static block_counter block;
+
 struct ordering_t
 {
-    enum types {
-        str_type,
-        long_type,
-        double_type,
-        time_type
-    };
+    enum types { str_type, long_type, double_type, time_type };
     
-    types type;
-    int   index;
+    types type{double_type};
+    int index{0};
 };
 
-std::vector< ordering_t > ordering;
+static std::vector< ordering_t > ordering;
 
 struct input_t
 {
@@ -148,20 +135,12 @@ struct input_t
     {
         for( std::size_t i = 0; i < ordering.size(); ++i )
         { 
-            switch (ordering[i].type)
+            switch( ordering[i].type )
             {
-                case ordering_t::str_type:
-                    if (keys.strings[ordering[i].index] != rhs.keys.strings[ ordering[i].index ]) { return false; }
-                    break;
-                case ordering_t::long_type:
-                    if (keys.longs[ordering[i].index] != rhs.keys.longs[ ordering[i].index ]) { return false; }
-                    break;
-                case ordering_t::double_type:
-                    if (keys.doubles[ordering[i].index] != rhs.keys.doubles[ ordering[i].index ]) { return false; }
-                    break;
-                case ordering_t::time_type:
-                    if (keys.time[ordering[i].index] != rhs.keys.time[ ordering[i].index ]) { return false; }
-                    break;
+                case ordering_t::str_type: if (keys.strings[ordering[i].index] != rhs.keys.strings[ ordering[i].index ]) { return false; } break;
+                case ordering_t::long_type: if (keys.longs[ordering[i].index] != rhs.keys.longs[ ordering[i].index ]) { return false; } break;
+                case ordering_t::double_type: if (keys.doubles[ordering[i].index] != rhs.keys.doubles[ ordering[i].index ]) { return false; } break;
+                case ordering_t::time_type: if (keys.time[ordering[i].index] != rhs.keys.time[ ordering[i].index ]) { return false; } break;
             }
         }
         return true;
@@ -195,20 +174,17 @@ struct input_t
     }
     
     typedef std::map< input_t, std::vector< std::string > > map;
-    
 };
 
 struct input_with_block : public input_t
 {
-    comma::uint32 block;
-    input_with_block() : block( 0 ) {}
+    comma::uint32 block{0};
 };
 
 struct input_with_ids_t : public input_t
 {
     comma::csv::impl::unstructured ids;
-    comma::uint32 block;
-    input_with_ids_t() : block( 0 ) {}
+    comma::uint32 block{0};
 };
 
 namespace comma { namespace visiting {
@@ -282,8 +258,9 @@ static int handle_discard_out_of_order( comma::csv::input_stream< input_with_blo
     {
         const input_with_block* p = istream.read();
         if( !p ) { break; }
-        if( last && p->block == last->block && ( ( reverse && *last < *p ) || ( !reverse && *p < *last ) ) ) { continue; }
+        if( last && block == *p && ( reverse ? *last < *p : *p < *last ) ) { continue; }
         last = *p;
+        block.update( *p );
         output_last_( istream );
     }
     return 0;
@@ -294,11 +271,10 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
     typedef boost::unordered_set< comma::csv::impl::unstructured, comma::csv::impl::unstructured::hash > set_t;
     typedef boost::unordered_map< comma::csv::impl::unstructured, set_t, comma::csv::impl::unstructured::hash > map_t;
     map_t keys;
-    comma::uint32 block = 0;
     if( !first_line.empty() )
     { 
         input_with_ids_t input = comma::csv::ascii< input_with_ids_t >( csv, default_input ).get( first_line );
-        block = input.block;
+        block.update( input );
         keys[ input.ids ].insert( input.keys );
         std::cout << first_line << std::endl;
     }
@@ -306,7 +282,7 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
     {
         const input_with_ids_t* p = istream.read();
         if( !p ) { break; }
-        if( p->block != block ) { block = p->block; keys.clear(); }
+        if( block.ready( *p ) ) { block.update( *p ); keys.clear(); }
         if( keys[ p->ids ].insert( p->keys ).second ) { output_last_( istream ); }
     }
     return 0;
@@ -318,11 +294,10 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
 //     typedef boost::unordered_set< comma::csv::impl::unstructured, comma::csv::impl::unstructured::hash > set_t;
 //     typedef boost::unordered_map< comma::csv::impl::unstructured, set_t, comma::csv::impl::unstructured::hash > map_t;
 //     map_t keys;
-//     comma::uint32 block = 0;
 //     if( !first_line.empty() )
 //     { 
 //         input_with_ids_t input = comma::csv::ascii< input_with_ids_t >( csv, default_input ).get( first_line );
-//         block = input.block;
+//         block.update( input );
 //         keys[ input.ids ].insert( input.keys );
 //         //std::cout << first_line << std::endl;
 //     }
@@ -330,7 +305,7 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
 //     {
 //         const input_with_ids_t* p = istream.read();
 //         if( !p ) { break; }
-//         if( p->block != block ) { block = p->block; keys.clear(); }
+//         if( block != *p ) { block.update( *p ); keys.clear(); }
 //         if( keys[ p->ids ].insert( p->keys ).second ) { output_last_( istream ); }
 //     }
 //     return 0;
@@ -339,14 +314,13 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
 static int handle_sliding_window( comma::csv::input_stream< input_with_block >& istream, const std::string& first_line, const input_with_block& default_input, bool reverse, unsigned int sliding_window )
 {
     if( sliding_window < 2 ) { std::cerr << "csv-sort: expected sliding window greater than 1, got: " << sliding_window << std::endl; return 1; }
-    comma::uint32 block = 0;
     unsigned int count = 0;
     typedef std::map< input_t, std::deque< std::string > > map_t;
     map_t map;
     if( !first_line.empty() )
     { 
         input_with_block input = comma::csv::ascii< input_with_block >( csv, default_input ).get( first_line );
-        block = input.block;
+        block.update( input );
         map_t::mapped_type& d = map[ input ];
         d.push_back( first_line );
         ++count;
@@ -354,14 +328,14 @@ static int handle_sliding_window( comma::csv::input_stream< input_with_block >&
     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) || !map.empty() )
     {
         const input_with_block* p = istream.read();
-        if( !p || p->block != block )
+        if( !p || block != *p )
         {
             if( reverse ) { output_( map.rbegin(), map.rend() ); } else { output_( map.begin(), map.end() ); }
             map.clear();
             count = 0;
         }
         if( !p ) { break; }
-        block = p->block;
+        block.update( *p );
         map_t::mapped_type& d = map[ *p ];
         if( istream.is_binary() )
         {
@@ -484,10 +458,8 @@ int handle_operations_with_ids( const comma::command_line_options& options )
     is_max = options.exists( "--max" );
     if( keys_size != 1 ) { std::cerr << "csv-sort: error, please specify exactly one field for --min/--max operation." << std::endl; return 1; }
     if ( verbose ) { std::cerr << "csv-sort: minimum mode: " << ( is_min ) << ", maximum mode: " << is_max  << std::endl; }
-    comma::uint32 block = 0;    // previous block number, use default of 0
     limit_map_t min_map;
     limit_map_t max_map;
-    
     bool first = true;
     if (!first_line.empty()) 
     { 
@@ -499,7 +471,7 @@ int handle_operations_with_ids( const comma::command_line_options& options )
         max_map[input.ids] = data;
         is_same_map[input.ids] = true;
         input_order.push_back( input.ids );
-        block = input.block;
+        block.update( input );
         first = false;
     }
     while( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) )
@@ -507,38 +479,32 @@ int handle_operations_with_ids( const comma::command_line_options& options )
         const input_with_ids_t* p = stdin_stream.read();
         if( !p ) { break; }
 //         std::cerr  << "p: " << comma::join( stdin_stream.ascii().last(), csv.delimiter ) << " - " << p->keys.longs[0] << std::endl;
-        
         if( first )
         {
             limit_data_t& data = min_map[p->ids];
             data.keys = *p;
             data.add_current_record( stdin_stream );
-            
             max_map[p->ids] = data;
             is_same_map[p->ids] = true;
             input_order.push_back( p->ids );
-            
-            block = p->block;
+            block.update( *p );
             first = false;
         }
-        else if( p->block != block )
+        else if( block != *p )
         {
             // Dump and clear previous
             output_current_block( min_map, max_map );
             min_map.clear();
             max_map.clear();
             input_order.clear();
-            
             // Set the same record for both min and max, it's a new block, new IDs
             limit_data_t& data = min_map[p->ids];
             data.keys = *p;
             data.add_current_record( stdin_stream );
-            
             max_map[p->ids] = data;
             is_same_map[p->ids] = true;
             input_order.push_back( p->ids );
-            
-            block = p->block;
+            block.update( *p );
         }
         else    /// The same block and not first record
         {
@@ -607,18 +573,17 @@ static int random( const comma::command_line_options& options )
     if( csv.has_field( "block" ) )
     {
         comma::csv::input_stream< input_with_block > is( std::cin, csv );
-        comma::uint32 block = 0;
         while( is.ready() || std::cin.good() )
         {
             const input_with_block* p = is.read();
-            if( !p || p->block != block )
+            if( !p || block != *p )
             {
                 std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
                 std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
                 for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
                 if( csv.flush ) { std::cout.flush(); }
                 records.clear();
-                if( p ) { block = p->block; }
+                if( p ) { block.update( *p ); }
             }
             if( !p ) { break; }
             if( csv.binary() )
@@ -709,6 +674,8 @@ static int sort( const comma::command_line_options& options )
     }
     csv.fields = comma::join( w, ',' );
     if ( verbose ) { std::cerr << "csv-sort: fields: " << csv.fields << std::endl; }
+    block = block_counter( 0, options.value( "--block-size,--size", 0 ) );
+    if( csv.has_field( "block" ) && block.fixed() ) { comma::say() << "'block' field and --block-size are mutually exclusive" << std::endl; return 1; }
     comma::csv::input_stream< input_with_block > istream( std::cin, csv, default_input );
     #ifdef WIN32
     if( istream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
@@ -717,25 +684,24 @@ static int sort( const comma::command_line_options& options )
     if( options.exists( "--discard-out-of-order,--discard-unsorted" ) ) { return handle_discard_out_of_order( istream, first_line, default_input, reverse ); }
     auto sliding_window = options.optional< unsigned int >( "--sliding-window,--window" );
     if( sliding_window ) { return handle_sliding_window( istream, first_line, default_input, reverse, *sliding_window ); }
-    comma::uint32 block = 0;
     input_t::map map;
     if( !first_line.empty() )
     { 
         input_with_block input = comma::csv::ascii< input_with_block >( csv, default_input ).get( first_line );
-        block = input.block;
+        block.update( input );
         input_t::map::mapped_type& d = map[ input ];
         d.push_back( first_line );
     }
     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) || !map.empty() )
     {
         const input_with_block* p = istream.read();
-        if( !p || p->block != block )
+        if( !p || block != *p )
         {
             if( reverse ) { output_( map.rbegin(), map.rend() ); } else { output_( map.begin(), map.end() ); }
             map.clear();
         }
         if( !p ) { break; }
-        block = p->block;
+        block.update( *p );
         input_t::map::mapped_type& d = map[ *p ];
         if( unique && !d.empty() ) { continue; }
         if( istream.is_binary() )
diff --git a/csv/test/csv-sort/fixed_block_size/expected b/csv/test/csv-sort/fixed_block_size/expected
new file mode 100644
index 000000000..6d4553119
--- /dev/null
+++ b/csv/test/csv-sort/fixed_block_size/expected
@@ -0,0 +1,14 @@
+fixed_block_size/basic/output/line[0]="a"
+fixed_block_size/basic/output/line[1]="b"
+fixed_block_size/basic/output/line[2]="c"
+fixed_block_size/basic/output/line[3]="d"
+fixed_block_size/basic/output/line[4]="e"
+fixed_block_size/basic/output/line[5]="f"
+fixed_block_size/last_block/output/line[0]="a"
+fixed_block_size/last_block/output/line[1]="b"
+fixed_block_size/last_block/output/line[2]="c"
+fixed_block_size/last_block/output/line[3]="d"
+fixed_block_size/last_block/output/line[4]="e"
+fixed_block_size/last_block/output/line[5]="f"
+fixed_block_size/last_block/output/line[6]="x"
+fixed_block_size/last_block/output/line[7]="y"
diff --git a/csv/test/csv-sort/fixed_block_size/input b/csv/test/csv-sort/fixed_block_size/input
new file mode 100644
index 000000000..5af45a4ac
--- /dev/null
+++ b/csv/test/csv-sort/fixed_block_size/input
@@ -0,0 +1,2 @@
+fixed_block_size/basic="( echo c ; echo b ; echo a ; echo f ; echo e; echo d ) | csv-sort --fields a --block-size 3"
+fixed_block_size/last_block="( echo c ; echo b ; echo a ; echo f ; echo e; echo d; echo y; echo x ) | csv-sort --fields a --block-size 3"
diff --git a/csv/test/csv-sort/fixed_block_size/test b/csv/test/csv-sort/fixed_block_size/test
new file mode 100755
index 000000000..152895e63
--- /dev/null
+++ b/csv/test/csv-sort/fixed_block_size/test
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From 2439f7f594d558f8218556f3ce11f9f0ac0696e3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 17 Nov 2022 11:41:23 +1100
Subject: [PATCH 0549/1056] csv::block_counter implemented; still to do:
 something like input_stream_with_block...

---
 csv/applications/csv-sort.cpp | 25 ++++---------------------
 csv/block.h                   | 25 +++++++++++++++++++++++++
 2 files changed, 29 insertions(+), 21 deletions(-)
 create mode 100644 csv/block.h

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index 3f81323af..47828c1c5 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -18,6 +18,7 @@
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
+#include "../../csv/block.h"
 #include "../../csv/stream.h"
 #include "../../csv/traits.h"
 #include "../../io/stream.h"
@@ -98,24 +99,7 @@ static bool verbose;
 static comma::csv::options csv;
 static bool is_min = false;
 static bool is_max = false;
-
-class block_counter // todo? move block handling to library
-{
-    public:
-        block_counter( comma::uint32 b = 0, comma::uint32 s = 0 ): _block( 0 ), _size( 0 ) {}
-        comma::uint32 operator()() const { return _block; }
-        comma::uint32 size() const { return _size; }
-        bool fixed() const { return _size > 0; }
-        template < typename T > bool operator==( const T& t ) const { return _size > 0 ? _block < _size : t.block == _block; }
-        template < typename T > bool operator!=( const T& t ) const { return !operator==( t ); }
-        template < typename T > comma::uint32 update( const T& t ) { _block = _size > 0 ? _block + 1 == _size ? 0 : _block + 1 : t.block; return _block; }
-        template < typename T > bool ready( const T& t ) const { return _size > 0 ? _block + 1 == _size : t.block != _block; }
-    private:
-        comma::uint32 _block{0}; 
-        comma::uint32 _size{0}; 
-};
-
-static block_counter block;
+static comma::csv::block_counter block;
 
 struct ordering_t
 {
@@ -655,8 +639,7 @@ static int sort( const comma::command_line_options& options )
         if( order[i].empty() || order[i] == "block" ) { continue; }
         for( std::size_t k = 0; k < v.size(); ++k )
         {
-            if( v[k].empty() || v[k] != order[i] ) 
-            { 
+            if( v[k].empty() || v[k] != order[i] ) { 
                 if( k + 1 == v.size() ) { std::cerr << "csv-sort: order field name \"" << order[i] << "\" not found in input fields \"" << csv.fields << "\"" << std::endl; return 1; }
                 continue; 
             }
@@ -674,7 +657,7 @@ static int sort( const comma::command_line_options& options )
     }
     csv.fields = comma::join( w, ',' );
     if ( verbose ) { std::cerr << "csv-sort: fields: " << csv.fields << std::endl; }
-    block = block_counter( 0, options.value( "--block-size,--size", 0 ) );
+    block = comma::csv::block_counter( 0, options.value( "--block-size,--size", 0 ) );
     if( csv.has_field( "block" ) && block.fixed() ) { comma::say() << "'block' field and --block-size are mutually exclusive" << std::endl; return 1; }
     comma::csv::input_stream< input_with_block > istream( std::cin, csv, default_input );
     #ifdef WIN32
diff --git a/csv/block.h b/csv/block.h
new file mode 100644
index 000000000..8dd73e77a
--- /dev/null
+++ b/csv/block.h
@@ -0,0 +1,25 @@
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+namespace comma { namespace csv {
+
+class block_counter
+{
+    public:
+        block_counter( comma::uint32 b = 0, comma::uint32 s = 0 ): _block( 0 ), _size( 0 ) {}
+        comma::uint32 operator()() const { return _block; }
+        comma::uint32 size() const { return _size; }
+        bool fixed() const { return _size > 0; }
+        template < typename T > bool operator==( const T& t ) const { return _size > 0 ? _block < _size : t.block == _block; }
+        template < typename T > bool operator!=( const T& t ) const { return !operator==( t ); }
+        template < typename T > comma::uint32 update( const T& t ) { _block = _size > 0 ? _block + 1 == _size ? 0 : _block + 1 : t.block; return _block; }
+        template < typename T > bool ready( const T& t ) const { return _size > 0 ? _block + 1 == _size : t.block != _block; }
+    private:
+        comma::uint32 _block{0}; 
+        comma::uint32 _size{0}; 
+};
+
+} } // namespace comma { namespace csv {

From b2ef6cfb7c1c742b14493379c556d5018d59cbfa Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 17 Nov 2022 12:42:25 +1100
Subject: [PATCH 0550/1056] csv-sort: --block-size: a couple of bugs fixed

---
 csv/applications/csv-sort.cpp               |  8 ++-
 csv/block.h                                 | 23 +++++---
 csv/test/csv-sort/fixed_block_size/expected | 60 ++++++++++++++++-----
 csv/test/csv-sort/fixed_block_size/input    |  9 +++-
 4 files changed, 76 insertions(+), 24 deletions(-)

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index 47828c1c5..d271b7fb4 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -657,8 +657,6 @@ static int sort( const comma::command_line_options& options )
     }
     csv.fields = comma::join( w, ',' );
     if ( verbose ) { std::cerr << "csv-sort: fields: " << csv.fields << std::endl; }
-    block = comma::csv::block_counter( 0, options.value( "--block-size,--size", 0 ) );
-    if( csv.has_field( "block" ) && block.fixed() ) { comma::say() << "'block' field and --block-size are mutually exclusive" << std::endl; return 1; }
     comma::csv::input_stream< input_with_block > istream( std::cin, csv, default_input );
     #ifdef WIN32
     if( istream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
@@ -678,13 +676,17 @@ static int sort( const comma::command_line_options& options )
     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) || !map.empty() )
     {
         const input_with_block* p = istream.read();
+        //if( p ) { std::cerr << "==> a: block != *p: " << ( block != *p ) << " size: " << block.size() << " current_size: " << block.current_size() << " map.size(): " << map.size() << std::endl; }
         if( !p || block != *p )
         {
+            //std::cerr << "==> b: block != *p: " << ( block != *p ) << " size: " << block.size() << " current_size: " << block.current_size() << std::endl;
             if( reverse ) { output_( map.rbegin(), map.rend() ); } else { output_( map.begin(), map.end() ); }
             map.clear();
         }
         if( !p ) { break; }
+        //std::cerr << "==> c: block: " << block() << " current_size: " << block.current_size() << std::endl;
         block.update( *p );
+        //std::cerr << "==> d: block: " << block() << " current_size: " << block.current_size() << std::endl;
         input_t::map::mapped_type& d = map[ *p ];
         if( unique && !d.empty() ) { continue; }
         if( istream.is_binary() )
@@ -711,6 +713,8 @@ int main( int ac, char** av )
         if( options.exists( "--last" ) ) { std::cerr << "csv-sort: --last: not implemented; todo" << std::endl; return 1; }
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
+        block = comma::csv::block_counter( 0, options.value( "--block-size,--size", 0 ) );
+        if( csv.has_field( "block" ) && block.fixed() ) { comma::say() << "'block' field and --block-size are mutually exclusive; got csv fields: '" << csv.fields << "'" << std::endl; return 1; }
         return   options.exists( "--first,--min,--max" )
                ? handle_operations_with_ids( options )
                : options.exists( "--random" )
diff --git a/csv/block.h b/csv/block.h
index 8dd73e77a..62cfe1617 100644
--- a/csv/block.h
+++ b/csv/block.h
@@ -9,17 +9,28 @@ namespace comma { namespace csv {
 class block_counter
 {
     public:
-        block_counter( comma::uint32 b = 0, comma::uint32 s = 0 ): _block( 0 ), _size( 0 ) {}
+        block_counter( comma::uint32 b = 0, comma::uint32 s = 0 ): _block( b ), _size( s ) {}
         comma::uint32 operator()() const { return _block; }
         comma::uint32 size() const { return _size; }
+        comma::uint32 current_size() const { return _current_size; }
         bool fixed() const { return _size > 0; }
-        template < typename T > bool operator==( const T& t ) const { return _size > 0 ? _block < _size : t.block == _block; }
+        template < typename T > bool operator==( const T& t ) const { return _size > 0 ? _current_size < _size : t.block == _block; } // dodgy?
         template < typename T > bool operator!=( const T& t ) const { return !operator==( t ); }
-        template < typename T > comma::uint32 update( const T& t ) { _block = _size > 0 ? _block + 1 == _size ? 0 : _block + 1 : t.block; return _block; }
-        template < typename T > bool ready( const T& t ) const { return _size > 0 ? _block + 1 == _size : t.block != _block; }
+        template < typename T > void update( const T& t );
+        template < typename T > bool ready( const T& t ) const { return _size > 0 ? _current_size == _size : t.block != _block; }
     private:
-        comma::uint32 _block{0}; 
-        comma::uint32 _size{0}; 
+        comma::uint32 _block{0};
+        comma::uint32 _size{0};
+        comma::uint32 _current_size{0}; 
 };
 
+template < typename T > inline void block_counter::update( const T& t )
+{ 
+    if( _size == 0 ) { _block = t.block; return; }
+    ++_current_size;
+    if( _current_size <= _size ) { return; }
+    _current_size = 1;
+    ++_block;
+}
+
 } } // namespace comma { namespace csv {
diff --git a/csv/test/csv-sort/fixed_block_size/expected b/csv/test/csv-sort/fixed_block_size/expected
index 6d4553119..5b277ef74 100644
--- a/csv/test/csv-sort/fixed_block_size/expected
+++ b/csv/test/csv-sort/fixed_block_size/expected
@@ -1,14 +1,46 @@
-fixed_block_size/basic/output/line[0]="a"
-fixed_block_size/basic/output/line[1]="b"
-fixed_block_size/basic/output/line[2]="c"
-fixed_block_size/basic/output/line[3]="d"
-fixed_block_size/basic/output/line[4]="e"
-fixed_block_size/basic/output/line[5]="f"
-fixed_block_size/last_block/output/line[0]="a"
-fixed_block_size/last_block/output/line[1]="b"
-fixed_block_size/last_block/output/line[2]="c"
-fixed_block_size/last_block/output/line[3]="d"
-fixed_block_size/last_block/output/line[4]="e"
-fixed_block_size/last_block/output/line[5]="f"
-fixed_block_size/last_block/output/line[6]="x"
-fixed_block_size/last_block/output/line[7]="y"
+fixed_block_size/ascii/block_field/output/line[0]="0,d"
+fixed_block_size/ascii/block_field/output/line[1]="0,e"
+fixed_block_size/ascii/block_field/output/line[2]="0,f"
+fixed_block_size/ascii/block_field/output/line[3]="1,a"
+fixed_block_size/ascii/block_field/output/line[4]="1,b"
+fixed_block_size/ascii/block_field/output/line[5]="1,c"
+fixed_block_size/ascii/block_field/status=0
+fixed_block_size/ascii/basic/output/line[0]="d"
+fixed_block_size/ascii/basic/output/line[1]="e"
+fixed_block_size/ascii/basic/output/line[2]="f"
+fixed_block_size/ascii/basic/output/line[3]="a"
+fixed_block_size/ascii/basic/output/line[4]="b"
+fixed_block_size/ascii/basic/output/line[5]="c"
+fixed_block_size/ascii/basic/status=0
+fixed_block_size/ascii/last_block/output/line[0]="x"
+fixed_block_size/ascii/last_block/output/line[1]="y"
+fixed_block_size/ascii/last_block/output/line[2]="z"
+fixed_block_size/ascii/last_block/output/line[3]="d"
+fixed_block_size/ascii/last_block/output/line[4]="e"
+fixed_block_size/ascii/last_block/output/line[5]="f"
+fixed_block_size/ascii/last_block/output/line[6]="x"
+fixed_block_size/ascii/last_block/output/line[7]="y"
+fixed_block_size/ascii/last_block/status=0
+fixed_block_size/binary/block_field/output/line[0]="0,d"
+fixed_block_size/binary/block_field/output/line[1]="0,e"
+fixed_block_size/binary/block_field/output/line[2]="0,f"
+fixed_block_size/binary/block_field/output/line[3]="1,a"
+fixed_block_size/binary/block_field/output/line[4]="1,b"
+fixed_block_size/binary/block_field/output/line[5]="1,c"
+fixed_block_size/binary/block_field/status=0
+fixed_block_size/binary/basic/output/line[0]="d"
+fixed_block_size/binary/basic/output/line[1]="e"
+fixed_block_size/binary/basic/output/line[2]="f"
+fixed_block_size/binary/basic/output/line[3]="a"
+fixed_block_size/binary/basic/output/line[4]="b"
+fixed_block_size/binary/basic/output/line[5]="c"
+fixed_block_size/binary/basic/status=0
+fixed_block_size/binary/last_block/output/line[0]="x"
+fixed_block_size/binary/last_block/output/line[1]="y"
+fixed_block_size/binary/last_block/output/line[2]="z"
+fixed_block_size/binary/last_block/output/line[3]="d"
+fixed_block_size/binary/last_block/output/line[4]="e"
+fixed_block_size/binary/last_block/output/line[5]="f"
+fixed_block_size/binary/last_block/output/line[6]="x"
+fixed_block_size/binary/last_block/output/line[7]="y"
+fixed_block_size/binary/last_block/status=0
diff --git a/csv/test/csv-sort/fixed_block_size/input b/csv/test/csv-sort/fixed_block_size/input
index 5af45a4ac..1c1e78f16 100644
--- a/csv/test/csv-sort/fixed_block_size/input
+++ b/csv/test/csv-sort/fixed_block_size/input
@@ -1,2 +1,7 @@
-fixed_block_size/basic="( echo c ; echo b ; echo a ; echo f ; echo e; echo d ) | csv-sort --fields a --block-size 3"
-fixed_block_size/last_block="( echo c ; echo b ; echo a ; echo f ; echo e; echo d; echo y; echo x ) | csv-sort --fields a --block-size 3"
+fixed_block_size/ascii/block_field="( echo 0,f ; echo 0,e ; echo 0,d ; echo 1,c ; echo 1,b; echo 1,a ) | csv-sort --fields block,a"
+fixed_block_size/ascii/basic="( echo f ; echo e ; echo d ; echo c ; echo b; echo a ) | csv-sort --fields a --block-size 3"
+fixed_block_size/ascii/last_block="( echo z ; echo y ; echo x ; echo f ; echo e; echo d; echo y; echo x ) | csv-sort --fields a --block-size 3"
+
+fixed_block_size/binary/block_field="( echo 0,f ; echo 0,e ; echo 0,d ; echo 1,c ; echo 1,b; echo 1,a ) | csv-to-bin ui,c | csv-sort --fields block,a --binary=ui,c | csv-from-bin ui,c"
+fixed_block_size/binary/basic="( echo f ; echo e ; echo d ; echo c ; echo b; echo a ) | csv-to-bin c | csv-sort --fields a --block-size 3 --binary c | csv-from-bin c"
+fixed_block_size/binary/last_block="( echo z ; echo y ; echo x ; echo f ; echo e; echo d; echo y; echo x ) | csv-to-bin c | csv-sort --fields a --block-size 3 --binary c | csv-from-bin c"

From d2e7e07015023fc47924d0762102cfc8f98be3af Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 17 Nov 2022 18:44:27 +1100
Subject: [PATCH 0551/1056] application: comma::say() and comma::verbose:
 instead of using boost::filesystem (which caused grief elsewhere), just split
 path and take back()

---
 application/command_line_options.cpp |  4 ++--
 application/verbose.cpp              | 35 +++-------------------------
 2 files changed, 5 insertions(+), 34 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index edf9687f0..7b7608fdf 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -9,7 +9,7 @@
 #include <unordered_map>
 #include <boost/bind.hpp>
 #include <boost/config/warning_disable.hpp>
-#include "boost/filesystem.hpp"
+//#include "boost/filesystem.hpp"
 #include "boost/iostreams/stream.hpp"
 #include "boost/iostreams/device/null.hpp"
 #include <boost/optional.hpp>
@@ -36,7 +36,7 @@ std::ostream& saymore() { return say( comma::application::detail::verbose ? std:
 void command_line_options::_init_verbose( bool v, const std::string& path )
 {
     comma::verbose.init( v, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
-    comma::application::detail::name = boost::filesystem::basename( path );
+    comma::application::detail::name = comma::split( path, '/' ).back(); // boost::filesystem::basename( path );
     comma::application::detail::verbose = v;
 }
 
diff --git a/application/verbose.cpp b/application/verbose.cpp
index b1fb2e394..b620ae127 100644
--- a/application/verbose.cpp
+++ b/application/verbose.cpp
@@ -1,33 +1,7 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2015 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-#include <boost/filesystem.hpp>
+//#include <boost/filesystem.hpp>
+#include "../string/string.h"
 #include "verbose.h"
 
 namespace comma {
@@ -39,10 +13,7 @@ verbose_t::operator bool () const {return enabled_;}
 const std::string& verbose_t::app_name() const {return app_name_;}
 void verbose_t::init(bool enabled, const std::string& argv0)
 {
-    if(!argv0.empty())
-    {
-        app_name_=boost::filesystem::basename(argv0);
-    }
+    if(!argv0.empty()) { app_name_ = comma::split( argv0, '/' ).back(); } // app_name_=boost::filesystem::basename(argv0);
     enabled_=enabled;
     start_of_line=true;
 }

From c4d1d73d9322f67ede1b44bdc6e13d779e93e9b2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 18 Nov 2022 18:17:09 +1100
Subject: [PATCH 0552/1056] packed: 6-byte little/big endian integers added;
 todo: unit test

---
 packed/big_endian.h    | 34 +++++--------------------
 packed/detail/endian.h | 58 +++---------------------------------------
 packed/little_endian.h | 33 +++++-------------------
 3 files changed, 16 insertions(+), 109 deletions(-)

diff --git a/packed/big_endian.h b/packed/big_endian.h
index 230eafb04..b837587d1 100644
--- a/packed/big_endian.h
+++ b/packed/big_endian.h
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
@@ -49,6 +21,10 @@ typedef detail::endian< detail::big, 4, false > big_endian_uint32;
 typedef detail::endian< detail::big, 4, true > big_endian_int32;
 typedef big_endian_uint32 net_uint32;
 typedef big_endian_int32 net_int32;
+typedef detail::endian< detail::big, 6, false > big_endian_uint48;
+typedef detail::endian< detail::big, 6, true > big_endian_int48;
+typedef big_endian_uint48 net_uint48;
+typedef big_endian_int48 net_int48;
 typedef detail::endian< detail::big, 4, true, true > big_endian_float32;
 typedef detail::endian< detail::big, 8, true, true > big_endian_float64;
 typedef big_endian_float32 big_endian_float;
@@ -67,6 +43,8 @@ typedef detail::endian< detail::big, 3, false > uint24;
 typedef detail::endian< detail::big, 3, true > int24;
 typedef detail::endian< detail::big, 4, false > uint32;
 typedef detail::endian< detail::big, 4, true > int32;
+typedef detail::endian< detail::big, 6, false > uint48; // go figure... there are actual people in the world using it in their protocol packets...
+typedef detail::endian< detail::big, 6, true > int48;
 typedef detail::endian< detail::big, 8, false > uint64;
 typedef detail::endian< detail::big, 8, true > int64;
 typedef detail::endian< detail::big, 4, true, true > float32;
diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index 8f013980d..8f3832d48 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -1,58 +1,6 @@
-// This file is provided in addition to comma and is not an integral
-// part of comma library.
-// Copyright (c) 2018 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-// comma is a generic and flexible library
+
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2018 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
@@ -76,6 +24,8 @@ template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating =
 template < endiannes Endianness > struct endian_traits< Endianness, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
 template < endiannes Endianness > struct endian_traits< Endianness, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
 template < endiannes Endianness > struct endian_traits< Endianness, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 6, true > { typedef comma::int64 type; typedef comma::uint64 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 6, false > { typedef comma::uint64 type; typedef comma::uint64 uint_of_same_size; };
 template < endiannes Endianness > struct endian_traits< Endianness, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
 
 template < typename T > struct net_traits;
diff --git a/packed/little_endian.h b/packed/little_endian.h
index 7f8b16d70..a85fbcc2d 100644
--- a/packed/little_endian.h
+++ b/packed/little_endian.h
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author Matthew Herrmann 2007
 /// @author vsevolod vlaskine
@@ -48,6 +21,10 @@ typedef detail::endian< detail::little, 4, true > little_endian32;
 typedef detail::endian< detail::little, 4, false > little_endian_uint32;
 typedef little_endian32 int32;
 typedef little_endian_uint32 uint32;
+typedef detail::endian< detail::little, 6, true > little_endian48;
+typedef detail::endian< detail::little, 6, false > little_endian_uint48;
+typedef little_endian48 int48;
+typedef little_endian_uint48 uint48;
 typedef detail::endian< detail::little, 8, true > little_endian64;
 typedef detail::endian< detail::little, 8, false > little_endian_uint64;
 typedef little_endian64 int64;
@@ -66,6 +43,8 @@ typedef detail::endian< detail::little, 3, false > uint24;
 typedef detail::endian< detail::little, 3, true > int24;
 typedef detail::endian< detail::little, 4, false > uint32;
 typedef detail::endian< detail::little, 4, true > int32;
+typedef detail::endian< detail::little, 6, false > uint48;
+typedef detail::endian< detail::little, 6, true > int48;
 typedef detail::endian< detail::little, 8, false > uint64;
 typedef detail::endian< detail::little, 8, true > int64;
 typedef detail::endian< detail::little, 4, true, true > float32;

From 00ff25827844972b5971b4f90e4bc7c977ff1ab3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Nov 2022 12:32:27 +1100
Subject: [PATCH 0553/1056] csv/names: fields_exist(): allow_empty flag added

---
 csv/names.cpp | 36 +++---------------------------------
 csv/names.h   | 37 +++----------------------------------
 2 files changed, 6 insertions(+), 67 deletions(-)

diff --git a/csv/names.cpp b/csv/names.cpp
index 76666407c..1a29c5f71 100644
--- a/csv/names.cpp
+++ b/csv/names.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -36,10 +8,11 @@
 
 namespace comma { namespace csv {
 
-bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset )
+bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset, bool allow_empty )
 {
     for( unsigned int i = 0; i < subset.size(); ++i )
     {
+        if( allow_empty && subset[i].empty() ) { continue; }
         bool found = false;
         for( unsigned int j = 0; !found && j < fields.size(); found = fields[j] == subset[i], ++j );
         if( !found ) { return false; }
@@ -47,9 +20,6 @@ bool fields_exist( const std::vector< std::string >& fields, const std::vector<
     return true;
 }
 
-bool fields_exist( const std::string& fields, const std::string& subset, char delimiter )
-{
-    return fields_exist( comma::split( fields, delimiter ), comma::split( subset, delimiter ) );
-}
+bool fields_exist( const std::string& fields, const std::string& subset, char delimiter, bool allow_empty ) { return fields_exist( comma::split( fields, delimiter, true ), comma::split( subset, delimiter, true ), allow_empty ); }
 
 } } // namespace comma { namespace csv {
diff --git a/csv/names.h b/csv/names.h
index 37a4d2ede..fdc4af7df 100644
--- a/csv/names.h
+++ b/csv/names.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_NAMES_H_
-#define COMMA_CSV_NAMES_H_
+#pragma once
 
 #include "../csv/impl/to_names.h"
 #include "../string/string.h"
@@ -59,8 +30,8 @@ std::vector< std::string > names( const S& sample = S() ) { return names( true,
 
 /// return true, if all the fields from subset present in fields
 /// @todo make a generic subset application
-bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset );
-bool fields_exist( const std::string& fields, const std::string& subset, char delimiter = ',' );
+bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset, bool allow_empty = false );
+bool fields_exist( const std::string& fields, const std::string& subset, char delimiter = ',', bool allow_empty = false );
 
 template < typename S >
 inline std::vector< std::string > names( const std::string& paths, bool useFullxpath, const S& sample )
@@ -85,5 +56,3 @@ inline std::vector< std::string > names( const std::string& paths, bool useFullx
 }
 
 } } // namespace comma { namespace csv {
-
-#endif // COMMA_CSV_NAMES_H_

From 0bb1ff82f6d923cf50a414faeca97644df368cc1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Nov 2022 10:42:21 +1100
Subject: [PATCH 0554/1056] name_value::map::assert_mutually_exclusive(): in
 progress...

---
 csv/applications/CMakeLists.txt | 14 +++---
 csv/applications/csv-paste.cpp  | 30 ++----------
 io/applications/CMakeLists.txt  |  2 +-
 name_value/map.cpp              | 80 ++++++++++++++++++++++++++++++
 name_value/map.h                | 87 +++++----------------------------
 5 files changed, 104 insertions(+), 109 deletions(-)
 create mode 100644 name_value/map.cpp

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index fd2077b72..98d7f5ed1 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -43,22 +43,22 @@ add_executable( csv-to-sql ${dir}/csv-to-sql.cpp )
 target_link_libraries ( csv-format ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-size ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-bin-cut ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_xpath )
-target_link_libraries ( csv-split comma_csv comma_application comma_io comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+target_link_libraries ( csv-split comma_csv comma_application comma_io comma_string comma_xpath comma_name_value ${comma_ALL_EXTERNAL_LIBRARIES} )
 target_link_libraries ( csv-from-columns ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string )
-target_link_libraries ( csv-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
+target_link_libraries ( csv-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string comma_name_value )
 target_link_libraries ( csv-sort ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
-target_link_libraries ( csv-select ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string )
-target_link_libraries ( csv-paste ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_io )
+target_link_libraries ( csv-select ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string comma_name_value )
+target_link_libraries ( csv-paste ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_io comma_name_value )
 target_link_libraries ( csv-time ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
 target_link_libraries ( csv-time-delay ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string comma_xpath )
-target_link_libraries ( csv-time-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_string comma_xpath )
+target_link_libraries ( csv-time-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_string comma_xpath comma_name_value )
 target_link_libraries ( csv-time-stamp ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string )
 target_link_libraries ( csv-to-bin ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application ) # profiler )
 target_link_libraries ( csv-from-bin ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application )
 target_link_libraries ( csv-calc ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_string )
 target_link_libraries ( csv-calc-new ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_string )
 target_link_libraries ( csv-crc ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_string )
-target_link_libraries ( csv-play ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_io )
+target_link_libraries ( csv-play ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_io comma_name_value )
 target_link_libraries ( csv-shape ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-shuffle ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-thin ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_io )
@@ -134,7 +134,7 @@ set_target_properties( csv-enumerate PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-enumerate RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-intervals ${dir}/csv-intervals.cpp )
-target_link_libraries ( csv-intervals ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath )
+target_link_libraries ( csv-intervals ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_name_value )
 set_target_properties( csv-intervals PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-intervals RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
          
diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 1fbc51677..583319aa1 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -89,6 +62,7 @@ static void usage( bool verbose )
     std::cerr << "                 WARNING: --size: deprecated, since it is confusing for files" << std::endl;
     std::cerr << "            --index; instead of block number output record index in the block" << std::endl;
     std::cerr << "            --reverse; if --index, output index in descending order" << std::endl;
+    std::cerr << "            --shape=<shape>; iterate through indices of a given shape; <shape>: same meaning as in numpy, e.g. 'line-number;shape=10,5,4'" << std::endl;
     std::cerr << "            --step=<value>; default=1; line number increment/decrement step" << std::endl;        
     std::cerr << "        examples (try them)" << std::endl;
     std::cerr << "            line number" << std::endl;
@@ -204,6 +178,7 @@ class line_number : public source
                 bool reverse;
                 comma::int32 step;
                 comma::int32 begin;
+                std::vector< comma::uint32 > shape;
                 std::string format;
                 
                 options( const boost::optional< comma::int32 >& b = boost::optional< comma::int32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false, int s = 1 )
@@ -217,6 +192,7 @@ class line_number : public source
                 
                 options( const std::string& properties, const comma::command_line_options& o ) // quick and dirty: use visiting instead
                 {
+                    o.assert_mutually_exclusive( "--shape", "--block-size,--size,--reverse,--begin" );
                     options defaults( boost::optional< comma::int32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::int32 >( "--step", 1 ) );
                     comma::name_value::map map( properties, ';', '=' );
                     size = map.value< comma::uint32 >( map.get().find( "block-size" ) != map.get().end() ? "block-size" : "size", defaults.size ); // quick and dirty
diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index 152b00f28..83428dc3b 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -39,7 +39,7 @@ if( NOT WIN32 )
     install( TARGETS io-ls RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( io-publish ${dir}/io-publish.cpp )
-    target_link_libraries( io-publish comma_base comma_io comma_application comma_xpath ) # profiler )
+    target_link_libraries( io-publish comma_base comma_io comma_application comma_xpath comma_name_value ) # profiler )
     set_target_properties( io-publish PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-publish RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
diff --git a/name_value/map.cpp b/name_value/map.cpp
new file mode 100644
index 000000000..421f6bffa
--- /dev/null
+++ b/name_value/map.cpp
@@ -0,0 +1,80 @@
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @authors cedric wohlleber, vsevolod vlaskine
+
+#include "../base/exception.h"
+#include "map.h"
+
+namespace comma { namespace name_value {
+
+map::map( const std::string& line, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( delimiter, value_delimiter ), unique, allowed_names ); }
+
+map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( fields, delimiter, value_delimiter ), unique, allowed_names ); }
+map::map( const std::string& line, const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names ): _line( line ) { init_( options, unique, allowed_names ); }
+
+static std::vector< std::string > get_named_values( const std::string& line, const comma::name_value::impl::options& options )
+{
+    std::vector< std::string > named_values = split_escaped( line, options.m_delimiter, &(options.m_quotes[0]), options.m_escape );
+    for( std::size_t i = 0; i < options.m_names.size() && i < named_values.size(); ++i )
+    {
+        if( options.m_names[i].empty() ) { continue; }
+        if( split( named_values[i], options.m_value_delimiter ).size() != 1U ) { COMMA_THROW( comma::exception, "expected unnamed value for " << options.m_names[i] << ", got: " << named_values[i] ); }
+        named_values[i] = options.m_names[i] + options.m_value_delimiter + named_values[i];
+    }
+    return named_values;
+}
+
+void map::init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names )
+{
+    std::unordered_set< std::string > allowed;
+    for( auto name: comma::split( allowed_names, ',', true ) ) { allowed.insert( name ); }
+    const std::vector< std::string >& named_values = get_named_values( _line, options );
+    for( std::size_t i = 0; i < named_values.size(); ++i )
+    {
+        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &( options.m_quotes[0]), options.m_escape );
+        if( !allowed.empty() && allowed.find( pair[0] ) == allowed.end() ) { COMMA_THROW( comma::exception, "name \"" << pair[0] << "\" is not among allowed names: " << allowed_names ); }
+        if( unique && pair.size() > 0 && _map.find( pair[0] ) != _map.end() ) { COMMA_THROW( comma::exception, "expected unique names, got more than one \"" << pair[0] << "\"" ); }
+        switch( pair.size() )
+        {
+            case 1: _map.insert( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
+            case 2: _map.insert( std::make_pair( pair[0], pair[1] ) ); break;
+            default: { COMMA_THROW( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
+        }
+    }
+}
+
+std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( delimiter, value_delimiter ) ); }
+
+std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const std::string& fields, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( fields, delimiter, value_delimiter ) ); }
+
+std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const impl::options& options )
+{
+    std::vector< std::pair< std::string, std::string > > v;
+    const std::vector< std::string >& named_values = get_named_values( line, options );
+    for( std::size_t i = 0; i < named_values.size(); ++i )
+    {
+        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &(options.m_quotes[0]), options.m_escape );
+        switch( pair.size() )
+        {
+            case 1: v.push_back( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
+            case 2: v.push_back( std::make_pair( pair[0], pair[1] ) ); break;
+            default: { COMMA_THROW_STREAM( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
+        }
+    }
+    return v;
+}
+
+bool map::exists( const std::string& name ) const { return _map.find( name ) != _map.end(); }
+
+void map::assert_mutually_exclusive( const std::string& f )
+{
+
+}
+
+void map::assert_mutually_exclusive( const std::string& f, const std::string& g )
+{
+
+}
+
+} } // namespace comma { namespace name_value {
diff --git a/name_value/map.h b/name_value/map.h
index c56fc4d4a..9f787b90c 100644
--- a/name_value/map.h
+++ b/name_value/map.h
@@ -60,87 +60,30 @@ class map
         /// return name-value map
         const map_type& get() const { return _map; }
 
+        /// throw exception if incompatible fields are present
+        void assert_mutually_exclusive( const std::string& f );
+
+        /// throw exception if incompatible fields are present
+        void assert_mutually_exclusive( const std::string& f, const std::string& g );
+
     private:
         void init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names );
         const std::string _line;
         map_type _map;
 };
 
-inline map::map( const std::string& line, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( delimiter, value_delimiter ), unique, allowed_names ); }
-
-inline map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( fields, delimiter, value_delimiter ), unique, allowed_names ); }
-
-inline map::map( const std::string& line, const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names ): _line( line ) { init_( options, unique, allowed_names ); }
-
-inline static std::vector< std::string > get_named_values( const std::string& line, const comma::name_value::impl::options& options )
-{
-    std::vector< std::string > named_values = split_escaped( line, options.m_delimiter, &(options.m_quotes[0]), options.m_escape );
-    for( std::size_t i = 0; i < options.m_names.size() && i < named_values.size(); ++i )
-    {
-        if( options.m_names[i].empty() ) { continue; }
-        if( split( named_values[i], options.m_value_delimiter ).size() != 1U ) { COMMA_THROW( comma::exception, "expected unnamed value for " << options.m_names[i] << ", got: " << named_values[i] ); }
-        named_values[i] = options.m_names[i] + options.m_value_delimiter + named_values[i];
-    }
-    return named_values;
-}
-
-inline void map::init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names )
-{
-    std::unordered_set< std::string > allowed;
-    for( auto name: comma::split( allowed_names, ',', true ) ) { allowed.insert( name ); }
-    const std::vector< std::string >& named_values = get_named_values( _line, options );
-    for( std::size_t i = 0; i < named_values.size(); ++i )
-    {
-        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &( options.m_quotes[0]), options.m_escape );
-        if( !allowed.empty() && allowed.find( pair[0] ) == allowed.end() ) { COMMA_THROW( comma::exception, "name \"" << pair[0] << "\" is not among allowed names: " << allowed_names ); }
-        if( unique && pair.size() > 0 && _map.find( pair[0] ) != _map.end() ) { COMMA_THROW( comma::exception, "expected unique names, got more than one \"" << pair[0] << "\"" ); }
-        switch( pair.size() )
-        {
-            case 1: _map.insert( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
-            case 2: _map.insert( std::make_pair( pair[0], pair[1] ) ); break;
-            default: { COMMA_THROW( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
-        }
-    }
-}
-
-inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( delimiter, value_delimiter ) ); }
-
-inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const std::string& fields, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( fields, delimiter, value_delimiter ) ); }
-
-inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const impl::options& options )
-{
-    std::vector< std::pair< std::string, std::string > > v;
-    const std::vector< std::string >& named_values = get_named_values( line, options );
-    for( std::size_t i = 0; i < named_values.size(); ++i )
-    {
-        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &(options.m_quotes[0]), options.m_escape );
-        switch( pair.size() )
-        {
-            case 1: v.push_back( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
-            case 2: v.push_back( std::make_pair( pair[0], pair[1] ) ); break;
-            default: { COMMA_THROW_STREAM( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
-        }
-    }
-    return v;
-}
-
-inline bool map::exists( const std::string& name ) const { return _map.find( name ) != _map.end(); }
-
 namespace detail {
 
-template < typename T >
-inline T lexical_cast( const std::string& s ) { return boost::lexical_cast< T >( s ); }
+template < typename T > inline T lexical_cast( const std::string& s ) { return boost::lexical_cast< T >( s ); }
 
-template <>
-inline bool lexical_cast< bool >( const std::string& s )
+template <> inline bool lexical_cast< bool >( const std::string& s )
 {
     if( s == "" || s == "true" ) { return true; }
     if( s == "false" ) { return false; }
     return boost::lexical_cast< bool >( s );
 }
 
-template <>
-inline boost::posix_time::ptime lexical_cast< boost::posix_time::ptime >( const std::string& s )
+template <> inline boost::posix_time::ptime lexical_cast< boost::posix_time::ptime >( const std::string& s )
 {
     if ( s == "not-a-date-time" ) { return boost::posix_time::not_a_date_time; }
     else if ( s == "+infinity" || s == "+inf" || s == "inf" ) { return boost::posix_time::pos_infin; }
@@ -150,8 +93,7 @@ inline boost::posix_time::ptime lexical_cast< boost::posix_time::ptime >( const
 
 } // namespace detail {
 
-template < typename T >
-inline std::vector< T > map::values( const std::string& name ) const
+template < typename T > inline std::vector< T > map::values( const std::string& name ) const
 {
     std::vector< T > v;
     for( typename map_type::const_iterator it = _map.begin(); it != _map.end(); ++it )
@@ -161,23 +103,20 @@ inline std::vector< T > map::values( const std::string& name ) const
     return v;
 }
 
-template < typename T >
-inline T map::value( const std::string& name, const T& default_value ) const
+template < typename T > inline T map::value( const std::string& name, const T& default_value ) const
 {
     const std::vector< T >& v = values< T >( name );
     return v.empty() ? default_value : v[0];
 }
 
-template < typename T >
-inline T map::value( const std::string& name ) const
+template < typename T > inline T map::value( const std::string& name ) const
 {
     const std::vector< T >& v = values< T >( name );
     if( v.empty() ) { COMMA_THROW_STREAM( comma::exception, "'" << name << "' not found in \"" << _line << "\"" ); }
     return v[0];
 }
 
-template < typename T >
-inline boost::optional< T > map::optional( const std::string& name ) const
+template < typename T > inline boost::optional< T > map::optional( const std::string& name ) const
 {
     const std::vector< T >& v = values< T >( name );
     return v.empty() ? boost::optional< T >() : boost::optional< T >( v[0] );

From 7d781efe0b418f53de4c6fc40bee413b4701980b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Nov 2022 11:38:42 +1100
Subject: [PATCH 0555/1056] csv-paste: line-number: shape implemented

---
 csv/applications/csv-paste.cpp | 58 ++++++++++++++++++++++++----------
 csv/test/csv-paste/expected    | 28 ++++++++++++++++
 csv/test/csv-paste/input       |  3 ++
 name_value/map.cpp             | 24 +++++++++++---
 name_value/map.h               |  4 +--
 5 files changed, 95 insertions(+), 22 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 583319aa1..8eacc7c71 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -195,15 +195,26 @@ class line_number : public source
                     o.assert_mutually_exclusive( "--shape", "--block-size,--size,--reverse,--begin" );
                     options defaults( boost::optional< comma::int32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::int32 >( "--step", 1 ) );
                     comma::name_value::map map( properties, ';', '=' );
-                    size = map.value< comma::uint32 >( map.get().find( "block-size" ) != map.get().end() ? "block-size" : "size", defaults.size ); // quick and dirty
-                    index = map.value< bool >( "index", defaults.index );
-                    reverse = map.value< bool >( "reverse", defaults.reverse );
-                    step = map.value< comma::int32 >( "step", defaults.step );
-                    auto b = map.optional< comma::int32 >( "begin" );
-                    if( !b ) { b = o.optional< comma::int32 >( "--begin" ); }
-                    begin = begin_( b );
+                    map.assert_mutually_exclusive( "shape", "block-size,size,reverse,begin,step" );
+                    std::string s = map.value< std::string >( "shape", o.value< std::string >( "--shape", "" ) );
                     format = map.value< std::string >( "binary", "" );
-                    if( !format.empty() && format != "ui" ) { std::cerr << "csv-paste: currently only ui supported for line-number; got: '" << format << "'" << std::endl; exit( 1 ); } // quick and dirty for now
+                    if( s.empty() )
+                    {
+                        size = map.value< comma::uint32 >( map.get().find( "block-size" ) != map.get().end() ? "block-size" : "size", defaults.size ); // quick and dirty
+                        index = map.value< bool >( "index", defaults.index );
+                        reverse = map.value< bool >( "reverse", defaults.reverse );
+                        step = map.value< comma::int32 >( "step", defaults.step );
+                        auto b = map.optional< comma::int32 >( "begin" );
+                        if( !b ) { b = o.optional< comma::int32 >( "--begin" ); }
+                        begin = begin_( b );
+                        if( !format.empty() && format != "ui" ) { std::cerr << "csv-paste: currently only ui supported for line-number; got: '" << format << "'" << std::endl; exit( 1 ); } // quick and dirty for now
+                    }
+                    else
+                    {
+                        auto v = comma::split( s, ',' );
+                        shape.resize( v.size() );
+                        for( unsigned int i = 0; i < v.size(); ++i ) { shape[i] = boost::lexical_cast< unsigned int >( v[i] ); }
+                    }
                 }
                 
             private:
@@ -215,23 +226,25 @@ class line_number : public source
         };
         
         line_number( bool is_binary, const options& options )
-            : source( options.format.empty() ? ( is_binary ? "binary=ui" : "" ) : "binary=" + options.format ) // quick and dirty
+            : source( options.format.empty() ? ( is_binary ? options.shape.empty() ? std::string ( "binary=ui" ) : "binary=" + boost::lexical_cast< std::string >( options.shape.size() ) + "ui" : std::string() ) : "binary=" + options.format ) // quick and dirty
             , options_( options )
             , count_( 0 )
             , value_( options_.begin )
+            , values_( options_.shape.size(), 0 )
         {
         }
         
         const std::string* read()
         { 
-            serialized_ = boost::lexical_cast< std::string >( value_ );
+            serialized_ = values_.empty() ? boost::lexical_cast< std::string >( value_ ) : comma::join( values_, ',' );
             update_();
             return &serialized_;
         }
         
         const char* read( char* buf ) // quick and dirty
         {
-            comma::csv::format::traits< comma::int32 >::to_bin( value_, buf );
+            if( values_.empty() ) { comma::csv::format::traits< comma::int32 >::to_bin( value_, buf ); }
+            else { for( unsigned int i = 0; i < values_.size(); ++i, buf += sizeof( comma::int32 ) ) { comma::csv::format::traits< comma::int32 >::to_bin( values_[i], buf ); } }
             update_();
             return buf;
         }
@@ -240,19 +253,32 @@ class line_number : public source
         options options_;
         comma::uint32 count_;
         comma::int32 value_;
+        std::vector< comma::uint32 > values_;
         std::string serialized_;
         
         void update_()
         {
-            ++count_; //count_ += options_.step;
-            if( count_ < options_.size )
+            if( values_.empty() )
             {
-                if( options_.index ) { value_ += options_.reverse ? -options_.step : options_.step; }
+                ++count_; //count_ += options_.step;
+                if( count_ < options_.size )
+                {
+                    if( options_.index ) { value_ += options_.reverse ? -options_.step : options_.step; }
+                }
+                else
+                {
+                    value_ = options_.index ? options_.begin : ( value_ + options_.step );
+                    count_ = 0;
+                }
             }
             else
             {
-                value_ = options_.index ? options_.begin : ( value_ + options_.step );
-                count_ = 0;
+                for( int i = values_.size() - 1; i >= 0; --i )
+                {
+                    ++values_[i];
+                    if( values_[i] < options_.shape[i] ) { break; }
+                    values_[i] = 0;
+                }
             }
         }
 };
diff --git a/csv/test/csv-paste/expected b/csv/test/csv-paste/expected
index 2b8f54240..ff6857aae 100644
--- a/csv/test/csv-paste/expected
+++ b/csv/test/csv-paste/expected
@@ -142,3 +142,31 @@ head[1]/status=0
 head[2]/output/line[0]="0"
 head[2]/output/line[1]="1"
 head[2]/status=0
+
+line_number/shape[0]/output/line[0]="0,0"
+line_number/shape[0]/output/line[1]="0,1"
+line_number/shape[0]/output/line[2]="0,2"
+line_number/shape[0]/output/line[3]="1,0"
+line_number/shape[0]/output/line[4]="1,1"
+line_number/shape[0]/output/line[5]="1,2"
+line_number/shape[0]/output/line[6]="0,0"
+line_number/shape[0]/output/line[7]="0,1"
+line_number/shape[0]/output/line[8]="0,2"
+line_number/shape[0]/output/line[9]="1,0"
+line_number/shape[0]/output/line[10]="1,1"
+line_number/shape[0]/output/line[11]="1,2"
+line_number/shape[0]/status=0
+
+line_number/shape[1]/output/line[0]="0,0"
+line_number/shape[1]/output/line[1]="0,1"
+line_number/shape[1]/output/line[2]="0,2"
+line_number/shape[1]/output/line[3]="1,0"
+line_number/shape[1]/output/line[4]="1,1"
+line_number/shape[1]/output/line[5]="1,2"
+line_number/shape[1]/output/line[6]="0,0"
+line_number/shape[1]/output/line[7]="0,1"
+line_number/shape[1]/output/line[8]="0,2"
+line_number/shape[1]/output/line[9]="1,0"
+line_number/shape[1]/output/line[10]="1,1"
+line_number/shape[1]/output/line[11]="1,2"
+line_number/shape[1]/status=0
diff --git a/csv/test/csv-paste/input b/csv/test/csv-paste/input
index de0b2313b..7976dbbaf 100644
--- a/csv/test/csv-paste/input
+++ b/csv/test/csv-paste/input
@@ -42,3 +42,6 @@ line_number/step[7]="csv-paste "line-number;block-size=5;index;reverse;begin=4;s
 head[0]="csv-paste 'line-number;size=10;index' --head=0"
 head[1]="csv-paste 'line-number;size=10;index' --head=1"
 head[2]="csv-paste 'line-number;size=10;index' --head=2"
+
+line_number/shape[0]="csv-paste 'line-number;shape=2,3' --head=12"
+line_number/shape[1]="csv-paste 'line-number;shape=2,3;binary=2ui' --head=12 | csv-from-bin 2ui"
diff --git a/name_value/map.cpp b/name_value/map.cpp
index 421f6bffa..9c78e0f6c 100644
--- a/name_value/map.cpp
+++ b/name_value/map.cpp
@@ -67,14 +67,30 @@ std::vector< std::pair< std::string, std::string > > map::as_vector( const std::
 
 bool map::exists( const std::string& name ) const { return _map.find( name ) != _map.end(); }
 
-void map::assert_mutually_exclusive( const std::string& f )
-{
+void map::assert_mutually_exclusive( const std::string& f ) { assert_mutually_exclusive( comma::split( f, ',' ) ); }
 
-}
+void map::assert_mutually_exclusive( const std::string& f, const std::string& g ) { assert_mutually_exclusive( comma::split( f, ',' ), comma::split( g, ',' ) ); }
 
-void map::assert_mutually_exclusive( const std::string& f, const std::string& g )
+void map::assert_mutually_exclusive( const std::vector< std::string >& f )
 {
+    std::string found;
+    for( const auto& s: f )
+    {
+        if( _map.find( s ) == _map.end() ) { continue; }
+        if( !found.empty() ) { COMMA_THROW( comma::exception, found << " and " << s << " are mutually exclusive" ); }
+        found = s;
+    }
+}
 
+void map::assert_mutually_exclusive( const std::vector< std::string >& f, const std::vector< std::string >& g )
+{
+    std::string found;
+    for( const auto& s: f ) { if( _map.find( s ) != _map.end() ) { found = s; break; } }
+    if( found.empty() ) { return; }
+    for( const auto& s: g )
+    {
+        if( _map.find( s ) != _map.end() ) { COMMA_THROW( comma::exception, found << " and " << s << " are mutually exclusive" ); }
+    }    
 }
 
 } } // namespace comma { namespace name_value {
diff --git a/name_value/map.h b/name_value/map.h
index 9f787b90c..1a15e116b 100644
--- a/name_value/map.h
+++ b/name_value/map.h
@@ -62,9 +62,9 @@ class map
 
         /// throw exception if incompatible fields are present
         void assert_mutually_exclusive( const std::string& f );
-
-        /// throw exception if incompatible fields are present
         void assert_mutually_exclusive( const std::string& f, const std::string& g );
+        void assert_mutually_exclusive( const std::vector< std::string >& f );
+        void assert_mutually_exclusive( const std::vector< std::string >& f, const std::vector< std::string >& g );
 
     private:
         void init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names );

From 3cc845ff29dd1823c96697f5db4bedc0ddbc3741 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 25 Jan 2023 19:20:34 +1100
Subject: [PATCH 0556/1056] csv-random: --range: correctly handling char and
 unsigned char added

---
 csv/applications/csv-random.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index e5189572d..e582227b5 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -191,10 +191,14 @@ static int run_impl( Distribution< T >& distribution, bool append, bool binary,
     return 0;
 }
 
+template < typename T > struct cast_traits { typedef T type; };
+template <> struct cast_traits< char > { typedef int type; };
+template <> struct cast_traits< unsigned char > { typedef unsigned int type; };
+
 template < typename T > static std::vector< T > _as( const std::vector< std::string >& v, unsigned int begin ) // todo? move to library?
 {
     std::vector< T > r( v.size() - begin );
-    for( unsigned int i = begin; i < v.size(); r[ i - begin ] = boost::lexical_cast< T >( v[i] ), ++i );
+    for( unsigned int i = begin; i < v.size(); r[ i - begin ] = boost::lexical_cast< typename cast_traits< T >::type >( v[i] ), ++i );
     return r;
 }
 

From 410b6f2f1cd3327f2c81d7323d8437658f9eab5d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 Feb 2023 14:18:39 +1100
Subject: [PATCH 0557/1056] comma_execute_and_wait: documentation fixed,
 example added

---
 bash/process/comma-process-util | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/bash/process/comma-process-util b/bash/process/comma-process-util
index 011ca4e26..5cec38f29 100755
--- a/bash/process/comma-process-util
+++ b/bash/process/comma-process-util
@@ -454,9 +454,13 @@ declare -r terminate_comma_execute_and_wait
 # @description runs a given command as a background task and waits for it to terminate
 #
 # Usage:
-#   comma_execute_and_wait command[,command2[,command3]] [--signals=signal1,signal2,...] \
+#   comma_execute_and_wait command[ command2[ command3]] [--signals=signal1,signal2,...] \
 #                          [--max-wait=max_wait] [--process|--group] [--any|--all] \
 #                          [--pid-fifo=<named pipe>]
+# Quick example:
+#   function _hello() { echo "hello $1"; }
+#   export -f _hello
+#   comma_execute_and_wait --group "some-command-line-util --some-option" "bash -c _hello world"
 #
 # The function executes the given command(s) (non-option argument) in a background process(es)
 # and waits for its completion (or timeout, see below).

From ec232c8d1a02e190bfe3cb8b3663c4c999021ceb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 16 Feb 2023 11:46:45 +1100
Subject: [PATCH 0558/1056] csv-time-stamp: --flush implemented

---
 csv/applications/csv-time-stamp.cpp | 51 +++++------------------------
 1 file changed, 8 insertions(+), 43 deletions(-)

diff --git a/csv/applications/csv-time-stamp.cpp b/csv/applications/csv-time-stamp.cpp
index cf77da7e3..e989c1a1f 100644
--- a/csv/applications/csv-time-stamp.cpp
+++ b/csv/applications/csv-time-stamp.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author cedric wohlleber
 
@@ -43,7 +15,7 @@
 #include "../../base/types.h"
 #include "../../csv/format.h"
 
-static void usage()
+static void usage( bool verbose )
 {
     std::cerr << std::endl;
     std::cerr << "prepend input with timestamp" << std::endl;
@@ -54,6 +26,7 @@ static void usage()
     std::cerr << "    --binary,-b=<format>: binary format" << std::endl;
     std::cerr << "    --size=<size>: binary input of size" << std::endl;
     std::cerr << "    --delimiter,-d <delimiter>: ascii only; default ','" << std::endl;
+    std::cerr << "    --flush; flush stdout after each record" << std::endl;
     std::cerr << "    --local: if present, local time; default: utc" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples:" << std::endl;
@@ -61,29 +34,22 @@ static void usage()
     std::cerr << "    cat input.bin | csv-time-stamp --binary=3ui" << std::endl;
     std::cerr << "    cat input.bin | csv-time-stamp --size=12" << std::endl;
     std::cerr << std::endl;
-    std::cerr << std::endl;
-    exit( -1 );
+    exit( 1 );
 }
 
 int main( int ac, char** av )
 {
     try
     {
-        comma::command_line_options options( ac, av );
-        if( options.exists( "--help" ) || options.exists( "-h" ) ) { usage(); }
-
+        comma::command_line_options options( ac, av, usage );
         bool local = options.exists( "--local" );
         char delimiter = options.value( "--delimiter,-d", ',' );
-
         boost::optional< comma::csv::format > format;
-        if( options.exists( "--binary,-b" ))
-        {
-            format = comma::csv::format( options.value< std::string >( "--binary,-b" ));
-        }
+        if( options.exists( "--binary,-b" )) { format = comma::csv::format( options.value< std::string >( "--binary,-b" )); }
         bool binary = options.exists( "--binary,-b,--size" );
         std::size_t size = options.value( "--size", 0 );
+        bool flush = options.exists( "--flush" );
         if( binary && size == 0 ) { size = format->size(); }
-
         #ifdef WIN32
         if( binary )
         {
@@ -91,7 +57,6 @@ int main( int ac, char** av )
             _setmode( _fileno( stdout ), _O_BINARY );
         }
         #endif
-
         if( binary )
         {
             boost::array< char, 65536 > buf;
@@ -112,7 +77,7 @@ int main( int ac, char** av )
                         std::cout.write( ( char* )( &timestamp ), time_size );
                         std::cout.write( cur, size );
                     }
-                    std::cout.flush();
+                    if( flush ) { std::cout.flush(); }
                     if( cur == end ) { cur = begin; }
                 }
                 int r = ::read( 0, cur + offset, end - cur - offset );
@@ -135,5 +100,5 @@ int main( int ac, char** av )
     }
     catch( std::exception& ex ) { std::cerr << "csv-time-stamp: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-time-stamp: unknown exception" << std::endl; }
-    usage();
+    return 1;
 }

From efbcabc3b62fed8cee0dedff41fb427d157678d0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 17 Feb 2023 17:39:29 +1100
Subject: [PATCH 0559/1056] comma::split_as(): optional default value added

---
 string/split.h | 21 +++++++++++----------
 1 file changed, 11 insertions(+), 10 deletions(-)

diff --git a/string/split.h b/string/split.h
index a21310dbc..47203f748 100644
--- a/string/split.h
+++ b/string/split.h
@@ -7,6 +7,7 @@
 #include <string>
 #include <vector>
 #include <boost/lexical_cast.hpp>
+#include <boost/optional.hpp>
 
 namespace comma {
 
@@ -16,19 +17,19 @@ bool is_one_of( char c, const char* characters );
 
 } // namespace string {
 
-/// split string into tokens (a quick implementation); always contains at least one element
+/// split string into tokens (a quick implementation); always contains at least one element unless empty_if_empty_input is true
 std::vector< std::string > split( const std::string& s, const char* separators = " ", bool empty_if_empty_input = false );
 
-/// split string into tokens (a quick implementation); always contains at least one element
+/// split string into tokens (a quick implementation); always contains at least one element unless empty_if_empty_input is true
 std::vector< std::string > split( const std::string& s, char separator, bool empty_if_empty_input = false );
 
-/// split string into tokens (a quick implementation) and cast to a given type; always contains at least one element
+/// split string into tokens (a quick implementation) and cast to a given type
 template < typename T >
-std::vector< T > split_as( const std::string& s, const char* separators );
+std::vector< T > split_as( const std::string& s, const char* separators, const boost::optional< T >& default_value = boost::none );
 
-/// split string into tokens (a quick implementation) and cast to a given type; always contains at least one element
+/// split string into tokens (a quick implementation) and cast to a given type
 template < typename T >
-std::vector< T > split_as( const std::string& s, char separator );
+std::vector< T > split_as( const std::string& s, char separator, const boost::optional< T >& default_value = boost::none );
 
 /// Split string into tokens; always contains at least one element;
 /// skips backslash escaped separator, handle non-nested quotes;
@@ -55,18 +56,18 @@ std::vector< std::string > split_bracketed( const std::string& s, const char * s
 std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket = '(', char rbracket = ')', bool strip_brackets = true );
 
 template < typename T >
-inline std::vector< T > split_as( const std::string& s, const char* separators )
+inline std::vector< T > split_as( const std::string& s, const char* separators, const boost::optional< T >& default_value )
 {
     const auto& v = split( s, separators, true );
     std::vector< T > t( v.size() );
-    for( unsigned int i = 0; i < v.size(); ++i ) { t[i] = boost::lexical_cast< T >( v[i] ); }
+    for( unsigned int i = 0; i < v.size(); ++i ) { t[i] = v[i].empty() && default_value ? *default_value : boost::lexical_cast< T >( v[i] ); }
     return t;
 }
 
-template < typename T > inline std::vector< T > split_as( const std::string& s, char separator )
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator, const boost::optional< T >& default_value )
 {
     const char separators[] = { separator, 0 };
-    return split_as< T >( s, separators );
+    return split_as< T >( s, separators, default_value );
 }
 
 } // namespace comma {

From a97039a54adb3f2e80b56801913c667ec6b449c6 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 21 Feb 2023 18:28:47 +1100
Subject: [PATCH 0560/1056] csv-random.cpp: reflowed help text to fit on 80
 column screen

---
 csv/applications/csv-random.cpp | 162 +++++++++++++++++++-------------
 1 file changed, 98 insertions(+), 64 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index e582227b5..0344550f7 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -18,71 +18,105 @@
 
 static void usage( bool verbose )
 {
-    std::cerr << std::endl;
-    std::cerr << "random operations on input stream" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --seed=[<unsigned int>]; random seed" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "operations" << std::endl;
-    std::cerr << "    make: output pseudo-random numbers" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        usage: csv-random make [<options>] > random.csv" << std::endl;
-    std::cerr << "               cat records.csv | csv-random make --append [<options>] > appended.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        options" << std::endl;
-    std::cerr << "            --append; append random numbers to stdin input" << std::endl;
-    std::cerr << "            --distribution=<distribution>[;<options>]; default=uniform; values: uniform, gaussian, normal; todo: more distributions to plug in, just ask" << std::endl;
-    std::cerr << "                uniform[;<min>;<max>]: if <min>, <max> not present, --range values will be used" << std::endl;
-    std::cerr << "                gaussian[;<mean>;<sigma>]" << std::endl;
-    std::cerr << "                normal: alias for gaussian" << std::endl;
-    std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
-    std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
-    std::cerr << "            --range=[<min>,<max>]; desired value range: attention! currently, will pick value until gets something in range" << std::endl;
-    std::cerr << "            --type=<type>; default=ui; supported values: b, ub, w, uw, i, ui, l, ul, f, d; can have more than one <type> i.e. 3ui" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    true-random: output non-deterministic uniformly distributed unsigned int random numbers (if non-deterministic source is not available" << std::endl;
-    std::cerr << "                 e.g. a hardware device, output will be pseudo-random" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        usage: csv-random true-random [<options>]" << std::endl;
-    std::cerr << "               cat records.csv | csv-random true-random --append <options> > appended.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        options" << std::endl;
-    std::cerr << "            --append; append random number to stdin input" << std::endl;
-    std::cerr << "            --once; output random number only once" << std::endl;
-    std::cerr << "            --output-binary; output random numbers as binary, or specify --binary=<format> for stdin input" << std::endl;
-    std::cerr << "            --type=<type>; default=ui; todo: supported values: ui; e.g: --type=3ui; --type=ui,ui,ui; etc" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        example" << std::endl;
-    std::cerr << "            > csv-random make --seed=$( csv-random true-random --once )" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    sample: output a uniformly distributed sample of input records of a given size; record order preserved" << std::endl;
-    std::cerr << "            limitation: current implementation accumulates input records before outputting" << std::endl;
-    std::cerr << "                        if records are large, it may be memory-inefficient; can be improved, just ask" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        usage: cat records.csv | csv-random sample [<options>] > sample.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        options" << std::endl;
-    std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
-    std::cerr << "            --fields=[<fields>]; if 'block' field present sample each block, otherwise read whole input and then sample" << std::endl;
-    std::cerr << "            --ratio=[<ratio>]; portion of each block to output, if block is too small, nothing will be output for it" << std::endl;
-    std::cerr << "            --size=<n>; default=1; number of records to output in each block, if smaller than block size, output the whole block" << std::endl;
-    std::cerr << "            --sliding-window,--window=[<size>]; todo: sample on sliding window of <size> records" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    shuffle: output input records in pseudo-random order" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "        options" << std::endl;
-    std::cerr << "            --engine=<engine>; default=mt19937_64; supported values: minstd_rand0, minstd_rand, mt19937, mt19937_64, ranlux24_base, ranlux48_base, ranlux24, ranlux48, knuth_b, default_random_engine" << std::endl;
-    std::cerr << "            --fields=[<fields>]; if 'block' field present, shuffle each block, otherwise read whole input and then shuffle" << std::endl;
-    std::cerr << "            --ratio=[<ratio>]; portion of each block to output, same as for \"sample\" operation, but shuffled" << std::endl;
-    std::cerr << "            --size=<n>; default=1; number of records to output in each block, same as for \"sample\" operation, but shuffled" << std::endl;
-    std::cerr << "            --sliding-window,--window=[<size>]; todo: shuffle on sliding window of <size> records" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "csv options:" << std::endl;
+    std::cerr << "\nrandom operations on input stream";
+    std::cerr << '\n';
+    std::cerr << "\nusage: csv-random <operation> [<options>]";
+    std::cerr << "\n";
+    std::cerr << "\n    where <operation> is one of:";
+    std::cerr << "\n        make: output pseudo-random numbers";
+    std::cerr << "\n        true-random: output non-deterministic uniformly distributed numbers";
+    std::cerr << "\n        sample: output a uniformly distributed sample of input records";
+    std::cerr << "\n        shuffle: output input records in pseudo-random order";
+    std::cerr << '\n';
+    std::cerr << "\noptions";
+    std::cerr << "\n    --seed=[<unsigned int>]; random seed";
+    std::cerr << '\n';
+    std::cerr << "\noperations";
+    std::cerr << "\n    make: output pseudo-random numbers";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: csv-random make [<options>] > random.csv";
+    std::cerr << "\n               cat input.csv | csv-random make --append [<options>]";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --append; append random numbers to stdin input";
+    std::cerr << "\n            --distribution=<distribution>[;<options>]";
+    std::cerr << "\n                where <distribution> is one of:";
+    std::cerr << "\n                    uniform[;<min>;<max>] (default)";
+    std::cerr << "\n                        if <min>, <max> not present, --range values will be used";
+    std::cerr << "\n                    gaussian[;<mean>;<sigma>]";
+    std::cerr << "\n                    normal: alias for gaussian";
+    std::cerr << "\n                todo: more distributions to plug in, just ask";
+    std::cerr << "\n            --engine=<engine>";
+    std::cerr << "\n                where <engine> is one of: minstd_rand0, minstd_rand, mt19937,";
+    std::cerr << "\n                    mt19937_64 (default), ranlux24_base, ranlux48_base,";
+    std::cerr << "\n                    ranlux24, ranlux48, knuth_b, default_random_engine";
+    std::cerr << "\n            --output-binary; output random numbers as binary";
+    std::cerr << "\n                    specify --binary=<format> for stdin input";
+    std::cerr << "\n            --range=[<min>,<max>]; desired value range";
+    std::cerr << "\n                attention! will pick value until gets something in range";
+    std::cerr << "\n            --type=<type>; default=ui; supported values: b,ub,w,uw,i,ui,l,ul,f,d";
+    std::cerr << "\n                can have more than one <type> i.e. 3ui";
+    std::cerr << '\n';
+    std::cerr << "\n    true-random: output non-deterministic uniformly distributed unsigned int";
+    std::cerr << "\n                 random numbers (if non-deterministic source is not available)";
+    std::cerr << "\n                 e.g. a hardware device, output will be pseudo-random";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: csv-random true-random [<options>]";
+    std::cerr << "\n               cat input.csv | csv-random true-random --append [<options>]";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --append; append random number to stdin input";
+    std::cerr << "\n            --once; output random number only once";
+    std::cerr << "\n            --output-binary; output random numbers as binary";
+    std::cerr << "\n                    specify --binary=<format> for stdin input";
+    std::cerr << "\n            --type=<type>; default=ui; todo: supported values: ui;";
+    std::cerr << "\n                    e.g: --type=3ui; --type=ui,ui,ui; etc";
+    std::cerr << '\n';
+    std::cerr << "\n        example";
+    std::cerr << "\n            > csv-random make --seed=$( csv-random true-random --once )";
+    std::cerr << '\n';
+    std::cerr << "\n    sample: output uniformly distributed sample of input records of a given size";
+    std::cerr << "\n            record order preserved";
+    std::cerr << "\n            limitation: current implementation accumulates input records before";
+    std::cerr << "\n            outputting, if records are large, it may be memory-inefficient;";
+    std::cerr << "\n            can be improved, just ask";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: cat records.csv | csv-random sample [<options>] > sample.csv";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --engine=<engine>";
+    std::cerr << "\n                where <engine> is one of: minstd_rand0, minstd_rand, mt19937,";
+    std::cerr << "\n                    mt19937_64 (default), ranlux24_base, ranlux48_base,";
+    std::cerr << "\n                    ranlux24, ranlux48, knuth_b, default_random_engine";
+    std::cerr << "\n            --fields=[<fields>]; if 'block' field present sample each block,";
+    std::cerr << "\n                    otherwise read whole input and then sample";
+    std::cerr << "\n            --ratio=[<ratio>]; portion of each block to output,";
+    std::cerr << "\n                    if block is too small, nothing will be output for it";
+    std::cerr << "\n            --size=<n>; default=1; number of records to output in each block,";
+    std::cerr << "\n                    if smaller than block size, output the whole block";
+    std::cerr << "\n            --sliding-window,--window=[<size>]; todo: sample on sliding window";
+    std::cerr << "\n                    of <size> records";
+    std::cerr << '\n';
+    std::cerr << "\n    shuffle: output input records in pseudo-random order";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --engine=<engine>";
+    std::cerr << "\n                where <engine> is one of: minstd_rand0, minstd_rand, mt19937,";
+    std::cerr << "\n                    mt19937_64 (default), ranlux24_base, ranlux48_base,";
+    std::cerr << "\n                    ranlux24, ranlux48, knuth_b, default_random_engine";
+    std::cerr << "\n            --fields=[<fields>]; if 'block' field present, shuffle each block,";
+    std::cerr << "\n                    otherwise read whole input and then shuffle";
+    std::cerr << "\n            --ratio=[<ratio>]; portion of each block to output,";
+    std::cerr << "\n                    same as for \"sample\" operation, but shuffled";
+    std::cerr << "\n            --size=<n>; default=1; number of records to output in each block,";
+    std::cerr << "\n                    same as for \"sample\" operation, but shuffled";
+    std::cerr << "\n            --sliding-window,--window=[<size>]; todo: shuffle on sliding window";
+    std::cerr << "\n                    of <size> records";
+    std::cerr << '\n';
+    std::cerr << "\ncsv options:";
     std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;
-    std::cerr << std::endl;
     exit( 0 );
 }
 

From 9af56f310ddc5da3e38835026eb216ff42c4c8fb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 22 Feb 2023 15:55:36 +1100
Subject: [PATCH 0561/1056] visiting::traits: traits for std::complex added

---
 visiting/traits.h | 21 +++++++++++++++++++++
 1 file changed, 21 insertions(+)

diff --git a/visiting/traits.h b/visiting/traits.h
index 87b2429e9..ecf92aaa8 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -9,6 +9,7 @@
 #include <stdlib.h>
 #endif
 #include <array>
+#include <complex>
 #include <map>
 #include <set>
 #include <string>
@@ -52,6 +53,26 @@ struct traits< std::pair< T, S > >
     }    
 };
 
+template < typename T >
+struct traits< std::complex< T > >
+{
+    template < typename K, typename V > static void visit( const K& key, std::complex< T >& t, V& v )
+    {
+        T s = t.real();
+        v.apply( "real", s );
+        t.real( s );
+        v = t.imag();
+        v.apply( "imag", s );
+        t.imag( s );
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const std::complex< T >& t, V& v )
+    {
+        v.apply( "real", t.real() );
+        v.apply( "imag", t.imag() );
+    }    
+};
+
 namespace detail {
 
 // template < unsigned int I > const char* element_name(); // super-quick and dirty for now, it would be better to use numeric indices, but then all visitors need to support tuple correctly

From 15cbec330bee6c1ecee2b348a4c6e468ab358390 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 22 Feb 2023 17:09:36 +1100
Subject: [PATCH 0562/1056] visiting/traits: trivial typo fixed

---
 visiting/traits.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/visiting/traits.h b/visiting/traits.h
index ecf92aaa8..5887f2855 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -61,7 +61,7 @@ struct traits< std::complex< T > >
         T s = t.real();
         v.apply( "real", s );
         t.real( s );
-        v = t.imag();
+        s = t.imag();
         v.apply( "imag", s );
         t.imag( s );
     }

From ae4c39a6e363c2e38b8a40e9d00258bd387c0434 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 24 Feb 2023 16:38:50 +1100
Subject: [PATCH 0563/1056] comma-name-value-util: comma_mangle_path_value:
 value quoted

---
 bash/comma-name-value-util | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bash/comma-name-value-util b/bash/comma-name-value-util
index 4db89e62d..4b809b4b5 100644
--- a/bash/comma-name-value-util
+++ b/bash/comma-name-value-util
@@ -60,8 +60,8 @@ function comma_path_value_mangle()
         [[ -n "$path" && ! "$path" =~ ^[#\"] ]] || continue
         name=${path//\//$delimiter}
         name=${name//-/$delimiter}
-        value=${value#\"}
-        value=${value%\"}
+        value="${value#\"}"
+        value="${value%\"}"
         echo "$name='$value'"
     done
 }

From 1f0da4c1be266233a15252e139940da19342c9d0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 Mar 2023 14:38:23 +1100
Subject: [PATCH 0564/1056] application/signal_flag.h: reset(): can pass value
 to it now; default value: false, backward-compatible

---
 application/signal_flag.h | 32 ++------------------------------
 1 file changed, 2 insertions(+), 30 deletions(-)

diff --git a/application/signal_flag.h b/application/signal_flag.h
index 62266f636..f9aad6886 100644
--- a/application/signal_flag.h
+++ b/application/signal_flag.h
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -66,8 +38,8 @@ struct signal_flag : public boost::noncopyable
         /// for those who does not like to type
         operator bool() const { return is_set_; }
 
-        /// reset to false
-        void reset() { is_set_ = false; }
+        /// reset to a given value
+        void reset( bool value = false ) { is_set_ = value; }
 
     private:
         static bool is_set_;

From 9880f7822b22b171ff791216617b7f86ff1a9111 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 21 Mar 2023 11:39:57 +1100
Subject: [PATCH 0565/1056] csv::read_as() convenience function implemented

---
 csv/stream.h | 68 +++++++++++++++++++++++++++-------------------------
 1 file changed, 35 insertions(+), 33 deletions(-)

diff --git a/csv/stream.h b/csv/stream.h
index 2f7ba849e..7400ac4f7 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_STREAM_H_
-#define COMMA_CSV_STREAM_H_
+#pragma once
 
 #ifdef WIN32
 #include <stdio.h>
@@ -39,6 +10,7 @@
 #include <io.h>
 #endif
 
+#include <fstream>
 #include <iostream>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/noncopyable.hpp>
@@ -53,10 +25,21 @@ namespace comma { namespace csv {
 /// @todo document
 namespace detail { void unsynchronize_with_stdio(); }
 
-template < typename S > class output_stream;
+/// generic input stream
 template < typename S > class input_stream;
+
+/// generic output stream
+template < typename S > class output_stream;
+
+/// tied input and output streams
 template < typename S, typename T > class tied;
 
+/// input stream passed through
+template < typename S > class passed;
+
+/// convenience functions: read input stream into a container that has push_back() method
+template < typename V > V read_as( std::istream& is, const options& o = options() );
+template < typename V > V read_as( const std::string& filename, const options& o = options() );
 
 /// ascii csv input stream
 template < typename S >
@@ -847,6 +830,25 @@ inline void output_stream< S >::append_output( input_stream< T >& is, const S& s
     }
 }*/
 
-} } // namespace comma { namespace csv {
+template < typename V > V read_as( std::istream& is, const options& o )
+{
+    input_stream< typename V::value_type > istream( is, o );
+    V v;
+    while( istream.ready() || is.good() )
+    {
+        auto p = istream.read();
+        if( !p ) { break; }
+        v.push_back( *p );
+    }
+    return v;
+}
 
-#endif /*COMMA_CSV_STREAM_H_*/
+template < typename V > V read_as( const std::string& filename, const options& o )
+{
+    std::ifstream ifs;
+    ifs.open( &filename[0], o.binary() ? std::ios_base::in | std::ios_base::binary : std::ios_base::in );
+    if( ifs.is_open() ) { return read_as< V >( ifs, o ); }
+    COMMA_THROW( comma::exception, "failed to open '" << filename << "'" );
+}
+
+} } // namespace comma { namespace csv {

From b1bf6c9b89ef34ca3939a9fcd72a69c7adffec72 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 26 Mar 2023 12:58:31 +1100
Subject: [PATCH 0566/1056] command_line_options::assert_exists_if()
 implemented

---
 application/command_line_options.cpp | 9 +++++++++
 application/command_line_options.h   | 3 +++
 2 files changed, 12 insertions(+)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 7b7608fdf..72021fff4 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -172,6 +172,15 @@ void command_line_options::assert_mutually_exclusive( const std::string& names )
     }
 }
 
+void command_line_options::assert_exists_if( const std::string& first, const std::string& second ) const
+{
+    if( !exists( first ) ) { return; }
+    for( const auto& o: comma::split( second, ',', true ) )
+    {
+        if( !exists( o ) ) { COMMA_THROW( comma::exception, "if " << first << ", please specify " << o ); }
+    }
+}
+
 void command_line_options::assert_exists( const std::string& names ) const { if( !exists( names ) ) { COMMA_THROW( comma::exception, "please specify one of the following: " << names  ); } }
 
 void command_line_options::assert_mutually_exclusive( const std::string& first, const std::string& second ) const
diff --git a/application/command_line_options.h b/application/command_line_options.h
index 71ee9746f..b4b9380ca 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -114,6 +114,9 @@ class command_line_options
         /// throw, if not at least one of options in the list exists, trivial convenience method
         void assert_exists( const std::string& comma_separated_names ) const;
 
+        /// throw, if first option is present, but any of options in the csv list in second is not
+        void assert_exists_if( const std::string& first, const std::string& second ) const;
+
         /// description
         struct description
         {

From 0169529d4eef7509e234a28fbc96aca2199919db Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 30 Mar 2023 17:02:42 +1100
Subject: [PATCH 0567/1056] comma_path_value_mangle: support [] subscripts in
 input path

replacing them with the given delimeter (underscore by default)
---
 bash/comma-name-value-util                                   | 2 ++
 .../comma_name_value_util/comma_path_value_mangle/expected   | 5 +++++
 bash/test/comma_name_value_util/comma_path_value_mangle/test | 5 +++++
 3 files changed, 12 insertions(+)

diff --git a/bash/comma-name-value-util b/bash/comma-name-value-util
index 4b809b4b5..4405ad058 100644
--- a/bash/comma-name-value-util
+++ b/bash/comma-name-value-util
@@ -60,6 +60,8 @@ function comma_path_value_mangle()
         [[ -n "$path" && ! "$path" =~ ^[#\"] ]] || continue
         name=${path//\//$delimiter}
         name=${name//-/$delimiter}
+        name=${name//[/$delimiter}
+        name=${name//]/}        # just remove trailing ] since it's always followed by / or the end of the line
         value="${value#\"}"
         value="${value%\"}"
         echo "$name='$value'"
diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/expected b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
index 7c500cc85..2df059ba9 100644
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/expected
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
@@ -4,3 +4,8 @@ basic/var_b='22'
 no_newline_at_end/var_a=basic/var_a
 no_newline_at_end/var_b=basic/var_b
 
+path/a_b_c='1'
+dashes/a_b_c='1'
+path_with_dashes/a_b_c='1'
+subscript/a_b_0='1'
+subscript_followed_by_path/a_b_0_c='1'
diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/test b/bash/test/comma_name_value_util/comma_path_value_mangle/test
index e619aa266..06dabc782 100755
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/test
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/test
@@ -10,3 +10,8 @@ echo "$input" | comma_path_value_mangle | sed 's|^|basic/|'
 
 echo -n "$input" | comma_path_value_mangle | sed 's|^|no_newline_at_end/|'
 
+echo "a/b/c=1" | comma_path_value_mangle | sed 's|^|path/|'
+echo "a-b-c=1" | comma_path_value_mangle | sed 's|^|dashes/|'
+echo "a/b-c=1" | comma_path_value_mangle | sed 's|^|path_with_dashes/|'
+echo "a/b[0]=1" | comma_path_value_mangle | sed 's|^|subscript/|'
+echo "a/b[0]/c=1" | comma_path_value_mangle | sed 's|^|subscript_followed_by_path/|'

From 2af63612ef52ddad3d64dd3a54876476dbd1f3a0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 11:09:45 +1000
Subject: [PATCH 0568/1056] packed: string: a constructor added; using pragma
 in includes; traits: placeholder added, first cut of string traits
 implemented

---
 packed/bits.h               | 33 +-----------------------
 packed/byte.h               | 33 +-----------------------
 packed/field.h              | 33 +-----------------------
 packed/packed.h             | 27 --------------------
 packed/string.h             | 50 ++++++-------------------------------
 packed/struct.h             | 33 +-----------------------
 packed/test/packed_test.cpp | 29 +--------------------
 packed/traits.h             | 37 +++++++++++++++++++++++++++
 8 files changed, 50 insertions(+), 225 deletions(-)
 create mode 100644 packed/traits.h

diff --git a/packed/bits.h b/packed/bits.h
index 177c84968..c8d049de1 100644
--- a/packed/bits.h
+++ b/packed/bits.h
@@ -1,38 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_BITS_HEADER_H_
-#define COMMA_PACKED_BITS_HEADER_H_
+#pragma once
 
 #include <limits>
 #include <string.h>
@@ -127,5 +98,3 @@ struct reversed_bits : public packed::field< reversed_bits< B, Default >, B, siz
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // COMMA_PACKED_BITS_HEADER_H_
diff --git a/packed/byte.h b/packed/byte.h
index c3259b616..0ef66af3a 100644
--- a/packed/byte.h
+++ b/packed/byte.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_BYTE_HEADER_H_
-#define COMMA_PACKED_BYTE_HEADER_H_
+#pragma once
 
 #if defined(__linux__) || defined(__APPLE__) || defined(__QNXNTO__)
 #include <arpa/inet.h>
@@ -98,5 +69,3 @@ struct const_byte : public packed::field< const_byte< C >, unsigned char, sizeof
 typedef byte uint8;
 
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_BYTE_HEADER_H_
diff --git a/packed/field.h b/packed/field.h
index 7ed6323ca..4d703e630 100644
--- a/packed/field.h
+++ b/packed/field.h
@@ -1,38 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_FIELD_H_
-#define COMMA_PACKED_FIELD_H_
+#pragma once
 
 #include <string.h>
 #include <type_traits> // #include <boost/static_assert.hpp>
@@ -97,5 +68,3 @@ class field
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // COMMA_PACKED_FIELD_H_
diff --git a/packed/packed.h b/packed/packed.h
index cb6775ed2..8616828a6 100644
--- a/packed/packed.h
+++ b/packed/packed.h
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #pragma once
 
diff --git a/packed/string.h b/packed/string.h
index 56106579e..45adf736a 100644
--- a/packed/string.h
+++ b/packed/string.h
@@ -1,38 +1,10 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
-/// @author Dewey Nguyen 2014-2014
+/// @author Dewey Nguyen 2014
 
-#ifndef COMMA_PACKED_STRING_H_
-#define COMMA_PACKED_STRING_H_
+#pragma once
 
 #include <cmath>
 #include <iomanip>
@@ -56,11 +28,11 @@ class string : public packed::field< string< S, Padding >, std::string, S >
 
         typedef packed::field< string< S, Padding >, std::string, S > base_type;
 
-        static const std::string& default_value()
-        {
-            static const std::string s;// static const std::string s( S, Padding );
-            return s;
-        }
+        string() = default;
+
+        string( const std::string& rhs ) { pack( this->data(), rhs ); }
+
+        static const std::string& default_value() { static const std::string s; return s; } // static const std::string s( S, Padding );
 
         static void pack( char* storage, const std::string& value )
         {
@@ -69,16 +41,12 @@ class string : public packed::field< string< S, Padding >, std::string, S >
             ::memcpy( storage, &value[0], value.size() );
         }
 
-        static std::string unpack( const char* storage )
-        {
-            return comma::strip( std::string( storage, size ), Padding );
-        }
+        static std::string unpack( const char* storage ) { return comma::strip( std::string( storage, size ), Padding ); }
 
         const string& operator=( const std::string& rhs ) { return base_type::operator=( rhs ); }
 
         const string& operator=( const char* rhs ) { return base_type::operator=( std::string( rhs, size ) ); }
 
-        /// a convenience method, if string represents numeric values
         template < typename T > T as() const { return boost::lexical_cast< T >( this->operator()() ); }
 };
 
@@ -174,5 +142,3 @@ class ascii_hex : public packed::field< ascii_hex< T, S, Padding >, T, S >
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_STRING_H_
diff --git a/packed/struct.h b/packed/struct.h
index 2bee4948d..ba559e7ee 100644
--- a/packed/struct.h
+++ b/packed/struct.h
@@ -1,38 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_STRUCT_HPP_
-#define COMMA_PACKED_STRUCT_HPP_
+#pragma once
 
 #include <cstring>
 #include <type_traits>
@@ -58,5 +29,3 @@ class packed_struct
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_STRUCT_HPP_
diff --git a/packed/test/packed_test.cpp b/packed/test/packed_test.cpp
index 4509a38d2..8c7eb8ea1 100644
--- a/packed/test/packed_test.cpp
+++ b/packed/test/packed_test.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 #ifndef WIN32
 #include <stdlib.h>
@@ -36,6 +8,7 @@
 #include <gtest/gtest.h>
 #include <boost/array.hpp>
 #include "../../packed/packed.h"
+#include "../../packed/traits.h"
 #include "../../math/compare.h"
 #include "../../packed/bits.h"
 #include "../../base/types.h"
diff --git a/packed/traits.h b/packed/traits.h
new file mode 100644
index 000000000..b8dd0cf0e
--- /dev/null
+++ b/packed/traits.h
@@ -0,0 +1,37 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author Vsevolod Vlaskine
+
+#pragma once
+
+#include <memory>
+#include <string>
+#include "../visiting/traits.h"
+#include "string.h"
+
+namespace comma { namespace visiting {
+
+// todo: add traits for other types
+
+template < std::size_t Size, char Padding > struct traits< comma::packed::string< Size, Padding > >
+{
+    template < typename Key, class Visitor > static void visit( const Key& k, comma::packed::string< Size, Padding >& p, Visitor& v )
+    {
+        // todo? quick and dirty for now; should we support nacked pointers in visitors?
+        // todo? should we replace Padding with 0?
+        std::string s( p.data(), Size );
+        v.apply( k, s );
+        std::memset( p.data(), Padding, Size );
+        std::memcpy( p.data(), &s[0], std::min( s.size(), Size ) );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key& k, const comma::packed::string< Size, Padding >& p, Visitor& v )
+    {
+        // todo? quick and dirty for now; should we support nacked pointers in visitors?
+        // todo? should we replace Padding with 0?
+        std::string s( p.data(), Size );
+        v.apply( k, s );
+    }
+};
+
+} } // namespace comma { namespace visiting {

From 2bb0dc0a30c5c4d7fed37e86910e955643d2896b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 11:24:28 +1000
Subject: [PATCH 0569/1056] packed::string: constructor added

---
 packed/string.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/packed/string.h b/packed/string.h
index 45adf736a..9da7e56b5 100644
--- a/packed/string.h
+++ b/packed/string.h
@@ -32,6 +32,8 @@ class string : public packed::field< string< S, Padding >, std::string, S >
 
         string( const std::string& rhs ) { pack( this->data(), rhs ); }
 
+        string( const char* rhs ) { operator=( rhs ); }
+
         static const std::string& default_value() { static const std::string s; return s; } // static const std::string s( S, Padding );
 
         static void pack( char* storage, const std::string& value )

From eb55f17cb008eed2889cbac68502dd6469642c9f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 15:31:48 +1000
Subject: [PATCH 0570/1056] base: comma_assert, comma_throw_if implemented

---
 base/CMakeLists.txt      |  4 ++++
 base/exception.h         | 38 +++++---------------------------------
 base/test/CMakeLists.txt | 13 +++++++++++++
 base/test/base_test.cpp  | 26 ++++++++++++++++++++++++++
 4 files changed, 48 insertions(+), 33 deletions(-)
 create mode 100644 base/test/CMakeLists.txt
 create mode 100644 base/test/base_test.cpp

diff --git a/base/CMakeLists.txt b/base/CMakeLists.txt
index 772b1e337..9e2cbd69b 100644
--- a/base/CMakeLists.txt
+++ b/base/CMakeLists.txt
@@ -12,3 +12,7 @@ install( TARGETS ${TARGET_NAME}
          RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime       # .exe, .dll
          LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime       # .so, mod.dll
          ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development ) # .a, .lib
+
+IF( comma_BUILD_TESTS )
+    ADD_SUBDIRECTORY( test )
+ENDIF( comma_BUILD_TESTS )
\ No newline at end of file
diff --git a/base/exception.h b/base/exception.h
index d6d388ce7..090c2d060 100644
--- a/base/exception.h
+++ b/base/exception.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_BASE_EXCEPTION_H
-#define COMMA_BASE_EXCEPTION_H
+#pragma once
 
 #include <stdexcept>
 #include <sstream>
@@ -72,6 +43,10 @@ namespace comma {
 
 #endif // COMMA_RETHROW
 
+#define COMMA_ASSERT( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW( comma::exception, "throwing because condition: " << #condition << "is true; " << strmessage ); } }
+
+#define COMMA_THROW_IF( condition, strmessage ) { if( condition ) { COMMA_THROW( comma::exception, "throw if condition: " << #condition << "; " << strmessage ); } }
+
 class exception : public std::runtime_error
 {
     public:
@@ -177,6 +152,3 @@ inline void exception::formatted_string_()
 }
 
 }  // namespace comma
-
-#endif //COMMA_BASE_EXCEPTION_H
-
diff --git a/base/test/CMakeLists.txt b/base/test/CMakeLists.txt
new file mode 100644
index 000000000..0e78c696c
--- /dev/null
+++ b/base/test/CMakeLists.txt
@@ -0,0 +1,13 @@
+set( KIT base )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${test_name} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/base/test/base_test.cpp b/base/test/base_test.cpp
new file mode 100644
index 000000000..ea78c602c
--- /dev/null
+++ b/base/test/base_test.cpp
@@ -0,0 +1,26 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include "../exception.h"
+#include <gtest/gtest.h>
+
+namespace comma {
+
+TEST( base, exception )
+{
+    COMMA_ASSERT( true, "all good" );
+    COMMA_ASSERT( 2 * 2 == 4, "all good" );
+    EXPECT_THROW( COMMA_ASSERT( false, "all bad" ), comma::exception );
+    EXPECT_THROW( COMMA_ASSERT( 2 * 2 == 5, "all bad" ), comma::exception );
+    COMMA_THROW_IF( false, "all good" );
+    COMMA_THROW_IF( 2 * 2 == 5, "all good" );
+    EXPECT_THROW( COMMA_THROW_IF( true, "all bad" ), comma::exception );
+    EXPECT_THROW( COMMA_THROW_IF( 2 * 2 == 4, "all bad" ), comma::exception );
+}
+
+} // namespace comma {
+
+int main( int argc, char* argv[] )
+{    
+    ::testing::InitGoogleTest( &argc, argv );
+    return RUN_ALL_TESTS();
+}

From a59be97a8becd018d0f1c347485af5686a9d8ddf Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 16:03:48 +1000
Subject: [PATCH 0571/1056] string: choice: first cut implemented

---
 string/choice.h             | 36 +++++++++++++++++++++++++++
 string/split.cpp            | 28 ---------------------
 string/string.cpp           | 33 +------------------------
 string/string.h             | 33 +------------------------
 string/test/string_test.cpp | 49 +++++++++++++++----------------------
 5 files changed, 58 insertions(+), 121 deletions(-)
 create mode 100644 string/choice.h

diff --git a/string/choice.h b/string/choice.h
new file mode 100644
index 000000000..3c57ea044
--- /dev/null
+++ b/string/choice.h
@@ -0,0 +1,36 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#pragma once
+
+#include <string>
+#include "../base/exception.h"
+
+namespace comma {
+
+template < typename Derived, typename S = std::string >
+struct choice: public S
+{
+    choice( typename Derived::values rhs = static_cast< typename Derived::values >( 0 ) ): S( Derived::choices()[rhs] ) {}
+    choice( const std::string& rhs ) { operator=( rhs ); }
+    choice& operator=( const std::string& rhs ) { COMMA_ASSERT( valid( rhs ), "expected value; got: '" << rhs << "'" ); operator=( rhs ); return *this; }
+    typename Derived::values to_enum() const;
+    static bool valid( const std::string& rhs );
+};
+
+template < typename Derived, typename S >
+typename Derived::values choice< Derived, S >::to_enum() const
+{
+    unsigned int i = 0;
+    for( const auto& c: Derived::choices() ) { if( *this == c ) { return static_cast< typename Derived::values >( i ); } ++i; }
+    COMMA_THROW( comma::exception, "could not convert to enum value: '" << std::string( *this ) << "'" ); // in theory never here
+}
+
+template < typename Derived, typename S >
+bool choice< Derived, S >::valid( const std::string& rhs )
+{
+    unsigned int i = 0;
+    for( const auto& c: Derived::choices() ) { if( rhs == c ) { return true; } ++i; }
+    return false;
+}
+
+} // namespace comma {
diff --git a/string/split.cpp b/string/split.cpp
index 8a4eb6888..579c98cfa 100644
--- a/string/split.cpp
+++ b/string/split.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 /// @author mathew hounsell
diff --git a/string/string.cpp b/string/string.cpp
index 1043d3265..25b3b0a28 100644
--- a/string/string.cpp
+++ b/string/string.cpp
@@ -1,43 +1,13 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// Copyright (c) 2019 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 /// @author mathew hounsell
 
+#include <iostream>
 #include <boost/optional.hpp>
 #include "../base/exception.h"
 #include "string.h"
 
-#include <iostream>
-
 namespace comma {
 
 std::string strip( const std::string& s, char character )
@@ -169,5 +139,4 @@ std::string common_front( const std::string& s, const std::string& t, char delim
     return s.substr( 0, i );
 }
 
-
 } // namespace comma {
diff --git a/string/string.h b/string/string.h
index a9b68392d..89dd93a44 100644
--- a/string/string.h
+++ b/string/string.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_STRING_STRING_H_
-#define COMMA_STRING_STRING_H_
+#pragma once
 
 #include <stdlib.h>
 #include <sstream>
@@ -94,5 +65,3 @@ inline std::string join( It begin, It end, char delimiter )
 }
 
 } // namespace comma {
-
-#endif // COMMA_STRING_STRING_H_
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index fe58e918d..c9abd3141 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -1,34 +1,7 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2023 vsevolod vlaskine
 
 #include "../../base/exception.h"
+#include "../choice.h"
 #include "../string.h"
 #include "../split.h"
 #include <list>
@@ -394,6 +367,24 @@ TEST( string, common_head_delimiter )
     EXPECT_EQ( common_front( "ab/cd/ef", "ab/cd/", '/' ), "ab/cd" );
 }
 
+struct fruit
+{
+    static std::vector< std::string > choices() { return { "apple", "orange", "juicymambo" }; }
+    enum values { apple, orange, juicymambo };
+};
+
+TEST( string, choice )
+{
+    EXPECT_EQ( choice< fruit >(), "apple" );
+    EXPECT_EQ( choice< fruit >().to_enum(), fruit::apple );
+    EXPECT_EQ( choice< fruit >( "orange" ), "orange" );
+    EXPECT_EQ( choice< fruit >( fruit::orange ), "orange" );
+    EXPECT_EQ( choice< fruit >( fruit::orange ).to_enum(), fruit::orange );
+    EXPECT_TRUE( choice< fruit >::valid( "juicymambo" ) );
+    EXPECT_FALSE( choice< fruit >::valid( "driedmambo" ) );
+    EXPECT_THROW( choice< fruit >( "driedmambo" ), comma::exception );
+}
+
 } // namespace comma {
 
 int main( int argc, char* argv[] )

From 780308bcf46f4445dd85e163b4286907e09a95f1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 16:24:32 +1000
Subject: [PATCH 0572/1056] string: choice: traits implemented

---
 string/choice.h             | 29 ++++++++++++++--------
 string/test/string_test.cpp | 48 +++++++++++++++++++++++++++----------
 string/traits.h             | 32 +++++++++++++++++++++++++
 3 files changed, 87 insertions(+), 22 deletions(-)
 create mode 100644 string/traits.h

diff --git a/string/choice.h b/string/choice.h
index 3c57ea044..2d1e9acd6 100644
--- a/string/choice.h
+++ b/string/choice.h
@@ -4,33 +4,42 @@
 
 #include <string>
 #include "../base/exception.h"
+#include "string.h"
 
-namespace comma {
+namespace comma { namespace strings {
 
-template < typename Derived, typename S = std::string >
-struct choice: public S
+template < typename Derived, typename Base = std::string >
+struct choice: public Base
 {
-    choice( typename Derived::values rhs = static_cast< typename Derived::values >( 0 ) ): S( Derived::choices()[rhs] ) {}
+    typedef Base base_t;
+    choice( typename Derived::values rhs = static_cast< typename Derived::values >( 0 ) ): Base( Derived::choices()[rhs] ) {}
     choice( const std::string& rhs ) { operator=( rhs ); }
-    choice& operator=( const std::string& rhs ) { COMMA_ASSERT( valid( rhs ), "expected value; got: '" << rhs << "'" ); operator=( rhs ); return *this; }
+    choice& operator=( const std::string& rhs ) { assert_valid( rhs ); operator=( rhs ); return *this; }
     typename Derived::values to_enum() const;
     static bool valid( const std::string& rhs );
+    static void assert_valid( const std::string& rhs );
 };
 
-template < typename Derived, typename S >
-typename Derived::values choice< Derived, S >::to_enum() const
+template < typename Derived, typename Base >
+typename Derived::values choice< Derived, Base >::to_enum() const
 {
     unsigned int i = 0;
     for( const auto& c: Derived::choices() ) { if( *this == c ) { return static_cast< typename Derived::values >( i ); } ++i; }
     COMMA_THROW( comma::exception, "could not convert to enum value: '" << std::string( *this ) << "'" ); // in theory never here
 }
 
-template < typename Derived, typename S >
-bool choice< Derived, S >::valid( const std::string& rhs )
+template < typename Derived, typename Base >
+bool choice< Derived, Base >::valid( const std::string& rhs )
 {
     unsigned int i = 0;
     for( const auto& c: Derived::choices() ) { if( rhs == c ) { return true; } ++i; }
     return false;
 }
 
-} // namespace comma {
+template < typename Derived, typename Base >
+void choice< Derived, Base >::assert_valid( const std::string& rhs )
+{
+    COMMA_ASSERT( valid( rhs ), "expected one of: " << comma::join( Derived::choices(), ',' ) << "; got: '" << rhs << "'" );
+}
+
+} } // namespace comma { namespace strings {
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index c9abd3141..438c25a14 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -1,11 +1,12 @@
 // Copyright (c) 2023 vsevolod vlaskine
 
+#include <list>
+#include <gtest/gtest.h>
 #include "../../base/exception.h"
 #include "../choice.h"
-#include "../string.h"
 #include "../split.h"
-#include <list>
-#include <gtest/gtest.h>
+#include "../string.h"
+#include "../traits.h"
 
 namespace comma {
 
@@ -373,16 +374,39 @@ struct fruit
     enum values { apple, orange, juicymambo };
 };
 
-TEST( string, choice )
+struct grocery_store
+{
+    strings::choice< comma::fruit > fruit;
+};
+
+namespace visiting {
+
+template <> struct traits< grocery_store >
+{
+    template < typename Key, class Visitor > static void visit( const Key& k, grocery_store& p, Visitor& v )
+    {
+        v.apply( "fruit", p.fruit );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key& k, const grocery_store& p, Visitor& v )
+    {
+        v.apply( "fruit", p.fruit );
+    }
+};
+
+} // namespace visiting {
+
+TEST( strings, choice )
 {
-    EXPECT_EQ( choice< fruit >(), "apple" );
-    EXPECT_EQ( choice< fruit >().to_enum(), fruit::apple );
-    EXPECT_EQ( choice< fruit >( "orange" ), "orange" );
-    EXPECT_EQ( choice< fruit >( fruit::orange ), "orange" );
-    EXPECT_EQ( choice< fruit >( fruit::orange ).to_enum(), fruit::orange );
-    EXPECT_TRUE( choice< fruit >::valid( "juicymambo" ) );
-    EXPECT_FALSE( choice< fruit >::valid( "driedmambo" ) );
-    EXPECT_THROW( choice< fruit >( "driedmambo" ), comma::exception );
+    EXPECT_EQ( strings::choice< fruit >(), "apple" );
+    EXPECT_EQ( strings::choice< fruit >().to_enum(), fruit::apple );
+    EXPECT_EQ( strings::choice< fruit >( "orange" ), "orange" );
+    EXPECT_EQ( strings::choice< fruit >( fruit::orange ), "orange" );
+    EXPECT_EQ( strings::choice< fruit >( fruit::orange ).to_enum(), fruit::orange );
+    EXPECT_TRUE( strings::choice< fruit >::valid( "juicymambo" ) );
+    EXPECT_FALSE( strings::choice< fruit >::valid( "driedmambo" ) );
+    EXPECT_THROW( strings::choice< fruit >( "driedmambo" ), comma::exception );
+    // todo: test visiting...
 }
 
 } // namespace comma {
diff --git a/string/traits.h b/string/traits.h
new file mode 100644
index 000000000..bfbeb7eea
--- /dev/null
+++ b/string/traits.h
@@ -0,0 +1,32 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author Vsevolod Vlaskine
+
+#pragma once
+
+#include <string>
+#include "../base/exception.h"
+#include "../visiting/traits.h"
+#include "choice.h"
+
+namespace comma { namespace visiting {
+
+template < typename Derived, typename Base > struct traits< comma::strings::choice< Derived, Base > >
+{
+    typedef comma::strings::choice< Derived, Base > choice_t;
+
+    template < typename Key, class Visitor > static void visit( const Key& k, choice_t& p, Visitor& v )
+    {
+        std::string s( p );
+        v.apply( k, s );
+        choice_t::assert_valid( s );
+        p = s;
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key& k, const choice_t& p, Visitor& v )
+    {
+        v.apply( k, static_cast< const Base& >( p ) );
+    }
+};
+
+} } // namespace comma { namespace visiting {

From f0ca233fa1d9448b4a0304d7e0ddfda9c1e249bd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 16:57:30 +1000
Subject: [PATCH 0573/1056] base/exception: typos fixed in exception error
 messages

---
 base/exception.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/base/exception.h b/base/exception.h
index 090c2d060..1e3e5cc13 100644
--- a/base/exception.h
+++ b/base/exception.h
@@ -43,9 +43,9 @@ namespace comma {
 
 #endif // COMMA_RETHROW
 
-#define COMMA_ASSERT( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW( comma::exception, "throwing because condition: " << #condition << "is true; " << strmessage ); } }
+#define COMMA_ASSERT( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW( comma::exception, "condition: '" << #condition << "' is false; " << strmessage ); } }
 
-#define COMMA_THROW_IF( condition, strmessage ) { if( condition ) { COMMA_THROW( comma::exception, "throw if condition: " << #condition << "; " << strmessage ); } }
+#define COMMA_THROW_IF( condition, strmessage ) { if( condition ) { COMMA_THROW( comma::exception, "throw because condition: '" << #condition << "' is true; " << strmessage ); } }
 
 class exception : public std::runtime_error
 {

From eda0fcc3e859188ec8d6440ee2b709a4bceb218b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 18:27:04 +1000
Subject: [PATCH 0574/1056] string: choice: traits: improved

---
 string/traits.h | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/string/traits.h b/string/traits.h
index bfbeb7eea..bc8316fda 100644
--- a/string/traits.h
+++ b/string/traits.h
@@ -17,10 +17,8 @@ template < typename Derived, typename Base > struct traits< comma::strings::choi
 
     template < typename Key, class Visitor > static void visit( const Key& k, choice_t& p, Visitor& v )
     {
-        std::string s( p );
-        v.apply( k, s );
-        choice_t::assert_valid( s );
-        p = s;
+        v.apply( k, static_cast< Base& >( p ) );
+        choice_t::assert_valid( std::string( p ) );
     }
 
     template < typename Key, class Visitor > static void visit( const Key& k, const choice_t& p, Visitor& v )

From 52b680f5d822d6139d2abc50ce6d3767dd3319df Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 18:51:53 +1000
Subject: [PATCH 0575/1056] string: choice: traits: bug fixed

---
 string/traits.h | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/string/traits.h b/string/traits.h
index bc8316fda..1363d9b31 100644
--- a/string/traits.h
+++ b/string/traits.h
@@ -6,6 +6,7 @@
 
 #include <string>
 #include "../base/exception.h"
+#include "../visiting/apply.h"
 #include "../visiting/traits.h"
 #include "choice.h"
 
@@ -17,13 +18,13 @@ template < typename Derived, typename Base > struct traits< comma::strings::choi
 
     template < typename Key, class Visitor > static void visit( const Key& k, choice_t& p, Visitor& v )
     {
-        v.apply( k, static_cast< Base& >( p ) );
+        comma::visiting::apply( v, static_cast< Base& >( p ) );
         choice_t::assert_valid( std::string( p ) );
     }
 
     template < typename Key, class Visitor > static void visit( const Key& k, const choice_t& p, Visitor& v )
     {
-        v.apply( k, static_cast< const Base& >( p ) );
+        comma::visiting::apply( v, static_cast< const Base& >( p ) );
     }
 };
 

From 7eec8b882a74f244eb53afb6bf186f9847ca4fdd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 1 May 2023 19:05:35 +1000
Subject: [PATCH 0576/1056] string: choice: valid and assert_valid instance
 methods added

---
 string/choice.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/string/choice.h b/string/choice.h
index 2d1e9acd6..6cc1885ad 100644
--- a/string/choice.h
+++ b/string/choice.h
@@ -18,6 +18,8 @@ struct choice: public Base
     typename Derived::values to_enum() const;
     static bool valid( const std::string& rhs );
     static void assert_valid( const std::string& rhs );
+    bool valid() const { return valid( std::string( *this ) ); } // quick and dirty for now
+    void assert_valid() const { assert_valid( std::string( *this ) ); } // quick and dirty for now
 };
 
 template < typename Derived, typename Base >

From d32baa5515277e3334de0dad206c50ef0423e1ea Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 18 May 2023 12:17:41 +1000
Subject: [PATCH 0577/1056] python: comma.dictionary added

---
 python/comma/__init__.py                      |  29 +----
 python/comma/dictionary/__init__.py           |   3 +
 python/comma/dictionary/test/test             |   4 +
 .../comma/dictionary/test/test_dictionary.py  |  99 +++++++++++++++
 python/comma/dictionary/util.py               | 115 ++++++++++++++++++
 python/comma/numpy/test/test                  |   2 +-
 python/comma/version.py                       |   2 +-
 python/setup.py                               |   2 +-
 8 files changed, 226 insertions(+), 30 deletions(-)
 create mode 100644 python/comma/dictionary/__init__.py
 create mode 100755 python/comma/dictionary/test/test
 create mode 100644 python/comma/dictionary/test/test_dictionary.py
 create mode 100644 python/comma/dictionary/util.py

diff --git a/python/comma/__init__.py b/python/comma/__init__.py
index 2fd92eed7..f62e8a2e0 100644
--- a/python/comma/__init__.py
+++ b/python/comma/__init__.py
@@ -1,33 +1,8 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+# Copyright (c) 2013 Vsevolod Vlaskine
 
 from . import csv
+from . import dictionary
 from . import io
 from . import numpy
 from . import signal
diff --git a/python/comma/dictionary/__init__.py b/python/comma/dictionary/__init__.py
new file mode 100644
index 000000000..8fab06d41
--- /dev/null
+++ b/python/comma/dictionary/__init__.py
@@ -0,0 +1,3 @@
+# Copyright (c) 2023 Vsevolod Vlaskine
+
+from .util import at, has, leaves, set
diff --git a/python/comma/dictionary/test/test b/python/comma/dictionary/test/test
new file mode 100755
index 000000000..dd2083842
--- /dev/null
+++ b/python/comma/dictionary/test/test
@@ -0,0 +1,4 @@
+#!/bin/bash
+
+name=$( basename $0 )
+pytest 1>&2 && echo "$name: succeeded" >&2 || { echo "$name: failed" >&2; exit 1; }
diff --git a/python/comma/dictionary/test/test_dictionary.py b/python/comma/dictionary/test/test_dictionary.py
new file mode 100644
index 000000000..07f0037d2
--- /dev/null
+++ b/python/comma/dictionary/test/test_dictionary.py
@@ -0,0 +1,99 @@
+import pytest
+from comma import dictionary
+
+def test_dictionary_at():
+    d = { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 }, 'g': 3 } }, 'p': [ 4, 5, { 'q': 6 } ], 'r': { 's': [ [ 7, 8 ] ] } }
+    assert dictionary.at( d, 'a/b/c' ) == { 'd': 1, 'f': 2 }
+    assert dictionary.at( d, 'a.b.c', delimiter = '.' ) == { 'd': 1, 'f': 2 }
+    assert dictionary.at( d, 'a/b/c/d' ) == 1
+    assert dictionary.at( d, 'a/b/g' ) == 3
+    assert dictionary.at( d, 'a', full = True ) == { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 }, 'g': 3 } } }
+    assert dictionary.at( d, 'a/b', full = True ) == { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 }, 'g': 3 } } }
+    assert dictionary.at( d, 'a/b/c', full = True ) == { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 } } } }
+    assert dictionary.at( d, 'a/b/c/d', full = True ) == { 'a': { 'b': { 'c': { 'd': 1 } } } }
+    assert dictionary.at( d, 'a/b/g', full = True ) == { 'a': { 'b': { 'g': 3 } } }
+    with pytest.raises( KeyError ): dictionary.at( d, 'x' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'x/y' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'a/z' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'a/b/c/e' )
+    with pytest.raises( TypeError ): dictionary.at( d, 'a/b/c/d/x' )
+    assert dictionary.at( d, 'x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/b/x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/b/c/x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/b/c/d/x', no_throw = True ) is None
+    assert dictionary.at( d, 'p' ) == [ 4, 5, { 'q': 6 } ]
+    assert dictionary.at( d, 'p[0]' ) == 4
+    assert dictionary.at( d, 'p[1]' ) == 5
+    assert dictionary.at( d, 'p[2]' ) == { 'q': 6 }
+    assert dictionary.at( d, 'p[2]/q' ) == 6
+    assert dictionary.at( d, 'r' ) == { 's': [ [ 7, 8 ] ] }
+    assert dictionary.at( d, 'r/s' ) == [ [ 7, 8 ] ]
+    assert dictionary.at( d, 'r/s[0][0]' ) == 7
+    assert dictionary.at( d, 'r/s[0][1]' ) == 8
+    with pytest.raises( IndexError ): dictionary.at( d, 'r/s[0][2]' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'r/s[0][2]', full = True )
+    assert dictionary.at( d, 'r/s[0][2]', full = True, no_throw = True ) is None
+    assert dictionary.at( { 'a': [11,22,33,44] }, 'a[1:3]' ) == [22, 33]
+    assert dictionary.at( { 'a': [11,22,33,44] }, 'a[1:]' ) == [22, 33, 44]
+    assert dictionary.at([11, 22, 33, 44], '[1:]') == [22, 33, 44]
+    assert dictionary.at([11, {'a': 22}, 33, 44], '[1]/a') == 22
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[1]') == 4
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]') == {'g': 6}
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]/g') == 6
+    assert dictionary.at({'a': {}, 'e': [3, 4, {'g': 6}]}, 'e[2]/g') == 6
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[0]', no_throw=True) == 3
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]', no_throw=True) == {'g': 6}
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]/g', no_throw=True) == 6
+
+def test_dictionary_has():
+    d = { 'a': { 'b': { 'c': { 'd': 1 } } } }
+    assert dictionary.has( d, 'a/b/c' )
+    assert dictionary.has( d, 'a.b.c', delimiter = '.' )
+    assert dictionary.has( d, 'a/b/c/d' )
+    assert not dictionary.has( d, 'x' )
+    assert not dictionary.has( d, 'x/y' )
+    assert not dictionary.has( d, 'a/z' )
+    assert not dictionary.has( d, 'a/b/c/e' )
+    assert not dictionary.has( d, 'a/b/c/d/x' )
+    assert not dictionary.has( d, 'a/b/c/d/x/y' )
+
+def test_dictionary_leaves():
+    assert list( dictionary.leaves( { 'a': 1, 'b': 2, 'c': 3 } ) ) == [ ( 'a', 1 ), ( 'b', 2 ), ( 'c', 3 ) ]
+    assert list( dictionary.leaves( ['a', 'b', 'c', 'd'] ) ) == [ ('[0]', 'a'), ('[1]', 'b'), ('[2]', 'c'), ('[3]', 'd') ]
+    assert list( dictionary.leaves( {'a': {'b': [0, 1]}, 'c': 2} ) ) == [('a/b[0]', 0), ('a/b[1]', 1), ('c', 2)]
+    assert list( dictionary.leaves( [ {'a': 0}, {'b': {'c':1, 'd': 2}} ] ) ) == [('[0]/a', 0), ('[1]/b/c', 1), ('[1]/b/d', 2)]
+    assert list( dictionary.leaves( { 'a': [ {'b': 0}, {'c': 1} ] } ) ) == [('a[0]/b', 0), ('a[1]/c', 1)]
+    assert list( dictionary.leaves( { 'a': { 'b': { 'c': 0 } } } ) ) == [ ( 'a/b/c', 0 ) ]
+    assert list( dictionary.leaves( 'a' ) ) == [ ( '', 'a' ) ]
+    assert list( dictionary.leaves( {} ) ) == []
+    assert list( dictionary.leaves( [] ) ) == []
+
+def test_dictionary_set():
+    d = {}
+    dictionary.set( d, 'a/b/c', 5 )
+    assert dictionary.at( d, 'a/b/c' ) == 5
+    dictionary.set( d, 'a/b/c', 10 )
+    assert dictionary.at( d, 'a/b/c' ) == 10
+    dictionary.set( d, 'a.b.c', 15, delimiter = '.' )
+    assert dictionary.at( d, 'a/b/c' ) == 15
+    assert dictionary.set( {}, 'a.b.c', 15, delimiter = '.' ) == { 'a': { 'b': { 'c': 15 } } }
+    d = dictionary.set( {}, 'a.x.y', 3, delimiter = '.' )
+    assert dictionary.set( d, 'a.b.c', 15, delimiter = '.' ) == { 'a': { 'b': { 'c': 15 }, 'x': { 'y': 3 } } }
+    assert d == { 'a': { 'b': { 'c': 15 }, 'x': { 'y': 3 } } }
+    e = { 'a': [0,[11,22,33],{'b': 4},5,6,7] }
+    dictionary.set(e, 'a[0]', 5)
+    dictionary.set(e, 'a[3]', 55)
+    assert e['a'][0] == 5
+    assert e['a'][3] == 55
+    dictionary.set(e, 'a[1][1]', 777)
+    assert e['a'][1][1] == 777
+    dictionary.set(e, 'a[2]/b', 8)
+    dictionary.set(e, 'a[3:5]', [88,99])
+    assert e['a'][3:5] == [88,99]
+    f = [0,1,2,3,{'a': 4}]
+    dictionary.set(f, '[2:4]', [22,33])
+    assert f[2:4] == [22,33]
+    dictionary.set(f, '[4]/a', 44)
+    dictionary.set(f, '[4]/b', 55)
+    assert f[4] == {'a': 44, 'b': 55 }
diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/util.py
new file mode 100644
index 000000000..b6bc49eb8
--- /dev/null
+++ b/python/comma/dictionary/util.py
@@ -0,0 +1,115 @@
+'''
+operations on dict and dict-like objects with string keys
+made for convenience, not for performance
+'''
+
+import copy, functools, typing
+
+def at( d, path, delimiter = '/', no_throw = False, full = False ): # todo: default=...
+    '''
+    return value at a given path in a dictionary
+    
+    params
+    ------
+        d: dictionary
+        path: path in dictionary, e.g 'a/b/c/d'
+        delimiter: path delimiter
+        no_throw: if path not found, return None instead of throwing exception
+        full: output dictionary, not just the key value, see example below
+    
+    examples
+    --------
+        >>> d = { "a": { "b": { "c": 5, "d": 6 } }, "e": [ 7, [ 8, 9, 10 ] ] }
+        >>> comma.dictionary.at( d, "a/b/c" )
+        5
+        >>> comma.dictionary.at( d, "a/b/c", full = True )
+        { "a": { "b": { "c": 5 } } }
+        >>> comma.dictionary.at( d, 'e[0]' )
+        7
+        >>> comma.dictionary.at( d, 'e[1]' )
+        [ 8, 9, 10 ]
+        >>> comma.dictionary.at( d, 'e[2][1]' )
+        10
+        >>> comma.dictionary.at( d, 'e[1][1:]' )
+        [ 9, 10 ]
+        >>> e = [1, 2, {'a': 3} ]
+        >>> comma.dictionary.at( e, '[2]/a' )
+        3
+    '''
+    s = path.split( delimiter )
+    def _value( d, k ):
+        if not k:
+            if no_throw: return None
+            raise ValueError( f'"{path}" has an empty element; remove initial, trailing, or duplicated delimiters' )
+        n = k.split( '[', 1 )
+        if len( n ) == 1: return None if no_throw and ( not isinstance( d, dict ) or not k in d ) else d[k]
+        if full:
+            if no_throw: return None
+            raise KeyError( f'on path "{path}": full=True not supported for array indices, since it cannot be done consistently' )
+        if no_throw:
+            try: return eval( f'd[{n[1]}' if n[0] == '' else f'd[n[0]][{n[1]}', { 'd': d, 'n': n } )
+            except: return None
+        return eval( f'd[{n[1]}' if n[0] == '' else f'd[n[0]][{n[1]}', {'d': d, 'n': n} )
+    r = functools.reduce( lambda d, k: _value( d, k ), s, d )
+    return None if r is None else functools.reduce( lambda d, k: { k: d }, [ r ] + s[::-1] ) if full else r
+
+def has( d, path, delimiter = '/' ):
+    '''
+    return true if element at a given dictionary path exists
+
+    todo: support list indices
+    
+    examples
+    --------
+        >>> d = { "a": { "b": { "c": 1, "d": 2, "e": [ 3, 4, { "f": 5 } ] } } }
+        >>> comma.dictionary.has( d, "a/b/c" )
+        True
+        >>> comma.dictionary.has( d, [ "a", "b", "c" ] )
+        True
+        >>> comma.dictionary.has( d, [ "a", "b", "x" ] )
+        False
+    '''
+    p = path.split( delimiter ) if isinstance( path, str ) else path
+    return functools.reduce( lambda d, k: ( d[k[1]] if k[0] + 1 < len( p ) else True ) if isinstance( d, dict ) and k[1] in d else False, enumerate( p ), d )
+
+def set( d, path, value, delimiter = '/' ):
+    '''
+    assign value to a nested dictionary/list element
+    
+    examples
+    --------
+        >>> d = { "a": { "b": 1, "c": [ 2, 3 ], "d": { "e": 4 } } }
+        >>> comma.dictionary.set( d, 'a/b/c[1]', 5 )
+        todo
+    '''
+    def _set( d, p ):
+        s = p[0].split( '[', 1 )
+        if len( p ) == 1:
+            if len( s ) == 1: d[p[0]] = value
+            else: exec( f'd[{s[1]} = value' if s[0] == '' else f'd["{s[0]}"][{s[1]} = value', { 'd': d, 'value': value } )
+        else:
+            if len( s ) == 1:
+                if not p[0] in d: d[p[0]] = {}
+                _set( d[p[0]], p[ 1: ] )
+            else:
+                if ( len( s ) == 1 or s[0] != '' ) and not s[0] in d: raise KeyError( f'on path {path}: {s[0]} not found' )
+                _set( eval( f'd[{s[1]}' if s[0] == '' else f'd["{s[0]}"][{s[1]}', { 'd': d } ), p[1:])
+    _set( d, path.split( delimiter ) )
+    return d
+
+def leaves( d, path=None ):
+    '''
+    iterator through the leaf items of a nested dictionary or list, yields path-value pairs
+
+    example
+    -------
+        >>> list( comma.dictionary.leaves( { "x": { "y": [ { "z": 0 }, {"w": 2 } ], "v": "hello" } } ) )
+        [('x/y[0]/z', 0), ('x/y[1]/w', 2), ('x/v', 'hello')]
+    '''
+    if path is None: path = ''
+    if isinstance( d, dict ):
+        for key, value in d.items(): yield from leaves( value, f'{path}/{key}' )
+    elif isinstance( d, list ):
+        for i, value in enumerate(d): yield from leaves( value, f'{path}[{i}]' )
+    else:
+        yield path[1:] if path and path[0] == '/' else path, d
diff --git a/python/comma/numpy/test/test b/python/comma/numpy/test/test
index 6724cd089..4ee19ed9c 100755
--- a/python/comma/numpy/test/test
+++ b/python/comma/numpy/test/test
@@ -3,5 +3,5 @@
 name=$( basename $0 )
 
 for t in test_*.py; do
-    python3 $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
+    python3 $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed; see $name/output/stdout.log for details" >&2; exit 1; }
 done
diff --git a/python/comma/version.py b/python/comma/version.py
index 6e9c8afd9..bda5995cb 100644
--- a/python/comma/version.py
+++ b/python/comma/version.py
@@ -1,4 +1,4 @@
 # Copyright (c) 2011 The University of Sydney
 
 # if you change this file, check that it still works with ../setup.py, which gets the comma version by reading this file
-__version__ = "1.0.1"
+__version__ = "1.1.0"
diff --git a/python/setup.py b/python/setup.py
index 7aa189ff2..4b947fbf4 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -30,7 +30,7 @@
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
         python_requires     = '>=3.6',
         #install_requires    = [ 'numpy' ], # todo? does it need to be uncommented for packaging
-        packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
+        packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.dictionary', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
         entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] } #scripts             = [ "comma/csv/applications/csv-eval" ]

From 9b613627fbbfa65136a7eb3cc0aac4f5b20ce991 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 19 May 2023 13:50:32 +1000
Subject: [PATCH 0578/1056] COMMA_THROW_BRIEF, COMMA_ASSERT_BRIEF implemented

---
 base/exception.h    | 127 +++++++++++++++++++-------------------------
 base/last_error.cpp |  72 ++++++++-----------------
 base/last_error.h   |  41 ++------------
 3 files changed, 83 insertions(+), 157 deletions(-)

diff --git a/base/exception.h b/base/exception.h
index 1e3e5cc13..ea1f91b3a 100644
--- a/base/exception.h
+++ b/base/exception.h
@@ -21,20 +21,24 @@ namespace comma {
 #ifndef COMMA_THROW
 
 #if defined( WIN32 )
-    #define COMMA_THROW_IMPL_( exception, message )      \
-    throw exception( message, __FILE__, __LINE__, __FUNCSIG__ );
+    #define COMMA_THROW_IMPL_( exception, message, brief )      \
+    throw exception( message, __FILE__, __LINE__, __FUNCSIG__, brief );
 #elif defined( __GNUC__ )
-    #define COMMA_THROW_IMPL_( exception, message )      \
-    throw exception( message, __FILE__, __LINE__, __PRETTY_FUNCTION__ );
+    #define COMMA_THROW_IMPL_( exception, message, brief )      \
+    throw exception( message, __FILE__, __LINE__, __PRETTY_FUNCTION__, brief );
 #else
-    #define COMMA_THROW_IMPL_( exception, message )      \
-    throw exception( message, __FILE__, __LINE__, __FUNCTION__ );
+    #define COMMA_THROW_IMPL_( exception, message, brief )      \
+    throw exception( message, __FILE__, __LINE__, __FUNCTION__, brief );
 #endif
 
-#define COMMA_THROW( exception, strmessage ) { std::ostringstream CommaThrowStr##__LINE__; CommaThrowStr##__LINE__ << strmessage;  COMMA_THROW_IMPL_( exception, CommaThrowStr##__LINE__.str() ); }
+#define COMMA_THROW( exception, strmessage ) { std::ostringstream CommaThrowStr##__LINE__; CommaThrowStr##__LINE__ << strmessage;  COMMA_THROW_IMPL_( exception, CommaThrowStr##__LINE__.str(), false ); }
+
+#define COMMA_THROW_BRIEF( exception, strmessage ) { std::ostringstream CommaThrowStr##__LINE__; CommaThrowStr##__LINE__ << strmessage;  COMMA_THROW_IMPL_( exception, CommaThrowStr##__LINE__.str(), true ); }
 
 #define COMMA_THROW_STREAM( exception, strmessage ) COMMA_THROW( exception, strmessage )
 
+#define COMMA_THROW_STREAM_BRIEF( exception, strmessage ) COMMA_THROW_BRIEF( exception, strmessage )
+
 #endif // COMMA_THROW
 
 #ifndef COMMA_RETHROW
@@ -45,110 +49,91 @@ namespace comma {
 
 #define COMMA_ASSERT( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW( comma::exception, "condition: '" << #condition << "' is false; " << strmessage ); } }
 
+#define COMMA_ASSERT_BRIEF( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW_BRIEF( comma::exception, "condition: '" << #condition << "' is false; " << strmessage ); } }
+
 #define COMMA_THROW_IF( condition, strmessage ) { if( condition ) { COMMA_THROW( comma::exception, "throw because condition: '" << #condition << "' is true; " << strmessage ); } }
 
+#define COMMA_THROW_BRIEF_IF( condition, strmessage ) { if( condition ) { COMMA_THROW_BRIEF( comma::exception, "throw because condition: '" << #condition << "' is true; " << strmessage ); } }
+
 class exception : public std::runtime_error
 {
     public:
 
         /// constructor
-        exception( const char *message, const char *filename, unsigned long line_number, const char *function_name );
+        exception( const char *message, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 
         /// constructor
-        exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name );
+        exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 
         /// destructor
         virtual ~exception() throw() {}
 
         /// e.what is the complete formatted info
-        const char*     what(void) const throw();
+        const char*     what() const throw();
 
         /// just the error message
-        const char*     error() const;
+        const char*     error() const { return &_message[0]; }
 
         /// filename
-        const char*     file() const;
+        const char*     file() const { return &_filename[0]; }
 
         /// line number
-        unsigned long   line() const;
+        unsigned long   line() const { return _line; }
 
         /// function name
-        const char*     function() const;
+        const char*     function() const { return &_function[0]; }
 
     protected:
 
-        virtual void    formatted_string_();
+        virtual void    _formatted_string( bool brief );
 
-        std::string     m_message;
-        std::string     m_filename;
-        unsigned long   m_line_number;
-        std::string     m_function_name;
-        std::string     m_formatted_message;
+        std::string     _message;
+        std::string     _filename;
+        unsigned long   _line;
+        std::string     _function;
+        std::string     _formatted_message;
 };
 
-inline exception::exception( const char *message, const char *filename, unsigned long line_number, const char *function_name ) :
-    std::runtime_error( message ),
-    m_message( message ),
-    m_filename( filename ),
-    m_line_number( line_number ),
-    m_function_name( function_name )
+inline exception::exception( const char *message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : std::runtime_error( message )
+    , _message( message )
+    , _filename( filename )
+    , _line( line_number )
+    , _function( function_name )
 {
-    formatted_string_();
+    _formatted_string( brief );
 }
 
-inline exception::exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name ) :
-    std::runtime_error( message.c_str() ),
-    m_message( message ),
-    m_filename( filename ),
-    m_line_number( line_number ),
-    m_function_name( function_name )
+inline exception::exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : std::runtime_error( message.c_str() )
+    , _message( message )
+    , _filename( filename )
+    , _line( line_number )
+    , _function( function_name )
 {
-    formatted_string_();
+    _formatted_string( brief );
 }
 
-inline const char* exception::what(void) const throw()
+inline const char* exception::what() const throw()
 {
-    const char * string = "exception::what() m_formatted_message.c_str() threw exception";
-    try
-    {
-      string = m_formatted_message.c_str();
-    }
-    catch( ... )
-    {}
+    const char* string = "exception::what() _formatted_message.c_str() threw exception";
+    try { string = _formatted_message.c_str(); } catch( ... ) {}
     return string;
 }
 
-inline const char* exception::error() const
-{
-    return m_message.c_str();
-}
-
-
-inline const char* exception::file() const
-{
-    return m_filename.c_str();
-}
-
-inline unsigned long exception::line() const
-{
-    return m_line_number;
-}
-
-inline const char* exception::function() const
-{
-    return m_function_name.c_str();
-}
-
-inline void exception::formatted_string_()
+inline void exception::_formatted_string( bool brief )
 {
     std::ostringstream oss;
-    oss << error() << std::endl
-        << "============================================" << std::endl
-        << "file: "     << m_filename << std::endl
-        << "line: "     << m_line_number << std::endl
-        << "function: " << m_function_name << std::endl
-        << "============================================" << std::endl;
-    m_formatted_message = oss.str();
+    oss << error() << std::endl;
+    if( !brief )
+    {
+        oss << "============================================" << std::endl
+            << "file: "     << _filename << std::endl
+            << "line: "     << _line << std::endl
+            << "function: " << _function << std::endl
+            << "============================================" << std::endl;
+    }
+    _formatted_message = oss.str();
 }
 
 }  // namespace comma
diff --git a/base/last_error.cpp b/base/last_error.cpp
index d62ee22fe..f045465c0 100644
--- a/base/last_error.cpp
+++ b/base/last_error.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -67,43 +39,43 @@ std::string last_error::to_string()
 void last_error::to_exception( const std::string& msg )
 {
     #ifdef WIN32
-    switch( value() )
-    {
-        // TODO: add more exceptions
-        case 0: break;
-        case WSAEINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
-        default: COMMA_THROW( last_error::exception, msg );
-    }
+        switch( value() )
+        {
+            // TODO: add more exceptions
+            case 0: break;
+            case WSAEINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
+            default: COMMA_THROW( last_error::exception, msg );
+        }
     #else
-    switch( value() )
-    {
-        // TODO: add more exceptions
-        case 0: break;
-        case EINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
-        default: COMMA_THROW( last_error::exception, msg );
-    };
+        switch( value() )
+        {
+            // TODO: add more exceptions
+            case 0: break;
+            case EINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
+            default: COMMA_THROW( last_error::exception, msg );
+        };
     #endif
 }
 
-last_error::exception::exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name )
-    : comma::exception( std::string( msg ) + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name )
+last_error::exception::exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : comma::exception( std::string( msg ) + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name, brief )
 {
     value = last_error::value();
 }
 
-last_error::exception::exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name )
-    : comma::exception( msg + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name )
+last_error::exception::exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : comma::exception( msg + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name, brief )
 {
     value = last_error::value();
 }
 
-last_error::interrupted_system_call_exception::interrupted_system_call_exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name )
-    : last_error::exception( msg, filename, line_number, function_name )
+last_error::interrupted_system_call_exception::interrupted_system_call_exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : last_error::exception( msg, filename, line_number, function_name, brief )
 {
 }
 
-last_error::interrupted_system_call_exception::interrupted_system_call_exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name )
-    : last_error::exception( msg, filename, line_number, function_name )
+last_error::interrupted_system_call_exception::interrupted_system_call_exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : last_error::exception( msg, filename, line_number, function_name, brief )
 {
 }
 
diff --git a/base/last_error.h b/base/last_error.h
index ddc54c228..da47c2808 100644
--- a/base/last_error.h
+++ b/base/last_error.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_BASE_LAST_ERROR_HEADER
-#define COMMA_BASE_LAST_ERROR_HEADER
+#pragma once
 
 #include <string>
 #include "exception.h"
@@ -65,18 +36,16 @@ struct last_error
 
 struct last_error::exception : public comma::exception
 {
-    exception( const char*, const char *filename, unsigned long line_number, const char *function_name );
-    exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name );
+    exception( const char*, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
+    exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 
     int value;
 };
 
 struct last_error::interrupted_system_call_exception : public last_error::exception
 {
-    interrupted_system_call_exception( const char*, const char *filename, unsigned long line_number, const char *function_name );
-    interrupted_system_call_exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name );
+    interrupted_system_call_exception( const char*, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
+    interrupted_system_call_exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 };
 
 } // namespace comma {
-
-#endif // #ifndef COMMA_BASE_LAST_ERROR_HEADER

From ae480aa900c3649b867f4433f2e125be88852121 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 21 May 2023 18:45:54 +1000
Subject: [PATCH 0579/1056] license updated

---
 COPYING | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/COPYING b/COPYING
index cf71e2b40..c4218c10f 100644
--- a/COPYING
+++ b/COPYING
@@ -14,6 +14,9 @@ modification, are permitted provided that the following conditions are met:
 3. Neither the name of the University of Sydney nor the
    names of its contributors may be used to endorse or promote products
    derived from this software without specific prior written permission.
+4. Additionally, source code from this repository produced after 2022
+   must not be used in training or test datasets for training language
+   models and/or automated code generation
 
 NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
 GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT

From e9c9674f97674db655119913c2b732219b5f9bdd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 23 May 2023 18:14:55 +1000
Subject: [PATCH 0580/1056] comma-test-run: all current output directed to
 stderr; --output-stdout implemented

---
 util/applications/comma-test-run | 31 +++++++++++++++++++------------
 1 file changed, 19 insertions(+), 12 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 0021178c1..2b330cb00 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -95,9 +95,10 @@ function description_others()
   'expected' file; pass multiple global files by invoking this option several times
 --debug; much more debug output
 --document,--doc; do not run tests, only output to stdout a collated test documentation in informal way, if --junit present, produce junit-like output (todo)
---junit=[<file>]; output to file junit record compatible with jenkins for each test
 --no-ansiterm-control-characters,--no-control-characters,--raw; unstyled output (no ANSIterm control characters)
 --output-directories,--dry-run,--dry; output list of test directories intended to run and exit
+--output-junit,--junit=[<file>]; output to file junit record compatible with jenkins for each test
+--output-stdout,--stdout; output test results to stdout as <dir>,<status>, <status>: success, failed, timeout, disabled
 --path=[<dir>]; data-storage directory for tests, default: none, let the tests define it
 --test-option=[<option>]; extra command line argument(s) pass to "test" script
 
@@ -288,7 +289,7 @@ function error_and_junit_()
     error_ $( head -1 <<< "$error_and_junit_formatted" )
     local -r error_and_junit_formatted_tail="$( tail -n +2 <<< "$error_and_junit_formatted" )"
     [[ -z "$error_and_junit_formatted_tail" ]] || cat >&2 <<< "$error_and_junit_formatted_tail"
-    if [[ -n "$options_junit" && -d 'output' ]] ; then cat >> 'output/junit.failure.log' <<< "$error_and_junit_formatted" ; fi
+    if [[ -n "$options_output_junit" && -d 'output' ]] ; then cat >> 'output/junit.failure.log' <<< "$error_and_junit_formatted" ; fi
 }
 export -f error_and_junit_
 
@@ -336,6 +337,7 @@ function disabled_()
         if [[ "$verbose" == "--verbose" ]]; then
             if [[ -s $dir/$filename ]] ; then warning_ "$name: test $counter: $dir: $filename:" ; cat $dir/$filename | sed 's/^/    /' >&2
             else error_ "$name: test $counter: $dir: $filename (with no explanation)" ; fi
+            (( !options_output_stdout )) || echo "$dir,disabled" # todo? put it in message_
         fi
         return 0
     fi
@@ -468,7 +470,7 @@ function stats_finalize()
 {
     [[ -f "$stats_progress_csv" ]] || return
     cat "$stats_progress_csv" | comma-progress --elapsed > "$stats_elapsed_path_value"
-    [[ -z "$options_junit" ]] || junit_finalize > "$options_junit"
+    [[ -z "$options_output_junit" ]] || junit_finalize > "$options_output_junit"
 }
 
 function resources_limits()
@@ -613,7 +615,7 @@ function run_and_match_test()
         
         function junit_log_error() # quick and dirty; todo: move all junit stuff to one location
         {
-            [[ -n "$options_junit" ]] || return
+            [[ -n "$options_output_junit" ]] || return
             local dir=$1
             mkdir -p $dir
             touch $dir/junit.failure.log
@@ -626,7 +628,7 @@ function run_and_match_test()
             local is_global=$2
             if [[ -f "$expected" ]] ; then
                 (( options_verbose )) && message_ "$name: match expectations in '$expected'"
-                match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; comma-test-match "$expected" <'output/stdout.log' 2>&1 )
+                match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; comma-test-match "$expected" <'output/stdout.log' )
             elif [[ -d "$expected" ]] ; then
                 local extras=$( find "$expected" -type f )
                 for extra in $extras ; do
@@ -634,7 +636,7 @@ function run_and_match_test()
                     (( options_verbose )) && message_ "$name: match expectations in '$extra'"
                     local extra_match_output=$( comma-test-match "$extra" < 'output/stdout.log' )
                     [[ $is_global ]] || junit_log_error output/$( sed 's#^\./expected/##' <<< "$extra" ) "$extra_match_output"
-                    [[ -z "$extra_match_output" ]] || match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; echo "$extra_match_output" | sed "s#^#$extra:#" 2>&1 )
+                    [[ -z "$extra_match_output" ]] || match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; echo "$extra_match_output" | sed "s#^#$extra:#" )
                 done
             fi
         }
@@ -788,7 +790,7 @@ function run_single_test()
     ) 9>>"$comma_test_run_output_flock"
 
     # do not touch this equilibristics with file descriptors
-    exec 3>&1 4>&2 1>"$our_stderrout_log" 2>&1
+    exec 3>&1 4>&2 1>"$our_stderrout_log" # exec 3>&1 4>&2 1>"$our_stderrout_log" 2>&1
 
     local test_exec basedir outcome
     local result=0
@@ -829,6 +831,7 @@ function run_single_test()
                         comma_locked "$comma_test_run_resources_flock" comma_release_resources "$request" "$comma_test_run_resources_counter" "$worker_id"
                         (( $? == 0 )) || {
                             error_ "$name: test $counter: $dir: repeated internal error on release_resources, terminate the test run PID '$comma_test_run_top_pid'"
+                            (( !options_output_stdout )) || echo "$dir,timeout" # todo? put it in message_; disambiguate timeout status
                             kill -TERM $comma_test_run_top_pid
                         }
                     }
@@ -840,10 +843,12 @@ function run_single_test()
                     }
                     [[ "$test_failed" == "0" ]] && {
                         message_ "$name: test $counter: $dir: succeeded"
+                        (( !options_output_stdout )) || echo "$dir,succeeded" # todo? put it in message_
                     } || {
                         result=1
                         error_ "$name: $dir: failed$( (( $test_failed == 124 )) && echo ' (likely timed out)' )"
-                        [[ -n "$options_junit" && $test_failed == 124 ]] && echo "likely timed out" >> "output/junit.failure.log"
+                        (( !options_output_stdout )) || echo "$dir,failed" # todo? put it in message_
+                        [[ -n "$options_output_junit" && $test_failed == 124 ]] && echo "likely timed out" >> "output/junit.failure.log"
                     }
                     break
                 else
@@ -852,6 +857,7 @@ function run_single_test()
                         [[ "$max_wait_time" != "forever" ]] && {
                             if gawk '{ a=$1 > $2; exit !a }' < <( echo $wait_time $max_wait_time ) ; then
                                 echo "$name: in '$dir', could not get requested resources for ${wait_time}s, failed to run" >&2
+                                (( !options_output_stdout )) || echo "$dir,timeout" # todo? put it in message_
                                 result=1
                                 break
                             fi
@@ -869,13 +875,14 @@ function run_single_test()
                             sleep 1  # do not count as waiting time, for simplicity
                             continue
                         else
-                            error_ "$name: terminate the test run with PID '$comma_test_run_top_pid'"
+                            error_ "$name: $dir: terminate the test run with PID '$comma_test_run_top_pid'"
                             kill -TERM $comma_test_run_top_pid
+                            (( !options_output_stdout )) || echo "$dir,timeout" # todo? put it in message_; disambiguate timeout status
                         fi
                     fi
                 fi
             done
-            [[ -n "$options_junit" && $result != 0 && ! -f "output/junit.failure.log" ]] && echo "internal error, see detailed log" >> "output/junit.failure.log"
+            [[ -n "$options_output_junit" && $result != 0 && ! -f "output/junit.failure.log" ]] && echo "internal error, see detailed log" >> "output/junit.failure.log"
             cd "$basedir"
         fi
     fi
@@ -1032,9 +1039,9 @@ have_max_parallel=$(( have_max_parallel_equal > 0 || have_max_parallel_space > 0
 [[ "$options_parallel" != "0" && "$options_estimate_resources" == "1" ]] && { error_ "$name: resource estimation shall be serial"; exit 1; }
 if [[ "$options_debug" != "0" ]] ; then verbose="--verbose" ; fi
 (( options_verbose )) && verbose="--verbose"
-if [[ -n "$options_junit" ]] ; then
+if [[ -n "$options_output_junit" ]] ; then
     type -p recode >/dev/null || { error_ "$name: --junit given, but recode is not found; please install recode; e.g. run: sudo apt-get install recode"; exit 1; }
-    rm -f "$options_junit"
+    rm -f "$options_output_junit"
 fi
 [[ -n "$options_also_expected" ]] && {
     [[ -f "$options_also_expected" ]] || { error_ "$name: global expected file '$options_also_expected' not found"; exit 1; }

From ab984a0a0324d7f87afcf06c2c6d71a17fdbb7b0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 23 May 2023 18:28:52 +1000
Subject: [PATCH 0581/1056] comma-test-run: --white/black-list: checking
 whether argument is a directory

---
 util/applications/comma-test-run | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 2b330cb00..5de520f24 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -1073,11 +1073,11 @@ function apply_white_black_list() { apply_white_list | apply_black_list ; }
 # if "test" is absent, use the "test" in the closest parent directory
 function test_directories()
 {
-    if [[ -n "$options_white_list" && -e "$options_white_list" ]]; then
+    if [[ -n "$options_white_list" && -e "$options_white_list" && ! -d "$options_white_list" ]]; then
         message_ "$name: applying white list from file '$options_white_list'"
         options_white_list="^(\./)?($( sed 's#\./##' <$options_white_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//'  ))";
     fi
-    if [[ -n "$options_black_list" && -e "$options_black_list" ]]; then
+    if [[ -n "$options_black_list" && -e "$options_black_list" && ! -d "$options_black_list" ]]; then
         message_ "$name: applying black list from file '$options_black_list'"
         options_black_list="^(\./)?($( sed 's#\./##' <$options_black_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//' ))";
     fi

From 2c5b2fabd7c7031ea9eec05e2ad7d144af16f7e5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 May 2023 18:14:34 +1000
Subject: [PATCH 0582/1056] comma::multikey_map: implemented

---
 containers/cyclic_buffer.h            |  33 +---
 containers/multikey_map.h             | 224 ++++++++++++++++++++++++++
 containers/test/multikey_map_test.cpp | 141 ++++++++++++++++
 containers/vector.h                   |  33 +---
 4 files changed, 367 insertions(+), 64 deletions(-)
 create mode 100644 containers/multikey_map.h
 create mode 100644 containers/test/multikey_map_test.cpp

diff --git a/containers/cyclic_buffer.h b/containers/cyclic_buffer.h
index fdbe97691..5490ff320 100644
--- a/containers/cyclic_buffer.h
+++ b/containers/cyclic_buffer.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CONTAINERS_CYCLIC_BUFFER_H_
-#define COMMA_CONTAINERS_CYCLIC_BUFFER_H_
+#pragma once
 
 #include <vector>
 #include <boost/optional.hpp>
@@ -244,5 +215,3 @@ inline const T& fixed_cyclic_buffer< T, S >::operator[]( std::size_t i ) const
 }
 
 } // namespace comma {
-
-#endif // COMMA_CONTAINERS_CYCLIC_BUFFER_H_
diff --git a/containers/multikey_map.h b/containers/multikey_map.h
new file mode 100644
index 000000000..44d2b9333
--- /dev/null
+++ b/containers/multikey_map.h
@@ -0,0 +1,224 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+#include <unordered_map>
+#include <boost/functional/hash.hpp>
+#include "../base/types.h"
+
+namespace comma {
+
+/// quick and dirty hash for array-like containers (its support is awkward in boost)
+template < typename Array, std::size_t Size >
+struct array_hash : public std::unary_function< Array, std::size_t >
+{
+    std::size_t operator()( Array const& array ) const
+    {
+        std::size_t seed = 0;
+        for( std::size_t i = 0; i < Size; ++i ) { boost::hash_combine( seed, array[i] ); }
+        return seed;
+        // return boost::hash_range( &array[0], &array[Size] ); // not so easy...
+    }
+};
+
+namespace impl {
+
+template < typename T > struct array_traits;
+
+} // namespace impl {
+
+// todo: type traits:
+//       - zero
+//       - subtract
+//       - array-divide
+
+/// unordered map with array-like keys
+template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, template < typename > class Traits = impl::array_traits >
+class multikey_map : public std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > >
+{
+    public:
+        typedef std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > > base_type;
+        
+        enum { dimensions = Size };
+        
+        typedef P point_type;
+
+        typedef typename base_type::key_type index_type;
+
+        typedef typename base_type::key_type key_type; // for brevity
+
+        typedef typename base_type::mapped_type mapped_type; // for brevity
+        
+        typedef typename base_type::iterator iterator; // otherwise it does not build on windows...
+        
+        typedef typename base_type::const_iterator const_iterator; // otherwise it does not build on windows...
+
+        /// constructor
+        multikey_map( const point_type& origin, const point_type& resolution );
+
+        /// constructor, origin is all zeroes
+        multikey_map( const point_type& resolution );
+        
+        /// insert element at the given point, if it does not exist
+        iterator touch_at( const point_type& point );
+        
+        /// insert element at the given point, if it does not exist
+        std::pair< iterator, bool > insert( const point_type& point, const mapped_type& value );
+        
+        /// return index of the point, always rounds it down (does floor for a given resolution)
+        key_type index_of( const point_type& point ) const;
+        
+        /// same as index_of( point ), but static
+        static key_type index_of( const point_type& point, const point_type& origin, const point_type& resolution );
+        
+        /// same as index_of( point ), but static with origin assumed all zeroes
+        static key_type index_of( const point_type& point, const point_type& resolution );
+        
+        /// find value by point
+        iterator find( const point_type& point );
+        
+        /// find value by point
+        const_iterator find( const point_type& point ) const;
+        
+        /// find value by key
+        iterator find( const key_type& index );
+        
+        /// find voxel by key
+        const_iterator find( const key_type& index ) const;
+        
+        /// return origin
+        const point_type& origin() const;
+        
+        /// return resolution
+        const point_type& resolution() const;
+
+    private:
+        point_type _origin;
+        point_type _resolution;
+};
+
+namespace impl {
+
+static int negative_flooring_ = static_cast< int >( -1.5 ) == -1 ? -1 : static_cast< int >( -1.5 ) == -2 ? 0 : 0;
+static int positive_flooring_ = static_cast< int >( 1.5 ) == 1 ? 0 : static_cast< int >( 1.5 ) == 2 ? -1 : -1;
+
+template < typename T, std::size_t Size > struct array_traits< std::array< T, Size > >
+{
+    enum { size = Size };
+
+    static std::array< T, Size > subtract( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
+    {
+        std::array< T, Size > d;
+        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] - rhs[i]; }
+        return d;
+    }
+
+    static std::array< T, Size > divide( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
+    {
+        std::array< T, Size > d;
+        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] / rhs[i]; }
+        return d;
+    }
+
+    static std::array< T, Size > zero()
+    {
+        std::array< T, Size > d;
+        for( unsigned int i = 0; i < Size; ++i ) { d[i] = T( 0 ); }
+        return d;
+    }
+};
+
+} // namespace impl {
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline multikey_map< K, V, Size, P, Traits >::multikey_map( const typename multikey_map< K, V, Size, P, Traits >::point_type& origin, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+    : _origin( origin )
+    , _resolution( resolution )
+{
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline multikey_map< K, V, Size, P, Traits >::multikey_map( const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+    : _origin( Traits< P >::zero() )
+    , _resolution( resolution )
+{
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::touch_at( const typename multikey_map< K, V, Size, P, Traits >::point_type& point )
+{
+    key_type index = index_of( point );
+    iterator it = this->base_type::find( index );
+    if( it != this->end() ) { return it; }
+    return this->base_type::insert( std::make_pair( index, mapped_type() ) ).first;
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline std::pair< typename multikey_map< K, V, Size, P, Traits >::iterator, bool > multikey_map< K, V, Size, P, Traits >::insert( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::mapped_type& value )
+{
+    return this->base_type::insert( std::make_pair( index_of( point ), value ) );
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::point_type& origin, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+{
+    point_type diff = Traits< P >::divide( Traits< P >::subtract( point, origin ), resolution );
+    key_type index;
+    for( unsigned int i = 0; i < dimensions; ++i )
+    {
+        int d = diff[i];
+        index[i] = d;
+        if( diff[i] == d ) { continue; }
+        index[i] += diff[i] < 0 ? impl::negative_flooring_ : ( d == 0 ? 0 : impl::positive_flooring_ );
+    }
+    return index;
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+{
+    return index_of( point, Traits< P >::zero(), resolution );
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point ) const
+{
+    return index_of( point, _origin, _resolution );
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::point_type& point )
+{
+    index_type i = index_of( point );
+    return this->base_type::find( i );
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::const_iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::point_type& point ) const
+{
+    index_type i = index_of( point );
+    return this->base_type::find( i );
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::key_type& index )
+{
+    return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline typename multikey_map< K, V, Size, P, Traits >::const_iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::key_type& index ) const
+{
+    return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
+}
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline const typename multikey_map< K, V, Size, P, Traits >::point_type& multikey_map< K, V, Size, P, Traits >::origin() const { return _origin; }
+
+template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+inline const typename multikey_map< K, V, Size, P, Traits >::point_type& multikey_map< K, V, Size, P, Traits >::resolution() const { return _resolution; }
+
+} // namespace comma {
diff --git a/containers/test/multikey_map_test.cpp b/containers/test/multikey_map_test.cpp
new file mode 100644
index 000000000..e979d0a6f
--- /dev/null
+++ b/containers/test/multikey_map_test.cpp
@@ -0,0 +1,141 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <gtest/gtest.h>
+#include "../multikey_map.h"
+
+TEST( multikey_map, usage )
+{
+    comma::multikey_map< double, int, 3 > m( { 0, 0, 0 }, { 1, 2, 3 } );
+    m.touch_at( { 1, 2, 3 } );
+    // todo
+}
+
+TEST( multikey_map, index )
+{
+    typedef comma::multikey_map< double, int, 3 > map_type;
+    {
+        map_type m( {1, 1, 1} );
+        {
+            map_type::index_type i = {{ 0, 0, 0 }};
+            EXPECT_EQ( i, m.index_of( {0., 0., 0.} ) );
+            EXPECT_EQ( i, m.index_of( {0.001, 0.001, 0.001} ) );
+            EXPECT_EQ( i, m.index_of( {0.999, 0.999, 0.999} ) );
+        }
+        {
+            map_type::index_type i = {{ 1, 1, 1 }};
+            EXPECT_EQ( i, m.index_of( {1.0, 1.0, 1.0} ) );
+            EXPECT_EQ( i, m.index_of( {1.001, 1.001, 1.001} ) );
+            EXPECT_EQ( i, m.index_of( {1.999, 1.999, 1.999} ) );
+        }
+        {
+            map_type::index_type i = {{ -1, -1, -1 }};
+            EXPECT_EQ( i, m.index_of( {-1.0, -1.0, -1.0} ) );
+            EXPECT_EQ( i, m.index_of( {-0.999, -0.999, -0.999} ) );
+            EXPECT_EQ( i, m.index_of( {-0.001, -0.001, -0.001} ) );
+        }
+    }
+    {
+        map_type m( {0.3, 0.3, 0.3} );
+        {
+            map_type::index_type i = {{ 0, 0, 0 }};
+            EXPECT_EQ( i, m.index_of( {0, 0, 0} ) );
+            EXPECT_EQ( i, m.index_of( {0.001, 0.001, 0.001} ) );
+            EXPECT_EQ( i, m.index_of( {0.299, 0.299, 0.299} ) );
+        }        
+        {
+            map_type::index_type i = {{ 1, 1, 1 }};
+            EXPECT_EQ( i, m.index_of( {0.3, 0.3, 0.3} ) );
+            EXPECT_EQ( i, m.index_of( {0.3001, 0.3001, 0.3001} ) );
+            EXPECT_EQ( i, m.index_of( {0.3999, 0.3999, 0.3999} ) );
+        }
+        {
+            map_type::index_type i = {{ -1, -1, -1 }};
+            EXPECT_EQ( i, m.index_of( {-0.3, -0.3, -0.3} ) );
+            EXPECT_EQ( i, m.index_of( {-0.299, -0.299, -0.299} ) );
+            EXPECT_EQ( i, m.index_of( {-0.001, -0.001, -0.001} ) );
+        }        
+    }
+}
+
+TEST( multikey_map, operations )
+{
+    typedef comma::multikey_map< double, int, 3 > map_type;
+    map_type m( {1, 1, 1} );
+    {
+        EXPECT_TRUE( ( m.find( map_type::point_type{1., 1., 1.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.touch_at( map_type::point_type{1., 1., 1.} ) != m.end() ) );
+        EXPECT_EQ( 1, m.size() );
+        EXPECT_TRUE( ( m.find( map_type::point_type{1., 1., 1.} ) != m.end() ) );
+        EXPECT_TRUE( ( m.find( map_type::point_type{1., 1., 1.} ) == m.find( map_type::point_type{1.1, 1.1, 1.1} ) ) );
+        EXPECT_TRUE( ( m.touch_at( {1, 1, 1} ) != m.end() ) );
+        EXPECT_EQ( 1, m.size() );
+        EXPECT_TRUE( ( m.touch_at( {1.1, 1.1, 1.1} ) != m.end() ) );
+        EXPECT_EQ( 1, m.size() );
+    }
+    {
+        EXPECT_TRUE( ( m.find( map_type::point_type{-1., -1., -1.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.touch_at( {-1., -1., -1.} ) != m.end() ) );
+        EXPECT_EQ( 2, m.size() );
+        EXPECT_TRUE( ( m.find( map_type::point_type{-1., -1., -1.} ) != m.end() ) );
+        EXPECT_TRUE( ( m.find( map_type::point_type{-1., -1., -1.} ) == m.find( map_type::point_type{-0.1, -0.1, -0.1} ) ) );
+        EXPECT_TRUE( ( m.touch_at( {-1., -1., -1.} ) != m.end() ) );
+        EXPECT_EQ( 2, m.size() );
+        EXPECT_TRUE( ( m.touch_at( {-0.1, -0.1, -0.1} ) != m.end() ) );
+        EXPECT_EQ( 2, m.size() );
+    }
+    {
+        EXPECT_TRUE( ( m.find( map_type::point_type{0., 0., 0.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.touch_at( {0., 0., 0.} ) != m.end() ) );
+        EXPECT_EQ( 3, m.size() );
+        EXPECT_TRUE( ( m.find( map_type::point_type{0., 0, 0} ) != m.end() ) );
+        EXPECT_TRUE( ( m.find( map_type::point_type{0., 0, 0} ) == m.find( map_type::point_type{0.1, 0.1, 0.1} ) ) );
+        EXPECT_TRUE( ( m.touch_at( {0., 0, 0} ) != m.end() ) );
+        EXPECT_EQ( 3, m.size() );
+        EXPECT_TRUE( ( m.touch_at( {0.1, 0.1, 0.1} ) != m.end() ) );
+        EXPECT_EQ( 3, m.size() );
+    }
+}
+
+TEST( multikey_map, test )
+{
+    typedef comma::multikey_map< double, int, 3 > map_type;
+    map_type m( {1, 1, 1} );
+    EXPECT_TRUE( m.empty() );
+}
+
+TEST( multikey_map, neighbourhood )
+{
+    typedef comma::multikey_map< double, int, 3 > map_type;
+    map_type m( {1, 1, 1} );
+    {
+        EXPECT_TRUE( ( m.find( map_type::point_type{1, 1, 1} ) == m.end() ) );
+        {
+            EXPECT_TRUE( ( m.touch_at( {1, 1, 1} ) != m.end() ) );
+            EXPECT_EQ( 1, m.size() );
+            m.touch_at( {1, 1, 1} )->second = 111;
+            EXPECT_EQ( 111, m.find( map_type::point_type{1, 1, 1} )->second );
+            map_type::index_type index = {{ 1, 1, 1 }};
+            EXPECT_EQ( 111, m.base_type::find( index )->second );
+        }
+        {
+            EXPECT_TRUE( ( m.touch_at( {2, 2, 2} ) != m.end() ) );
+            EXPECT_EQ( 2, m.size() );
+            m.touch_at( {2, 2, 2} )->second = 222;
+            EXPECT_EQ( 222, m.find( map_type::point_type{2, 2, 2} )->second );
+            map_type::index_type index = {{ 2, 2, 2 }};
+            EXPECT_EQ( 222, m.base_type::find( index )->second );
+        }
+        {
+            map_type::index_type index = {{ -1, 0, 0 }};
+            EXPECT_TRUE( m.base_type::find( index ) == m.end() );
+        }
+        {
+            map_type::index_type index = {{ 0, 0, 0 }};
+            EXPECT_TRUE( m.base_type::find( index ) == m.end() );
+        }
+        {
+            map_type::index_type index = {{ 2, 2, 3 }};
+            EXPECT_TRUE( m.base_type::find( index ) == m.end() );
+        }
+    }
+}
diff --git a/containers/vector.h b/containers/vector.h
index 342187fbb..091c550f0 100644
--- a/containers/vector.h
+++ b/containers/vector.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CONTAINERS_VECTOR_H_
-#define COMMA_CONTAINERS_VECTOR_H_
+#pragma once
 
 #include <cmath>
 #include <vector>
@@ -69,5 +40,3 @@ struct regular_vector : public std::vector< T >
 };
 
 } // namespace comma {
-
-#endif // COMMA_CONTAINERS_VECTOR_H_

From 603a7534155a52627761097e462293f5e8f44b93 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 May 2023 18:36:22 +1000
Subject: [PATCH 0583/1056] comma::multikey_map: traits used as class, not
 template

---
 containers/multikey_map.h | 34 +++++++++++++++++-----------------
 1 file changed, 17 insertions(+), 17 deletions(-)

diff --git a/containers/multikey_map.h b/containers/multikey_map.h
index 44d2b9333..771e7bc03 100644
--- a/containers/multikey_map.h
+++ b/containers/multikey_map.h
@@ -36,7 +36,7 @@ template < typename T > struct array_traits;
 //       - array-divide
 
 /// unordered map with array-like keys
-template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, template < typename > class Traits = impl::array_traits >
+template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, typename Traits = impl::array_traits< P > >
 class multikey_map : public std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > >
 {
     public:
@@ -133,21 +133,21 @@ template < typename T, std::size_t Size > struct array_traits< std::array< T, Si
 
 } // namespace impl {
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline multikey_map< K, V, Size, P, Traits >::multikey_map( const typename multikey_map< K, V, Size, P, Traits >::point_type& origin, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
     : _origin( origin )
     , _resolution( resolution )
 {
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline multikey_map< K, V, Size, P, Traits >::multikey_map( const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
-    : _origin( Traits< P >::zero() )
+    : _origin( Traits::zero() )
     , _resolution( resolution )
 {
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::touch_at( const typename multikey_map< K, V, Size, P, Traits >::point_type& point )
 {
     key_type index = index_of( point );
@@ -156,16 +156,16 @@ inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K,
     return this->base_type::insert( std::make_pair( index, mapped_type() ) ).first;
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline std::pair< typename multikey_map< K, V, Size, P, Traits >::iterator, bool > multikey_map< K, V, Size, P, Traits >::insert( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::mapped_type& value )
 {
     return this->base_type::insert( std::make_pair( index_of( point ), value ) );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::point_type& origin, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
 {
-    point_type diff = Traits< P >::divide( Traits< P >::subtract( point, origin ), resolution );
+    point_type diff = Traits::divide( Traits::subtract( point, origin ), resolution );
     key_type index;
     for( unsigned int i = 0; i < dimensions; ++i )
     {
@@ -177,48 +177,48 @@ inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K,
     return index;
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
 {
-    return index_of( point, Traits< P >::zero(), resolution );
+    return index_of( point, Traits::zero(), resolution );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point ) const
 {
     return index_of( point, _origin, _resolution );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::point_type& point )
 {
     index_type i = index_of( point );
     return this->base_type::find( i );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::const_iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::point_type& point ) const
 {
     index_type i = index_of( point );
     return this->base_type::find( i );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::key_type& index )
 {
     return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename multikey_map< K, V, Size, P, Traits >::const_iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::key_type& index ) const
 {
     return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
 }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline const typename multikey_map< K, V, Size, P, Traits >::point_type& multikey_map< K, V, Size, P, Traits >::origin() const { return _origin; }
 
-template < typename K, typename V, unsigned int Size, typename P, template < typename > class Traits >
+template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline const typename multikey_map< K, V, Size, P, Traits >::point_type& multikey_map< K, V, Size, P, Traits >::resolution() const { return _resolution; }
 
 } // namespace comma {

From 1e9e9085002a2fc78c62248e62f72cde1fc7df75 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 May 2023 18:44:16 +1000
Subject: [PATCH 0584/1056] comma::multikey_map::map_type added

---
 containers/multikey_map.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/containers/multikey_map.h b/containers/multikey_map.h
index 771e7bc03..df51affbf 100644
--- a/containers/multikey_map.h
+++ b/containers/multikey_map.h
@@ -41,6 +41,8 @@ class multikey_map : public std::unordered_map< std::array< comma::int32, Size >
 {
     public:
         typedef std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > > base_type;
+
+        typedef base_type map_type;
         
         enum { dimensions = Size };
         

From 28a7a413c1d6997fd041d2588bb696261c2a9cf1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 May 2023 18:46:28 +1000
Subject: [PATCH 0585/1056] comma::multikey_map: comments removed

---
 containers/multikey_map.h | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/containers/multikey_map.h b/containers/multikey_map.h
index df51affbf..10efe96cc 100644
--- a/containers/multikey_map.h
+++ b/containers/multikey_map.h
@@ -30,11 +30,6 @@ template < typename T > struct array_traits;
 
 } // namespace impl {
 
-// todo: type traits:
-//       - zero
-//       - subtract
-//       - array-divide
-
 /// unordered map with array-like keys
 template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, typename Traits = impl::array_traits< P > >
 class multikey_map : public std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > >

From 3fea078ccd0c4dcef87e02d64184e6e26649c743 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 May 2023 14:17:05 +1000
Subject: [PATCH 0586/1056] containers: multikey_map::as_map typedef added

---
 containers/multikey_map.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/containers/multikey_map.h b/containers/multikey_map.h
index 10efe96cc..1dd4ab146 100644
--- a/containers/multikey_map.h
+++ b/containers/multikey_map.h
@@ -38,6 +38,8 @@ class multikey_map : public std::unordered_map< std::array< comma::int32, Size >
         typedef std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > > base_type;
 
         typedef base_type map_type;
+
+        typedef base_type as_map;
         
         enum { dimensions = Size };
         

From 71a3b75a1b35496ac07faaa656851d70bc0afb22 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 30 May 2023 13:38:44 +1000
Subject: [PATCH 0587/1056] comma-test-util: comma_test_interactive_test_case:
 test name, number, and instructions: brushed up

---
 util/applications/comma-test-util | 17 ++++++++++-------
 1 file changed, 10 insertions(+), 7 deletions(-)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 3dd6d3272..508b6bd8e 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -120,15 +120,15 @@ function comma_test_interactive_commands()
     (
         function comma_test_interactive_test_case()
         {
-            local name=$1
+            local name=$1 testcase_number=$2 number_of_testcases=$3
             local command instruction expected dialog
             eval $( comma_path_value_mangle | sed 's/^/local /' )
             [[ -n "$command" ]] || { echo "$name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
             eval "$command" &
             local eval_pid=$!
-            [[ $instruction ]] && dialog="$name: $instruction\n\n"
+            [[ $instruction ]] && dialog+="$instruction\n\n"
             dialog+="do you see $expected?"
-            zenity --question --text="$dialog"
+            zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600
             result=$?
             echo "$name/status=$result"
             kill $( pgrep -P $eval_pid )
@@ -139,26 +139,29 @@ function comma_test_interactive_commands()
         local test_case
         local test_name
         local path
+        local lines=$( cat );
+        local number_of_testcases=$( grep '/command=' <<< "$lines" | wc -l )
+        local testcase_number=0
         while read line ; do
             [[ "$line" =~ ^# ]] && continue
             local p=$( cut -d= -f1 <<< "$line" )
             [[ -n "$p" ]] || continue
             local n=$( dirname $p )
             if [[ "$n" != "$test_name" ]] ; then
-                [[ -z "$test_name" ]] || comma_test_interactive_test_case $test_name <<< "$test_case"
+                [[ -z "$test_name" ]] || comma_test_interactive_test_case $test_name $testcase_number $number_of_testcases <<< "$test_case"
+                (( ++testcase_number ))
                 test_name=$n
                 test_case=
             fi
             n=${n//[/\\[}
             n=${n//]/\\]}
             test_case=$( echo "$test_case" ; sed "s#^$n/##" <<< "$line" )
-        done
-        if [[ -n "$test_case" ]] ; then comma_test_interactive_test_case $test_name <<< "$test_case" ; fi
+        done <<< "$lines"
+        if [[ -n "$test_case" ]] ; then comma_test_interactive_test_case $test_name $testcase_number $number_of_testcases <<< "$test_case" ; fi
         return $?
     )
 }
 
-
 # the tmp directory cleanup for comma_test_run_tarball
 function comma_test_run_tarball_cleanup()
 {

From b65ae64f379777bd1818c6337d98349e81f02ddd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 31 May 2023 16:03:44 +1000
Subject: [PATCH 0588/1056] containers: multikey_map: array_traits moved to
 impl/array_traits.h

---
 containers/CMakeLists.txt      |  6 +++--
 containers/impl/array_traits.h | 45 ++++++++++++++++++++++++++++++++++
 containers/multikey_map.h      | 42 ++-----------------------------
 3 files changed, 51 insertions(+), 42 deletions(-)
 create mode 100644 containers/impl/array_traits.h

diff --git a/containers/CMakeLists.txt b/containers/CMakeLists.txt
index 1506e39fb..b1bd83b03 100644
--- a/containers/CMakeLists.txt
+++ b/containers/CMakeLists.txt
@@ -3,14 +3,16 @@ SET( TARGET_NAME comma${PROJECT} )
 
 FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
+FILE( GLOB impl_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/*.h )
 
-SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
+SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
 
-add_custom_target( ${TARGET_NAME} ${source} ${includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
+add_custom_target( ${TARGET_NAME} ${source} ${includes} ${impl_includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_includes} )
 #SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 #TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
 #INSTALL(
 #    TARGETS ${TARGET_NAME}
 #    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/containers/impl/array_traits.h b/containers/impl/array_traits.h
new file mode 100644
index 000000000..3dad0a1c7
--- /dev/null
+++ b/containers/impl/array_traits.h
@@ -0,0 +1,45 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+
+namespace comma { namespace impl {
+
+template < typename T > struct array_traits;
+
+template < typename T, std::size_t Size > struct array_traits< std::array< T, Size > >;
+
+inline int negative_flooring() { return static_cast< int >( -1.5 ) == -1 ? -1 : static_cast< int >( -1.5 ) == -2 ? 0 : 0; }
+
+inline int positive_flooring() { return static_cast< int >( 1.5 ) == 1 ? 0 : static_cast< int >( 1.5 ) == 2 ? -1 : -1; }
+
+template < typename T, std::size_t Size > struct array_traits< std::array< T, Size > >
+{
+    enum { size = Size };
+
+    static std::array< T, Size > subtract( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
+    {
+        std::array< T, Size > d;
+        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] - rhs[i]; }
+        return d;
+    }
+
+    static std::array< T, Size > divide( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
+    {
+        std::array< T, Size > d;
+        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] / rhs[i]; }
+        return d;
+    }
+
+    static std::array< T, Size > zero()
+    {
+        std::array< T, Size > d;
+        for( unsigned int i = 0; i < Size; ++i ) { d[i] = T( 0 ); }
+        return d;
+    }
+};
+
+} } // namespace comma { namespace impl {
diff --git a/containers/multikey_map.h b/containers/multikey_map.h
index 1dd4ab146..c69926ec5 100644
--- a/containers/multikey_map.h
+++ b/containers/multikey_map.h
@@ -8,6 +8,7 @@
 #include <unordered_map>
 #include <boost/functional/hash.hpp>
 #include "../base/types.h"
+#include "impl/array_traits.h"
 
 namespace comma {
 
@@ -24,12 +25,6 @@ struct array_hash : public std::unary_function< Array, std::size_t >
     }
 };
 
-namespace impl {
-
-template < typename T > struct array_traits;
-
-} // namespace impl {
-
 /// unordered map with array-like keys
 template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, typename Traits = impl::array_traits< P > >
 class multikey_map : public std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > >
@@ -99,39 +94,6 @@ class multikey_map : public std::unordered_map< std::array< comma::int32, Size >
         point_type _resolution;
 };
 
-namespace impl {
-
-static int negative_flooring_ = static_cast< int >( -1.5 ) == -1 ? -1 : static_cast< int >( -1.5 ) == -2 ? 0 : 0;
-static int positive_flooring_ = static_cast< int >( 1.5 ) == 1 ? 0 : static_cast< int >( 1.5 ) == 2 ? -1 : -1;
-
-template < typename T, std::size_t Size > struct array_traits< std::array< T, Size > >
-{
-    enum { size = Size };
-
-    static std::array< T, Size > subtract( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
-    {
-        std::array< T, Size > d;
-        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] - rhs[i]; }
-        return d;
-    }
-
-    static std::array< T, Size > divide( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
-    {
-        std::array< T, Size > d;
-        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] / rhs[i]; }
-        return d;
-    }
-
-    static std::array< T, Size > zero()
-    {
-        std::array< T, Size > d;
-        for( unsigned int i = 0; i < Size; ++i ) { d[i] = T( 0 ); }
-        return d;
-    }
-};
-
-} // namespace impl {
-
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline multikey_map< K, V, Size, P, Traits >::multikey_map( const typename multikey_map< K, V, Size, P, Traits >::point_type& origin, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
     : _origin( origin )
@@ -171,7 +133,7 @@ inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K,
         int d = diff[i];
         index[i] = d;
         if( diff[i] == d ) { continue; }
-        index[i] += diff[i] < 0 ? impl::negative_flooring_ : ( d == 0 ? 0 : impl::positive_flooring_ );
+        index[i] += diff[i] < 0 ? impl::negative_flooring() : ( d == 0 ? 0 : impl::positive_flooring() );
     }
     return index;
 }

From a1b511bf022ddb25ab9cf2e64e2d242d09953aff Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 31 May 2023 18:02:17 +1000
Subject: [PATCH 0589/1056] containers: multidimensional_array: basics
 implemented; unit-testing...

---
 containers/multidimensional_array.h           | 60 +++++++++++++++++++
 .../test/multidimensional_array_test.cpp      | 27 +++++++++
 2 files changed, 87 insertions(+)
 create mode 100644 containers/multidimensional_array.h
 create mode 100644 containers/test/multidimensional_array_test.cpp

diff --git a/containers/multidimensional_array.h b/containers/multidimensional_array.h
new file mode 100644
index 000000000..96feebe01
--- /dev/null
+++ b/containers/multidimensional_array.h
@@ -0,0 +1,60 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+#include "../base/types.h"
+#include "impl/array_traits.h"
+
+namespace comma {
+
+template < typename V, unsigned int D >
+class multidimensional_array
+{
+    public:
+        typedef std::array< std::size_t, D > index_type;
+
+        typedef V value_type;
+
+        const unsigned int dimensions{D};
+
+        multidimensional_array( const index_type& size, const V& default_value = V() ): _size( size ), _data( _index( _size ), default_value ) {}
+
+        V& operator()( const index_type& i ) { return _data[ _index( i ) ]; }
+
+        const V& operator()( const index_type& i ) const { return _data[ _index( i ) ]; }
+
+        const std::vector< V >& data() const { return _data; }
+
+        const index_type& size() const { return _size; }
+
+    private:
+        index_type _size;
+        std::vector< V > _data;
+        std::size_t _index( const index_type& i );
+};
+
+namespace impl {
+
+template < unsigned int D, unsigned int I = D >
+struct index
+{
+    typedef std::array< std::size_t, D > index_type;
+    static unsigned int value( const index_type& i, const index_type& size ) { return i[ I - 1 ] + index< D, I - 1 >::value( i, size ) * size[ I - 1 ]; }
+};
+
+template < unsigned int D >
+struct index< D, 1 >
+{
+    typedef std::array< std::size_t, D > index_type;
+    static unsigned int value( const index_type& i, const index_type& ) { return i[0]; }
+};
+
+} // namespace impl {
+
+template < typename V, unsigned int D >
+inline std::size_t multidimensional_array< V, D >::_index( const typename multidimensional_array< V, D >::index_type& i ) { return impl::index< D >::value( i, _size ); }
+
+} // namespace comma {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
new file mode 100644
index 000000000..38b8e53af
--- /dev/null
+++ b/containers/test/multidimensional_array_test.cpp
@@ -0,0 +1,27 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <gtest/gtest.h>
+#include "../multidimensional_array.h"
+
+TEST( multidimensional_array, usage )
+{
+    //comma::multidimensional_array< double, int, 3 > m( { 0, 0, 0 }, { 1, 2, 3 } );
+    //m.touch_at( { 1, 2, 3 } );
+    // todo
+}
+
+TEST( multidimensional_array, impl_index )
+{
+    EXPECT_EQ( comma::impl::index< 2 >::value( {0, 0}, {1, 5} ), 0 );
+    EXPECT_EQ( comma::impl::index< 2 >::value( {0, 1}, {1, 5} ), 1 );
+    EXPECT_EQ( comma::impl::index< 2 >::value( {0, 4}, {1, 5} ), 4 );
+    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 0}, {1, 5} ), 5 );
+    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 1}, {2, 5} ), 6 );
+    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 2}, {2, 5} ), 7 );
+    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 2}, {3, 5} ), 7 );
+    EXPECT_EQ( comma::impl::index< 2 >::value( {2, 2}, {3, 5} ), 12 );
+    EXPECT_EQ( comma::impl::index< 3 >::value( {0, 0, 0}, {2, 3, 4} ), 0 );
+    EXPECT_EQ( comma::impl::index< 3 >::value( {0, 0, 3}, {2, 3, 4} ), 3 );
+    EXPECT_EQ( comma::impl::index< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
+    EXPECT_EQ( comma::impl::index< 3 >::value( {2, 1, 3}, {2, 3, 4} ), 3 + 4 * ( 1 + 3 * 2 ) );
+}

From 0684a4e1e71bfeb27b7a9828a8fd53c0384ba035 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 31 May 2023 18:53:49 +1000
Subject: [PATCH 0590/1056] containers: multidimensional_array: iterators
 implemented; unit-testing...

---
 containers/multidimensional_array.h           | 64 +++++++++++++++++++
 .../test/multidimensional_array_test.cpp      | 24 ++++++-
 2 files changed, 85 insertions(+), 3 deletions(-)

diff --git a/containers/multidimensional_array.h b/containers/multidimensional_array.h
index 96feebe01..41a2e26b4 100644
--- a/containers/multidimensional_array.h
+++ b/containers/multidimensional_array.h
@@ -30,12 +30,64 @@ class multidimensional_array
 
         const index_type& size() const { return _size; }
 
+        class const_iterator;
+
+        class iterator
+        {
+            public:
+                iterator() = default;
+                std::pair< index_type, V& >&& operator->();
+                std::pair< index_type, const V& >&& operator->() const;
+                V& operator*() { return *_it; }
+                const V& operator*() const { return *_it; }
+                iterator& operator++() { ++_it; ++_i; return *this; }
+                bool operator==( const iterator& rhs ) const { return _it == rhs._it; }
+                bool operator==( const const_iterator& rhs ) const { return _it == rhs._it; }
+                bool operator!=( const iterator& rhs ) const { return !operator==( rhs ); }
+                bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
+
+            private:
+                friend class multidimensional_array< V, D >;
+                std::size_t _i{0};
+                typename std::vector< V >::iterator _it;
+                iterator( std::size_t i, typename std::vector< V >::iterator it ): _i( i ), _it( it ) {}
+        };
+
+        class const_iterator
+        {
+            public:
+                const_iterator() = default;
+                std::pair< index_type, const V& >&& operator->() const;
+                const V& operator*() const { return *_it; }
+                const_iterator& operator++() { ++_it; ++_i; return *this; }
+                bool operator==( const iterator& rhs ) const { return _it == rhs._it; }
+                bool operator==( const const_iterator& rhs ) const { return _it == rhs._it; }
+                bool operator!=( const iterator& rhs ) const { return !operator==( rhs ); }
+                bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
+
+            private:
+                friend class multidimensional_array< V, D >;
+                std::size_t _i{0};
+                typename std::vector< V >::iterator _it;
+                const_iterator( std::size_t i, typename std::vector< V >::iterator it ): _i( i ), _it( it ) {}
+        };
+
+        iterator begin() { return iterator( 0, _data.begin() ); }
+
+        const_iterator begin() const { return const_iterator( 0, _data.begin() ); }
+
+        iterator end() { return iterator( _data.size(), _data.end() ); }
+
+        const_iterator end() const { return const_iterator( _data.size(), _data.end() ); }
+
     private:
         index_type _size;
         std::vector< V > _data;
         std::size_t _index( const index_type& i );
 };
 
+
+
 namespace impl {
 
 template < unsigned int D, unsigned int I = D >
@@ -43,6 +95,8 @@ struct index
 {
     typedef std::array< std::size_t, D > index_type;
     static unsigned int value( const index_type& i, const index_type& size ) { return i[ I - 1 ] + index< D, I - 1 >::value( i, size ) * size[ I - 1 ]; }
+    static void value( std::size_t j, index_type& i, const index_type& size ) { i[ I - 1 ] = j % size[ I - 1 ]; index< D, I - 1 >::value( j / size[ I - 1 ], i, size ); }
+    static index_type value( std::size_t j, const index_type& size ) { index_type i; value( j, i, size ); return i; }
 };
 
 template < unsigned int D >
@@ -50,6 +104,7 @@ struct index< D, 1 >
 {
     typedef std::array< std::size_t, D > index_type;
     static unsigned int value( const index_type& i, const index_type& ) { return i[0]; }
+    static void value( std::size_t j, index_type& i, const index_type& size ) { i[0] = j; }
 };
 
 } // namespace impl {
@@ -57,4 +112,13 @@ struct index< D, 1 >
 template < typename V, unsigned int D >
 inline std::size_t multidimensional_array< V, D >::_index( const typename multidimensional_array< V, D >::index_type& i ) { return impl::index< D >::value( i, _size ); }
 
+template < typename V, unsigned int D >
+std::pair< typename multidimensional_array< V, D >::index_type, V& >&& multidimensional_array< V, D >::iterator::operator->() { return std::make_pair( impl::index< D >::value( _i, _size ), *_it ); }
+
+template < typename V, unsigned int D >
+std::pair< typename multidimensional_array< V, D >::index_type, const V& >&& multidimensional_array< V, D >::iterator::operator->() const { return std::make_pair( impl::index< D >::value( _i, _size ), *_it ); }
+
+template < typename V, unsigned int D >
+std::pair< typename multidimensional_array< V, D >::index_type, const V& >&& multidimensional_array< V, D >::const_iterator::operator->() const { return std::make_pair( impl::index< D >::value( _i, _size ), *_it ); }
+
 } // namespace comma {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 38b8e53af..52718180c 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -5,12 +5,10 @@
 
 TEST( multidimensional_array, usage )
 {
-    //comma::multidimensional_array< double, int, 3 > m( { 0, 0, 0 }, { 1, 2, 3 } );
-    //m.touch_at( { 1, 2, 3 } );
     // todo
 }
 
-TEST( multidimensional_array, impl_index )
+TEST( multidimensional_array, impl_index_value )
 {
     EXPECT_EQ( comma::impl::index< 2 >::value( {0, 0}, {1, 5} ), 0 );
     EXPECT_EQ( comma::impl::index< 2 >::value( {0, 1}, {1, 5} ), 1 );
@@ -25,3 +23,23 @@ TEST( multidimensional_array, impl_index )
     EXPECT_EQ( comma::impl::index< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
     EXPECT_EQ( comma::impl::index< 3 >::value( {2, 1, 3}, {2, 3, 4} ), 3 + 4 * ( 1 + 3 * 2 ) );
 }
+
+TEST( multidimensional_array, impl_index_inverted_value )
+{
+    typedef std::array< std::size_t, 3 > array_t;
+    { array_t a{0, 0, 0}; EXPECT_EQ( comma::impl::index< 3 >::value( 0, {2, 3, 4} ), a ); }
+    { array_t a{0, 0, 1}; EXPECT_EQ( comma::impl::index< 3 >::value( 1, {2, 3, 4} ), a ); }
+    { array_t a{2, 1, 3}; EXPECT_EQ( comma::impl::index< 3 >::value( 3 + 4 * ( 1 + 3 * 2 ), {2, 3, 4} ), a ); }
+    // todo: way more tests
+}
+
+TEST( multidimensional_array, basics )
+{
+    {
+        comma::multidimensional_array< int, 3 > a( {2, 3, 4}, 0 );
+        unsigned int i = 0;
+        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        EXPECT_EQ( a( {2, 1, 3} ), 3 + 4 * ( 1 + 3 * 2 ) );
+        // todo: more tests
+    }
+}

From c71812c43a0b3888bb26d08e70d7bad1f8eb820b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 1 Jun 2023 12:05:04 +1000
Subject: [PATCH 0591/1056] containers: multidimensional_array: a couple of
 bugs fixed; unit-testing: basics done

---
 containers/multidimensional_array.h           | 30 +++++----
 .../test/multidimensional_array_test.cpp      | 64 ++++++++++++++++---
 2 files changed, 72 insertions(+), 22 deletions(-)

diff --git a/containers/multidimensional_array.h b/containers/multidimensional_array.h
index 41a2e26b4..9f0451d30 100644
--- a/containers/multidimensional_array.h
+++ b/containers/multidimensional_array.h
@@ -20,7 +20,7 @@ class multidimensional_array
 
         const unsigned int dimensions{D};
 
-        multidimensional_array( const index_type& size, const V& default_value = V() ): _size( size ), _data( _index( _size ), default_value ) {}
+        multidimensional_array( const index_type& size, const V& default_value = V() ): _size( size ), _data( _product( _size ), default_value ) {}
 
         V& operator()( const index_type& i ) { return _data[ _index( i ) ]; }
 
@@ -36,11 +36,10 @@ class multidimensional_array
         {
             public:
                 iterator() = default;
-                std::pair< index_type, V& >&& operator->();
-                std::pair< index_type, const V& >&& operator->() const;
                 V& operator*() { return *_it; }
                 const V& operator*() const { return *_it; }
                 iterator& operator++() { ++_it; ++_i; return *this; }
+                index_type index() const;
                 bool operator==( const iterator& rhs ) const { return _it == rhs._it; }
                 bool operator==( const const_iterator& rhs ) const { return _it == rhs._it; }
                 bool operator!=( const iterator& rhs ) const { return !operator==( rhs ); }
@@ -50,16 +49,17 @@ class multidimensional_array
                 friend class multidimensional_array< V, D >;
                 std::size_t _i{0};
                 typename std::vector< V >::iterator _it;
-                iterator( std::size_t i, typename std::vector< V >::iterator it ): _i( i ), _it( it ) {}
+                index_type _size;
+                iterator( std::size_t i, typename std::vector< V >::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
         };
 
         class const_iterator
         {
             public:
                 const_iterator() = default;
-                std::pair< index_type, const V& >&& operator->() const;
                 const V& operator*() const { return *_it; }
                 const_iterator& operator++() { ++_it; ++_i; return *this; }
+                index_type index() const;
                 bool operator==( const iterator& rhs ) const { return _it == rhs._it; }
                 bool operator==( const const_iterator& rhs ) const { return _it == rhs._it; }
                 bool operator!=( const iterator& rhs ) const { return !operator==( rhs ); }
@@ -69,21 +69,23 @@ class multidimensional_array
                 friend class multidimensional_array< V, D >;
                 std::size_t _i{0};
                 typename std::vector< V >::iterator _it;
-                const_iterator( std::size_t i, typename std::vector< V >::iterator it ): _i( i ), _it( it ) {}
+                index_type _size;
+                const_iterator( std::size_t i, typename std::vector< V >::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
         };
 
-        iterator begin() { return iterator( 0, _data.begin() ); }
+        iterator begin() { return iterator( 0, _data.begin(), _size ); }
 
-        const_iterator begin() const { return const_iterator( 0, _data.begin() ); }
+        const_iterator begin() const { return const_iterator( 0, _data.begin(), _size ); }
 
-        iterator end() { return iterator( _data.size(), _data.end() ); }
+        iterator end() { return iterator( _data.size(), _data.end(), _size ); }
 
-        const_iterator end() const { return const_iterator( _data.size(), _data.end() ); }
+        const_iterator end() const { return const_iterator( _data.size(), _data.end(), _size ); }
 
     private:
         index_type _size;
         std::vector< V > _data;
         std::size_t _index( const index_type& i );
+        std::size_t _product( const index_type& i );
 };
 
 
@@ -97,6 +99,7 @@ struct index
     static unsigned int value( const index_type& i, const index_type& size ) { return i[ I - 1 ] + index< D, I - 1 >::value( i, size ) * size[ I - 1 ]; }
     static void value( std::size_t j, index_type& i, const index_type& size ) { i[ I - 1 ] = j % size[ I - 1 ]; index< D, I - 1 >::value( j / size[ I - 1 ], i, size ); }
     static index_type value( std::size_t j, const index_type& size ) { index_type i; value( j, i, size ); return i; }
+    static std::size_t product( const index_type& i ) { return i[ I - 1 ] * index< D, I - 1 >::product( i ); }
 };
 
 template < unsigned int D >
@@ -105,6 +108,7 @@ struct index< D, 1 >
     typedef std::array< std::size_t, D > index_type;
     static unsigned int value( const index_type& i, const index_type& ) { return i[0]; }
     static void value( std::size_t j, index_type& i, const index_type& size ) { i[0] = j; }
+    static std::size_t product( const index_type& i ) { return i[0]; }
 };
 
 } // namespace impl {
@@ -113,12 +117,12 @@ template < typename V, unsigned int D >
 inline std::size_t multidimensional_array< V, D >::_index( const typename multidimensional_array< V, D >::index_type& i ) { return impl::index< D >::value( i, _size ); }
 
 template < typename V, unsigned int D >
-std::pair< typename multidimensional_array< V, D >::index_type, V& >&& multidimensional_array< V, D >::iterator::operator->() { return std::make_pair( impl::index< D >::value( _i, _size ), *_it ); }
+inline std::size_t multidimensional_array< V, D >::_product( const typename multidimensional_array< V, D >::index_type& i ) { return impl::index< D >::product( i ); }
 
 template < typename V, unsigned int D >
-std::pair< typename multidimensional_array< V, D >::index_type, const V& >&& multidimensional_array< V, D >::iterator::operator->() const { return std::make_pair( impl::index< D >::value( _i, _size ), *_it ); }
+inline typename multidimensional_array< V, D >::index_type multidimensional_array< V, D >::iterator::index() const { return impl::index< D >::value( _i, _size ); }
 
 template < typename V, unsigned int D >
-std::pair< typename multidimensional_array< V, D >::index_type, const V& >&& multidimensional_array< V, D >::const_iterator::operator->() const { return std::make_pair( impl::index< D >::value( _i, _size ), *_it ); }
+inline typename multidimensional_array< V, D >::index_type multidimensional_array< V, D >::const_iterator::index() const { return impl::index< D >::value( _i, _size ); }
 
 } // namespace comma {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 52718180c..18a611d6e 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -3,11 +3,6 @@
 #include <gtest/gtest.h>
 #include "../multidimensional_array.h"
 
-TEST( multidimensional_array, usage )
-{
-    // todo
-}
-
 TEST( multidimensional_array, impl_index_value )
 {
     EXPECT_EQ( comma::impl::index< 2 >::value( {0, 0}, {1, 5} ), 0 );
@@ -21,7 +16,17 @@ TEST( multidimensional_array, impl_index_value )
     EXPECT_EQ( comma::impl::index< 3 >::value( {0, 0, 0}, {2, 3, 4} ), 0 );
     EXPECT_EQ( comma::impl::index< 3 >::value( {0, 0, 3}, {2, 3, 4} ), 3 );
     EXPECT_EQ( comma::impl::index< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
-    EXPECT_EQ( comma::impl::index< 3 >::value( {2, 1, 3}, {2, 3, 4} ), 3 + 4 * ( 1 + 3 * 2 ) );
+    EXPECT_EQ( comma::impl::index< 3 >::value( {1, 2, 3}, {2, 3, 4} ), 3 + 4 * ( 2 + 3 * 1 ) );
+    EXPECT_EQ( comma::impl::index< 3 >::value( {1, 2, 4}, {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( comma::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+}
+
+TEST( multidimensional_array, impl_index_product )
+{
+    EXPECT_EQ( comma::impl::index< 1 >::product( {2} ), 2 );
+    EXPECT_EQ( comma::impl::index< 2 >::product( {2, 3} ), 6 );
+    EXPECT_EQ( comma::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( comma::impl::index< 4 >::product( {2, 3, 4, 5} ), 2 * 3 * 4 * 5 );
 }
 
 TEST( multidimensional_array, impl_index_inverted_value )
@@ -33,13 +38,54 @@ TEST( multidimensional_array, impl_index_inverted_value )
     // todo: way more tests
 }
 
-TEST( multidimensional_array, basics )
+TEST( multidimensional_array, iteration )
 {
     {
+        typedef std::array< std::size_t, 3 > array_t;
         comma::multidimensional_array< int, 3 > a( {2, 3, 4}, 0 );
+        { array_t s{2, 3, 4}; EXPECT_EQ( a.size(), s ); EXPECT_EQ( a.data().size(), 2 * 3 * 4 ); }
         unsigned int i = 0;
         for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
-        EXPECT_EQ( a( {2, 1, 3} ), 3 + 4 * ( 1 + 3 * 2 ) );
-        // todo: more tests
+        auto it = a.begin();
+        { array_t a{0, 0, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 0 ); ++it; }
+        { array_t a{0, 0, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 1 ); ++it; }
+        { array_t a{0, 0, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 2 ); ++it; }
+        { array_t a{0, 0, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 3 ); ++it; }
+        { array_t a{0, 1, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 4 ); ++it; }
+        { array_t a{0, 1, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 5 ); ++it; }
+        { array_t a{0, 1, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 6 ); ++it; }
+        { array_t a{0, 1, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 7 ); ++it; }
+        { array_t a{0, 2, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 8 ); ++it; }
+        { array_t a{0, 2, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 9 ); ++it; }
+        { array_t a{0, 2, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 10 ); ++it; }
+        { array_t a{0, 2, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 11 ); ++it; }
+        { array_t a{1, 0, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 12 ); ++it; }
+        { array_t a{1, 0, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 13 ); ++it; }
+        { array_t a{1, 0, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 14 ); ++it; }
+        { array_t a{1, 0, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 15 ); ++it; }
+        { array_t a{1, 1, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 16 ); ++it; }
+        { array_t a{1, 1, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 17 ); ++it; }
+        { array_t a{1, 1, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 18 ); ++it; }
+        { array_t a{1, 1, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 19 ); ++it; }
+        { array_t a{1, 2, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 20 ); ++it; }
+        { array_t a{1, 2, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 21 ); ++it; }
+        { array_t a{1, 2, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 22 ); ++it; }
+        { array_t a{1, 2, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 23 ); ++it; }
+        EXPECT_TRUE( it == a.end() );
     }
 }
+
+TEST( multidimensional_array, access )
+{
+    {
+        comma::multidimensional_array< int, 3 > a( {2, 3, 4}, 0 );
+        unsigned int i = 0;
+        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        EXPECT_EQ( a( {0, 0, 0} ), 0 );
+        EXPECT_EQ( a( {0, 1, 0} ), 4 );
+        EXPECT_EQ( a( {1, 2, 3} ), 23 );
+        a( {0, 0, 0} ) = 111; EXPECT_EQ( a( {0, 0, 0} ), 111 );
+        a( {1, 1, 2} ) = 222; EXPECT_EQ( a( {1, 1, 2} ), 222 );
+        a( {1, 2, 3} ) = 333; EXPECT_EQ( a( {1, 2, 3} ), 333 );
+    }
+}
\ No newline at end of file

From 0cdc31445de1619b75f0c0233d8c8b66fe4ea567 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 1 Jun 2023 12:17:57 +1000
Subject: [PATCH 0592/1056] containers: interpolated_multidimensional_array: in
 progress...

---
 containers/multidimensional_array.h | 27 +++++++++++++++++++++++++++
 1 file changed, 27 insertions(+)

diff --git a/containers/multidimensional_array.h b/containers/multidimensional_array.h
index 9f0451d30..cad8c8c9e 100644
--- a/containers/multidimensional_array.h
+++ b/containers/multidimensional_array.h
@@ -88,6 +88,33 @@ class multidimensional_array
         std::size_t _product( const index_type& i );
 };
 
+template < typename V, unsigned int D, typename P = std::array< double, D > >
+class interpolated_multidimensional_array: public multidimensional_array< V, D >
+{
+    public:
+        typedef P point_type;
+
+        typedef multidimensional_array< V, D > base_type;
+
+        typedef typename base_type::index_type index_type;
+
+        typedef typename base_type::value_type value_type;
+
+        interpolated_multidimensional_array( const P& origin, const P& resolution, const index_type& size, const V& default_value = V() );
+
+        index_type index_of( const point_type& p ) const;
+
+        V& operator()( const point_type& p ) { return operator()( index_of( p ) ); }
+
+        const V& operator()( const point_type& p ) const { return operator()( index_of( p ) ); }
+
+        V interpolated( const point_type& p ) const;
+
+    private:
+        point_type _origin;
+        point_type _resolution;
+        void _assert_valid( const point_type& p );
+};
 
 
 namespace impl {

From 2ec611dfcfdd56db078e3823f92dde283e908666 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 1 Jun 2023 14:00:07 +1000
Subject: [PATCH 0593/1056] containers: multidimensional_array: storage type
 added

---
 containers/multidimensional_array.h | 50 +++++++++++++++++------------
 1 file changed, 29 insertions(+), 21 deletions(-)

diff --git a/containers/multidimensional_array.h b/containers/multidimensional_array.h
index cad8c8c9e..0a8f9a4f9 100644
--- a/containers/multidimensional_array.h
+++ b/containers/multidimensional_array.h
@@ -10,7 +10,7 @@
 
 namespace comma {
 
-template < typename V, unsigned int D >
+template < typename V, unsigned int D, typename S = std::vector< V > >
 class multidimensional_array
 {
     public:
@@ -18,6 +18,8 @@ class multidimensional_array
 
         typedef V value_type;
 
+        typedef S storage_type;
+
         const unsigned int dimensions{D};
 
         multidimensional_array( const index_type& size, const V& default_value = V() ): _size( size ), _data( _product( _size ), default_value ) {}
@@ -26,7 +28,7 @@ class multidimensional_array
 
         const V& operator()( const index_type& i ) const { return _data[ _index( i ) ]; }
 
-        const std::vector< V >& data() const { return _data; }
+        const storage_type& data() const { return _data; }
 
         const index_type& size() const { return _size; }
 
@@ -46,11 +48,11 @@ class multidimensional_array
                 bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
 
             private:
-                friend class multidimensional_array< V, D >;
+                friend class multidimensional_array< V, D, S >;
                 std::size_t _i{0};
-                typename std::vector< V >::iterator _it;
+                typename storage_type::iterator _it;
                 index_type _size;
-                iterator( std::size_t i, typename std::vector< V >::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
+                iterator( std::size_t i, typename storage_type::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
         };
 
         class const_iterator
@@ -66,11 +68,11 @@ class multidimensional_array
                 bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
 
             private:
-                friend class multidimensional_array< V, D >;
+                friend class multidimensional_array< V, D, S >;
                 std::size_t _i{0};
-                typename std::vector< V >::iterator _it;
+                typename storage_type::iterator _it;
                 index_type _size;
-                const_iterator( std::size_t i, typename std::vector< V >::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
+                const_iterator( std::size_t i, typename storage_type::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
         };
 
         iterator begin() { return iterator( 0, _data.begin(), _size ); }
@@ -83,18 +85,20 @@ class multidimensional_array
 
     private:
         index_type _size;
-        std::vector< V > _data;
+        storage_type _data;
         std::size_t _index( const index_type& i );
         std::size_t _product( const index_type& i );
 };
 
-template < typename V, unsigned int D, typename P = std::array< double, D > >
-class interpolated_multidimensional_array: public multidimensional_array< V, D >
+// todo: slice
+
+template < typename V, unsigned int D, typename P = std::array< double, D >, typename S = std::vector< V > >
+class interpolated_multidimensional_array: public multidimensional_array< V, D, S >
 {
     public:
         typedef P point_type;
 
-        typedef multidimensional_array< V, D > base_type;
+        typedef multidimensional_array< V, D, S > base_type;
 
         typedef typename base_type::index_type index_type;
 
@@ -102,7 +106,11 @@ class interpolated_multidimensional_array: public multidimensional_array< V, D >
 
         interpolated_multidimensional_array( const P& origin, const P& resolution, const index_type& size, const V& default_value = V() );
 
-        index_type index_of( const point_type& p ) const;
+        index_type index_of( const point_type& p ) const; // p: 1.,2.,3. -> return: 23,22,21
+
+        /// q = index_as_point( p ); // p: 1.,2.,3. -> 21.,22.,23
+        /// index_of( p ) == index_of( origin + q * resolution );
+        point_type index_as_point( const point_type& p ) const; // p: 1.,2.,3. -> 21.,22.,23
 
         V& operator()( const point_type& p ) { return operator()( index_of( p ) ); }
 
@@ -140,16 +148,16 @@ struct index< D, 1 >
 
 } // namespace impl {
 
-template < typename V, unsigned int D >
-inline std::size_t multidimensional_array< V, D >::_index( const typename multidimensional_array< V, D >::index_type& i ) { return impl::index< D >::value( i, _size ); }
+template < typename V, unsigned int D, typename S >
+inline std::size_t multidimensional_array< V, D, S >::_index( const typename multidimensional_array< V, D, S >::index_type& i ) { return impl::index< D >::value( i, _size ); }
 
-template < typename V, unsigned int D >
-inline std::size_t multidimensional_array< V, D >::_product( const typename multidimensional_array< V, D >::index_type& i ) { return impl::index< D >::product( i ); }
+template < typename V, unsigned int D, typename S >
+inline std::size_t multidimensional_array< V, D, S >::_product( const typename multidimensional_array< V, D, S >::index_type& i ) { return impl::index< D >::product( i ); }
 
-template < typename V, unsigned int D >
-inline typename multidimensional_array< V, D >::index_type multidimensional_array< V, D >::iterator::index() const { return impl::index< D >::value( _i, _size ); }
+template < typename V, unsigned int D, typename S >
+inline typename multidimensional_array< V, D, S >::index_type multidimensional_array< V, D, S >::iterator::index() const { return impl::index< D >::value( _i, _size ); }
 
-template < typename V, unsigned int D >
-inline typename multidimensional_array< V, D >::index_type multidimensional_array< V, D >::const_iterator::index() const { return impl::index< D >::value( _i, _size ); }
+template < typename V, unsigned int D, typename S >
+inline typename multidimensional_array< V, D, S >::index_type multidimensional_array< V, D, S >::const_iterator::index() const { return impl::index< D >::value( _i, _size ); }
 
 } // namespace comma {

From ca88864cfb9f40b8112b14a1ad1f1d986bcee9e4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 Jun 2023 17:00:46 +1000
Subject: [PATCH 0594/1056] comma::containers::multidimensional: array, slice:
 first cut implemented

---
 containers/multidimensional_array.h           | 117 ++++++++++++------
 .../test/multidimensional_array_test.cpp      |  63 +++++-----
 2 files changed, 112 insertions(+), 68 deletions(-)

diff --git a/containers/multidimensional_array.h b/containers/multidimensional_array.h
index 0a8f9a4f9..60c2bd935 100644
--- a/containers/multidimensional_array.h
+++ b/containers/multidimensional_array.h
@@ -8,29 +8,27 @@
 #include "../base/types.h"
 #include "impl/array_traits.h"
 
-namespace comma {
+namespace comma { namespace containers { namespace multidimensional {
 
-template < typename V, unsigned int D, typename S = std::vector< V > >
-class multidimensional_array
+template < typename V, unsigned int D >
+class slice
 {
     public:
         typedef std::array< std::size_t, D > index_type;
 
         typedef V value_type;
 
-        typedef S storage_type;
-
         const unsigned int dimensions{D};
 
-        multidimensional_array( const index_type& size, const V& default_value = V() ): _size( size ), _data( _product( _size ), default_value ) {}
+        slice( const index_type& shape, V* data ): _shape( shape ), _size( _product( _shape ) ), _data( data ) {}
 
-        V& operator()( const index_type& i ) { return _data[ _index( i ) ]; }
+        V& operator[]( const index_type& i ) { return _data[ _index( i ) ]; }
 
-        const V& operator()( const index_type& i ) const { return _data[ _index( i ) ]; }
+        const V& operator[]( const index_type& i ) const { return _data[ _index( i ) ]; }
 
-        const storage_type& data() const { return _data; }
+        const V* data() const { return _data; }
 
-        const index_type& size() const { return _size; }
+        const index_type& shape() const { return _shape; }
 
         class const_iterator;
 
@@ -48,11 +46,11 @@ class multidimensional_array
                 bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
 
             private:
-                friend class multidimensional_array< V, D, S >;
+                friend class slice< V, D >;
                 std::size_t _i{0};
-                typename storage_type::iterator _it;
-                index_type _size;
-                iterator( std::size_t i, typename storage_type::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
+                V* _it{nullptr};
+                index_type _shape;
+                iterator( std::size_t i, V* it, const index_type& shape ): _i( i ), _it( it ), _shape( shape ) {}
         };
 
         class const_iterator
@@ -68,43 +66,84 @@ class multidimensional_array
                 bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
 
             private:
-                friend class multidimensional_array< V, D, S >;
+                friend class slice< V, D >;
                 std::size_t _i{0};
-                typename storage_type::iterator _it;
-                index_type _size;
-                const_iterator( std::size_t i, typename storage_type::iterator it, const index_type& size ): _i( i ), _it( it ), _size( size ) {}
+                const V* _it{nullptr};
+                index_type _shape;
+                const_iterator( std::size_t i, V* it, const index_type& shape ): _i( i ), _it( it ), _shape( shape ) {}
         };
 
-        iterator begin() { return iterator( 0, _data.begin(), _size ); }
+        iterator begin() { return iterator( 0, _data, _shape ); }
 
-        const_iterator begin() const { return const_iterator( 0, _data.begin(), _size ); }
+        const_iterator begin() const { return const_iterator( 0, _data, _shape ); }
 
-        iterator end() { return iterator( _data.size(), _data.end(), _size ); }
+        iterator end() { return iterator( _size, _data + _size, _shape ); }
 
-        const_iterator end() const { return const_iterator( _data.size(), _data.end(), _size ); }
+        const_iterator end() const { return const_iterator( _size, _data + _size, _shape ); }
 
     private:
-        index_type _size;
-        storage_type _data;
+        index_type _shape;
+        std::size_t _size;
+        V* _data;
         std::size_t _index( const index_type& i );
-        std::size_t _product( const index_type& i );
+        static std::size_t _product( const index_type& i );
 };
 
-// todo: slice
+
+template < typename V, unsigned int D, typename S = std::vector< V > >
+class array
+{
+    public:
+        typedef slice< V, D > slice_type;
+
+        typedef typename slice_type::index_type index_type;
+
+        typedef V value_type;
+
+        typedef S storage_type;
+
+        const unsigned int dimensions{D};
+
+        array( const index_type& shape, const V& default_value = V() );
+
+        V& operator[]( const index_type& i ) { return _slice[i]; }
+
+        const V& operator[]( const index_type& i ) const { return _slice[i]; }
+
+        const storage_type& data() const { return _data; }
+
+        const index_type& shape() const { return _slice.shape(); }
+
+        typedef typename slice_type::iterator iterator;
+
+        typedef typename slice_type::const_iterator const_iterator;
+
+        iterator begin() { return _slice.begin(); }
+
+        const_iterator begin() const { return _slice.begin(); }
+
+        iterator end() { return _slice.end(); }
+
+        const_iterator end() const { return _slice.end(); }
+
+    private:
+        storage_type _data;
+        slice_type _slice;
+};
 
 template < typename V, unsigned int D, typename P = std::array< double, D >, typename S = std::vector< V > >
-class interpolated_multidimensional_array: public multidimensional_array< V, D, S >
+class interpolated_array: public array< V, D, S >
 {
     public:
         typedef P point_type;
 
-        typedef multidimensional_array< V, D, S > base_type;
+        typedef array< V, D, S > base_type;
 
         typedef typename base_type::index_type index_type;
 
         typedef typename base_type::value_type value_type;
 
-        interpolated_multidimensional_array( const P& origin, const P& resolution, const index_type& size, const V& default_value = V() );
+        interpolated_array( const P& origin, const P& resolution, const index_type& size, const V& default_value = V() );
 
         index_type index_of( const point_type& p ) const; // p: 1.,2.,3. -> return: 23,22,21
 
@@ -124,7 +163,6 @@ class interpolated_multidimensional_array: public multidimensional_array< V, D,
         void _assert_valid( const point_type& p );
 };
 
-
 namespace impl {
 
 template < unsigned int D, unsigned int I = D >
@@ -148,16 +186,19 @@ struct index< D, 1 >
 
 } // namespace impl {
 
-template < typename V, unsigned int D, typename S >
-inline std::size_t multidimensional_array< V, D, S >::_index( const typename multidimensional_array< V, D, S >::index_type& i ) { return impl::index< D >::value( i, _size ); }
+template < typename V, unsigned int D >
+inline std::size_t slice< V, D >::_index( const typename slice< V, D >::index_type& i ) { return impl::index< D >::value( i, _shape ); }
 
-template < typename V, unsigned int D, typename S >
-inline std::size_t multidimensional_array< V, D, S >::_product( const typename multidimensional_array< V, D, S >::index_type& i ) { return impl::index< D >::product( i ); }
+template < typename V, unsigned int D >
+inline std::size_t slice< V, D >::_product( const typename slice< V, D >::index_type& i ) { return impl::index< D >::product( i ); }
 
-template < typename V, unsigned int D, typename S >
-inline typename multidimensional_array< V, D, S >::index_type multidimensional_array< V, D, S >::iterator::index() const { return impl::index< D >::value( _i, _size ); }
+template < typename V, unsigned int D >
+inline typename slice< V, D >::index_type slice< V, D >::iterator::index() const { return impl::index< D >::value( _i, _shape ); }
+
+template < typename V, unsigned int D >
+inline typename slice< V, D >::index_type slice< V, D >::const_iterator::index() const { return impl::index< D >::value( _i, _shape ); }
 
 template < typename V, unsigned int D, typename S >
-inline typename multidimensional_array< V, D, S >::index_type multidimensional_array< V, D, S >::const_iterator::index() const { return impl::index< D >::value( _i, _size ); }
+array< V, D, S >::array( const index_type& shape, const V& default_value ): _data( impl::index< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
 
-} // namespace comma {
+} } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 18a611d6e..ed24dc53d 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -3,38 +3,40 @@
 #include <gtest/gtest.h>
 #include "../multidimensional_array.h"
 
+namespace cmd = comma::containers::multidimensional; 
+
 TEST( multidimensional_array, impl_index_value )
 {
-    EXPECT_EQ( comma::impl::index< 2 >::value( {0, 0}, {1, 5} ), 0 );
-    EXPECT_EQ( comma::impl::index< 2 >::value( {0, 1}, {1, 5} ), 1 );
-    EXPECT_EQ( comma::impl::index< 2 >::value( {0, 4}, {1, 5} ), 4 );
-    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 0}, {1, 5} ), 5 );
-    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 1}, {2, 5} ), 6 );
-    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 2}, {2, 5} ), 7 );
-    EXPECT_EQ( comma::impl::index< 2 >::value( {1, 2}, {3, 5} ), 7 );
-    EXPECT_EQ( comma::impl::index< 2 >::value( {2, 2}, {3, 5} ), 12 );
-    EXPECT_EQ( comma::impl::index< 3 >::value( {0, 0, 0}, {2, 3, 4} ), 0 );
-    EXPECT_EQ( comma::impl::index< 3 >::value( {0, 0, 3}, {2, 3, 4} ), 3 );
-    EXPECT_EQ( comma::impl::index< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
-    EXPECT_EQ( comma::impl::index< 3 >::value( {1, 2, 3}, {2, 3, 4} ), 3 + 4 * ( 2 + 3 * 1 ) );
-    EXPECT_EQ( comma::impl::index< 3 >::value( {1, 2, 4}, {2, 3, 4} ), 2 * 3 * 4 );
-    EXPECT_EQ( comma::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {0, 0}, {1, 5} ), 0 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {0, 1}, {1, 5} ), 1 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {0, 4}, {1, 5} ), 4 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 0}, {1, 5} ), 5 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 1}, {2, 5} ), 6 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 2}, {2, 5} ), 7 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 2}, {3, 5} ), 7 );
+    EXPECT_EQ( cmd::impl::index< 2 >::value( {2, 2}, {3, 5} ), 12 );
+    EXPECT_EQ( cmd::impl::index< 3 >::value( {0, 0, 0}, {2, 3, 4} ), 0 );
+    EXPECT_EQ( cmd::impl::index< 3 >::value( {0, 0, 3}, {2, 3, 4} ), 3 );
+    EXPECT_EQ( cmd::impl::index< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
+    EXPECT_EQ( cmd::impl::index< 3 >::value( {1, 2, 3}, {2, 3, 4} ), 3 + 4 * ( 2 + 3 * 1 ) );
+    EXPECT_EQ( cmd::impl::index< 3 >::value( {1, 2, 4}, {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
 }
 
 TEST( multidimensional_array, impl_index_product )
 {
-    EXPECT_EQ( comma::impl::index< 1 >::product( {2} ), 2 );
-    EXPECT_EQ( comma::impl::index< 2 >::product( {2, 3} ), 6 );
-    EXPECT_EQ( comma::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
-    EXPECT_EQ( comma::impl::index< 4 >::product( {2, 3, 4, 5} ), 2 * 3 * 4 * 5 );
+    EXPECT_EQ( cmd::impl::index< 1 >::product( {2} ), 2 );
+    EXPECT_EQ( cmd::impl::index< 2 >::product( {2, 3} ), 6 );
+    EXPECT_EQ( cmd::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index< 4 >::product( {2, 3, 4, 5} ), 2 * 3 * 4 * 5 );
 }
 
 TEST( multidimensional_array, impl_index_inverted_value )
 {
     typedef std::array< std::size_t, 3 > array_t;
-    { array_t a{0, 0, 0}; EXPECT_EQ( comma::impl::index< 3 >::value( 0, {2, 3, 4} ), a ); }
-    { array_t a{0, 0, 1}; EXPECT_EQ( comma::impl::index< 3 >::value( 1, {2, 3, 4} ), a ); }
-    { array_t a{2, 1, 3}; EXPECT_EQ( comma::impl::index< 3 >::value( 3 + 4 * ( 1 + 3 * 2 ), {2, 3, 4} ), a ); }
+    { array_t a{0, 0, 0}; EXPECT_EQ( cmd::impl::index< 3 >::value( 0, {2, 3, 4} ), a ); }
+    { array_t a{0, 0, 1}; EXPECT_EQ( cmd::impl::index< 3 >::value( 1, {2, 3, 4} ), a ); }
+    { array_t a{2, 1, 3}; EXPECT_EQ( cmd::impl::index< 3 >::value( 3 + 4 * ( 1 + 3 * 2 ), {2, 3, 4} ), a ); }
     // todo: way more tests
 }
 
@@ -42,8 +44,8 @@ TEST( multidimensional_array, iteration )
 {
     {
         typedef std::array< std::size_t, 3 > array_t;
-        comma::multidimensional_array< int, 3 > a( {2, 3, 4}, 0 );
-        { array_t s{2, 3, 4}; EXPECT_EQ( a.size(), s ); EXPECT_EQ( a.data().size(), 2 * 3 * 4 ); }
+        comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+        { array_t s{2, 3, 4}; EXPECT_EQ( a.shape(), s ); EXPECT_EQ( a.data().size(), 2 * 3 * 4 ); }
         unsigned int i = 0;
         for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
         auto it = a.begin();
@@ -78,14 +80,15 @@ TEST( multidimensional_array, iteration )
 TEST( multidimensional_array, access )
 {
     {
-        comma::multidimensional_array< int, 3 > a( {2, 3, 4}, 0 );
+        comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
         unsigned int i = 0;
         for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
-        EXPECT_EQ( a( {0, 0, 0} ), 0 );
-        EXPECT_EQ( a( {0, 1, 0} ), 4 );
-        EXPECT_EQ( a( {1, 2, 3} ), 23 );
-        a( {0, 0, 0} ) = 111; EXPECT_EQ( a( {0, 0, 0} ), 111 );
-        a( {1, 1, 2} ) = 222; EXPECT_EQ( a( {1, 1, 2} ), 222 );
-        a( {1, 2, 3} ) = 333; EXPECT_EQ( a( {1, 2, 3} ), 333 );
+        typedef comma::containers::multidimensional::array< int, 3 >::index_type index_t;
+        { index_t i{0, 0, 0}; EXPECT_EQ( a[i], 0 ); }
+        { index_t i{0, 1, 0}; EXPECT_EQ( a[i], 4 ); }
+        { index_t i{1, 2, 3}; EXPECT_EQ( a[i], 23 ); }
+        { index_t i{0, 0, 0}; a[{0, 0, 0}] = 111; EXPECT_EQ( a[i], 111 ); }
+        { index_t i{1, 1, 2}; a[{1, 1, 2}] = 222; EXPECT_EQ( a[i], 222 ); }
+        { index_t i{1, 2, 3}; a[{1, 2, 3}] = 333; EXPECT_EQ( a[i], 333 ); }
     }
 }
\ No newline at end of file

From 4fa6a4eab2ddf9631bdfc6685afea42fe8ba15a5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 Jun 2023 18:43:50 +1000
Subject: [PATCH 0595/1056] comma::containers::multidimensional::array[] on
 slices: first cut implemented, but looking pretty ugly due to templating;
 tested, but trying to add better usage semantics

---
 containers/multidimensional_array.h           | 61 ++++++++++++--
 .../test/multidimensional_array_test.cpp      | 79 ++++++++++++++++++-
 2 files changed, 133 insertions(+), 7 deletions(-)

diff --git a/containers/multidimensional_array.h b/containers/multidimensional_array.h
index 60c2bd935..afb6fcf32 100644
--- a/containers/multidimensional_array.h
+++ b/containers/multidimensional_array.h
@@ -18,14 +18,28 @@ class slice
 
         typedef V value_type;
 
-        const unsigned int dimensions{D};
+        static const unsigned int dimensions{D};
 
         slice( const index_type& shape, V* data ): _shape( shape ), _size( _product( _shape ) ), _data( data ) {}
 
+        slice& operator=( const slice& rhs ) = default;
+
         V& operator[]( const index_type& i ) { return _data[ _index( i ) ]; }
 
         const V& operator[]( const index_type& i ) const { return _data[ _index( i ) ]; }
 
+        template < unsigned int I >
+        slice< V, D - I > operator[]( const std::array< std::size_t, I >& i );
+
+        template < unsigned int I >
+        const slice< V, D - I > operator[]( const std::array< std::size_t, I >& i ) const;
+
+        slice< V, D - 1 > operator[]( std::size_t i ) { return operator[]< 1 >( std::array< std::size_t, 1 >{i} ); }
+
+        const slice< V, D - 1 > operator[]( std::size_t i ) const { return operator[]< 1 >( std::array< std::size_t, 1 >{i} ); }
+
+        V* data() { return _data; }
+        
         const V* data() const { return _data; }
 
         const index_type& shape() const { return _shape; }
@@ -110,6 +124,18 @@ class array
 
         const V& operator[]( const index_type& i ) const { return _slice[i]; }
 
+        multidimensional::slice< V, D - 1 > operator[]( std::size_t i ) { return _slice[i]; }
+
+        template < unsigned int I >
+        multidimensional::slice< V, D - I > operator[]( const std::array< std::size_t, I >& i ) { return _slice.template operator[]< I >( i ); }
+
+        const multidimensional::slice< V, D - 1 > operator[]( std::size_t i ) const { return _slice[i]; }
+
+        template < unsigned int I >
+        const multidimensional::slice< V, D - I > operator[]( const std::array< std::size_t, I >& i ) const { return _slice.template operator[]< I >( i ); }
+
+        storage_type& data() { return _data; }
+
         const storage_type& data() const { return _data; }
 
         const index_type& shape() const { return _slice.shape(); }
@@ -169,10 +195,19 @@ template < unsigned int D, unsigned int I = D >
 struct index
 {
     typedef std::array< std::size_t, D > index_type;
-    static unsigned int value( const index_type& i, const index_type& size ) { return i[ I - 1 ] + index< D, I - 1 >::value( i, size ) * size[ I - 1 ]; }
-    static void value( std::size_t j, index_type& i, const index_type& size ) { i[ I - 1 ] = j % size[ I - 1 ]; index< D, I - 1 >::value( j / size[ I - 1 ], i, size ); }
-    static index_type value( std::size_t j, const index_type& size ) { index_type i; value( j, i, size ); return i; }
+    static unsigned int value( const index_type& i, const index_type& shape ) { return i[ I - 1 ] + index< D, I - 1 >::value( i, shape ) * shape[ I - 1 ]; }
+    static void value( std::size_t j, index_type& i, const index_type& shape ) { i[ I - 1 ] = j % shape[ I - 1 ]; index< D, I - 1 >::value( j / shape[ I - 1 ], i, shape ); }
+    static index_type value( std::size_t j, const index_type& shape ) { index_type i; value( j, i, shape ); return i; }
     static std::size_t product( const index_type& i ) { return i[ I - 1 ] * index< D, I - 1 >::product( i ); }
+    template < unsigned int J >
+    static std::pair< std::array< std::size_t, J >, std::array< std::size_t, D - J > > split( const index_type& i ) // todo: use metaprogramming, kinda same as product
+    {
+        std::pair< std::array< std::size_t, J >, std::array< std::size_t, D - J > > p;
+        unsigned int k = 0;
+        for( unsigned int n = 0; n < J; ++n, ++k ) { p.first[n] = i[k]; }
+        for( unsigned int n = 0; n < D - J; ++n, ++k ) { p.second[n] = i[k]; }
+        return p;
+    }
 };
 
 template < unsigned int D >
@@ -198,7 +233,23 @@ inline typename slice< V, D >::index_type slice< V, D >::iterator::index() const
 template < typename V, unsigned int D >
 inline typename slice< V, D >::index_type slice< V, D >::const_iterator::index() const { return impl::index< D >::value( _i, _shape ); }
 
+template < typename V, unsigned int D >
+template < unsigned int I >
+inline slice< V, D - I > slice< V, D >::operator[]( const std::array< std::size_t, I >& i )
+{
+    auto s = impl::index< D >::template split< I >( _shape );
+    return slice< V, D - I >( s.second, _data + impl::index< I >::value( i, s.first ) * impl::index< D - I >::product( s.second ) );
+}
+
+template < typename V, unsigned int D >
+template < unsigned int I >
+inline const slice< V, D - I > slice< V, D >::operator[]( const std::array< std::size_t, I >& i ) const
+{
+    auto s = impl::index< D >::template split< I >( _shape );
+    return slice< V, D - I >( s.second, _data + impl::index< I >::value( i, s.first ) * impl::index< D - I >::product( s.second ) );
+}
+
 template < typename V, unsigned int D, typename S >
-array< V, D, S >::array( const index_type& shape, const V& default_value ): _data( impl::index< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
+inline array< V, D, S >::array( const index_type& shape, const V& default_value ): _data( impl::index< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
 
 } } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index ed24dc53d..069c69c08 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -48,6 +48,8 @@ TEST( multidimensional_array, iteration )
         { array_t s{2, 3, 4}; EXPECT_EQ( a.shape(), s ); EXPECT_EQ( a.data().size(), 2 * 3 * 4 ); }
         unsigned int i = 0;
         for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        i = 0;
+        for( auto it = a.data().begin(); it != a.data().end(); ++it ) { EXPECT_EQ( *it, i++ ); }
         auto it = a.begin();
         { array_t a{0, 0, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 0 ); ++it; }
         { array_t a{0, 0, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 1 ); ++it; }
@@ -77,7 +79,7 @@ TEST( multidimensional_array, iteration )
     }
 }
 
-TEST( multidimensional_array, access )
+TEST( multidimensional_array, array )
 {
     {
         comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
@@ -91,4 +93,77 @@ TEST( multidimensional_array, access )
         { index_t i{1, 1, 2}; a[{1, 1, 2}] = 222; EXPECT_EQ( a[i], 222 ); }
         { index_t i{1, 2, 3}; a[{1, 2, 3}] = 333; EXPECT_EQ( a[i], 333 ); }
     }
-}
\ No newline at end of file
+}
+
+TEST( multidimensional_array, slice )
+{
+    {
+        comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+        unsigned int i = 0;
+        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        {
+            typedef comma::containers::multidimensional::array< int, 2 >::index_type index_t;
+            comma::containers::multidimensional::slice< int, 2 > s = a[0];
+            { index_t i{0, 0}; EXPECT_EQ( s[i], 0 ); }
+            { index_t i{0, 1}; EXPECT_EQ( s[i], 1 ); }
+            { index_t i{0, 2}; EXPECT_EQ( s[i], 2 ); }
+            { index_t i{0, 3}; EXPECT_EQ( s[i], 3 ); }
+            { index_t i{1, 0}; EXPECT_EQ( s[i], 4 ); }
+            { index_t i{1, 1}; EXPECT_EQ( s[i], 5 ); }
+            { index_t i{1, 2}; EXPECT_EQ( s[i], 6 ); }
+            { index_t i{1, 3}; EXPECT_EQ( s[i], 7 ); }
+            { index_t i{2, 0}; EXPECT_EQ( s[i], 8 ); }
+            { index_t i{2, 1}; EXPECT_EQ( s[i], 9 ); }
+            { index_t i{2, 2}; EXPECT_EQ( s[i], 10 ); }
+            { index_t i{2, 3}; EXPECT_EQ( s[i], 11 ); }
+            s = a[1];
+            { index_t i{0, 0}; EXPECT_EQ( s[i], 12 ); }
+            { index_t i{0, 1}; EXPECT_EQ( s[i], 13 ); }
+            { index_t i{0, 2}; EXPECT_EQ( s[i], 14 ); }
+            { index_t i{0, 3}; EXPECT_EQ( s[i], 15 ); }
+            { index_t i{1, 0}; EXPECT_EQ( s[i], 16 ); }
+            { index_t i{1, 1}; EXPECT_EQ( s[i], 17 ); }
+            { index_t i{1, 2}; EXPECT_EQ( s[i], 18 ); }
+            { index_t i{1, 3}; EXPECT_EQ( s[i], 19 ); }
+            { index_t i{2, 0}; EXPECT_EQ( s[i], 20 ); }
+            { index_t i{2, 1}; EXPECT_EQ( s[i], 21 ); }
+            { index_t i{2, 2}; EXPECT_EQ( s[i], 22 ); }
+            { index_t i{2, 3}; EXPECT_EQ( s[i], 23 ); }
+        }
+        {
+            typedef comma::containers::multidimensional::array< int, 1 >::index_type index_t;
+            {
+                comma::containers::multidimensional::slice< int, 1 > s = a.operator[]<2>( {0, 0} ); // todo! super-ugly! improve templating on operator (use impl for now)!
+                { index_t i{0}; EXPECT_EQ( s[i], 0 ); } // todo: improve usage on 1-dimensional slices
+                { index_t i{1}; EXPECT_EQ( s[i], 1 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 2 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 3 ); }
+                s = a.operator[]<2>( {0, 1} );
+                { index_t i{0}; EXPECT_EQ( s[i], 4 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 5 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 6 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 7 ); }
+                s = a.operator[]<2>( {0, 2} );
+                { index_t i{0}; EXPECT_EQ( s[i], 8 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 9 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 10 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 11 ); }
+                s = a.operator[]<2>( {1, 0} );
+                { index_t i{0}; EXPECT_EQ( s[i], 12 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 13 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 14 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 15 ); }
+                s = a.operator[]<2>( {1, 1} );
+                { index_t i{0}; EXPECT_EQ( s[i], 16 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 17 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 18 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 19 ); }
+                s = a.operator[]<2>( {1, 2} );
+                { index_t i{0}; EXPECT_EQ( s[i], 20 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 21 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 22 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 23 ); }
+            }
+        }
+    }
+}

From e3881352bb224a27d26508667ecf757a2d396d79 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 Jun 2023 18:54:24 +1000
Subject: [PATCH 0596/1056] comma::containers::multidimensional::array[] on
 slices: more tests added; todo! better usage semantics!

---
 .../test/multidimensional_array_test.cpp      | 23 ++++++++++++++++---
 1 file changed, 20 insertions(+), 3 deletions(-)

diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 069c69c08..1a1aa6dea 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -98,10 +98,10 @@ TEST( multidimensional_array, array )
 TEST( multidimensional_array, slice )
 {
     {
-        comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
-        unsigned int i = 0;
-        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
         {
+            comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+            unsigned int i = 0;
+            for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
             typedef comma::containers::multidimensional::array< int, 2 >::index_type index_t;
             comma::containers::multidimensional::slice< int, 2 > s = a[0];
             { index_t i{0, 0}; EXPECT_EQ( s[i], 0 ); }
@@ -116,6 +116,19 @@ TEST( multidimensional_array, slice )
             { index_t i{2, 1}; EXPECT_EQ( s[i], 9 ); }
             { index_t i{2, 2}; EXPECT_EQ( s[i], 10 ); }
             { index_t i{2, 3}; EXPECT_EQ( s[i], 11 ); }
+            {
+                auto t = s[0];
+                typedef comma::containers::multidimensional::array< int, 1 >::index_type index_t;
+                { index_t i{0}; EXPECT_EQ( t[i], 0 ); }
+                { index_t i{1}; EXPECT_EQ( t[i], 1 ); }
+                { index_t i{2}; EXPECT_EQ( t[i], 2 ); }
+                { index_t i{3}; EXPECT_EQ( t[i], 3 ); }
+                t = s[1];
+                { index_t i{0}; EXPECT_EQ( t[i], 4 ); }
+                { index_t i{1}; EXPECT_EQ( t[i], 5 ); }
+                { index_t i{2}; EXPECT_EQ( t[i], 6 ); }
+                { index_t i{3}; EXPECT_EQ( t[i], 7 ); }
+            }
             s = a[1];
             { index_t i{0, 0}; EXPECT_EQ( s[i], 12 ); }
             { index_t i{0, 1}; EXPECT_EQ( s[i], 13 ); }
@@ -129,8 +142,12 @@ TEST( multidimensional_array, slice )
             { index_t i{2, 1}; EXPECT_EQ( s[i], 21 ); }
             { index_t i{2, 2}; EXPECT_EQ( s[i], 22 ); }
             { index_t i{2, 3}; EXPECT_EQ( s[i], 23 ); }
+            { s[{1, 3}] = 111; std::array< std::size_t, 3 > i{1, 1, 3}; EXPECT_EQ( a[i], 111 ); }
         }
         {
+            comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+            unsigned int i = 0;
+            for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
             typedef comma::containers::multidimensional::array< int, 1 >::index_type index_t;
             {
                 comma::containers::multidimensional::slice< int, 1 > s = a.operator[]<2>( {0, 0} ); // todo! super-ugly! improve templating on operator (use impl for now)!

From 83adc6ba259184f3cab363401e330b7390daa151 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 5 Jun 2023 18:08:32 +1000
Subject: [PATCH 0597/1056] string/choice.h: explicit call to Base::operator=()
 in operator=()

for some reason without the explicit call the method segfaults when built
with g++ 7.5.0 (Ubuntu 18.04 version)
---
 string/choice.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/string/choice.h b/string/choice.h
index 6cc1885ad..35fff959f 100644
--- a/string/choice.h
+++ b/string/choice.h
@@ -14,7 +14,7 @@ struct choice: public Base
     typedef Base base_t;
     choice( typename Derived::values rhs = static_cast< typename Derived::values >( 0 ) ): Base( Derived::choices()[rhs] ) {}
     choice( const std::string& rhs ) { operator=( rhs ); }
-    choice& operator=( const std::string& rhs ) { assert_valid( rhs ); operator=( rhs ); return *this; }
+    choice& operator=( const std::string& rhs ) { assert_valid( rhs ); Base::operator=( rhs ); return *this; }
     typename Derived::values to_enum() const;
     static bool valid( const std::string& rhs );
     static void assert_valid( const std::string& rhs );

From 3a7ba26bb57133c8616740a311088306dc59cbb5 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Mon, 5 Jun 2023 19:29:18 +1000
Subject: [PATCH 0598/1056] comma-test-run: capture stderr as well as stdout
 from comma-test-match

Not capturing stderr led to errors in the util/test/test_run/expectations tests

This reverts part of commit e9c9674f
---
 util/applications/comma-test-run | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 5de520f24..77b377273 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -628,7 +628,7 @@ function run_and_match_test()
             local is_global=$2
             if [[ -f "$expected" ]] ; then
                 (( options_verbose )) && message_ "$name: match expectations in '$expected'"
-                match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; comma-test-match "$expected" <'output/stdout.log' )
+                match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; comma-test-match "$expected" <'output/stdout.log' 2>&1 )
             elif [[ -d "$expected" ]] ; then
                 local extras=$( find "$expected" -type f )
                 for extra in $extras ; do

From 189c45120e1b5c3e0587b2cba095e0f12d49b20f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Jun 2023 13:45:32 +1000
Subject: [PATCH 0599/1056] containers/multidimensional: containers refactored

---
 containers/CMakeLists.txt                     |  4 +-
 .../array.h}                                  |  4 +-
 .../map.h}                                    | 42 +++++++++----------
 .../test/multidimensional_array_test.cpp      |  2 +-
 ...test.cpp => multidimensional_map_test.cpp} | 12 +++---
 5 files changed, 33 insertions(+), 31 deletions(-)
 rename containers/{multidimensional_array.h => multidimensional/array.h} (99%)
 rename containers/{multikey_map.h => multidimensional/map.h} (63%)
 rename containers/test/{multikey_map_test.cpp => multidimensional_map_test.cpp} (91%)

diff --git a/containers/CMakeLists.txt b/containers/CMakeLists.txt
index b1bd83b03..698846fec 100644
--- a/containers/CMakeLists.txt
+++ b/containers/CMakeLists.txt
@@ -4,8 +4,9 @@ SET( TARGET_NAME comma${PROJECT} )
 FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
 FILE( GLOB impl_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/*.h )
+FILE( GLOB multidimensional_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/multidimensional/*.h )
 
-SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
+SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} ${multidimensional_includes} )
 
 add_custom_target( ${TARGET_NAME} ${source} ${includes} ${impl_includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_includes} )
 #SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
@@ -13,6 +14,7 @@ add_custom_target( ${TARGET_NAME} ${source} ${includes} ${impl_includes} ) # ADD
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
+INSTALL( FILES ${multidimensional_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/multidimensional )
 #INSTALL(
 #    TARGETS ${TARGET_NAME}
 #    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/containers/multidimensional_array.h b/containers/multidimensional/array.h
similarity index 99%
rename from containers/multidimensional_array.h
rename to containers/multidimensional/array.h
index afb6fcf32..fa5281839 100644
--- a/containers/multidimensional_array.h
+++ b/containers/multidimensional/array.h
@@ -5,8 +5,8 @@
 #pragma once
 
 #include <array>
-#include "../base/types.h"
-#include "impl/array_traits.h"
+#include "../../base/types.h"
+#include "../impl/array_traits.h"
 
 namespace comma { namespace containers { namespace multidimensional {
 
diff --git a/containers/multikey_map.h b/containers/multidimensional/map.h
similarity index 63%
rename from containers/multikey_map.h
rename to containers/multidimensional/map.h
index c69926ec5..889c90f27 100644
--- a/containers/multikey_map.h
+++ b/containers/multidimensional/map.h
@@ -7,10 +7,10 @@
 #include <array>
 #include <unordered_map>
 #include <boost/functional/hash.hpp>
-#include "../base/types.h"
-#include "impl/array_traits.h"
+#include "../../base/types.h"
+#include "../impl/array_traits.h"
 
-namespace comma {
+namespace comma { namespace containers { namespace multidimensional {
 
 /// quick and dirty hash for array-like containers (its support is awkward in boost)
 template < typename Array, std::size_t Size >
@@ -27,10 +27,10 @@ struct array_hash : public std::unary_function< Array, std::size_t >
 
 /// unordered map with array-like keys
 template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, typename Traits = impl::array_traits< P > >
-class multikey_map : public std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > >
+class map : public std::unordered_map< std::array< comma::int32, Size >, V, array_hash< std::array< comma::int32, Size >, Size > >
 {
     public:
-        typedef std::unordered_map< std::array< comma::int32, Size >, V, comma::array_hash< std::array< comma::int32, Size >, Size > > base_type;
+        typedef std::unordered_map< std::array< comma::int32, Size >, V, array_hash< std::array< comma::int32, Size >, Size > > base_type;
 
         typedef base_type map_type;
 
@@ -51,10 +51,10 @@ class multikey_map : public std::unordered_map< std::array< comma::int32, Size >
         typedef typename base_type::const_iterator const_iterator; // otherwise it does not build on windows...
 
         /// constructor
-        multikey_map( const point_type& origin, const point_type& resolution );
+        map( const point_type& origin, const point_type& resolution );
 
         /// constructor, origin is all zeroes
-        multikey_map( const point_type& resolution );
+        map( const point_type& resolution );
         
         /// insert element at the given point, if it does not exist
         iterator touch_at( const point_type& point );
@@ -95,21 +95,21 @@ class multikey_map : public std::unordered_map< std::array< comma::int32, Size >
 };
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline multikey_map< K, V, Size, P, Traits >::multikey_map( const typename multikey_map< K, V, Size, P, Traits >::point_type& origin, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Traits >::point_type& origin, const typename map< K, V, Size, P, Traits >::point_type& resolution )
     : _origin( origin )
     , _resolution( resolution )
 {
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline multikey_map< K, V, Size, P, Traits >::multikey_map( const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Traits >::point_type& resolution )
     : _origin( Traits::zero() )
     , _resolution( resolution )
 {
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::touch_at( const typename multikey_map< K, V, Size, P, Traits >::point_type& point )
+inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::touch_at( const typename map< K, V, Size, P, Traits >::point_type& point )
 {
     key_type index = index_of( point );
     iterator it = this->base_type::find( index );
@@ -118,13 +118,13 @@ inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K,
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline std::pair< typename multikey_map< K, V, Size, P, Traits >::iterator, bool > multikey_map< K, V, Size, P, Traits >::insert( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::mapped_type& value )
+inline std::pair< typename map< K, V, Size, P, Traits >::iterator, bool > map< K, V, Size, P, Traits >::insert( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::mapped_type& value )
 {
     return this->base_type::insert( std::make_pair( index_of( point ), value ) );
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::point_type& origin, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& origin, const typename map< K, V, Size, P, Traits >::point_type& resolution )
 {
     point_type diff = Traits::divide( Traits::subtract( point, origin ), resolution );
     key_type index;
@@ -139,47 +139,47 @@ inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K,
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point, const typename multikey_map< K, V, Size, P, Traits >::point_type& resolution )
+inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& resolution )
 {
     return index_of( point, Traits::zero(), resolution );
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::key_type multikey_map< K, V, Size, P, Traits >::index_of( const typename multikey_map< K, V, Size, P, Traits >::point_type& point ) const
+inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point ) const
 {
     return index_of( point, _origin, _resolution );
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::point_type& point )
+inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::point_type& point )
 {
     index_type i = index_of( point );
     return this->base_type::find( i );
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::const_iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::point_type& point ) const
+inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::point_type& point ) const
 {
     index_type i = index_of( point );
     return this->base_type::find( i );
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::key_type& index )
+inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::key_type& index )
 {
     return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline typename multikey_map< K, V, Size, P, Traits >::const_iterator multikey_map< K, V, Size, P, Traits >::find( const typename multikey_map< K, V, Size, P, Traits >::key_type& index ) const
+inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::key_type& index ) const
 {
     return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline const typename multikey_map< K, V, Size, P, Traits >::point_type& multikey_map< K, V, Size, P, Traits >::origin() const { return _origin; }
+inline const typename map< K, V, Size, P, Traits >::point_type& map< K, V, Size, P, Traits >::origin() const { return _origin; }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
-inline const typename multikey_map< K, V, Size, P, Traits >::point_type& multikey_map< K, V, Size, P, Traits >::resolution() const { return _resolution; }
+inline const typename map< K, V, Size, P, Traits >::point_type& map< K, V, Size, P, Traits >::resolution() const { return _resolution; }
 
-} // namespace comma {
+} } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 1a1aa6dea..93a71bd29 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -1,7 +1,7 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
-#include "../multidimensional_array.h"
+#include "../multidimensional/array.h"
 
 namespace cmd = comma::containers::multidimensional; 
 
diff --git a/containers/test/multikey_map_test.cpp b/containers/test/multidimensional_map_test.cpp
similarity index 91%
rename from containers/test/multikey_map_test.cpp
rename to containers/test/multidimensional_map_test.cpp
index e979d0a6f..7f30a4ced 100644
--- a/containers/test/multikey_map_test.cpp
+++ b/containers/test/multidimensional_map_test.cpp
@@ -1,18 +1,18 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
-#include "../multikey_map.h"
+#include "../multidimensional/map.h"
 
 TEST( multikey_map, usage )
 {
-    comma::multikey_map< double, int, 3 > m( { 0, 0, 0 }, { 1, 2, 3 } );
+    comma::containers::multidimensional::map< double, int, 3 > m( { 0, 0, 0 }, { 1, 2, 3 } );
     m.touch_at( { 1, 2, 3 } );
     // todo
 }
 
 TEST( multikey_map, index )
 {
-    typedef comma::multikey_map< double, int, 3 > map_type;
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
     {
         map_type m( {1, 1, 1} );
         {
@@ -59,7 +59,7 @@ TEST( multikey_map, index )
 
 TEST( multikey_map, operations )
 {
-    typedef comma::multikey_map< double, int, 3 > map_type;
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
     map_type m( {1, 1, 1} );
     {
         EXPECT_TRUE( ( m.find( map_type::point_type{1., 1., 1.} ) == m.end() ) );
@@ -98,14 +98,14 @@ TEST( multikey_map, operations )
 
 TEST( multikey_map, test )
 {
-    typedef comma::multikey_map< double, int, 3 > map_type;
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
     map_type m( {1, 1, 1} );
     EXPECT_TRUE( m.empty() );
 }
 
 TEST( multikey_map, neighbourhood )
 {
-    typedef comma::multikey_map< double, int, 3 > map_type;
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
     map_type m( {1, 1, 1} );
     {
         EXPECT_TRUE( ( m.find( map_type::point_type{1, 1, 1} ) == m.end() ) );

From 5f54e1472df862ad52959ed12e2bcb5d2406b822 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Jun 2023 14:11:12 +1000
Subject: [PATCH 0600/1056] containers::multidimensional::array: operator[]
 replaced with at() method for slices

---
 containers/multidimensional/array.h           | 22 +++++++++----------
 .../test/multidimensional_array_test.cpp      | 20 ++++++++---------
 2 files changed, 21 insertions(+), 21 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index fa5281839..34c760ec7 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -29,14 +29,14 @@ class slice
         const V& operator[]( const index_type& i ) const { return _data[ _index( i ) ]; }
 
         template < unsigned int I >
-        slice< V, D - I > operator[]( const std::array< std::size_t, I >& i );
+        slice< V, D - I > at( const std::array< std::size_t, I >& i );
 
         template < unsigned int I >
-        const slice< V, D - I > operator[]( const std::array< std::size_t, I >& i ) const;
+        const slice< V, D - I > at( const std::array< std::size_t, I >& i ) const;
 
-        slice< V, D - 1 > operator[]( std::size_t i ) { return operator[]< 1 >( std::array< std::size_t, 1 >{i} ); }
+        slice< V, D - 1 > at( std::size_t i ) { return at< 1 >( std::array< std::size_t, 1 >{i} ); }
 
-        const slice< V, D - 1 > operator[]( std::size_t i ) const { return operator[]< 1 >( std::array< std::size_t, 1 >{i} ); }
+        const slice< V, D - 1 > at( std::size_t i ) const { return at< 1 >( std::array< std::size_t, 1 >{i} ); }
 
         V* data() { return _data; }
         
@@ -124,15 +124,15 @@ class array
 
         const V& operator[]( const index_type& i ) const { return _slice[i]; }
 
-        multidimensional::slice< V, D - 1 > operator[]( std::size_t i ) { return _slice[i]; }
+        template < unsigned int I >
+        multidimensional::slice< V, D - I > at( const std::array< std::size_t, I >& i ) { return _slice.template at< I >( i ); }
 
         template < unsigned int I >
-        multidimensional::slice< V, D - I > operator[]( const std::array< std::size_t, I >& i ) { return _slice.template operator[]< I >( i ); }
+        const multidimensional::slice< V, D - I > at( const std::array< std::size_t, I >& i ) const { return _slice.template at< I >( i ); }
 
-        const multidimensional::slice< V, D - 1 > operator[]( std::size_t i ) const { return _slice[i]; }
+        multidimensional::slice< V, D - 1 > at( std::size_t i ) { return _slice.at( i ); }
 
-        template < unsigned int I >
-        const multidimensional::slice< V, D - I > operator[]( const std::array< std::size_t, I >& i ) const { return _slice.template operator[]< I >( i ); }
+        const multidimensional::slice< V, D - 1 > at( std::size_t i ) const { return _slice.at( i ); }
 
         storage_type& data() { return _data; }
 
@@ -235,7 +235,7 @@ inline typename slice< V, D >::index_type slice< V, D >::const_iterator::index()
 
 template < typename V, unsigned int D >
 template < unsigned int I >
-inline slice< V, D - I > slice< V, D >::operator[]( const std::array< std::size_t, I >& i )
+inline slice< V, D - I > slice< V, D >::at( const std::array< std::size_t, I >& i )
 {
     auto s = impl::index< D >::template split< I >( _shape );
     return slice< V, D - I >( s.second, _data + impl::index< I >::value( i, s.first ) * impl::index< D - I >::product( s.second ) );
@@ -243,7 +243,7 @@ inline slice< V, D - I > slice< V, D >::operator[]( const std::array< std::size_
 
 template < typename V, unsigned int D >
 template < unsigned int I >
-inline const slice< V, D - I > slice< V, D >::operator[]( const std::array< std::size_t, I >& i ) const
+inline const slice< V, D - I > slice< V, D >::at( const std::array< std::size_t, I >& i ) const
 {
     auto s = impl::index< D >::template split< I >( _shape );
     return slice< V, D - I >( s.second, _data + impl::index< I >::value( i, s.first ) * impl::index< D - I >::product( s.second ) );
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 93a71bd29..9939e8b13 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -103,7 +103,7 @@ TEST( multidimensional_array, slice )
             unsigned int i = 0;
             for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
             typedef comma::containers::multidimensional::array< int, 2 >::index_type index_t;
-            comma::containers::multidimensional::slice< int, 2 > s = a[0];
+            comma::containers::multidimensional::slice< int, 2 > s = a.at( 0 );
             { index_t i{0, 0}; EXPECT_EQ( s[i], 0 ); }
             { index_t i{0, 1}; EXPECT_EQ( s[i], 1 ); }
             { index_t i{0, 2}; EXPECT_EQ( s[i], 2 ); }
@@ -117,19 +117,19 @@ TEST( multidimensional_array, slice )
             { index_t i{2, 2}; EXPECT_EQ( s[i], 10 ); }
             { index_t i{2, 3}; EXPECT_EQ( s[i], 11 ); }
             {
-                auto t = s[0];
+                auto t = s.at( 0 );
                 typedef comma::containers::multidimensional::array< int, 1 >::index_type index_t;
                 { index_t i{0}; EXPECT_EQ( t[i], 0 ); }
                 { index_t i{1}; EXPECT_EQ( t[i], 1 ); }
                 { index_t i{2}; EXPECT_EQ( t[i], 2 ); }
                 { index_t i{3}; EXPECT_EQ( t[i], 3 ); }
-                t = s[1];
+                t = s.at( 1 );
                 { index_t i{0}; EXPECT_EQ( t[i], 4 ); }
                 { index_t i{1}; EXPECT_EQ( t[i], 5 ); }
                 { index_t i{2}; EXPECT_EQ( t[i], 6 ); }
                 { index_t i{3}; EXPECT_EQ( t[i], 7 ); }
             }
-            s = a[1];
+            s = a.at( 1 );
             { index_t i{0, 0}; EXPECT_EQ( s[i], 12 ); }
             { index_t i{0, 1}; EXPECT_EQ( s[i], 13 ); }
             { index_t i{0, 2}; EXPECT_EQ( s[i], 14 ); }
@@ -150,32 +150,32 @@ TEST( multidimensional_array, slice )
             for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
             typedef comma::containers::multidimensional::array< int, 1 >::index_type index_t;
             {
-                comma::containers::multidimensional::slice< int, 1 > s = a.operator[]<2>( {0, 0} ); // todo! super-ugly! improve templating on operator (use impl for now)!
+                comma::containers::multidimensional::slice< int, 1 > s = a.at< 2 >( {0, 0} ); // todo! super-ugly! improve templating!
                 { index_t i{0}; EXPECT_EQ( s[i], 0 ); } // todo: improve usage on 1-dimensional slices
                 { index_t i{1}; EXPECT_EQ( s[i], 1 ); }
                 { index_t i{2}; EXPECT_EQ( s[i], 2 ); }
                 { index_t i{3}; EXPECT_EQ( s[i], 3 ); }
-                s = a.operator[]<2>( {0, 1} );
+                s = a.at< 2 >( {0, 1} );
                 { index_t i{0}; EXPECT_EQ( s[i], 4 ); }
                 { index_t i{1}; EXPECT_EQ( s[i], 5 ); }
                 { index_t i{2}; EXPECT_EQ( s[i], 6 ); }
                 { index_t i{3}; EXPECT_EQ( s[i], 7 ); }
-                s = a.operator[]<2>( {0, 2} );
+                s = a.at< 2 >( {0, 2} );
                 { index_t i{0}; EXPECT_EQ( s[i], 8 ); }
                 { index_t i{1}; EXPECT_EQ( s[i], 9 ); }
                 { index_t i{2}; EXPECT_EQ( s[i], 10 ); }
                 { index_t i{3}; EXPECT_EQ( s[i], 11 ); }
-                s = a.operator[]<2>( {1, 0} );
+                s = a.at< 2 >( {1, 0} );
                 { index_t i{0}; EXPECT_EQ( s[i], 12 ); }
                 { index_t i{1}; EXPECT_EQ( s[i], 13 ); }
                 { index_t i{2}; EXPECT_EQ( s[i], 14 ); }
                 { index_t i{3}; EXPECT_EQ( s[i], 15 ); }
-                s = a.operator[]<2>( {1, 1} );
+                s = a.at< 2 >( {1, 1} );
                 { index_t i{0}; EXPECT_EQ( s[i], 16 ); }
                 { index_t i{1}; EXPECT_EQ( s[i], 17 ); }
                 { index_t i{2}; EXPECT_EQ( s[i], 18 ); }
                 { index_t i{3}; EXPECT_EQ( s[i], 19 ); }
-                s = a.operator[]<2>( {1, 2} );
+                s = a.at< 2 >( {1, 2} );
                 { index_t i{0}; EXPECT_EQ( s[i], 20 ); }
                 { index_t i{1}; EXPECT_EQ( s[i], 21 ); }
                 { index_t i{2}; EXPECT_EQ( s[i], 22 ); }

From 3afbcf46befa23227f1d3c73bb90d55b9bd9db98 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Jun 2023 16:04:27 +1000
Subject: [PATCH 0601/1056] containers::multidimensional: refactored and
 simplified

---
 containers/impl/array_traits.h                | 70 +++++++++++--------
 containers/multidimensional/array.h           | 36 +++++++---
 containers/multidimensional/map.h             | 17 ++---
 .../test/multidimensional_array_test.cpp      |  1 +
 4 files changed, 72 insertions(+), 52 deletions(-)

diff --git a/containers/impl/array_traits.h b/containers/impl/array_traits.h
index 3dad0a1c7..688a7ee30 100644
--- a/containers/impl/array_traits.h
+++ b/containers/impl/array_traits.h
@@ -6,40 +6,52 @@
 
 #include <array>
 
-namespace comma { namespace impl {
+namespace comma { namespace containers { namespace impl {
 
-template < typename T > struct array_traits;
-
-template < typename T, std::size_t Size > struct array_traits< std::array< T, Size > >;
-
-inline int negative_flooring() { return static_cast< int >( -1.5 ) == -1 ? -1 : static_cast< int >( -1.5 ) == -2 ? 0 : 0; }
-
-inline int positive_flooring() { return static_cast< int >( 1.5 ) == 1 ? 0 : static_cast< int >( 1.5 ) == 2 ? -1 : -1; }
-
-template < typename T, std::size_t Size > struct array_traits< std::array< T, Size > >
+template < typename T > inline int index( T p, T origin, T resolution )
 {
-    enum { size = Size };
-
-    static std::array< T, Size > subtract( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
+    static constexpr int negative_flooring = static_cast< int >( -1.5 ) == -1 ? -1 : static_cast< int >( -1.5 ) == -2 ? 0 : 0;
+    static constexpr int positive_flooring = static_cast< int >( 1.5 ) == 1 ? 0 : static_cast< int >( 1.5 ) == 2 ? -1 : -1;
+    double diff = ( p - origin ) / resolution;
+    int i = diff;
+    if( i == 0 || diff != i ) { i += diff < 0 ? negative_flooring : positive_flooring; }
+    return i;
+}
+
+template < std::size_t Size > struct operations
+{
+    template < typename S, typename T > static S& add( S& s, const T& t ) { s[ Size - 1 ] += t[ Size - 1 ]; operations< Size - 1 >::multiply( s, t ); return s; }
+    template < typename S, typename T > static S& subtract( S& s, const T& t ) { s[ Size - 1 ] -= t[ Size - 1 ]; operations< Size - 1 >::subtract( s, t ); return s; }
+    template < typename S, typename T > static S& vdivide( S& s, const T& t ) { s[ Size - 1 ] /= t[ Size - 1 ]; operations< Size - 1 >::vdivide( s, t ); return s; }
+    template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[ Size - 1 ] *= t; operations< Size - 1 >::multiply( s, t ); return s; }
+    template < typename S, typename T > static double dot( S& s, const T& t ) { return s[ Size - 1 ] * t[ Size - 1 ] + operations< Size - 1 >::dot( s, t ); }
+    template < typename S > static S& fill( S&s, double value ) { s[ Size - 1 ] = 0; operations< Size - 1 >::fill( s, value ); return s; }
+    template < typename S > static S filled( double value ) { S s; fill( s, value ); return s; }
+    template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
+
+    template < typename S, typename T > static S add( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
+    template < typename S, typename T > static S subtract( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
+    template < typename S, typename T > static S vdivide( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
+    template < typename S, typename T > static S multiply( const S& s, const T& t ) { S r = s; multiply( r, t ); return r; }
+
+    template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution )
     {
-        std::array< T, Size > d;
-        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] - rhs[i]; }
-        return d;
+        i[ Size - 1 ] = index( p[ Size - 1 ], origin[ Size - 1 ], resolution[ Size - 1 ] );
+        operations< Size - 1 >::index_of( i, p, origin, resolution );
+        return i;
     }
 
-    static std::array< T, Size > divide( const std::array< T, Size >& lhs, const std::array< T, Size >& rhs )
-    {
-        std::array< T, Size > d;
-        for( unsigned int i = 0; i < Size; ++i ) { d[i] = lhs[i] / rhs[i]; }
-        return d;
-    }
+    template < typename S, typename I > static I index_of( const S& p, const S& origin, const S& resolution ) { I i; index_of( i, p, origin, resolution ); return i; }
+};
 
-    static std::array< T, Size > zero()
-    {
-        std::array< T, Size > d;
-        for( unsigned int i = 0; i < Size; ++i ) { d[i] = T( 0 ); }
-        return d;
-    }
+template <> struct operations< 0 >
+{
+    template < typename S, typename T > static S& add( S& s, const T& t ) { s[0] += t[0]; return s; }
+    template < typename S, typename T > static S& subtract( S& s, const T& t ) { s[0] -= t[0]; return s; }
+    template < typename S, typename T > static S& vdivide( S& s, const T& t ) { s[0] /= t[0]; return s; }
+    template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[0] *= t; return s; }
+    template < typename S > static S& fill( S&s, double value ) { s[0] = 0; return s; }
+    template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution ) { i[0] = index( p[0], origin[0], resolution[0] ); return i; }
 };
 
-} } // namespace comma { namespace impl {
+} } } // namespace comma { namespace containers { impl {
diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 34c760ec7..5a88c59b9 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -157,8 +157,8 @@ class array
         slice_type _slice;
 };
 
-template < typename V, unsigned int D, typename P = std::array< double, D >, typename S = std::vector< V > >
-class interpolated_array: public array< V, D, S >
+template < typename V, unsigned int D, typename P = std::array< double, D >, typename Traits = impl::operations< D >, typename S = std::vector< V > >
+class grid: public array< V, D, S >
 {
     public:
         typedef P point_type;
@@ -169,23 +169,24 @@ class interpolated_array: public array< V, D, S >
 
         typedef typename base_type::value_type value_type;
 
-        interpolated_array( const P& origin, const P& resolution, const index_type& size, const V& default_value = V() );
+        grid( const P& origin, const P& resolution, const index_type& shape, const V& default_value = V() );
 
-        index_type index_of( const point_type& p ) const; // p: 1.,2.,3. -> return: 23,22,21
+        index_type index_of( const point_type& p ) const;
 
-        /// q = index_as_point( p ); // p: 1.,2.,3. -> 21.,22.,23
-        /// index_of( p ) == index_of( origin + q * resolution );
-        point_type index_as_point( const point_type& p ) const; // p: 1.,2.,3. -> 21.,22.,23
+        point_type lower_bound( const point_type& p ) const;
 
-        V& operator()( const point_type& p ) { return operator()( index_of( p ) ); }
+        V& operator()( const point_type& p ) { return this->operator[]( index_of( p ) ); }
 
-        const V& operator()( const point_type& p ) const { return operator()( index_of( p ) ); }
+        const V& operator()( const point_type& p ) const { return this->operator[]( index_of( p ) ); }
 
-        V interpolated( const point_type& p ) const;
+        const point_type& origin() const { return _origin; }
+
+        const point_type& resolution() const { return _resolution; }
 
     private:
         point_type _origin;
         point_type _resolution;
+        point_type _end;
         void _assert_valid( const point_type& p );
 };
 
@@ -252,4 +253,19 @@ inline const slice< V, D - I > slice< V, D >::at( const std::array< std::size_t,
 template < typename V, unsigned int D, typename S >
 inline array< V, D, S >::array( const index_type& shape, const V& default_value ): _data( impl::index< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
 
+// template < typename V, unsigned int D, typename P, typename Traits, typename S >
+// inline typename interpolated_array< V, D, P, Traits, S >::key_type interpolated_array< V, D, P, Traits, S >::index_of( const typename interpolated_array< V, D, P, Traits, S >::point_type& point )
+// {
+//     point_type diff = Traits::divide( Traits::subtract( _point, _origin ), _resolution ); // todo: move this all to a more generic location; reuse for array and map
+//     key_type index;
+//     for( unsigned int i = 0; i < dimensions; ++i )
+//     {
+//         int d = diff[i];
+//         index[i] = d;
+//         if( diff[i] == d ) { continue; }
+//         index[i] += diff[i] < 0 ? impl::negative_flooring() : ( d == 0 ? 0 : impl::positive_flooring() );
+//     }
+//     return index;
+// }
+
 } } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/multidimensional/map.h b/containers/multidimensional/map.h
index 889c90f27..f9fa9894d 100644
--- a/containers/multidimensional/map.h
+++ b/containers/multidimensional/map.h
@@ -26,7 +26,7 @@ struct array_hash : public std::unary_function< Array, std::size_t >
 };
 
 /// unordered map with array-like keys
-template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, typename Traits = impl::array_traits< P > >
+template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, typename Traits = impl::operations< Size > >
 class map : public std::unordered_map< std::array< comma::int32, Size >, V, array_hash< std::array< comma::int32, Size >, Size > >
 {
     public:
@@ -103,7 +103,7 @@ inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Tra
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Traits >::point_type& resolution )
-    : _origin( Traits::zero() )
+    : _origin( Traits::template zero< P >() )
     , _resolution( resolution )
 {
 }
@@ -126,22 +126,13 @@ inline std::pair< typename map< K, V, Size, P, Traits >::iterator, bool > map< K
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& origin, const typename map< K, V, Size, P, Traits >::point_type& resolution )
 {
-    point_type diff = Traits::divide( Traits::subtract( point, origin ), resolution );
-    key_type index;
-    for( unsigned int i = 0; i < dimensions; ++i )
-    {
-        int d = diff[i];
-        index[i] = d;
-        if( diff[i] == d ) { continue; }
-        index[i] += diff[i] < 0 ? impl::negative_flooring() : ( d == 0 ? 0 : impl::positive_flooring() );
-    }
-    return index;
+    return Traits::template index_of< P, key_type >( point, origin, resolution );
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& resolution )
 {
-    return index_of( point, Traits::zero(), resolution );
+    return index_of( point, Traits::template zero< P >(), resolution );
 }
 
 template < typename K, typename V, unsigned int Size, typename P, typename Traits >
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 9939e8b13..2d409e00f 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -1,6 +1,7 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
+#include <eigen3/Eigen/Core>
 #include "../multidimensional/array.h"
 
 namespace cmd = comma::containers::multidimensional; 

From 55c87492d19cdfd919b88c3e773e6b2941c1cec7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Jun 2023 16:12:31 +1000
Subject: [PATCH 0602/1056] containers::multidimensional::grid: implemented;
 unit test: todo

---
 containers/multidimensional/array.h | 8 +++-----
 1 file changed, 3 insertions(+), 5 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 5a88c59b9..c53b57d7e 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -169,11 +169,11 @@ class grid: public array< V, D, S >
 
         typedef typename base_type::value_type value_type;
 
-        grid( const P& origin, const P& resolution, const index_type& shape, const V& default_value = V() );
+        grid( const P& origin, const P& resolution, const index_type& shape, const V& default_value = V() ): base_type( shape, default_value ), _origin( origin ), _resolution( resolution ) {}
 
-        index_type index_of( const point_type& p ) const;
+        index_type index_of( const point_type& point ) const { return Traits::template index_of< P, index_type >( point, origin, resolution ); }
 
-        point_type lower_bound( const point_type& p ) const;
+        point_type lower_bound( const point_type& point ) const { return Traits::add( _origin + Traits::multiply( _resolution, index_of( point ) ) ); }
 
         V& operator()( const point_type& p ) { return this->operator[]( index_of( p ) ); }
 
@@ -186,8 +186,6 @@ class grid: public array< V, D, S >
     private:
         point_type _origin;
         point_type _resolution;
-        point_type _end;
-        void _assert_valid( const point_type& p );
 };
 
 namespace impl {

From 03a6c5afdcc5500c7d84647f99f78a1054d2793f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 7 Jun 2023 14:55:59 +1000
Subject: [PATCH 0603/1056] containers: array_traits: operations::nearest():
 first cut implemented

---
 containers/impl/array_traits.h                | 33 ++++++++++++++++--
 containers/test/array_traits_test.cpp         | 34 +++++++++++++++++++
 .../test/multidimensional_array_test.cpp      |  3 +-
 3 files changed, 66 insertions(+), 4 deletions(-)
 create mode 100644 containers/test/array_traits_test.cpp

diff --git a/containers/impl/array_traits.h b/containers/impl/array_traits.h
index 688a7ee30..1b0e66876 100644
--- a/containers/impl/array_traits.h
+++ b/containers/impl/array_traits.h
@@ -18,21 +18,30 @@ template < typename T > inline int index( T p, T origin, T resolution )
     return i;
 }
 
+template < typename I, std::size_t Size > static constexpr std::array< I, Size > neighbours; // quick and dirty, for now leaving it to the enthusiasts to implement it using metaprogramming
+template < typename I > static constexpr std::array< I, 2 > neighbours< I, 1 > = {{ {{ 0 }}, {{ 1 }} }};
+template < typename I > static constexpr std::array< I, 4 > neighbours< I, 2 > = {{ {{ 0, 0 }}, {{ 0, 1 }}, {{ 1, 0 }}, {{ 1, 1 }} }};
+template < typename I > static constexpr std::array< I, 8 > neighbours< I, 3 > = {{ {{ 0, 0, 0 }}, {{ 0, 0, 1 }}, {{ 0, 1, 0 }}, {{ 0, 1, 1 }}, {{ 1, 0, 0 }}, {{ 1, 0, 1 }}, {{ 1, 1, 0 }}, {{ 1, 1, 1 }} }};
+template < typename I > static constexpr std::array< I, 16 > neighbours< I, 4 > = {{ {{ 0, 0, 0, 0 }}, {{ 0, 0, 0, 1 }}, {{ 0, 0, 1, 0 }}, {{ 0, 0, 1, 1 }}, {{ 0, 1, 0, 0 }}, {{ 0, 1, 0, 1 }}, {{ 0, 1, 1, 0 }}, {{ 0, 1, 1, 1 }}, {{ 1, 0, 0, 0 }}, {{ 1, 0, 0, 1 }}, {{ 1, 0, 1, 0 }}, {{ 1, 0, 1, 1 }}, {{ 1, 1, 0, 0 }}, {{ 1, 1, 0, 1 }}, {{ 1, 1, 1, 0 }}, {{ 1, 1, 1, 1 }} }};
+// todo: add more dimensions as required or write that little metaprogramming piece
+
 template < std::size_t Size > struct operations
 {
     template < typename S, typename T > static S& add( S& s, const T& t ) { s[ Size - 1 ] += t[ Size - 1 ]; operations< Size - 1 >::multiply( s, t ); return s; }
     template < typename S, typename T > static S& subtract( S& s, const T& t ) { s[ Size - 1 ] -= t[ Size - 1 ]; operations< Size - 1 >::subtract( s, t ); return s; }
     template < typename S, typename T > static S& vdivide( S& s, const T& t ) { s[ Size - 1 ] /= t[ Size - 1 ]; operations< Size - 1 >::vdivide( s, t ); return s; }
     template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[ Size - 1 ] *= t; operations< Size - 1 >::multiply( s, t ); return s; }
+    template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[ Size - 1 ] *= t[ Size - 1 ]; operations< Size - 1 >::vmultiply( s, t ); return s; }
     template < typename S, typename T > static double dot( S& s, const T& t ) { return s[ Size - 1 ] * t[ Size - 1 ] + operations< Size - 1 >::dot( s, t ); }
     template < typename S > static S& fill( S&s, double value ) { s[ Size - 1 ] = 0; operations< Size - 1 >::fill( s, value ); return s; }
     template < typename S > static S filled( double value ) { S s; fill( s, value ); return s; }
     template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
 
     template < typename S, typename T > static S add( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
-    template < typename S, typename T > static S subtract( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
-    template < typename S, typename T > static S vdivide( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
+    template < typename S, typename T > static S subtract( const S& s, const T& t ) { S r = s; subtract( r, t ); return r; }
+    template < typename S, typename T > static S vdivide( const S& s, const T& t ) { S r = s; vdivide( r, t ); return r; }
     template < typename S, typename T > static S multiply( const S& s, const T& t ) { S r = s; multiply( r, t ); return r; }
+    template < typename S, typename T > static S vmultiply( const S& s, const T& t ) { S r = s; vmultiply( r, t ); return r; }
 
     template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution )
     {
@@ -42,16 +51,34 @@ template < std::size_t Size > struct operations
     }
 
     template < typename S, typename I > static I index_of( const S& p, const S& origin, const S& resolution ) { I i; index_of( i, p, origin, resolution ); return i; }
+
+    template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) // todo? metaprogram?
+    {
+        const S& s = subtract( p, origin );
+        double m = dot( s, s );
+        unsigned int j = 0;
+        const auto& n = comma::containers::impl::neighbours< I, Size >;
+        for( unsigned int i = 1; m > 0 && i < n.size(); ++i )
+        {
+            const S& r = subtract( vmultiply( resolution, n[i] ), s );
+            double d = dot( r, r );
+            if( d < m ) { m = d; j = i; }
+        }
+        return n[j];
+    }
 };
 
-template <> struct operations< 0 >
+template <> struct operations< 1 >
 {
     template < typename S, typename T > static S& add( S& s, const T& t ) { s[0] += t[0]; return s; }
     template < typename S, typename T > static S& subtract( S& s, const T& t ) { s[0] -= t[0]; return s; }
     template < typename S, typename T > static S& vdivide( S& s, const T& t ) { s[0] /= t[0]; return s; }
     template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[0] *= t; return s; }
+    template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[0] *= t[0]; return s; }
+    template < typename S, typename T > static double dot( S& s, const T& t ) { return s[0] * t[0]; }
     template < typename S > static S& fill( S&s, double value ) { s[0] = 0; return s; }
     template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution ) { i[0] = index( p[0], origin[0], resolution[0] ); return i; }
+    template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) { return p[0] - origin[0] < resolution[0] / 2 ? I{ 0 } : I{ 1 }; }
 };
 
 } } } // namespace comma { namespace containers { impl {
diff --git a/containers/test/array_traits_test.cpp b/containers/test/array_traits_test.cpp
new file mode 100644
index 000000000..4bd699136
--- /dev/null
+++ b/containers/test/array_traits_test.cpp
@@ -0,0 +1,34 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <array>
+#include <gtest/gtest.h>
+#include "../multidimensional/array.h"
+
+namespace cci = comma::containers::impl; 
+
+TEST( array_traits, operations_nearest )
+{
+    {
+        typedef std::array< double, 1 > point_t;
+        typedef std::array< int, 1 > index_t;
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+    }
+    {
+        typedef std::array< double, 2 > point_t;
+        typedef std::array< int, 2 > index_t;
+        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }        
+        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.2}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+    }
+}
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 2d409e00f..dcae52934 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -1,11 +1,12 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
-#include <eigen3/Eigen/Core>
 #include "../multidimensional/array.h"
 
 namespace cmd = comma::containers::multidimensional; 
 
+namespace cci = comma::containers::impl; 
+
 TEST( multidimensional_array, impl_index_value )
 {
     EXPECT_EQ( cmd::impl::index< 2 >::value( {0, 0}, {1, 5} ), 0 );

From 499db574fa482504e69bd43b6a0f544fbf335675 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 7 Jun 2023 15:31:48 +1000
Subject: [PATCH 0604/1056] containers: array_traits: operations: norms(),
 weights(): first cut implemented

---
 containers/impl/array_traits.h        | 32 +++++++++++++++++++++++++++
 containers/test/array_traits_test.cpp |  9 ++++++++
 2 files changed, 41 insertions(+)

diff --git a/containers/impl/array_traits.h b/containers/impl/array_traits.h
index 1b0e66876..15b39b3e2 100644
--- a/containers/impl/array_traits.h
+++ b/containers/impl/array_traits.h
@@ -5,6 +5,7 @@
 #pragma once
 
 #include <array>
+#include <cmath>
 
 namespace comma { namespace containers { namespace impl {
 
@@ -18,6 +19,8 @@ template < typename T > inline int index( T p, T origin, T resolution )
     return i;
 }
 
+template < int Base, unsigned int Pow > static constexpr int pow = Base * pow< Base, Pow - 1 >;
+template < int Base > static constexpr int pow< Base, 0 >{1};
 template < typename I, std::size_t Size > static constexpr std::array< I, Size > neighbours; // quick and dirty, for now leaving it to the enthusiasts to implement it using metaprogramming
 template < typename I > static constexpr std::array< I, 2 > neighbours< I, 1 > = {{ {{ 0 }}, {{ 1 }} }};
 template < typename I > static constexpr std::array< I, 4 > neighbours< I, 2 > = {{ {{ 0, 0 }}, {{ 0, 1 }}, {{ 1, 0 }}, {{ 1, 1 }} }};
@@ -66,6 +69,35 @@ template < std::size_t Size > struct operations
         }
         return n[j];
     }
+
+    template < typename S, typename I > static std::array< double, pow< 2, Size > > squared_norms( const S& p, const S& origin, const S& resolution ) // todo? metaprogram?
+    {
+        const S& s = subtract( p, origin );
+        std::array< double, pow< 2, Size > > d;
+        const auto& n = comma::containers::impl::neighbours< I, Size >;
+        for( unsigned int i = 0; i < n.size(); ++i )
+        {
+            const S& r = subtract( vmultiply( resolution, n[i] ), s );
+            d[i] = dot( r, r );
+        }
+        return d;
+    }
+
+    template < typename S, typename I > static std::array< double, pow< 2, Size > > norms( const S& p, const S& origin, const S& resolution )
+    {
+        std::array< double, pow< 2, Size > > d = squared_norms( p, origin, resolution );
+        for( auto& v: d ) { v = std::sqrt( v ); }
+        return d;
+    }
+
+    template < typename S, typename I > static std::array< double, pow< 2, Size > > weights( const S& p, const S& origin, const S& resolution )
+    {
+        std::array< double, pow< 2, Size > > d = norms( p, origin, resolution );
+        double s = 0;
+        for( auto& v: d ) { s += v; }
+        for( auto& v: d ) { v /= s; }
+        return d;
+    }
 };
 
 template <> struct operations< 1 >
diff --git a/containers/test/array_traits_test.cpp b/containers/test/array_traits_test.cpp
index 4bd699136..3b5e4f597 100644
--- a/containers/test/array_traits_test.cpp
+++ b/containers/test/array_traits_test.cpp
@@ -31,4 +31,13 @@ TEST( array_traits, operations_nearest )
         { index_t expected{0, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
         { index_t expected{1, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
     }
+    {
+        typedef std::array< double, 3 > point_t;
+        typedef std::array< int, 3 > index_t;
+        { index_t expected{0, 0, 0}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 0, 0}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1, 0}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0.7, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0, 1}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1, 1}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0.7, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+    }
 }

From 1525af88be348041e361b8d564fb7e1cd7167e36 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 7 Jun 2023 15:49:51 +1000
Subject: [PATCH 0605/1056] containers: array_traits moved to multidimensional

---
 containers/CMakeLists.txt                     |  6 +--
 containers/multidimensional/array.h           | 45 +++++++------------
 .../{impl => multidimensional}/array_traits.h |  8 ++--
 containers/multidimensional/map.h             |  2 +-
 containers/test/array_traits_test.cpp         | 44 +++++++++---------
 .../test/multidimensional_array_test.cpp      | 44 +++++++++---------
 6 files changed, 65 insertions(+), 84 deletions(-)
 rename containers/{impl => multidimensional}/array_traits.h (96%)

diff --git a/containers/CMakeLists.txt b/containers/CMakeLists.txt
index 698846fec..52fe741f2 100644
--- a/containers/CMakeLists.txt
+++ b/containers/CMakeLists.txt
@@ -3,17 +3,15 @@ SET( TARGET_NAME comma${PROJECT} )
 
 FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
-FILE( GLOB impl_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/*.h )
 FILE( GLOB multidimensional_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/multidimensional/*.h )
 
-SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} ${multidimensional_includes} )
+SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${multidimensional_includes} )
 
-add_custom_target( ${TARGET_NAME} ${source} ${includes} ${impl_includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_includes} )
+add_custom_target( ${TARGET_NAME} ${source} ${includes} ${multidimensional_includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_includes} )
 #SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 #TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
-INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
 INSTALL( FILES ${multidimensional_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/multidimensional )
 #INSTALL(
 #    TARGETS ${TARGET_NAME}
diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index c53b57d7e..baab11152 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -6,7 +6,7 @@
 
 #include <array>
 #include "../../base/types.h"
-#include "../impl/array_traits.h"
+#include "array_traits.h"
 
 namespace comma { namespace containers { namespace multidimensional {
 
@@ -191,13 +191,13 @@ class grid: public array< V, D, S >
 namespace impl {
 
 template < unsigned int D, unsigned int I = D >
-struct index
+struct index_traits
 {
     typedef std::array< std::size_t, D > index_type;
-    static unsigned int value( const index_type& i, const index_type& shape ) { return i[ I - 1 ] + index< D, I - 1 >::value( i, shape ) * shape[ I - 1 ]; }
-    static void value( std::size_t j, index_type& i, const index_type& shape ) { i[ I - 1 ] = j % shape[ I - 1 ]; index< D, I - 1 >::value( j / shape[ I - 1 ], i, shape ); }
+    static unsigned int value( const index_type& i, const index_type& shape ) { return i[ I - 1 ] + index_traits< D, I - 1 >::value( i, shape ) * shape[ I - 1 ]; }
+    static void value( std::size_t j, index_type& i, const index_type& shape ) { i[ I - 1 ] = j % shape[ I - 1 ]; index_traits< D, I - 1 >::value( j / shape[ I - 1 ], i, shape ); }
     static index_type value( std::size_t j, const index_type& shape ) { index_type i; value( j, i, shape ); return i; }
-    static std::size_t product( const index_type& i ) { return i[ I - 1 ] * index< D, I - 1 >::product( i ); }
+    static std::size_t product( const index_type& i ) { return i[ I - 1 ] * index_traits< D, I - 1 >::product( i ); }
     template < unsigned int J >
     static std::pair< std::array< std::size_t, J >, std::array< std::size_t, D - J > > split( const index_type& i ) // todo: use metaprogramming, kinda same as product
     {
@@ -210,7 +210,7 @@ struct index
 };
 
 template < unsigned int D >
-struct index< D, 1 >
+struct index_traits< D, 1 >
 {
     typedef std::array< std::size_t, D > index_type;
     static unsigned int value( const index_type& i, const index_type& ) { return i[0]; }
@@ -221,49 +221,34 @@ struct index< D, 1 >
 } // namespace impl {
 
 template < typename V, unsigned int D >
-inline std::size_t slice< V, D >::_index( const typename slice< V, D >::index_type& i ) { return impl::index< D >::value( i, _shape ); }
+inline std::size_t slice< V, D >::_index( const typename slice< V, D >::index_type& i ) { return impl::index_traits< D >::value( i, _shape ); }
 
 template < typename V, unsigned int D >
-inline std::size_t slice< V, D >::_product( const typename slice< V, D >::index_type& i ) { return impl::index< D >::product( i ); }
+inline std::size_t slice< V, D >::_product( const typename slice< V, D >::index_type& i ) { return impl::index_traits< D >::product( i ); }
 
 template < typename V, unsigned int D >
-inline typename slice< V, D >::index_type slice< V, D >::iterator::index() const { return impl::index< D >::value( _i, _shape ); }
+inline typename slice< V, D >::index_type slice< V, D >::iterator::index() const { return impl::index_traits< D >::value( _i, _shape ); }
 
 template < typename V, unsigned int D >
-inline typename slice< V, D >::index_type slice< V, D >::const_iterator::index() const { return impl::index< D >::value( _i, _shape ); }
+inline typename slice< V, D >::index_type slice< V, D >::const_iterator::index() const { return impl::index_traits< D >::value( _i, _shape ); }
 
 template < typename V, unsigned int D >
 template < unsigned int I >
 inline slice< V, D - I > slice< V, D >::at( const std::array< std::size_t, I >& i )
 {
-    auto s = impl::index< D >::template split< I >( _shape );
-    return slice< V, D - I >( s.second, _data + impl::index< I >::value( i, s.first ) * impl::index< D - I >::product( s.second ) );
+    auto s = impl::index_traits< D >::template split< I >( _shape );
+    return slice< V, D - I >( s.second, _data + impl::index_traits< I >::value( i, s.first ) * impl::index_traits< D - I >::product( s.second ) );
 }
 
 template < typename V, unsigned int D >
 template < unsigned int I >
 inline const slice< V, D - I > slice< V, D >::at( const std::array< std::size_t, I >& i ) const
 {
-    auto s = impl::index< D >::template split< I >( _shape );
-    return slice< V, D - I >( s.second, _data + impl::index< I >::value( i, s.first ) * impl::index< D - I >::product( s.second ) );
+    auto s = impl::index_traits< D >::template split< I >( _shape );
+    return slice< V, D - I >( s.second, _data + impl::index_traits< I >::value( i, s.first ) * impl::index_traits< D - I >::product( s.second ) );
 }
 
 template < typename V, unsigned int D, typename S >
-inline array< V, D, S >::array( const index_type& shape, const V& default_value ): _data( impl::index< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
-
-// template < typename V, unsigned int D, typename P, typename Traits, typename S >
-// inline typename interpolated_array< V, D, P, Traits, S >::key_type interpolated_array< V, D, P, Traits, S >::index_of( const typename interpolated_array< V, D, P, Traits, S >::point_type& point )
-// {
-//     point_type diff = Traits::divide( Traits::subtract( _point, _origin ), _resolution ); // todo: move this all to a more generic location; reuse for array and map
-//     key_type index;
-//     for( unsigned int i = 0; i < dimensions; ++i )
-//     {
-//         int d = diff[i];
-//         index[i] = d;
-//         if( diff[i] == d ) { continue; }
-//         index[i] += diff[i] < 0 ? impl::negative_flooring() : ( d == 0 ? 0 : impl::positive_flooring() );
-//     }
-//     return index;
-// }
+inline array< V, D, S >::array( const index_type& shape, const V& default_value ): _data( impl::index_traits< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
 
 } } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/impl/array_traits.h b/containers/multidimensional/array_traits.h
similarity index 96%
rename from containers/impl/array_traits.h
rename to containers/multidimensional/array_traits.h
index 15b39b3e2..8c41f9781 100644
--- a/containers/impl/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -7,7 +7,7 @@
 #include <array>
 #include <cmath>
 
-namespace comma { namespace containers { namespace impl {
+namespace comma { namespace containers { namespace multidimensional { namespace impl {
 
 template < typename T > inline int index( T p, T origin, T resolution )
 {
@@ -60,7 +60,7 @@ template < std::size_t Size > struct operations
         const S& s = subtract( p, origin );
         double m = dot( s, s );
         unsigned int j = 0;
-        const auto& n = comma::containers::impl::neighbours< I, Size >;
+        const auto& n = neighbours< I, Size >;
         for( unsigned int i = 1; m > 0 && i < n.size(); ++i )
         {
             const S& r = subtract( vmultiply( resolution, n[i] ), s );
@@ -74,7 +74,7 @@ template < std::size_t Size > struct operations
     {
         const S& s = subtract( p, origin );
         std::array< double, pow< 2, Size > > d;
-        const auto& n = comma::containers::impl::neighbours< I, Size >;
+        const auto& n = neighbours< I, Size >;
         for( unsigned int i = 0; i < n.size(); ++i )
         {
             const S& r = subtract( vmultiply( resolution, n[i] ), s );
@@ -113,4 +113,4 @@ template <> struct operations< 1 >
     template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) { return p[0] - origin[0] < resolution[0] / 2 ? I{ 0 } : I{ 1 }; }
 };
 
-} } } // namespace comma { namespace containers { impl {
+} } } } // namespace comma { namespace containers { namespace multidimensional { namespace impl {
diff --git a/containers/multidimensional/map.h b/containers/multidimensional/map.h
index f9fa9894d..5d4da6def 100644
--- a/containers/multidimensional/map.h
+++ b/containers/multidimensional/map.h
@@ -8,7 +8,7 @@
 #include <unordered_map>
 #include <boost/functional/hash.hpp>
 #include "../../base/types.h"
-#include "../impl/array_traits.h"
+#include "array_traits.h"
 
 namespace comma { namespace containers { namespace multidimensional {
 
diff --git a/containers/test/array_traits_test.cpp b/containers/test/array_traits_test.cpp
index 3b5e4f597..f00e3d077 100644
--- a/containers/test/array_traits_test.cpp
+++ b/containers/test/array_traits_test.cpp
@@ -2,42 +2,42 @@
 
 #include <array>
 #include <gtest/gtest.h>
-#include "../multidimensional/array.h"
+#include "../multidimensional/array_traits.h"
 
-namespace cci = comma::containers::impl; 
+namespace ccmi = comma::containers::multidimensional::impl; 
 
 TEST( array_traits, operations_nearest )
 {
     {
         typedef std::array< double, 1 > point_t;
         typedef std::array< int, 1 > index_t;
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
-        { index_t i = cci::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
     }
     {
         typedef std::array< double, 2 > point_t;
         typedef std::array< int, 2 > index_t;
-        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }        
-        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{0, 0}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.2}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{0, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{0, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{1, 1}; index_t actual = cci::operations< 2 >::nearest< point_t, index_t >( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }        
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.2}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
     }
     {
         typedef std::array< double, 3 > point_t;
         typedef std::array< int, 3 > index_t;
-        { index_t expected{0, 0, 0}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{1, 0, 0}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{0, 1, 0}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0.7, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{0, 0, 1}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
-        { index_t expected{1, 1, 1}; index_t actual = cci::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0.7, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0.7, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0.7, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
     }
 }
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index dcae52934..9c1abcb9a 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -5,40 +5,38 @@
 
 namespace cmd = comma::containers::multidimensional; 
 
-namespace cci = comma::containers::impl; 
-
 TEST( multidimensional_array, impl_index_value )
 {
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {0, 0}, {1, 5} ), 0 );
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {0, 1}, {1, 5} ), 1 );
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {0, 4}, {1, 5} ), 4 );
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 0}, {1, 5} ), 5 );
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 1}, {2, 5} ), 6 );
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 2}, {2, 5} ), 7 );
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {1, 2}, {3, 5} ), 7 );
-    EXPECT_EQ( cmd::impl::index< 2 >::value( {2, 2}, {3, 5} ), 12 );
-    EXPECT_EQ( cmd::impl::index< 3 >::value( {0, 0, 0}, {2, 3, 4} ), 0 );
-    EXPECT_EQ( cmd::impl::index< 3 >::value( {0, 0, 3}, {2, 3, 4} ), 3 );
-    EXPECT_EQ( cmd::impl::index< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
-    EXPECT_EQ( cmd::impl::index< 3 >::value( {1, 2, 3}, {2, 3, 4} ), 3 + 4 * ( 2 + 3 * 1 ) );
-    EXPECT_EQ( cmd::impl::index< 3 >::value( {1, 2, 4}, {2, 3, 4} ), 2 * 3 * 4 );
-    EXPECT_EQ( cmd::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {0, 0}, {1, 5} ), 0 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {0, 1}, {1, 5} ), 1 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {0, 4}, {1, 5} ), 4 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 0}, {1, 5} ), 5 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 1}, {2, 5} ), 6 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 2}, {2, 5} ), 7 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 2}, {3, 5} ), 7 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {2, 2}, {3, 5} ), 12 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {0, 0, 0}, {2, 3, 4} ), 0 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {0, 0, 3}, {2, 3, 4} ), 3 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {1, 2, 3}, {2, 3, 4} ), 3 + 4 * ( 2 + 3 * 1 ) );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {1, 2, 4}, {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
 }
 
 TEST( multidimensional_array, impl_index_product )
 {
-    EXPECT_EQ( cmd::impl::index< 1 >::product( {2} ), 2 );
-    EXPECT_EQ( cmd::impl::index< 2 >::product( {2, 3} ), 6 );
-    EXPECT_EQ( cmd::impl::index< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
-    EXPECT_EQ( cmd::impl::index< 4 >::product( {2, 3, 4, 5} ), 2 * 3 * 4 * 5 );
+    EXPECT_EQ( cmd::impl::index_traits< 1 >::product( {2} ), 2 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::product( {2, 3} ), 6 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index_traits< 4 >::product( {2, 3, 4, 5} ), 2 * 3 * 4 * 5 );
 }
 
 TEST( multidimensional_array, impl_index_inverted_value )
 {
     typedef std::array< std::size_t, 3 > array_t;
-    { array_t a{0, 0, 0}; EXPECT_EQ( cmd::impl::index< 3 >::value( 0, {2, 3, 4} ), a ); }
-    { array_t a{0, 0, 1}; EXPECT_EQ( cmd::impl::index< 3 >::value( 1, {2, 3, 4} ), a ); }
-    { array_t a{2, 1, 3}; EXPECT_EQ( cmd::impl::index< 3 >::value( 3 + 4 * ( 1 + 3 * 2 ), {2, 3, 4} ), a ); }
+    { array_t a{0, 0, 0}; EXPECT_EQ( cmd::impl::index_traits< 3 >::value( 0, {2, 3, 4} ), a ); }
+    { array_t a{0, 0, 1}; EXPECT_EQ( cmd::impl::index_traits< 3 >::value( 1, {2, 3, 4} ), a ); }
+    { array_t a{2, 1, 3}; EXPECT_EQ( cmd::impl::index_traits< 3 >::value( 3 + 4 * ( 1 + 3 * 2 ), {2, 3, 4} ), a ); }
     // todo: way more tests
 }
 

From a8921ab18162890dd9d6995281974945b82ad050 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 7 Jun 2023 19:12:23 +1000
Subject: [PATCH 0606/1056] containers: array_traits: interpolation::linear:
 first cut implemented; testing...

---
 containers/multidimensional/array_traits.h | 34 ++++++++++++++++------
 containers/test/array_traits_test.cpp      | 21 +++++++++++++
 2 files changed, 46 insertions(+), 9 deletions(-)

diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index 8c41f9781..c0b036ab1 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -6,6 +6,7 @@
 
 #include <array>
 #include <cmath>
+#include <type_traits>
 
 namespace comma { namespace containers { namespace multidimensional { namespace impl {
 
@@ -36,9 +37,13 @@ template < std::size_t Size > struct operations
     template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[ Size - 1 ] *= t; operations< Size - 1 >::multiply( s, t ); return s; }
     template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[ Size - 1 ] *= t[ Size - 1 ]; operations< Size - 1 >::vmultiply( s, t ); return s; }
     template < typename S, typename T > static double dot( S& s, const T& t ) { return s[ Size - 1 ] * t[ Size - 1 ] + operations< Size - 1 >::dot( s, t ); }
-    template < typename S > static S& fill( S&s, double value ) { s[ Size - 1 ] = 0; operations< Size - 1 >::fill( s, value ); return s; }
+    template < typename S, typename T > static S& invert( S& s ) { s[ Size - 1 ] = !s[ Size - 1 ]; operations< Size - 1 >::invert( s ); return s; }
+    template < typename S, typename T > static S& mask( S& s, const T& t ) { s[ Size - 1 ] = t[ Size - 1 ] ? t[ Size - 1 ] : s[ Size - 1 ]; operations< Size - 1 >::mask( s, t ); return s; }
+    template < typename S, typename T > static S masked( const S& s, const T& t ) { S m = s; mask( m, t ); return m; }
+    template < typename S > static S& fill( S&s, double value ) { s[ Size - 1 ] = value; operations< Size - 1 >::fill( s, value ); return s; }
     template < typename S > static S filled( double value ) { S s; fill( s, value ); return s; }
     template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
+    template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[Size] ) >::type { return s[ Size - 1 ] * operations< Size - 1 >::product( s ); }
 
     template < typename S, typename T > static S add( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
     template < typename S, typename T > static S subtract( const S& s, const T& t ) { S r = s; subtract( r, t ); return r; }
@@ -90,14 +95,22 @@ template < std::size_t Size > struct operations
         return d;
     }
 
-    template < typename S, typename I > static std::array< double, pow< 2, Size > > weights( const S& p, const S& origin, const S& resolution )
+    struct interpolation
     {
-        std::array< double, pow< 2, Size > > d = norms( p, origin, resolution );
-        double s = 0;
-        for( auto& v: d ) { s += v; }
-        for( auto& v: d ) { v /= s; }
-        return d;
-    }
+        struct linear
+        {
+            template < typename S > static std::array< double, pow< 2, Size > > weights( const S& p, const S& origin, const S& resolution )
+            {
+                S s = vdivide( subtract( p, origin ), resolution );
+                S t;
+                subtract( fill( t, 1. ), s );
+                const auto& n = neighbours< std::array< unsigned int, Size >, Size >;
+                std::array< double, pow< 2, Size > > w;
+                for( unsigned int i = 0; i < pow< 2, Size >; ++i ) { w[i] = product( masked( s, n[ pow< 2, Size > - i - 1 ] ) ) * product( masked( t, n[i] ) ); }
+                return w;
+            }
+        };
+    };
 };
 
 template <> struct operations< 1 >
@@ -108,7 +121,10 @@ template <> struct operations< 1 >
     template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[0] *= t; return s; }
     template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[0] *= t[0]; return s; }
     template < typename S, typename T > static double dot( S& s, const T& t ) { return s[0] * t[0]; }
-    template < typename S > static S& fill( S&s, double value ) { s[0] = 0; return s; }
+    template < typename S, typename T > static S& invert( S& s ) { s[0] = !s[0]; return s; }
+    template < typename S, typename T > static S& mask( S& s, const T& t ) { s[0] = t[0] ? t[0] : s[0]; return s; }
+    template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[0] ) >::type { return s[0]; }
+    template < typename S > static S& fill( S&s, double value ) { s[0] = value; return s; }
     template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution ) { i[0] = index( p[0], origin[0], resolution[0] ); return i; }
     template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) { return p[0] - origin[0] < resolution[0] / 2 ? I{ 0 } : I{ 1 }; }
 };
diff --git a/containers/test/array_traits_test.cpp b/containers/test/array_traits_test.cpp
index f00e3d077..7a1d30ad8 100644
--- a/containers/test/array_traits_test.cpp
+++ b/containers/test/array_traits_test.cpp
@@ -40,4 +40,25 @@ TEST( array_traits, operations_nearest )
         { index_t expected{0, 0, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
         { index_t expected{1, 1, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0.7, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
     }
+    {
+        typedef std::array< float, 3 > point_t;
+        typedef std::array< float, 3 > index_t;
+        { index_t expected{0, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0.7, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0.7, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+    }
+}
+
+TEST( array_traits, interpolation_linear_weights )
+{
+    {
+        typedef std::array< double, 2 > point_t;
+        typedef std::array< double, 4 > weights_t;
+        { weights_t expected{1, 0, 0, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0, 1, 0, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0, 0, 1, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{1, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0, 0, 0, 1}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+    }
 }

From d76db542ac71114091c73015334b78b8f3921adb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 10:49:42 +1000
Subject: [PATCH 0607/1056] containers: array_traits: interpolation::linear:
 more tests added

---
 containers/multidimensional/array_traits.h |  4 +++-
 containers/test/array_traits_test.cpp      |  4 ++++
 math/compare.h                             | 28 ----------------------
 3 files changed, 7 insertions(+), 29 deletions(-)

diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index c0b036ab1..c3dff96c3 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -7,6 +7,7 @@
 #include <array>
 #include <cmath>
 #include <type_traits>
+#include "../../math/compare.h"
 
 namespace comma { namespace containers { namespace multidimensional { namespace impl {
 
@@ -44,7 +45,7 @@ template < std::size_t Size > struct operations
     template < typename S > static S filled( double value ) { S s; fill( s, value ); return s; }
     template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
     template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[Size] ) >::type { return s[ Size - 1 ] * operations< Size - 1 >::product( s ); }
-
+    template < typename S, typename T, typename Diff > static bool near( const S& s, const T& t, const Diff& epsilon ) { return comma::math::equal( s[ Size - 1 ], t[ Size - 1 ], epsilon ) && operations< Size - 1 >::near( s, t, epsilon ); }
     template < typename S, typename T > static S add( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
     template < typename S, typename T > static S subtract( const S& s, const T& t ) { S r = s; subtract( r, t ); return r; }
     template < typename S, typename T > static S vdivide( const S& s, const T& t ) { S r = s; vdivide( r, t ); return r; }
@@ -124,6 +125,7 @@ template <> struct operations< 1 >
     template < typename S, typename T > static S& invert( S& s ) { s[0] = !s[0]; return s; }
     template < typename S, typename T > static S& mask( S& s, const T& t ) { s[0] = t[0] ? t[0] : s[0]; return s; }
     template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[0] ) >::type { return s[0]; }
+    template < typename S, typename T, typename Diff > static bool near( const S& s, const T& t, const Diff& epsilon ) { return comma::math::equal( s[0], t[0], epsilon ); }
     template < typename S > static S& fill( S&s, double value ) { s[0] = value; return s; }
     template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution ) { i[0] = index( p[0], origin[0], resolution[0] ); return i; }
     template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) { return p[0] - origin[0] < resolution[0] / 2 ? I{ 0 } : I{ 1 }; }
diff --git a/containers/test/array_traits_test.cpp b/containers/test/array_traits_test.cpp
index 7a1d30ad8..6be69a2f3 100644
--- a/containers/test/array_traits_test.cpp
+++ b/containers/test/array_traits_test.cpp
@@ -2,6 +2,7 @@
 
 #include <array>
 #include <gtest/gtest.h>
+#include "../../math/compare.h"
 #include "../multidimensional/array_traits.h"
 
 namespace ccmi = comma::containers::multidimensional::impl; 
@@ -60,5 +61,8 @@ TEST( array_traits, interpolation_linear_weights )
         { weights_t expected{0, 1, 0, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
         { weights_t expected{0, 0, 1, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{1, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
         { weights_t expected{0, 0, 0, 1}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0.3, 0.7, 0, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_TRUE( ccmi::operations< 3 >::near( expected, actual, 1e-6 ) ); }
+        { weights_t expected{0.3, 0, 0.7, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0.7, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_TRUE( ccmi::operations< 3 >::near( expected, actual, 1e-6 ) ); }
+        // todo: way more testing
     }
 }
diff --git a/math/compare.h b/math/compare.h
index b55b62600..d87951abb 100644
--- a/math/compare.h
+++ b/math/compare.h
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 

From 5890e3dbcf874ac2f5f3d8848e198f35d05925de Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 11:50:41 +1000
Subject: [PATCH 0608/1056] math-lookup: in progress...

---
 containers/CMakeLists.txt               | 12 ++--
 containers/applications/CMakeLists.txt  |  7 +++
 containers/applications/math-lookup.cpp | 79 +++++++++++++++++++++++++
 3 files changed, 94 insertions(+), 4 deletions(-)
 create mode 100644 containers/applications/CMakeLists.txt
 create mode 100644 containers/applications/math-lookup.cpp

diff --git a/containers/CMakeLists.txt b/containers/CMakeLists.txt
index 52fe741f2..c809b3809 100644
--- a/containers/CMakeLists.txt
+++ b/containers/CMakeLists.txt
@@ -1,5 +1,5 @@
 SET( PROJECT "containers" )
-SET( TARGET_NAME comma${PROJECT} )
+SET( TARGET_NAME comma_${PROJECT} )
 
 FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
@@ -20,6 +20,10 @@ INSTALL( FILES ${multidimensional_includes} DESTINATION ${comma_INSTALL_INCLUDE_
 #    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
 #)
 
-IF( comma_BUILD_TESTS )
-    ADD_SUBDIRECTORY( test )
-ENDIF( comma_BUILD_TESTS )
+if( comma_BUILD_TESTS )
+    add_subdirectory( test )
+endif( comma_BUILD_TESTS )
+
+if( comma_BUILD_APPLICATIONS )
+    add_subdirectory( applications )
+endif( comma_BUILD_APPLICATIONS )
diff --git a/containers/applications/CMakeLists.txt b/containers/applications/CMakeLists.txt
new file mode 100644
index 000000000..dc4beb661
--- /dev/null
+++ b/containers/applications/CMakeLists.txt
@@ -0,0 +1,7 @@
+set( dir ${SOURCE_CODE_BASE_DIR}/containers/applications )
+
+add_executable( math-lookup math-lookup.cpp ) # todo! should math-lookup be here at all? does it create circular dependencies?
+#add_dependencies( math-lookup comma_containers )
+target_link_libraries( math-lookup ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv )
+set_target_properties( math-lookup PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS math-lookup RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
new file mode 100644
index 000000000..cdd87a7bf
--- /dev/null
+++ b/containers/applications/math-lookup.cpp
@@ -0,0 +1,79 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#include <iostream>
+#include "../../application/command_line_options.h"
+#include "../../csv/stream.h"
+
+void usage( bool verbose )
+{
+    std::cerr << "operations on a multidimensional lookup table" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat input.csv | math-lookup <operation> <options>" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    interpolate: output interpolated value for the given input" << std::endl;
+    std::cerr << "    nearest: todo: output table element index and value nearest to the given input" << std::endl;
+    std::cerr << "    query: todo: output table element index and value for the given input" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    interpolate" << std::endl;
+    std::cerr << "        todo" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    nearest" << std::endl;
+    std::cerr << "        todo" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    query" << std::endl;
+    std::cerr << "        todo" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    todo" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+namespace comma { namespace applications { namespace lookup { namespace operations {
+
+static int interpolate( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
+{
+    comma::say() << "interpolate: todo" << std::endl;
+    return 1;
+}
+
+static int nearest( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
+{
+    comma::say() << "nearest: todo" << std::endl;
+    return 1;
+}
+
+static int query( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
+{
+    comma::say() << "query: todo" << std::endl;
+    return 1;
+}
+
+} } } } // namespace comma { namespace applications { namespace lookup { namespace operations {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        comma::csv::options csv( options );
+        const auto& unnamed = options.unnamed( "--flush,--verbose,-v", "-.*" );
+        if( unnamed.empty() ) { comma::say() << "please specify operation" << std::endl; return 1; }
+        std::string operation = unnamed[0];
+        if( operation == "interpolate" ) { return comma::applications::lookup::operations::interpolate( options, csv, unnamed ); }
+        if( operation == "nearest" ) { return comma::applications::lookup::operations::nearest( options, csv, unnamed ); }
+        if( operation == "query" ) { return comma::applications::lookup::operations::query( options, csv, unnamed ); }
+        comma::say() << "expected operation; got: '" << operation << "'" << std::endl;
+        return 1;
+    }
+    catch( std::exception& ex ) { comma::say() << "caught exception: " << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "caught unknown exception" << std::endl; }
+    return 1;
+}

From f9653756b13b881deab7e82bb2f986788f94b66a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 12:21:57 +1000
Subject: [PATCH 0609/1056] containers::multidimensional::grid::interpolated():
 implemented; debugging...

---
 containers/multidimensional/array.h | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index baab11152..65042ce75 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -183,6 +183,8 @@ class grid: public array< V, D, S >
 
         const point_type& resolution() const { return _resolution; }
 
+        V interpolated( const point_type& point ) const; // todo: flag/enum or alike for different interpolation types; currently linear only
+
     private:
         point_type _origin;
         point_type _resolution;
@@ -249,6 +251,19 @@ inline const slice< V, D - I > slice< V, D >::at( const std::array< std::size_t,
 }
 
 template < typename V, unsigned int D, typename S >
-inline array< V, D, S >::array( const index_type& shape, const V& default_value ): _data( impl::index_traits< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
+inline array< V, D, S >::array( const typename array< V, D, S >::index_type& shape, const V& default_value ): _data( impl::index_traits< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
+
+template < typename V, unsigned int D, typename P, typename Traits, typename S >
+V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
+{
+    P origin = _resolution;
+    index_type i = index_of( point );
+    Traits::add( Traits::multiply( _resolution, i ), _origin );
+    const auto& weights = Traits::interpolation::linear::weights( point, origin, _resolution );
+    const auto& neighbours = impl::neighbours< index_type, D >;
+    V v = this->operator[]( i ) * weights[0]; // todo?! value traits?!
+    for( unsigned int i = 1; i < weights.size(); ++i ) { v += this->operator[]( Traits::add( neighbours[i], i ) ) * weights[i]; } // todo?! value traits?!
+    return v;
+}
 
 } } } // namespace comma { namespace containers { namespace multidimensional {

From be00bacca2773d4faa0c79a432f1b18bfd21e0e2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 13:15:33 +1000
Subject: [PATCH 0610/1056] containers::multidimensional::grid::interpolated():
 a few fixed; basic tests added

---
 containers/multidimensional/array.h           | 16 ++++++------
 containers/multidimensional/array_traits.h    |  2 +-
 .../test/multidimensional_array_test.cpp      | 25 +++++++++++++++++++
 3 files changed, 34 insertions(+), 9 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 65042ce75..f5d7c53bb 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -99,7 +99,7 @@ class slice
         index_type _shape;
         std::size_t _size;
         V* _data;
-        std::size_t _index( const index_type& i );
+        std::size_t _index( const index_type& i ) const;
         static std::size_t _product( const index_type& i );
 };
 
@@ -171,7 +171,7 @@ class grid: public array< V, D, S >
 
         grid( const P& origin, const P& resolution, const index_type& shape, const V& default_value = V() ): base_type( shape, default_value ), _origin( origin ), _resolution( resolution ) {}
 
-        index_type index_of( const point_type& point ) const { return Traits::template index_of< P, index_type >( point, origin, resolution ); }
+        index_type index_of( const point_type& point ) const { return Traits::template index_of< P, index_type >( point, _origin, _resolution ); }
 
         point_type lower_bound( const point_type& point ) const { return Traits::add( _origin + Traits::multiply( _resolution, index_of( point ) ) ); }
 
@@ -223,7 +223,7 @@ struct index_traits< D, 1 >
 } // namespace impl {
 
 template < typename V, unsigned int D >
-inline std::size_t slice< V, D >::_index( const typename slice< V, D >::index_type& i ) { return impl::index_traits< D >::value( i, _shape ); }
+inline std::size_t slice< V, D >::_index( const typename slice< V, D >::index_type& i ) const { return impl::index_traits< D >::value( i, _shape ); }
 
 template < typename V, unsigned int D >
 inline std::size_t slice< V, D >::_product( const typename slice< V, D >::index_type& i ) { return impl::index_traits< D >::product( i ); }
@@ -256,13 +256,13 @@ inline array< V, D, S >::array( const typename array< V, D, S >::index_type& sha
 template < typename V, unsigned int D, typename P, typename Traits, typename S >
 V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
 {
-    P origin = _resolution;
-    index_type i = index_of( point );
-    Traits::add( Traits::multiply( _resolution, i ), _origin );
-    const auto& weights = Traits::interpolation::linear::weights( point, origin, _resolution );
+    P element_origin = _resolution;
+    const index_type i = index_of( point );
+    Traits::add( Traits::vmultiply( element_origin, i ), _origin );
+    const auto& weights = Traits::interpolation::linear::weights( point, element_origin, _resolution );
     const auto& neighbours = impl::neighbours< index_type, D >;
     V v = this->operator[]( i ) * weights[0]; // todo?! value traits?!
-    for( unsigned int i = 1; i < weights.size(); ++i ) { v += this->operator[]( Traits::add( neighbours[i], i ) ) * weights[i]; } // todo?! value traits?!
+    for( unsigned int j = 1; j < weights.size(); ++j ) { v += this->operator[]( Traits::add( i, neighbours[j] ) ) * weights[j]; } // todo?! value traits?!
     return v;
 }
 
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index c3dff96c3..f156c222d 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -32,7 +32,7 @@ template < typename I > static constexpr std::array< I, 16 > neighbours< I, 4 >
 
 template < std::size_t Size > struct operations
 {
-    template < typename S, typename T > static S& add( S& s, const T& t ) { s[ Size - 1 ] += t[ Size - 1 ]; operations< Size - 1 >::multiply( s, t ); return s; }
+    template < typename S, typename T > static S& add( S& s, const T& t ) { s[ Size - 1 ] += t[ Size - 1 ]; operations< Size - 1 >::add( s, t ); return s; }
     template < typename S, typename T > static S& subtract( S& s, const T& t ) { s[ Size - 1 ] -= t[ Size - 1 ]; operations< Size - 1 >::subtract( s, t ); return s; }
     template < typename S, typename T > static S& vdivide( S& s, const T& t ) { s[ Size - 1 ] /= t[ Size - 1 ]; operations< Size - 1 >::vdivide( s, t ); return s; }
     template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[ Size - 1 ] *= t; operations< Size - 1 >::multiply( s, t ); return s; }
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 9c1abcb9a..603e2f9d4 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -184,3 +184,28 @@ TEST( multidimensional_array, slice )
         }
     }
 }
+
+TEST( multidimensional_array, grid_index )
+{
+    {
+        comma::containers::multidimensional::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 3}, 0 );
+        typedef std::array< std::size_t, 2 > index_t;
+        int i = 0;
+        for( auto it = g.begin(); it != g.end(); ++it ) { *it = i++; }
+        { index_t i = {0, 0}; EXPECT_EQ( g.index_of( {0, 0} ), i ); }
+        { index_t i = {0, 1}; EXPECT_EQ( g.index_of( {0, 1.01} ), i ); }
+        // todo: more tests
+    }
+}
+
+TEST( multidimensional_array, grid_interpolate )
+{
+    {
+        comma::containers::multidimensional::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 2}, 0 );
+        g[{0, 0}] = 0; g[{0, 1}] = 1; g[{1, 0}] = 2; g[{1, 1}] = 3;
+        EXPECT_EQ( g.interpolated( {0, 0} ), 0 );
+        EXPECT_EQ( g.interpolated( {0, 1} ), 1 );
+        EXPECT_EQ( g.interpolated( {1, 0} ), 2 );
+        EXPECT_EQ( g.interpolated( {1, 1} ), 3 );
+    }
+}
\ No newline at end of file

From 7d01adaa6623802da4ab3b089e77c403b035ea1d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 13:41:16 +1000
Subject: [PATCH 0611/1056] math-lookup: in progress...

---
 containers/applications/math-lookup.cpp | 32 +++++++++++++++++++++++++
 1 file changed, 32 insertions(+)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index cdd87a7bf..7be8959d6 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -2,9 +2,13 @@
 
 /// @author vsevolod vlaskine
 
+#include <fstream>
 #include <iostream>
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
 #include "../../csv/stream.h"
+#include "../../name_value/parser.h"
+#include "../multidimensional/array.h"
 
 void usage( bool verbose )
 {
@@ -36,6 +40,34 @@ void usage( bool verbose )
     exit( 0 );
 }
 
+namespace comma { namespace applications { namespace lookup { namespace operations {
+
+template < typename T, std::size_t D, std::size_t E >
+struct lut
+{
+    struct input { std::array< double, D > point; };
+    typedef std::array< std::size_t, D > index_t;
+    typedef std::array< T, E > value_t;
+    typedef comma::containers::multidimensional::grid< value_t, D > grid_t;
+
+    static grid_t& load( grid_t& g, const std::string& options )
+    {
+        auto csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( options );
+        COMMA_ASSERT_BRIEF( csv.binary(), "lookup table: on file '" << csv.filename << "': only binary files are currently supported" );
+        std::ifstream ifs( csv.filename, std::ios::binary );
+        COMMA_ASSERT_BRIEF( ifs.is_open(), "lookup table: failed to open '" << csv.filename << "'" );
+        std::size_t size = g.data().size() * sizeof( T ) * E;
+        ifs.read( reinterpret_cast< char* >( &g.data()[0] ), size );
+        COMMA_ASSERT_BRIEF( ifs.gcount() > 0, "lookup table: failed to read from '" << csv.filename << "'" );
+        COMMA_ASSERT_BRIEF( std::size_t( ifs.gcount() ) == size, "lookup table: on file '" << csv.filename << "': expected " << size << " bytes; got: " << ifs.gcount() );
+        return g;
+    }
+};
+
+} } } } // namespace comma { namespace applications { namespace lookup { namespace operations {
+
+
+
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
 static int interpolate( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )

From 0de90a3fe152d8215c179fb016d5cfc0b431a7a9 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 15:19:59 +1000
Subject: [PATCH 0612/1056] math-lookup: interpolate: in progress...

---
 containers/applications/CMakeLists.txt  |  2 +-
 containers/applications/math-lookup.cpp | 24 +++++++++++++++++-------
 2 files changed, 18 insertions(+), 8 deletions(-)

diff --git a/containers/applications/CMakeLists.txt b/containers/applications/CMakeLists.txt
index dc4beb661..3274df0d0 100644
--- a/containers/applications/CMakeLists.txt
+++ b/containers/applications/CMakeLists.txt
@@ -2,6 +2,6 @@ set( dir ${SOURCE_CODE_BASE_DIR}/containers/applications )
 
 add_executable( math-lookup math-lookup.cpp ) # todo! should math-lookup be here at all? does it create circular dependencies?
 #add_dependencies( math-lookup comma_containers )
-target_link_libraries( math-lookup ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv )
+target_link_libraries( math-lookup ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_name_value comma_csv )
 set_target_properties( math-lookup PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS math-lookup RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 7be8959d6..bfc00e514 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -7,6 +7,7 @@
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
+#include "../../csv/traits.h"
 #include "../../name_value/parser.h"
 #include "../multidimensional/array.h"
 
@@ -45,15 +46,14 @@ namespace comma { namespace applications { namespace lookup { namespace operatio
 template < typename T, std::size_t D, std::size_t E >
 struct lut
 {
-    struct input { std::array< double, D > point; };
+    typedef std::array< double, D > point_t;
     typedef std::array< std::size_t, D > index_t;
     typedef std::array< T, E > value_t;
-    typedef comma::containers::multidimensional::grid< value_t, D > grid_t;
+    typedef comma::containers::multidimensional::grid< value_t, D, point_t > grid_t;
+    struct input { std::array< double, D > point; };
 
-    static grid_t& load( grid_t& g, const std::string& options )
+    static grid_t& load( grid_t& g, const comma::csv::options& csv )
     {
-        auto csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( options );
-        COMMA_ASSERT_BRIEF( csv.binary(), "lookup table: on file '" << csv.filename << "': only binary files are currently supported" );
         std::ifstream ifs( csv.filename, std::ios::binary );
         COMMA_ASSERT_BRIEF( ifs.is_open(), "lookup table: failed to open '" << csv.filename << "'" );
         std::size_t size = g.data().size() * sizeof( T ) * E;
@@ -62,16 +62,26 @@ struct lut
         COMMA_ASSERT_BRIEF( std::size_t( ifs.gcount() ) == size, "lookup table: on file '" << csv.filename << "': expected " << size << " bytes; got: " << ifs.gcount() );
         return g;
     }
+
+    template < typename F >
+    int run( const comma::csv::options& lut_csv, F&& f )
+    {
+        grid_t grid;
+        load( grid, lut_csv );
+        return 0;
+    }
 };
 
 } } } } // namespace comma { namespace applications { namespace lookup { namespace operations {
 
-
-
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
 static int interpolate( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
 {
+    COMMA_ASSERT_BRIEF( unnamed.size() > 1, "please specify lookup table file as: math-lookup <operation> <filename>" );
+    auto lut_csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( unnamed[1] );
+    COMMA_ASSERT_BRIEF( csv.binary(), "lookup table: on file '" << lut_csv.filename << "': only binary files are currently supported" );
+    auto input_format = csv.binary() ? csv.format() : comma::csv::format( options.value< std::string >( "--format", "d" ) );
     comma::say() << "interpolate: todo" << std::endl;
     return 1;
 }

From 32f2c5b71d17e3a6505bdf9bbb7b8a7547ad843f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 17:33:31 +1000
Subject: [PATCH 0613/1056] math-lookup: interpolate: template resolution
 implemented; in progress...

---
 containers/applications/CMakeLists.txt  |  2 +-
 containers/applications/math-lookup.cpp | 79 +++++++++++++++++++++++--
 2 files changed, 74 insertions(+), 7 deletions(-)

diff --git a/containers/applications/CMakeLists.txt b/containers/applications/CMakeLists.txt
index 3274df0d0..a7433d78c 100644
--- a/containers/applications/CMakeLists.txt
+++ b/containers/applications/CMakeLists.txt
@@ -2,6 +2,6 @@ set( dir ${SOURCE_CODE_BASE_DIR}/containers/applications )
 
 add_executable( math-lookup math-lookup.cpp ) # todo! should math-lookup be here at all? does it create circular dependencies?
 #add_dependencies( math-lookup comma_containers )
-target_link_libraries( math-lookup ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_name_value comma_csv )
+target_link_libraries( math-lookup ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_name_value comma_csv comma_string )
 set_target_properties( math-lookup PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS math-lookup RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index bfc00e514..aad4edcfe 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -4,11 +4,13 @@
 
 #include <fstream>
 #include <iostream>
+#include <memory>
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
 #include "../../csv/traits.h"
 #include "../../name_value/parser.h"
+#include "../../visiting/traits.h"
 #include "../multidimensional/array.h"
 
 void usage( bool verbose )
@@ -43,6 +45,9 @@ void usage( bool verbose )
 
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
+template< typename T, std::size_t D >
+struct _array { std::array< T, D > point; };
+
 template < typename T, std::size_t D, std::size_t E >
 struct lut
 {
@@ -50,7 +55,8 @@ struct lut
     typedef std::array< std::size_t, D > index_t;
     typedef std::array< T, E > value_t;
     typedef comma::containers::multidimensional::grid< value_t, D, point_t > grid_t;
-    struct input { std::array< double, D > point; };
+    typedef _array< double, D > input_t;
+    typedef _array< T, D > output_t;
 
     static grid_t& load( grid_t& g, const comma::csv::options& csv )
     {
@@ -63,17 +69,69 @@ struct lut
         return g;
     }
 
-    template < typename F >
-    int run( const comma::csv::options& lut_csv, F&& f )
+    template < typename F > static int run( const std::vector< double >& origin
+                                          , const std::vector< double >& resolution
+                                          , const std::vector< std::size_t >& shape
+                                          , const comma::csv::options& lut_csv
+                                          , F&& f )
     {
-        grid_t grid;
+        point_t o, r;
+        index_t s;
+        std::memcpy( &o[0], &origin[0], D * sizeof( double ) );
+        std::memcpy( &r[0], &resolution[0], D * sizeof( double ) );
+        std::memcpy( &s[0], &shape[0], D * sizeof( std::size_t ) );
+        grid_t grid( o, r, s );
         load( grid, lut_csv );
         return 0;
     }
 };
 
+template < typename T, std::size_t D, typename F > static int run_with_dim( const std::vector< double >& origin
+                                                                          , const std::vector< double >& resolution
+                                                                          , const std::vector< std::size_t >& shape
+                                                                          , const comma::csv::options& lut_csv
+                                                                          , F&& f )
+{
+    switch( lut_csv.format().count() )
+    {
+        case 1: return lut< T, D, 1 >::run( origin, resolution, shape, lut_csv, f );
+        case 2: return lut< T, D, 2 >::run( origin, resolution, shape, lut_csv, f );
+        case 3: return lut< T, D, 3 >::run( origin, resolution, shape, lut_csv, f );
+        case 4: return lut< T, D, 4 >::run( origin, resolution, shape, lut_csv, f );
+        default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup table values currently supported; got: " << lut_csv.format().count() << " dimensions in " << lut_csv.format().string() );
+    }
+    return 1;
+}
+
+template < typename T, typename F > static int run_as( const std::vector< double >& origin
+                                                     , const std::vector< double >& resolution
+                                                     , const std::vector< std::size_t >& shape
+                                                     , const comma::csv::options& lut_csv
+                                                     , F&& f )
+{
+    switch( origin.size() )
+    {
+        case 1: return run_with_dim< T, 1 >( origin, resolution, shape, lut_csv, f );
+        case 2: return run_with_dim< T, 2 >( origin, resolution, shape, lut_csv, f );
+        case 3: return run_with_dim< T, 3 >( origin, resolution, shape, lut_csv, f );
+        case 4: return run_with_dim< T, 4 >( origin, resolution, shape, lut_csv, f );
+        default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup tables currently supported; got: " << origin.size() << " dimensions" );
+    }
+    return 1;
+}
+
 } } } } // namespace comma { namespace applications { namespace lookup { namespace operations {
 
+namespace comma { namespace visiting {
+
+template < typename T, std::size_t D > struct traits< comma::applications::lookup::operations::_array< T, D > >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, comma::applications::lookup::operations::_array< T, D >& p, Visitor& v ) { v.apply( "point", p.point ); }
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::applications::lookup::operations::_array< T, D >& p, Visitor& v ) { v.apply( "point", p.point ); }
+};
+
+} } // namespace comma { namespace visiting {
+
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
 static int interpolate( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
@@ -81,8 +139,17 @@ static int interpolate( const comma::command_line_options& options, const csv::o
     COMMA_ASSERT_BRIEF( unnamed.size() > 1, "please specify lookup table file as: math-lookup <operation> <filename>" );
     auto lut_csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( unnamed[1] );
     COMMA_ASSERT_BRIEF( csv.binary(), "lookup table: on file '" << lut_csv.filename << "': only binary files are currently supported" );
-    auto input_format = csv.binary() ? csv.format() : comma::csv::format( options.value< std::string >( "--format", "d" ) );
-    comma::say() << "interpolate: todo" << std::endl;
+    const auto& origin = comma::split_as< double >( options.value< std::string >( "--origin,-o" ), ',' );
+    const auto& resolution = comma::split_as< double >( options.value< std::string >( "--resolution,-r" ), ',' );
+    const auto& shape = comma::split_as< std::size_t >( options.value< std::string >( "--shape" ), ',' );
+    COMMA_ASSERT_BRIEF( origin.size() == resolution.size(), "expected --origin and --resolution of the same dimensions; got: " << origin.size() << " and " << resolution.size() );
+    COMMA_ASSERT_BRIEF( origin.size() == shape.size(), "expected --origin and --shape of the same dimensions; got: " << origin.size() << " and " << shape.size() );
+    switch( lut_csv.format().elements()[0].type ) // todo! quick and dirty
+    {
+        case comma::csv::format::float_t: return comma::applications::lookup::operations::run_as< float >( origin, resolution, shape, lut_csv, nullptr );
+        case comma::csv::format::double_t: return comma::applications::lookup::operations::run_as< double >( origin, resolution, shape, lut_csv, nullptr );
+        default: COMMA_THROW( comma::exception, "only float and double as lookup table values are supported; got: '" << unnamed[1] << "'" );
+    }
     return 1;
 }
 

From 3f28dcd0bcfbbf3293e62649b1218d87db9313ec Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 17:54:18 +1000
Subject: [PATCH 0614/1056] math-lookup: interpolate: more template plumbing;
 in progress...

---
 containers/applications/math-lookup.cpp    | 53 +++++++++++++++-------
 containers/multidimensional/array_traits.h |  1 +
 2 files changed, 37 insertions(+), 17 deletions(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index aad4edcfe..fe25e09ac 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -69,10 +69,11 @@ struct lut
         return g;
     }
 
-    template < typename F > static int run( const std::vector< double >& origin
-                                          , const std::vector< double >& resolution
-                                          , const std::vector< std::size_t >& shape
+    template < typename F > static int run( const comma::csv::options& csv
                                           , const comma::csv::options& lut_csv
+                                          , const std::vector< double >& origin
+                                          , const std::vector< double >& resolution
+                                          , const std::vector< std::size_t >& shape                                          
                                           , F&& f )
     {
         point_t o, r;
@@ -82,39 +83,57 @@ struct lut
         std::memcpy( &s[0], &shape[0], D * sizeof( std::size_t ) );
         grid_t grid( o, r, s );
         load( grid, lut_csv );
+        input_t zero;
+        std::memset( &zero.point[0], 0, zero.point.size() * sizeof( T ) );
+        comma::csv::input_stream< input_t > istream( std::cin, csv, zero );
+        // todo! ostream and tied? or just do it by hand for now?
+        while( istream.ready() || std::cin.good() )
+        {
+            const auto& p = istream.read();
+            if( !p ) { break; }
+
+            // todo: process
+            // todo: output using tied; just a stub for debugging for now
+            if( csv.binary() ) { std::cout.write( istream.binary().last(), istream.binary().size() ); }
+            else { std::cout << comma::join( istream.ascii().last(), csv.delimiter ) << std::endl; }
+
+            if( csv.flush ) { std::cout.flush(); }
+        }
         return 0;
     }
 };
 
-template < typename T, std::size_t D, typename F > static int run_with_dim( const std::vector< double >& origin
+template < typename T, std::size_t D, typename F > static int run_with_dim( const comma::csv::options& csv
+                                                                          , const comma::csv::options& lut_csv
+                                                                          , const std::vector< double >& origin
                                                                           , const std::vector< double >& resolution
                                                                           , const std::vector< std::size_t >& shape
-                                                                          , const comma::csv::options& lut_csv
                                                                           , F&& f )
 {
     switch( lut_csv.format().count() )
     {
-        case 1: return lut< T, D, 1 >::run( origin, resolution, shape, lut_csv, f );
-        case 2: return lut< T, D, 2 >::run( origin, resolution, shape, lut_csv, f );
-        case 3: return lut< T, D, 3 >::run( origin, resolution, shape, lut_csv, f );
-        case 4: return lut< T, D, 4 >::run( origin, resolution, shape, lut_csv, f );
+        case 1: return lut< T, D, 1 >::run( csv, lut_csv, origin, resolution, shape, f );
+        case 2: return lut< T, D, 2 >::run( csv, lut_csv, origin, resolution, shape, f );
+        case 3: return lut< T, D, 3 >::run( csv, lut_csv, origin, resolution, shape, f );
+        case 4: return lut< T, D, 4 >::run( csv, lut_csv, origin, resolution, shape, f );
         default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup table values currently supported; got: " << lut_csv.format().count() << " dimensions in " << lut_csv.format().string() );
     }
     return 1;
 }
 
-template < typename T, typename F > static int run_as( const std::vector< double >& origin
+template < typename T, typename F > static int run_as( const comma::csv::options& csv
+                                                     , const comma::csv::options& lut_csv
+                                                     , const std::vector< double >& origin
                                                      , const std::vector< double >& resolution
                                                      , const std::vector< std::size_t >& shape
-                                                     , const comma::csv::options& lut_csv
                                                      , F&& f )
 {
     switch( origin.size() )
     {
-        case 1: return run_with_dim< T, 1 >( origin, resolution, shape, lut_csv, f );
-        case 2: return run_with_dim< T, 2 >( origin, resolution, shape, lut_csv, f );
-        case 3: return run_with_dim< T, 3 >( origin, resolution, shape, lut_csv, f );
-        case 4: return run_with_dim< T, 4 >( origin, resolution, shape, lut_csv, f );
+        case 1: return run_with_dim< T, 1 >( csv, lut_csv, origin, resolution, shape, f );
+        case 2: return run_with_dim< T, 2 >( csv, lut_csv, origin, resolution, shape, f );
+        case 3: return run_with_dim< T, 3 >( csv, lut_csv, origin, resolution, shape, f );
+        case 4: return run_with_dim< T, 4 >( csv, lut_csv, origin, resolution, shape, f );
         default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup tables currently supported; got: " << origin.size() << " dimensions" );
     }
     return 1;
@@ -146,8 +165,8 @@ static int interpolate( const comma::command_line_options& options, const csv::o
     COMMA_ASSERT_BRIEF( origin.size() == shape.size(), "expected --origin and --shape of the same dimensions; got: " << origin.size() << " and " << shape.size() );
     switch( lut_csv.format().elements()[0].type ) // todo! quick and dirty
     {
-        case comma::csv::format::float_t: return comma::applications::lookup::operations::run_as< float >( origin, resolution, shape, lut_csv, nullptr );
-        case comma::csv::format::double_t: return comma::applications::lookup::operations::run_as< double >( origin, resolution, shape, lut_csv, nullptr );
+        case comma::csv::format::float_t: return comma::applications::lookup::operations::run_as< float >( csv, lut_csv, origin, resolution, shape, nullptr );
+        case comma::csv::format::double_t: return comma::applications::lookup::operations::run_as< double >( csv, lut_csv, origin, resolution, shape, nullptr );
         default: COMMA_THROW( comma::exception, "only float and double as lookup table values are supported; got: '" << unnamed[1] << "'" );
     }
     return 1;
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index f156c222d..ae1739184 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -127,6 +127,7 @@ template <> struct operations< 1 >
     template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[0] ) >::type { return s[0]; }
     template < typename S, typename T, typename Diff > static bool near( const S& s, const T& t, const Diff& epsilon ) { return comma::math::equal( s[0], t[0], epsilon ); }
     template < typename S > static S& fill( S&s, double value ) { s[0] = value; return s; }
+    template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
     template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution ) { i[0] = index( p[0], origin[0], resolution[0] ); return i; }
     template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) { return p[0] - origin[0] < resolution[0] / 2 ? I{ 0 } : I{ 1 }; }
 };

From f412ed09a49341fcf1d3fe0286de8ee338102308 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 18:07:36 +1000
Subject: [PATCH 0615/1056] math-lookup: operation functors implemented; in
 progress...

---
 containers/applications/math-lookup.cpp | 24 ++++++++++++++++++++++++
 containers/multidimensional/array.h     | 11 +++++++++++
 2 files changed, 35 insertions(+)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index fe25e09ac..7cb45315e 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -69,6 +69,30 @@ struct lut
         return g;
     }
 
+    static std::pair< index_t, value_t > nearest( const grid_t& g, const point_t& p )
+    {
+        std::pair< index_t, value_t > r;
+        r.first = g.nearest_to( p );
+        r.second = g[r.first];
+        return r;
+    }
+
+    static std::pair< index_t, value_t > query( const grid_t& g, const point_t& p )
+    {
+        std::pair< index_t, value_t > r;
+        r.first = g.index_of( p );
+        r.second = g[r.first];
+        return r;
+    }
+
+    static std::pair< index_t, value_t > interpolate( const grid_t& g, const point_t& p )
+    {
+        std::pair< index_t, value_t > r;
+        r.first = g.index_of( p );
+        r.second = g.interpolated( p );
+        return r;
+    }
+
     template < typename F > static int run( const comma::csv::options& csv
                                           , const comma::csv::options& lut_csv
                                           , const std::vector< double >& origin
diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index f5d7c53bb..cde76d9bc 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -185,6 +185,8 @@ class grid: public array< V, D, S >
 
         V interpolated( const point_type& point ) const; // todo: flag/enum or alike for different interpolation types; currently linear only
 
+        index_type nearest_to( const point_type& point ) const;
+
     private:
         point_type _origin;
         point_type _resolution;
@@ -266,4 +268,13 @@ V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
     return v;
 }
 
+template < typename V, unsigned int D, typename P, typename Traits, typename S >
+typename grid< V, D, P, Traits, S >::index_type grid< V, D, P, Traits, S >::nearest_to( const P& point ) const
+{
+    P element_origin = _resolution;
+    index_type i = index_of( point );
+    Traits::add( Traits::vmultiply( element_origin, i ), _origin );
+    return Traits::add( Traits::nearest( point, element_origin, resolution ), i );
+}
+
 } } } // namespace comma { namespace containers { namespace multidimensional {

From 333cc1d9ac74d99d34e5fb19dd9a1c86f890a4e6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 9 Jun 2023 11:02:40 +1000
Subject: [PATCH 0616/1056] csv: read_as: inlined; method with default values
 added

---
 csv/stream.h | 20 ++++++++++++++------
 1 file changed, 14 insertions(+), 6 deletions(-)

diff --git a/csv/stream.h b/csv/stream.h
index 7400ac4f7..b432fb653 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -40,6 +40,8 @@ template < typename S > class passed;
 /// convenience functions: read input stream into a container that has push_back() method
 template < typename V > V read_as( std::istream& is, const options& o = options() );
 template < typename V > V read_as( const std::string& filename, const options& o = options() );
+template < typename V > V read_as( std::istream& is, const options& o, const typename V::value_type& default_value );
+template < typename V > V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value );
 
 /// ascii csv input stream
 template < typename S >
@@ -493,7 +495,8 @@ inline void passed< S >::write()
     {
         if( is_stdout_ )
         {
-            ::write( 1, is_.binary().last(), is_.binary().size() );
+            auto r = ::write( 1, is_.binary().last(), is_.binary().size() );
+            ( void ) r;
             if( flush ) { ::fflush( stdout ); }
         }
         else
@@ -518,7 +521,8 @@ inline void passed< S >::write( const S& s )
         is_.binary().binary().put( s, &buffer_[0] );
         if( is_stdout_ )
         {
-            ::write( 1, &buffer_[0], is_.binary().size() );
+            auto r = ::write( 1, &buffer_[0], is_.binary().size() );
+            ( void ) r;
             if( flush ) { ::fflush( stdout ); }
         }
         else
@@ -830,9 +834,9 @@ inline void output_stream< S >::append_output( input_stream< T >& is, const S& s
     }
 }*/
 
-template < typename V > V read_as( std::istream& is, const options& o )
+template < typename V > inline V read_as( std::istream& is, const options& o, const typename V::value_type& default_value )
 {
-    input_stream< typename V::value_type > istream( is, o );
+    input_stream< typename V::value_type > istream( is, o, default_value );
     V v;
     while( istream.ready() || is.good() )
     {
@@ -843,12 +847,16 @@ template < typename V > V read_as( std::istream& is, const options& o )
     return v;
 }
 
-template < typename V > V read_as( const std::string& filename, const options& o )
+template < typename V > inline V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value )
 {
     std::ifstream ifs;
     ifs.open( &filename[0], o.binary() ? std::ios_base::in | std::ios_base::binary : std::ios_base::in );
-    if( ifs.is_open() ) { return read_as< V >( ifs, o ); }
+    if( ifs.is_open() ) { return read_as< V >( ifs, o, default_value ); }
     COMMA_THROW( comma::exception, "failed to open '" << filename << "'" );
 }
 
+template < typename V > inline V read_as( const std::string& filename, const options& o ) { return read_as< V >( filename, o, V::value_type() ); }
+
+template < typename V > inline V read_as( std::istream& is, const options& o ) { return read_as< V >( is, o, V::value_type() ); }
+
 } } // namespace comma { namespace csv {

From c2831600f672f20240569f7994ec10579492d0e1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 9 Jun 2023 11:13:43 +1000
Subject: [PATCH 0617/1056] csv::read_as: typo fixed

---
 csv/stream.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/stream.h b/csv/stream.h
index b432fb653..a3de56dab 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -855,8 +855,8 @@ template < typename V > inline V read_as( const std::string& filename, const opt
     COMMA_THROW( comma::exception, "failed to open '" << filename << "'" );
 }
 
-template < typename V > inline V read_as( const std::string& filename, const options& o ) { return read_as< V >( filename, o, V::value_type() ); }
+template < typename V > inline V read_as( const std::string& filename, const options& o ) { return read_as< V >( filename, o, typename V::value_type() ); }
 
-template < typename V > inline V read_as( std::istream& is, const options& o ) { return read_as< V >( is, o, V::value_type() ); }
+template < typename V > inline V read_as( std::istream& is, const options& o ) { return read_as< V >( is, o, typename V::value_type() ); }
 
 } } // namespace comma { namespace csv {

From 268cae85053d817288426930bbcf2664dfd40c0e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 9 Jun 2023 16:21:11 +1000
Subject: [PATCH 0618/1056] csv::read_as( csv::options ) added

---
 csv/stream.h | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/csv/stream.h b/csv/stream.h
index a3de56dab..37403ff71 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -38,6 +38,7 @@ template < typename S, typename T > class tied;
 template < typename S > class passed;
 
 /// convenience functions: read input stream into a container that has push_back() method
+template < typename V > V read_as( const options& o, const typename V::value_type& default_value = typename V::value_type() );
 template < typename V > V read_as( std::istream& is, const options& o = options() );
 template < typename V > V read_as( const std::string& filename, const options& o = options() );
 template < typename V > V read_as( std::istream& is, const options& o, const typename V::value_type& default_value );
@@ -859,4 +860,6 @@ template < typename V > inline V read_as( const std::string& filename, const opt
 
 template < typename V > inline V read_as( std::istream& is, const options& o ) { return read_as< V >( is, o, typename V::value_type() ); }
 
+template < typename V > inline V read_as( const options& o, const typename V::value_type& default_value ) { return read_as< V >( o.filename, o, default_value ); }
+
 } } // namespace comma { namespace csv {

From 285987df7703ca9232f1fe506445133affedbd76 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 8 Jun 2023 19:20:55 +1000
Subject: [PATCH 0619/1056] math-lookup: mainly plumbed through; todo: 1-dim
 support; nearest operation; --help; regression test; in progress...

---
 containers/applications/math-lookup.cpp | 131 ++++++++++++------------
 containers/multidimensional/array.h     |   2 +-
 2 files changed, 68 insertions(+), 65 deletions(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 7cb45315e..cb139c2f5 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -43,6 +43,25 @@ void usage( bool verbose )
     exit( 0 );
 }
 
+// todo
+// - 1-dimensional: fix
+// - array operators: fix
+// - nearest: fix
+// ! --help
+// - regression test: basics
+
+template< typename T, std::size_t D, typename S >
+std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+
+template< typename T, std::size_t D, typename S >
+std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+
+template< typename T, std::size_t D >
+std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+
+template< typename T, std::size_t D >
+std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
 template< typename T, std::size_t D >
@@ -69,95 +88,96 @@ struct lut
         return g;
     }
 
-    static std::pair< index_t, value_t > nearest( const grid_t& g, const point_t& p )
+    static std::pair< index_t, value_t > interpolate( const grid_t& g, const point_t& p )
     {
         std::pair< index_t, value_t > r;
-        r.first = g.nearest_to( p );
-        r.second = g[r.first];
+        r.first = g.index_of( p );
+        r.second = g.interpolated( p );
         return r;
     }
 
-    static std::pair< index_t, value_t > query( const grid_t& g, const point_t& p )
+    static std::pair< index_t, value_t > nearest( const grid_t& g, const point_t& p )
     {
         std::pair< index_t, value_t > r;
-        r.first = g.index_of( p );
+        r.first = g.nearest_to( p );
         r.second = g[r.first];
         return r;
     }
 
-    static std::pair< index_t, value_t > interpolate( const grid_t& g, const point_t& p )
+    static std::pair< index_t, value_t > query( const grid_t& g, const point_t& p )
     {
         std::pair< index_t, value_t > r;
         r.first = g.index_of( p );
-        r.second = g.interpolated( p );
+        r.second = g[r.first];
         return r;
     }
 
-    template < typename F > static int run( const comma::csv::options& csv
-                                          , const comma::csv::options& lut_csv
-                                          , const std::vector< double >& origin
-                                          , const std::vector< double >& resolution
-                                          , const std::vector< std::size_t >& shape                                          
-                                          , F&& f )
+    static int run( const std::string& operation
+                  , const comma::csv::options& csv
+                  , const comma::csv::options& lut_csv
+                  , const std::vector< double >& origin
+                  , const std::vector< double >& resolution
+                  , const std::vector< std::size_t >& shape )
     {
+        std::pair< index_t, value_t > ( *f )( const grid_t&, const point_t& );
+        if( operation == "interpolate" ) { f = lut< T, D, E >::interpolate; }
+        //else if( operation == "nearest" ) { f = lut< T, D, E >::nearest; }
+        else if( operation == "query" ) { f = lut< T, D, E >::query; }
+        else { COMMA_THROW_BRIEF( comma::exception, "expected operation; got: '" << operation << "'" ); }
         point_t o, r;
         index_t s;
-        std::memcpy( &o[0], &origin[0], D * sizeof( double ) );
-        std::memcpy( &r[0], &resolution[0], D * sizeof( double ) );
-        std::memcpy( &s[0], &shape[0], D * sizeof( std::size_t ) );
+        std::memcpy( &o[0], &origin[0], D * sizeof( double ) ); // quick and dirty
+        std::memcpy( &r[0], &resolution[0], D * sizeof( double ) ); // quick and dirty
+        std::memcpy( &s[0], &shape[0], D * sizeof( std::size_t ) ); // quick and dirty
         grid_t grid( o, r, s );
         load( grid, lut_csv );
         input_t zero;
         std::memset( &zero.point[0], 0, zero.point.size() * sizeof( T ) );
         comma::csv::input_stream< input_t > istream( std::cin, csv, zero );
-        // todo! ostream and tied? or just do it by hand for now?
+        comma::csv::output_stream< std::pair< index_t, value_t > > ostream( std::cout, csv.binary() );
+        auto tied = comma::csv::tied( istream, ostream );
         while( istream.ready() || std::cin.good() )
         {
             const auto& p = istream.read();
             if( !p ) { break; }
-
-            // todo: process
-            // todo: output using tied; just a stub for debugging for now
-            if( csv.binary() ) { std::cout.write( istream.binary().last(), istream.binary().size() ); }
-            else { std::cout << comma::join( istream.ascii().last(), csv.delimiter ) << std::endl; }
-
+            tied.append( f( grid, p->point ) );
             if( csv.flush ) { std::cout.flush(); }
         }
         return 0;
     }
 };
 
-template < typename T, std::size_t D, typename F > static int run_with_dim( const comma::csv::options& csv
-                                                                          , const comma::csv::options& lut_csv
-                                                                          , const std::vector< double >& origin
-                                                                          , const std::vector< double >& resolution
-                                                                          , const std::vector< std::size_t >& shape
-                                                                          , F&& f )
+template < typename T, std::size_t D > static int run_with_dim( const std::string& operation
+                                                              , const comma::csv::options& csv
+                                                              , const comma::csv::options& lut_csv
+                                                              , const std::vector< double >& origin
+                                                              , const std::vector< double >& resolution
+                                                              , const std::vector< std::size_t >& shape )
 {
     switch( lut_csv.format().count() )
     {
-        case 1: return lut< T, D, 1 >::run( csv, lut_csv, origin, resolution, shape, f );
-        case 2: return lut< T, D, 2 >::run( csv, lut_csv, origin, resolution, shape, f );
-        case 3: return lut< T, D, 3 >::run( csv, lut_csv, origin, resolution, shape, f );
-        case 4: return lut< T, D, 4 >::run( csv, lut_csv, origin, resolution, shape, f );
+        case 1: return lut< T, D, 1 >::run( operation, csv, lut_csv, origin, resolution, shape );
+        case 2: return lut< T, D, 2 >::run( operation, csv, lut_csv, origin, resolution, shape );
+        case 3: return lut< T, D, 3 >::run( operation, csv, lut_csv, origin, resolution, shape );
+        case 4: return lut< T, D, 4 >::run( operation, csv, lut_csv, origin, resolution, shape );
         default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup table values currently supported; got: " << lut_csv.format().count() << " dimensions in " << lut_csv.format().string() );
     }
     return 1;
 }
 
-template < typename T, typename F > static int run_as( const comma::csv::options& csv
-                                                     , const comma::csv::options& lut_csv
-                                                     , const std::vector< double >& origin
-                                                     , const std::vector< double >& resolution
-                                                     , const std::vector< std::size_t >& shape
-                                                     , F&& f )
+template < typename T > static int run_as( const std::string& operation
+                                         , const comma::csv::options& csv
+                                         , const comma::csv::options& lut_csv
+                                         , const std::vector< double >& origin
+                                         , const std::vector< double >& resolution
+                                         , const std::vector< std::size_t >& shape )
 {
     switch( origin.size() )
     {
-        case 1: return run_with_dim< T, 1 >( csv, lut_csv, origin, resolution, shape, f );
-        case 2: return run_with_dim< T, 2 >( csv, lut_csv, origin, resolution, shape, f );
-        case 3: return run_with_dim< T, 3 >( csv, lut_csv, origin, resolution, shape, f );
-        case 4: return run_with_dim< T, 4 >( csv, lut_csv, origin, resolution, shape, f );
+        // todo! case 1: return run_with_dim< T, 1 >( operation, csv, lut_csv, origin, resolution, shape );
+        case 2: return run_with_dim< T, 2 >( operation, csv, lut_csv, origin, resolution, shape );
+        case 3: return run_with_dim< T, 3 >( operation, csv, lut_csv, origin, resolution, shape );
+        case 4: return run_with_dim< T, 4 >( operation, csv, lut_csv, origin, resolution, shape );
         default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup tables currently supported; got: " << origin.size() << " dimensions" );
     }
     return 1;
@@ -177,7 +197,7 @@ template < typename T, std::size_t D > struct traits< comma::applications::looku
 
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
-static int interpolate( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
+static int run( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
 {
     COMMA_ASSERT_BRIEF( unnamed.size() > 1, "please specify lookup table file as: math-lookup <operation> <filename>" );
     auto lut_csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( unnamed[1] );
@@ -189,25 +209,13 @@ static int interpolate( const comma::command_line_options& options, const csv::o
     COMMA_ASSERT_BRIEF( origin.size() == shape.size(), "expected --origin and --shape of the same dimensions; got: " << origin.size() << " and " << shape.size() );
     switch( lut_csv.format().elements()[0].type ) // todo! quick and dirty
     {
-        case comma::csv::format::float_t: return comma::applications::lookup::operations::run_as< float >( csv, lut_csv, origin, resolution, shape, nullptr );
-        case comma::csv::format::double_t: return comma::applications::lookup::operations::run_as< double >( csv, lut_csv, origin, resolution, shape, nullptr );
+        case comma::csv::format::float_t: return comma::applications::lookup::operations::run_as< float >( unnamed[0], csv, lut_csv, origin, resolution, shape );
+        case comma::csv::format::double_t: return comma::applications::lookup::operations::run_as< double >( unnamed[0], csv, lut_csv, origin, resolution, shape );
         default: COMMA_THROW( comma::exception, "only float and double as lookup table values are supported; got: '" << unnamed[1] << "'" );
     }
     return 1;
 }
 
-static int nearest( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
-{
-    comma::say() << "nearest: todo" << std::endl;
-    return 1;
-}
-
-static int query( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
-{
-    comma::say() << "query: todo" << std::endl;
-    return 1;
-}
-
 } } } } // namespace comma { namespace applications { namespace lookup { namespace operations {
 
 int main( int ac, char** av )
@@ -218,12 +226,7 @@ int main( int ac, char** av )
         comma::csv::options csv( options );
         const auto& unnamed = options.unnamed( "--flush,--verbose,-v", "-.*" );
         if( unnamed.empty() ) { comma::say() << "please specify operation" << std::endl; return 1; }
-        std::string operation = unnamed[0];
-        if( operation == "interpolate" ) { return comma::applications::lookup::operations::interpolate( options, csv, unnamed ); }
-        if( operation == "nearest" ) { return comma::applications::lookup::operations::nearest( options, csv, unnamed ); }
-        if( operation == "query" ) { return comma::applications::lookup::operations::query( options, csv, unnamed ); }
-        comma::say() << "expected operation; got: '" << operation << "'" << std::endl;
-        return 1;
+        return comma::applications::lookup::operations::run( options, csv, unnamed );
     }
     catch( std::exception& ex ) { comma::say() << "caught exception: " << ex.what() << std::endl; }
     catch( ... ) { comma::say() << "caught unknown exception" << std::endl; }
diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index cde76d9bc..2448bc0cb 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -274,7 +274,7 @@ typename grid< V, D, P, Traits, S >::index_type grid< V, D, P, Traits, S >::near
     P element_origin = _resolution;
     index_type i = index_of( point );
     Traits::add( Traits::vmultiply( element_origin, i ), _origin );
-    return Traits::add( Traits::nearest( point, element_origin, resolution ), i );
+    return Traits::add( Traits::template nearest< index_type >( point, const_cast< const P& >( element_origin ), _resolution ), i );
 }
 
 } } } // namespace comma { namespace containers { namespace multidimensional {

From a11ef893543107f3911f4be17dc8f1f1c5f27729 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 9 Jun 2023 19:37:34 +1000
Subject: [PATCH 0620/1056] math-lookup: --help added

---
 containers/applications/math-lookup.cpp | 29 ++++++++++++++-----------
 1 file changed, 16 insertions(+), 13 deletions(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index cb139c2f5..350cc02c6 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -16,26 +16,29 @@
 void usage( bool verbose )
 {
     std::cerr << "operations on a multidimensional lookup table" << std::endl;
+    std::cerr << "up to 4-dimension lookup tables with up to 4-dimension" << std::endl;
+    std::cerr << "values are currently supported; if you need more, just ask" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage: cat input.csv | math-lookup <operation> <options>" << std::endl;
+    std::cerr << "usage: cat input.csv | math-lookup <operation> [<lut-filename>] <options>" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
-    std::cerr << "    interpolate: output interpolated value for the given input" << std::endl;
+    std::cerr << "    index: todo: output index for a given input" << std::endl;
+    std::cerr << "    interpolate: todo: output interpolated value for the given input" << std::endl;
     std::cerr << "    nearest: todo: output table element index and value nearest to the given input" << std::endl;
     std::cerr << "    query: todo: output table element index and value for the given input" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "operations" << std::endl;
-    std::cerr << "    interpolate" << std::endl;
-    std::cerr << "        todo" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    nearest" << std::endl;
-    std::cerr << "        todo" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    query" << std::endl;
-    std::cerr << "        todo" << std::endl;
-    std::cerr << std::endl;
     std::cerr << "options" << std::endl;
-    std::cerr << "    todo" << std::endl;
+    std::cerr << "    --origin,-o=<point>; e.g: --origin=0,1,2,3" << std::endl;
+    std::cerr << "    --resolution,-r=<point>; e.g: --resolution=0.5,3,2,3" << std::endl;
+    std::cerr << "    --shape=<point>; e.g: --shape=3,2,5,3, same as in numpy" << std::endl;
+    std::cerr << "                     i.e. shape[0] is the slowest-changing" << std::endl;
+    std::cerr << "                     i.e. expected lookup table memory layout" << std::endl;
+    std::cerr << "                     is rows first" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "input/output options" << std::endl;
+    std::cerr << "    --input-fields; todo: print input fields for an operation to stdout and exit" << std::endl;
+    std::cerr << "    --output-fields; todo: print output fields for an operation to stdout and exit" << std::endl;
+    std::cerr << "    --output-format; todo: print output format for an operation to stdout and exit" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;

From 97b01a69ae00bd22d704a7b1fcaa53a99278df04 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 10 Jun 2023 13:48:20 +1000
Subject: [PATCH 0621/1056] csv::read_as(): optional size parameter added

---
 csv/stream.h | 24 ++++++++++++------------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/csv/stream.h b/csv/stream.h
index 37403ff71..d88776cc5 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -38,11 +38,11 @@ template < typename S, typename T > class tied;
 template < typename S > class passed;
 
 /// convenience functions: read input stream into a container that has push_back() method
-template < typename V > V read_as( const options& o, const typename V::value_type& default_value = typename V::value_type() );
-template < typename V > V read_as( std::istream& is, const options& o = options() );
-template < typename V > V read_as( const std::string& filename, const options& o = options() );
-template < typename V > V read_as( std::istream& is, const options& o, const typename V::value_type& default_value );
-template < typename V > V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value );
+template < typename V > V read_as( const options& o, const typename V::value_type& default_value = typename V::value_type(), std::size_t size = 0 );
+template < typename V > V read_as( std::istream& is, const options& o = options(), std::size_t size = 0 );
+template < typename V > V read_as( const std::string& filename, const options& o = options(), std::size_t size = 0 );
+template < typename V > V read_as( std::istream& is, const options& o, const typename V::value_type& default_value, std::size_t size = 0 );
+template < typename V > V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value, std::size_t size = 0 );
 
 /// ascii csv input stream
 template < typename S >
@@ -835,11 +835,11 @@ inline void output_stream< S >::append_output( input_stream< T >& is, const S& s
     }
 }*/
 
-template < typename V > inline V read_as( std::istream& is, const options& o, const typename V::value_type& default_value )
+template < typename V > inline V read_as( std::istream& is, const options& o, const typename V::value_type& default_value, std::size_t size )
 {
     input_stream< typename V::value_type > istream( is, o, default_value );
     V v;
-    while( istream.ready() || is.good() )
+    for( std::size_t count{0}; ( size == 0 || count < size ) && ( istream.ready() || is.good() ); ++count )
     {
         auto p = istream.read();
         if( !p ) { break; }
@@ -848,18 +848,18 @@ template < typename V > inline V read_as( std::istream& is, const options& o, co
     return v;
 }
 
-template < typename V > inline V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value )
+template < typename V > inline V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value, std::size_t size )
 {
     std::ifstream ifs;
     ifs.open( &filename[0], o.binary() ? std::ios_base::in | std::ios_base::binary : std::ios_base::in );
-    if( ifs.is_open() ) { return read_as< V >( ifs, o, default_value ); }
+    if( ifs.is_open() ) { return read_as< V >( ifs, o, default_value, size ); }
     COMMA_THROW( comma::exception, "failed to open '" << filename << "'" );
 }
 
-template < typename V > inline V read_as( const std::string& filename, const options& o ) { return read_as< V >( filename, o, typename V::value_type() ); }
+template < typename V > inline V read_as( const std::string& filename, const options& o, std::size_t size ) { return read_as< V >( filename, o, typename V::value_type(), size ); }
 
-template < typename V > inline V read_as( std::istream& is, const options& o ) { return read_as< V >( is, o, typename V::value_type() ); }
+template < typename V > inline V read_as( std::istream& is, const options& o, std::size_t size ) { return read_as< V >( is, o, typename V::value_type(), size ); }
 
-template < typename V > inline V read_as( const options& o, const typename V::value_type& default_value ) { return read_as< V >( o.filename, o, default_value ); }
+template < typename V > inline V read_as( const options& o, const typename V::value_type& default_value, std::size_t size ) { return read_as< V >( o.filename, o, default_value, size ); }
 
 } } // namespace comma { namespace csv {

From da10a044816627646e099853f157fb5e8afa355a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Jun 2023 10:32:50 +1000
Subject: [PATCH 0622/1056] math-lookup: trivial compilation error fixed

---
 containers/applications/math-lookup.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 350cc02c6..291934669 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -138,7 +138,7 @@ struct lut
         std::memset( &zero.point[0], 0, zero.point.size() * sizeof( T ) );
         comma::csv::input_stream< input_t > istream( std::cin, csv, zero );
         comma::csv::output_stream< std::pair< index_t, value_t > > ostream( std::cout, csv.binary() );
-        auto tied = comma::csv::tied( istream, ostream );
+        auto tied = comma::csv::make_tied( istream, ostream );
         while( istream.ready() || std::cin.good() )
         {
             const auto& p = istream.read();

From e281d41e176edccef2f5b41822d0d72c6a69075b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Jun 2023 12:06:24 +1000
Subject: [PATCH 0623/1056] math-lookup: --help improved

---
 containers/applications/math-lookup.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 291934669..1cd2bc18a 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -19,7 +19,7 @@ void usage( bool verbose )
     std::cerr << "up to 4-dimension lookup tables with up to 4-dimension" << std::endl;
     std::cerr << "values are currently supported; if you need more, just ask" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage: cat input.csv | math-lookup <operation> [<lut-filename>] <options>" << std::endl;
+    std::cerr << "usage: cat input.csv | math-lookup <operation> [<lut-filename>[;<lut-csv-options>]] <options>" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
     std::cerr << "    index: todo: output index for a given input" << std::endl;
@@ -204,7 +204,7 @@ static int run( const comma::command_line_options& options, const csv::options&
 {
     COMMA_ASSERT_BRIEF( unnamed.size() > 1, "please specify lookup table file as: math-lookup <operation> <filename>" );
     auto lut_csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( unnamed[1] );
-    COMMA_ASSERT_BRIEF( csv.binary(), "lookup table: on file '" << lut_csv.filename << "': only binary files are currently supported" );
+    COMMA_ASSERT_BRIEF( csv.binary(), "lookup table: on file '" << lut_csv.filename << "': only binary files are currently supported, e.g: 'lut.bin;binary=3f'" );
     const auto& origin = comma::split_as< double >( options.value< std::string >( "--origin,-o" ), ',' );
     const auto& resolution = comma::split_as< double >( options.value< std::string >( "--resolution,-r" ), ',' );
     const auto& shape = comma::split_as< std::size_t >( options.value< std::string >( "--shape" ), ',' );

From 3648031366d12456706a168f6e5675c74bfcd11b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Jun 2023 12:16:10 +1000
Subject: [PATCH 0624/1056] math-lookup: trivial typo fixed

---
 containers/applications/math-lookup.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 1cd2bc18a..7aa68c71f 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -204,7 +204,7 @@ static int run( const comma::command_line_options& options, const csv::options&
 {
     COMMA_ASSERT_BRIEF( unnamed.size() > 1, "please specify lookup table file as: math-lookup <operation> <filename>" );
     auto lut_csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( unnamed[1] );
-    COMMA_ASSERT_BRIEF( csv.binary(), "lookup table: on file '" << lut_csv.filename << "': only binary files are currently supported, e.g: 'lut.bin;binary=3f'" );
+    COMMA_ASSERT_BRIEF( lut_csv.binary(), "lookup table: on file '" << lut_csv.filename << "': only binary files are currently supported, e.g: 'lut.bin;binary=3f'" );
     const auto& origin = comma::split_as< double >( options.value< std::string >( "--origin,-o" ), ',' );
     const auto& resolution = comma::split_as< double >( options.value< std::string >( "--resolution,-r" ), ',' );
     const auto& shape = comma::split_as< std::size_t >( options.value< std::string >( "--shape" ), ',' );

From 8ef74d7ed82c83a60d624c8355b0a573da3bb652 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Jun 2023 12:23:57 +1000
Subject: [PATCH 0625/1056] math-lookup: array operators implemented

---
 containers/applications/math-lookup.cpp | 16 +++++++---------
 1 file changed, 7 insertions(+), 9 deletions(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 7aa68c71f..363f4fbd4 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -23,9 +23,9 @@ void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
     std::cerr << "    index: todo: output index for a given input" << std::endl;
-    std::cerr << "    interpolate: todo: output interpolated value for the given input" << std::endl;
+    std::cerr << "    interpolate: output interpolated value for the given input" << std::endl;
     std::cerr << "    nearest: todo: output table element index and value nearest to the given input" << std::endl;
-    std::cerr << "    query: todo: output table element index and value for the given input" << std::endl;
+    std::cerr << "    query: output table element index and value for the given input" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --origin,-o=<point>; e.g: --origin=0,1,2,3" << std::endl;
@@ -48,22 +48,20 @@ void usage( bool verbose )
 
 // todo
 // - 1-dimensional: fix
-// - array operators: fix
 // - nearest: fix
-// ! --help
 // - regression test: basics
 
 template< typename T, std::size_t D, typename S >
-std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
 
 template< typename T, std::size_t D, typename S >
-std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { auto r = lhs; r *= rhs; return r; }
 
 template< typename T, std::size_t D >
-std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] += rhs[i]; } return lhs; } // quick and dirty; let compiler optimize
 
 template< typename T, std::size_t D >
-std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { COMMA_THROW( comma::exception, "todo" ); }
+std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { auto r = lhs; r += rhs; return r; }
 
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
@@ -124,7 +122,7 @@ struct lut
     {
         std::pair< index_t, value_t > ( *f )( const grid_t&, const point_t& );
         if( operation == "interpolate" ) { f = lut< T, D, E >::interpolate; }
-        //else if( operation == "nearest" ) { f = lut< T, D, E >::nearest; }
+        else if( operation == "nearest" ) { COMMA_THROW_BRIEF( comma::exception, "nearest: todo" ); } //else if( operation == "nearest" ) { f = lut< T, D, E >::nearest; }
         else if( operation == "query" ) { f = lut< T, D, E >::query; }
         else { COMMA_THROW_BRIEF( comma::exception, "expected operation; got: '" << operation << "'" ); }
         point_t o, r;

From 1f86b7855eb2528693c32e9423a99375feccba26 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Jun 2023 14:11:36 +1000
Subject: [PATCH 0626/1056] containers::multidimensional::grid::has() method
 added

---
 containers/multidimensional/array.h | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 2448bc0cb..00d9ce507 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -95,7 +95,7 @@ class slice
 
         const_iterator end() const { return const_iterator( _size, _data + _size, _shape ); }
 
-    private:
+    protected:
         index_type _shape;
         std::size_t _size;
         V* _data;
@@ -152,7 +152,7 @@ class array
 
         const_iterator end() const { return _slice.end(); }
 
-    private:
+    protected:
         storage_type _data;
         slice_type _slice;
 };
@@ -187,6 +187,8 @@ class grid: public array< V, D, S >
 
         index_type nearest_to( const point_type& point ) const;
 
+        bool has( const point_type& point ) const;
+
     private:
         point_type _origin;
         point_type _resolution;
@@ -277,4 +279,12 @@ typename grid< V, D, P, Traits, S >::index_type grid< V, D, P, Traits, S >::near
     return Traits::add( Traits::template nearest< index_type >( point, const_cast< const P& >( element_origin ), _resolution ), i );
 }
 
+template < typename V, unsigned int D, typename P, typename Traits, typename S >
+inline bool grid< V, D, P, Traits, S >::has( const P& point ) const // quick and dirty for now
+{
+    const auto& i = index_of( point );
+    for( unsigned int k = 0; k < D; ++k ) { if( i[k] < 0 || i[k] >= this->shape()[k] ) { return false; } }
+    return true;
+}
+
 } } } // namespace comma { namespace containers { namespace multidimensional {

From 55b2b67328c55a8f845cb0e42abb3b1d85b396e1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Jun 2023 14:11:59 +1000
Subject: [PATCH 0627/1056] math-lookup: interpolate: mostly works; todo:
 corner cases, unit test

---
 containers/applications/math-lookup.cpp | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 363f4fbd4..ee6fe720b 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -39,6 +39,7 @@ void usage( bool verbose )
     std::cerr << "    --input-fields; todo: print input fields for an operation to stdout and exit" << std::endl;
     std::cerr << "    --output-fields; todo: print output fields for an operation to stdout and exit" << std::endl;
     std::cerr << "    --output-format; todo: print output format for an operation to stdout and exit" << std::endl;
+    std::cerr << "    --permissive; discard inputs outside lookup table" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
@@ -51,6 +52,9 @@ void usage( bool verbose )
 // - nearest: fix
 // - regression test: basics
 
+static bool permissive{false};
+static bool verbose{false};
+
 template< typename T, std::size_t D, typename S >
 std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
 
@@ -63,6 +67,9 @@ std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D
 template< typename T, std::size_t D >
 std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { auto r = lhs; r += rhs; return r; }
 
+template< typename T, std::size_t D >
+std::ostream& operator<<( std::ostream& os, const std::array< T, D >& rhs ) { std::string d; for( unsigned int i = 0; i < D; ++i ) { os << d << rhs[i]; d = ","; } return os; }
+
 namespace comma { namespace applications { namespace lookup { namespace operations {
 
 template< typename T, std::size_t D >
@@ -141,6 +148,12 @@ struct lut
         {
             const auto& p = istream.read();
             if( !p ) { break; }
+            if( !grid.has( p->point ) ) 
+            {
+                if( permissive ) { comma::saymore() << "discarded input outside grid: " << p->point << std::endl; continue; }
+                comma::say() << "input outside grid: " << p->point << "; use --permissive to discard" << std::endl;
+                return 1;
+            }
             tied.append( f( grid, p->point ) );
             if( csv.flush ) { std::cout.flush(); }
         }
@@ -225,8 +238,10 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         comma::csv::options csv( options );
-        const auto& unnamed = options.unnamed( "--flush,--verbose,-v", "-.*" );
+        const auto& unnamed = options.unnamed( "--flush,--permissive,--verbose,-v", "-.*" );
         if( unnamed.empty() ) { comma::say() << "please specify operation" << std::endl; return 1; }
+        permissive = options.exists( "--permissive" );
+        verbose = options.exists( "--verbose,-v" );
         return comma::applications::lookup::operations::run( options, csv, unnamed );
     }
     catch( std::exception& ex ) { comma::say() << "caught exception: " << ex.what() << std::endl; }

From 489ce006e0b7f9f21d02d6b6e3b762df75c0a8cd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 14 Jun 2023 15:28:18 +1000
Subject: [PATCH 0628/1056] name_value/ptree visitor: std::size_t used for
 std::array, boost::array traits since std::size_t and unsigned int are
 different types (std::size_t is unsigned long long)

---
 containers/multidimensional/map.h             | 28 +++++++++----------
 .../test/multidimensional_array_test.cpp      |  3 ++
 name_value/ptree.h                            |  4 +--
 3 files changed, 19 insertions(+), 16 deletions(-)

diff --git a/containers/multidimensional/map.h b/containers/multidimensional/map.h
index 5d4da6def..6742c5305 100644
--- a/containers/multidimensional/map.h
+++ b/containers/multidimensional/map.h
@@ -26,7 +26,7 @@ struct array_hash : public std::unary_function< Array, std::size_t >
 };
 
 /// unordered map with array-like keys
-template < typename K, typename V, unsigned int Size, typename P = std::array< K, Size >, typename Traits = impl::operations< Size > >
+template < typename K, typename V, std::size_t Size, typename P = std::array< K, Size >, typename Traits = impl::operations< Size > >
 class map : public std::unordered_map< std::array< comma::int32, Size >, V, array_hash< std::array< comma::int32, Size >, Size > >
 {
     public:
@@ -94,21 +94,21 @@ class map : public std::unordered_map< std::array< comma::int32, Size >, V, arra
         point_type _resolution;
 };
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Traits >::point_type& origin, const typename map< K, V, Size, P, Traits >::point_type& resolution )
     : _origin( origin )
     , _resolution( resolution )
 {
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Traits >::point_type& resolution )
     : _origin( Traits::template zero< P >() )
     , _resolution( resolution )
 {
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::touch_at( const typename map< K, V, Size, P, Traits >::point_type& point )
 {
     key_type index = index_of( point );
@@ -117,60 +117,60 @@ inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Trait
     return this->base_type::insert( std::make_pair( index, mapped_type() ) ).first;
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline std::pair< typename map< K, V, Size, P, Traits >::iterator, bool > map< K, V, Size, P, Traits >::insert( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::mapped_type& value )
 {
     return this->base_type::insert( std::make_pair( index_of( point ), value ) );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& origin, const typename map< K, V, Size, P, Traits >::point_type& resolution )
 {
     return Traits::template index_of< P, key_type >( point, origin, resolution );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& resolution )
 {
     return index_of( point, Traits::template zero< P >(), resolution );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point ) const
 {
     return index_of( point, _origin, _resolution );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::point_type& point )
 {
     index_type i = index_of( point );
     return this->base_type::find( i );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::point_type& point ) const
 {
     index_type i = index_of( point );
     return this->base_type::find( i );
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::key_type& index )
 {
     return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::key_type& index ) const
 {
     return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
 }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline const typename map< K, V, Size, P, Traits >::point_type& map< K, V, Size, P, Traits >::origin() const { return _origin; }
 
-template < typename K, typename V, unsigned int Size, typename P, typename Traits >
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
 inline const typename map< K, V, Size, P, Traits >::point_type& map< K, V, Size, P, Traits >::resolution() const { return _resolution; }
 
 } } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 603e2f9d4..391bf0086 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -193,6 +193,9 @@ TEST( multidimensional_array, grid_index )
         int i = 0;
         for( auto it = g.begin(); it != g.end(); ++it ) { *it = i++; }
         { index_t i = {0, 0}; EXPECT_EQ( g.index_of( {0, 0} ), i ); }
+        { index_t i = {0, 1}; EXPECT_EQ( g.index_of( {0, 1} ), i ); }
+        { index_t i = {1, 0}; EXPECT_EQ( g.index_of( {1, 0} ), i ); }
+        { index_t i = {1, 1}; EXPECT_EQ( g.index_of( {1, 1} ), i ); }
         { index_t i = {0, 1}; EXPECT_EQ( g.index_of( {0, 1.01} ), i ); }
         // todo: more tests
     }
diff --git a/name_value/ptree.h b/name_value/ptree.h
index 83d23a722..bef9c81e1 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -126,9 +126,9 @@ struct property_tree // quick and dirty
 
             template < typename K, typename T, typename A > void apply_next( const K& key, std::vector< T, A >& value ) { _apply_to_arraylike( key, value ); }
 
-            template < typename K, typename T, unsigned int Size > void apply_next( const K& key, boost::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
+            template < typename K, typename T, std::size_t Size > void apply_next( const K& key, boost::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
 
-            template < typename K, typename T, unsigned int Size > void apply_next( const K& key, std::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
+            template < typename K, typename T, std::size_t Size > void apply_next( const K& key, std::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
 
             /// apply to map
             template < typename K, typename L, typename T, typename A >

From 4354b4646849c646b41f93eaa3d280a1b236527c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 14 Jun 2023 16:17:52 +1000
Subject: [PATCH 0629/1056] name_value/test/ptree_test.cpp: test fixed

---
 name_value/test/ptree_test.cpp | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/name_value/test/ptree_test.cpp b/name_value/test/ptree_test.cpp
index 59c27d9ae..b619181ba 100644
--- a/name_value/test/ptree_test.cpp
+++ b/name_value/test/ptree_test.cpp
@@ -359,8 +359,11 @@ TEST( ptree, array )
         std::istringstream iss( s );
         property_tree::from_path_value( iss, ptree );
         from_ptree from_ptree( ptree );
-        boost::array< std::string, 3 > array;
-        try { visiting::apply( from_ptree, array ); EXPECT_TRUE( false ); } catch( ... ) {}
+        boost::array< std::string, 3 > array{ "bye", "moon", "stars" };
+        visiting::apply( from_ptree, array );
+        EXPECT_EQ( array[0], "hello" );
+        EXPECT_EQ( array[1], "world" );
+        EXPECT_EQ( array[2], "stars" );
     }
     {
         boost::property_tree::ptree ptree;

From 88ae453dd1f372f6822e747df3b8beeb6896bcd2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 20 Jun 2023 15:14:05 +1000
Subject: [PATCH 0630/1056] 
 containers::multidimensional::array::interpolated(): debugging...

---
 containers/multidimensional/array.h           | 36 +++++++++++++++----
 containers/multidimensional/array_traits.h    |  4 +--
 .../test/multidimensional_array_test.cpp      | 10 +++---
 3 files changed, 38 insertions(+), 12 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 00d9ce507..fee7148ff 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -257,17 +257,41 @@ inline const slice< V, D - I > slice< V, D >::at( const std::array< std::size_t,
 template < typename V, unsigned int D, typename S >
 inline array< V, D, S >::array( const typename array< V, D, S >::index_type& shape, const V& default_value ): _data( impl::index_traits< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
 
+// template < typename V, unsigned int D, typename P, typename Traits, typename S >
+// V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
+// {
+//     P element_origin = _resolution;
+//     const index_type i = index_of( point );
+//     Traits::add( Traits::vmultiply( element_origin, i ), _origin );
+//     const auto& weights = Traits::interpolation::linear::weights( point, element_origin, _resolution );
+//     const auto& neighbours = impl::neighbours< index_type, D >;
+//     V v = this->operator[]( i ) * weights[0]; // todo?! value traits?!
+//     for( unsigned int j = 1; j < weights.size(); ++j ) { v += this->operator[]( Traits::add( i, neighbours[j] ) ) * weights[j]; } // todo?! value traits?!
+//     return v;
+// }
+
 template < typename V, unsigned int D, typename P, typename Traits, typename S >
 V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
 {
-    P element_origin = _resolution;
     const index_type i = index_of( point );
-    Traits::add( Traits::vmultiply( element_origin, i ), _origin );
-    const auto& weights = Traits::interpolation::linear::weights( point, element_origin, _resolution );
+    const P p = Traits::subtract( point, Traits::add( Traits::vmultiply( _resolution, i ), _origin ) );
+    //std::cerr << "==> a: point: " << point[0] << "," << point[1] << " p: " << p[0] << "," << p[1] << " _resolution: " << _resolution[0] << "," << _resolution[1] << std::endl;
     const auto& neighbours = impl::neighbours< index_type, D >;
-    V v = this->operator[]( i ) * weights[0]; // todo?! value traits?!
-    for( unsigned int j = 1; j < weights.size(); ++j ) { v += this->operator[]( Traits::add( i, neighbours[j] ) ) * weights[j]; } // todo?! value traits?!
-    return v;
+    double s = 0;
+    V v = this->operator[]( i ); // todo?! value traits?!
+    for( unsigned int j = 0; j < neighbours.size(); ++j )
+    {
+        P d = Traits::subtract( p, Traits::vmultiply( _resolution, neighbours[j] ) );
+        double n = std::sqrt( Traits::dot( d, d ) );
+        index_type k = Traits::add( i, neighbours[j] );
+        if( math::equal( n, 0 ) ) { return this->operator[]( k ); }
+        double w = 1 / n;
+        s += w;
+        //std::cerr << "==> b: j: " << j << " k: " << k[0] << "," << k[1] << " n: " << n << " w: " << w << std::endl;
+        if( j == 0 ) { v *= w; } else { v += this->operator[]( k ) * w; } // quick and dirty for now
+    }
+    //std::cerr << "==> c: s: " << s << std::endl;
+    return v * ( 1 / s );
 }
 
 template < typename V, unsigned int D, typename P, typename Traits, typename S >
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index ae1739184..3061fd2b8 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -38,9 +38,9 @@ template < std::size_t Size > struct operations
     template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[ Size - 1 ] *= t; operations< Size - 1 >::multiply( s, t ); return s; }
     template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[ Size - 1 ] *= t[ Size - 1 ]; operations< Size - 1 >::vmultiply( s, t ); return s; }
     template < typename S, typename T > static double dot( S& s, const T& t ) { return s[ Size - 1 ] * t[ Size - 1 ] + operations< Size - 1 >::dot( s, t ); }
-    template < typename S, typename T > static S& invert( S& s ) { s[ Size - 1 ] = !s[ Size - 1 ]; operations< Size - 1 >::invert( s ); return s; }
     template < typename S, typename T > static S& mask( S& s, const T& t ) { s[ Size - 1 ] = t[ Size - 1 ] ? t[ Size - 1 ] : s[ Size - 1 ]; operations< Size - 1 >::mask( s, t ); return s; }
     template < typename S, typename T > static S masked( const S& s, const T& t ) { S m = s; mask( m, t ); return m; }
+    template < typename S, typename T > static S& logical_not( S& s ) { s[ Size - 1 ] = !s[ Size - 1 ]; operations< Size - 1 >::logical_not( s ); return s; }
     template < typename S > static S& fill( S&s, double value ) { s[ Size - 1 ] = value; operations< Size - 1 >::fill( s, value ); return s; }
     template < typename S > static S filled( double value ) { S s; fill( s, value ); return s; }
     template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
@@ -122,7 +122,7 @@ template <> struct operations< 1 >
     template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[0] *= t; return s; }
     template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[0] *= t[0]; return s; }
     template < typename S, typename T > static double dot( S& s, const T& t ) { return s[0] * t[0]; }
-    template < typename S, typename T > static S& invert( S& s ) { s[0] = !s[0]; return s; }
+    template < typename S, typename T > static S& logical_not( S& s ) { s[0] = !s[0]; return s; }
     template < typename S, typename T > static S& mask( S& s, const T& t ) { s[0] = t[0] ? t[0] : s[0]; return s; }
     template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[0] ) >::type { return s[0]; }
     template < typename S, typename T, typename Diff > static bool near( const S& s, const T& t, const Diff& epsilon ) { return comma::math::equal( s[0], t[0], epsilon ); }
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 391bf0086..a48b25cf8 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -205,10 +205,12 @@ TEST( multidimensional_array, grid_interpolate )
 {
     {
         comma::containers::multidimensional::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 2}, 0 );
-        g[{0, 0}] = 0; g[{0, 1}] = 1; g[{1, 0}] = 2; g[{1, 1}] = 3;
+        g[{0, 0}] = 0; g[{0, 1}] = 1; g[{1, 0}] = 0; g[{1, 1}] = 1;
         EXPECT_EQ( g.interpolated( {0, 0} ), 0 );
-        EXPECT_EQ( g.interpolated( {0, 1} ), 1 );
-        EXPECT_EQ( g.interpolated( {1, 0} ), 2 );
-        EXPECT_EQ( g.interpolated( {1, 1} ), 3 );
+        EXPECT_EQ( g.interpolated( {0, 0.5} ), 0.5 );
+        EXPECT_EQ( g.interpolated( {0.5, 0.5} ), 0.5 );
+        //EXPECT_EQ( g.interpolated( {0.5, 0} ), 0.5 );
+        //EXPECT_EQ( g.interpolated( {1, 0} ), 2 );
+        //EXPECT_EQ( g.interpolated( {1, 1} ), 3 );
     }
 }
\ No newline at end of file

From f986c9c7967f41a1c812efba170d3bbb8a7a402e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 20 Jun 2023 18:13:28 +1000
Subject: [PATCH 0631/1056] 
 containers::multidimensional::array::interpolated(): seems working

---
 containers/multidimensional/array.h        | 59 +++++++++++-----------
 containers/multidimensional/array_traits.h |  5 +-
 2 files changed, 32 insertions(+), 32 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index fee7148ff..8667f2fc1 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -257,43 +257,42 @@ inline const slice< V, D - I > slice< V, D >::at( const std::array< std::size_t,
 template < typename V, unsigned int D, typename S >
 inline array< V, D, S >::array( const typename array< V, D, S >::index_type& shape, const V& default_value ): _data( impl::index_traits< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
 
-// template < typename V, unsigned int D, typename P, typename Traits, typename S >
-// V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
-// {
-//     P element_origin = _resolution;
-//     const index_type i = index_of( point );
-//     Traits::add( Traits::vmultiply( element_origin, i ), _origin );
-//     const auto& weights = Traits::interpolation::linear::weights( point, element_origin, _resolution );
-//     const auto& neighbours = impl::neighbours< index_type, D >;
-//     V v = this->operator[]( i ) * weights[0]; // todo?! value traits?!
-//     for( unsigned int j = 1; j < weights.size(); ++j ) { v += this->operator[]( Traits::add( i, neighbours[j] ) ) * weights[j]; } // todo?! value traits?!
-//     return v;
-// }
-
 template < typename V, unsigned int D, typename P, typename Traits, typename S >
 V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
 {
     const index_type i = index_of( point );
-    const P p = Traits::subtract( point, Traits::add( Traits::vmultiply( _resolution, i ), _origin ) );
-    //std::cerr << "==> a: point: " << point[0] << "," << point[1] << " p: " << p[0] << "," << p[1] << " _resolution: " << _resolution[0] << "," << _resolution[1] << std::endl;
+    P element_origin = Traits::add( Traits::vmultiply( _resolution, i ), _origin );
+    const auto& weights = Traits::interpolation::linear::weights( point, element_origin, _resolution );
     const auto& neighbours = impl::neighbours< index_type, D >;
-    double s = 0;
-    V v = this->operator[]( i ); // todo?! value traits?!
-    for( unsigned int j = 0; j < neighbours.size(); ++j )
-    {
-        P d = Traits::subtract( p, Traits::vmultiply( _resolution, neighbours[j] ) );
-        double n = std::sqrt( Traits::dot( d, d ) );
-        index_type k = Traits::add( i, neighbours[j] );
-        if( math::equal( n, 0 ) ) { return this->operator[]( k ); }
-        double w = 1 / n;
-        s += w;
-        //std::cerr << "==> b: j: " << j << " k: " << k[0] << "," << k[1] << " n: " << n << " w: " << w << std::endl;
-        if( j == 0 ) { v *= w; } else { v += this->operator[]( k ) * w; } // quick and dirty for now
-    }
-    //std::cerr << "==> c: s: " << s << std::endl;
-    return v * ( 1 / s );
+    V v = this->operator[]( i ) * weights[0]; // todo?! value traits?!
+    for( unsigned int j = 1; j < weights.size(); ++j ) { v += this->operator[]( Traits::add( i, neighbours[j] ) ) * weights[j]; } // todo?! value traits?!
+    return v;
 }
 
+// template < typename V, unsigned int D, typename P, typename Traits, typename S >
+// V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
+// {
+//     const index_type i = index_of( point );
+//     const P p = Traits::subtract( point, Traits::add( Traits::vmultiply( _resolution, i ), _origin ) );
+//     //std::cerr << "==> a: point: " << point[0] << "," << point[1] << " p: " << p[0] << "," << p[1] << " _resolution: " << _resolution[0] << "," << _resolution[1] << std::endl;
+//     const auto& neighbours = impl::neighbours< index_type, D >;
+//     double s = 0;
+//     V v = this->operator[]( i ); // todo?! value traits?!
+//     for( unsigned int j = 0; j < neighbours.size(); ++j )
+//     {
+//         P d = Traits::subtract( p, Traits::vmultiply( _resolution, neighbours[j] ) );
+//         double n = Traits::dot( d, d ); //double n = std::sqrt( Traits::dot( d, d ) );
+//         index_type k = Traits::add( i, neighbours[j] );
+//         if( math::equal( n, 0 ) ) { return this->operator[]( k ); }
+//         double w = 1 / n;
+//         s += w;
+//         //std::cerr << "==> b: j: " << j << " k: " << k[0] << "," << k[1] << " n: " << n << " w: " << w << std::endl;
+//         if( j == 0 ) { v *= w; } else { v += this->operator[]( k ) * w; } // quick and dirty for now
+//     }
+//     //std::cerr << "==> c: s: " << s << std::endl;
+//     return v * ( 1 / s );
+// }
+
 template < typename V, unsigned int D, typename P, typename Traits, typename S >
 typename grid< V, D, P, Traits, S >::index_type grid< V, D, P, Traits, S >::nearest_to( const P& point ) const
 {
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index 3061fd2b8..4fac00e00 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -100,9 +100,8 @@ template < std::size_t Size > struct operations
     {
         struct linear
         {
-            template < typename S > static std::array< double, pow< 2, Size > > weights( const S& p, const S& origin, const S& resolution )
+            template < typename S > static std::array< double, pow< 2, Size > > weights( const S& s )
             {
-                S s = vdivide( subtract( p, origin ), resolution );
                 S t;
                 subtract( fill( t, 1. ), s );
                 const auto& n = neighbours< std::array< unsigned int, Size >, Size >;
@@ -110,6 +109,8 @@ template < std::size_t Size > struct operations
                 for( unsigned int i = 0; i < pow< 2, Size >; ++i ) { w[i] = product( masked( s, n[ pow< 2, Size > - i - 1 ] ) ) * product( masked( t, n[i] ) ); }
                 return w;
             }
+
+            template < typename S > static std::array< double, pow< 2, Size > > weights( const S& p, const S& origin, const S& resolution ) { return weights( vdivide( subtract( p, origin ), resolution ) ); }
         };
     };
 };

From e86f9402db341fc4e355183d90e27dc30a86ae4a Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Wed, 5 Jul 2023 14:55:12 +1000
Subject: [PATCH 0632/1056] comma::csv::time::from/to_microseconds() exposed as
 first-class citizens

---
 csv/format.cpp | 46 +++++++++++++++++++++++++++++-----------------
 csv/format.h   | 15 ++++++++++-----
 2 files changed, 39 insertions(+), 22 deletions(-)

diff --git a/csv/format.cpp b/csv/format.cpp
index 59f238ff8..c2415b636 100644
--- a/csv/format.cpp
+++ b/csv/format.cpp
@@ -13,7 +13,6 @@
 #include "../base/types.h"
 #include "../string/string.h"
 #include "../csv/format.h"
-#include "impl/epoch.h"
 
 namespace comma { namespace csv {
 
@@ -467,27 +466,13 @@ boost::posix_time::ptime format::traits< boost::posix_time::ptime, format::time
     //::memcpy( &microseconds, buf, sizeof( comma::int64 ) );
 	(void)size;
     comma::int64 microseconds = *reinterpret_cast< const comma::int64* >( buf );
-    if( microseconds == bin_not_a_date_time ) { return boost::posix_time::not_a_date_time; }
-    if( microseconds == bin_time_pos_infin ) { return boost::posix_time::pos_infin; }
-    if( microseconds == bin_time_neg_infin ) { return boost::posix_time::neg_infin; }
-    long seconds = static_cast< long >( microseconds / 1000000 ); // todo: due to bug in boost, will be casted down to int32, but for the dates we use seconds will never overflow, thus, leave it like this now
-    microseconds -= static_cast< comma::int64 >( seconds ) * 1000000;
-    return boost::posix_time::ptime( csv::impl::epoch, boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( static_cast< long >( microseconds ) ) );
+    return comma::csv::time::from_microseconds( microseconds );
 }
 
 void format::traits< boost::posix_time::ptime, format::time >::to_bin( const boost::posix_time::ptime& t, char* buf, std::size_t size )
 {
-    if( t.is_not_a_date_time() ) { *reinterpret_cast< comma::int64* >( buf ) = bin_not_a_date_time; return; }
-    if( t.is_pos_infinity() ) { *reinterpret_cast< comma::int64* >( buf ) = bin_time_pos_infin; return; }
-    if( t.is_neg_infinity() ) { *reinterpret_cast< comma::int64* >( buf ) = bin_time_neg_infin; return; }
 	(void)size;
-    static const boost::posix_time::ptime base( csv::impl::epoch );
-    const boost::posix_time::time_duration duration = t - base;
-    long seconds = duration.total_seconds(); // boost uses long, which is a bug for 32-bit
-    comma::int64 microseconds = static_cast< comma::int64 >( seconds ) * 1000000l;
-    microseconds += ( duration - boost::posix_time::seconds( seconds ) ).total_microseconds();
-    *reinterpret_cast< comma::int64* >( buf ) = microseconds; // ::memcpy( buf, &microseconds, sizeof( comma::int64 ) );
-
+    *reinterpret_cast< comma::int64* >( buf ) = comma::csv::time::to_microseconds(t);
 }
 
 std::string format::traits< std::string, format::fixed_string >::from_bin( const char* buf, std::size_t size )
@@ -502,4 +487,31 @@ void format::traits< std::string, format::fixed_string >::to_bin( const std::str
     if( t.length() < size ) { ::memset( buf + t.length(), 0, size - t.length() ); }
 }
 
+namespace time {
+
+boost::posix_time::ptime from_microseconds(comma::int64 microseconds, boost::gregorian::date epoch)
+{
+    if( microseconds == bin_not_a_date_time ) { return boost::posix_time::not_a_date_time; }
+    if( microseconds == bin_time_pos_infin ) { return boost::posix_time::pos_infin; }
+    if( microseconds == bin_time_neg_infin ) { return boost::posix_time::neg_infin; }
+    long seconds = static_cast< long >( microseconds / 1000000 ); // todo: due to bug in boost, will be casted down to int32, but for the dates we use seconds will never overflow, thus, leave it like this now
+    microseconds -= static_cast< comma::int64 >( seconds ) * 1000000;
+    return boost::posix_time::ptime( epoch, boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( static_cast< long >( microseconds ) ) );
+}
+
+comma::int64 to_microseconds(const boost::posix_time::ptime& t, boost::gregorian::date epoch)
+{
+    if( t.is_not_a_date_time() ) { return bin_not_a_date_time; }
+    if( t.is_pos_infinity() ) { return bin_time_pos_infin; }
+    if( t.is_neg_infinity() ) { return bin_time_neg_infin; }
+    static const boost::posix_time::ptime base( epoch );
+    const boost::posix_time::time_duration duration = t - base;
+    long seconds = duration.total_seconds(); // boost uses long, which is a bug for 32-bit
+    comma::int64 microseconds = static_cast< comma::int64 >( seconds ) * 1000000l;
+    microseconds += ( duration - boost::posix_time::seconds( seconds ) ).total_microseconds();
+    return microseconds;
+}
+
+} // namespace time {
+
 } } // namespace comma { namespace csv {
diff --git a/csv/format.h b/csv/format.h
index a1063461b..8e27a02fb 100644
--- a/csv/format.h
+++ b/csv/format.h
@@ -30,8 +30,7 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_APPLICATIONS_FORMAT_HEADER_GUARD_
-#define COMMA_CSV_APPLICATIONS_FORMAT_HEADER_GUARD_
+#pragma once
 
 #include <stdlib.h>
 #include <iostream>
@@ -48,12 +47,21 @@
 #include "../visiting/visit.h"
 #include "../visiting/while.h"
 #include "../xpath/xpath.h"
+#include "impl/epoch.h" 
 
 namespace comma { namespace csv {
 
 /// forward declaration
 namespace impl { class to_format; }
 
+namespace time {
+
+boost::posix_time::ptime from_microseconds(comma::int64 microseconds, boost::gregorian::date epoch=csv::impl::epoch);
+
+comma::int64 to_microseconds(const boost::posix_time::ptime& t, boost::gregorian::date epoch=csv::impl::epoch);
+
+} // namespace time {
+
 /// csv to/from bin format
 /// @todo the interface has got real messy; fully refactor!
 class format
@@ -166,7 +174,6 @@ class format
         template < typename T > static std::string value_impl( const T& t );
 };
 
-
 namespace impl {
 
 class to_format
@@ -394,5 +401,3 @@ template <> struct format::traits< std::string, format::fixed_string >
 };
 
 } } // namespace comma { namespace csv {
-
-#endif // #ifndef COMMA_CSV_APPLICATIONS_FORMAT_HEADER_GUARD_

From 9c7061a0184d5989d731217fea572a52c7459e62 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 19 Jul 2023 16:03:04 +1000
Subject: [PATCH 0633/1056] comma-test-run: make "running" message more
 accurate

and reword "started" to "launching"
---
 util/applications/comma-test-run | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 77b377273..7504a61ed 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -786,7 +786,7 @@ function run_single_test()
     # say something so that the user is not guessing what is going on
     (
         flock -x 9
-        message_ "$name: test $counter: $dir: started..."
+        message_ "$name: test $counter: $dir: launching..."
     ) 9>>"$comma_test_run_output_flock"
 
     # do not touch this equilibristics with file descriptors
@@ -806,8 +806,6 @@ function run_single_test()
             error_ "$name: error: no \"test\" script found in any parent directory of $dir"
             result=1
         else
-            message_ "$name: test $counter: $dir: running..."
-
             basedir=$( pwd )
 
             ## Comment out for now: the exact usage to be discussed, it is confusing and can be taken as a sign of error
@@ -823,6 +821,7 @@ function run_single_test()
                     report_end_of_wait
                     local error_files test_failed
                     find . -name out_of_shared_memory | xargs rm -f
+                    message_ "$name: test $counter: $dir: running..."
                     comma_progress_named "$our_stats_progress" "$dir" run_test_with_timeout
                     test_failed=$?
                     comma_locked "$comma_test_run_resources_flock" comma_release_resources "$request" "$comma_test_run_resources_counter" "$worker_id"

From 95a90811c067b645d9110213214ac33bbd3bc9ab Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 27 Jul 2023 10:31:10 +1000
Subject: [PATCH 0634/1056] comma::silent_none() implemented

---
 base/none.h | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/base/none.h b/base/none.h
index 6752d7de3..77ef009fe 100644
--- a/base/none.h
+++ b/base/none.h
@@ -4,6 +4,8 @@
 
 #pragma once
 
+#include <boost/optional.hpp>
+
 namespace comma {
 
 /// convenience type to use e.g. as a "tag" type in template definitions
@@ -11,5 +13,13 @@ namespace comma {
 /// to be a singleton type (see boost/none_t.hpp for details) meaning
 /// that it won't compile for some use cases
 struct none {};
+
+/// a quick fix for annoying boost::optional compilation warning
+/// boost::optional< int > i; // gets compile warning when i first dereferenced
+///                           // even if i is initialized for sure somewhere in the code
+/// boost::optional< int > i{boost::none}; // still same compile warning
+/// boost::optional< int > i = comma::silent_none< int >(); // fine, no warning
+template < typename T >
+inline boost::optional< T > silent_none() { return boost::optional< T >( boost::none ); }
     
 } // namespace comma {

From 64ccd455225c8362eddc7fa98d3caea8e5565628 Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Tue, 8 Aug 2023 18:04:37 +1000
Subject: [PATCH 0635/1056] containers/synchronized/multiqueue.h Added new
 multiqueue for aligning multiple queues by key

---
 containers/synchronized/multiqueue.h          |  52 ++++++
 .../test/synchronized_multiqueue_test.cpp     | 167 ++++++++++++++++++
 2 files changed, 219 insertions(+)
 create mode 100644 containers/synchronized/multiqueue.h
 create mode 100644 containers/test/synchronized_multiqueue_test.cpp

diff --git a/containers/synchronized/multiqueue.h b/containers/synchronized/multiqueue.h
new file mode 100644
index 000000000..85a9aab70
--- /dev/null
+++ b/containers/synchronized/multiqueue.h
@@ -0,0 +1,52 @@
+#include <queue>
+#include <tuple>
+#include <boost/date_time/posix_time/posix_time.hpp>
+
+namespace comma { namespace containers { namespace synchronized {
+
+namespace impl {
+
+template < typename K > struct traits { typedef K diff_type; };
+template <> struct traits< boost::posix_time::ptime > { typedef boost::posix_time::time_duration diff_type; };
+
+}
+
+template < typename K, typename T, typename S >
+class multiqueue
+{
+    public:
+        std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > > queues;
+
+        multiqueue( typename impl::traits< K >::diff_type max_diff ): _max_diff( max_diff ) {}
+        bool ready() const;
+        void purge();
+
+    private:
+        typename impl::traits< K >::diff_type _max_diff;
+        static typename impl::traits< K >::diff_type _abs_diff(K lhs, K rhs) { return lhs < rhs ? (rhs - lhs) : (lhs - rhs); }
+};
+
+template < typename K, typename T, typename S >
+inline bool multiqueue<K, T, S>::ready() const
+{
+    if( std::get<0>(queues).empty() || std::get<1>(queues).empty() ) { return false; }
+    return _abs_diff( std::get<1>(queues).front().first, std::get<0>(queues).front().first ) <= _max_diff;
+}
+
+template < typename K, typename T, typename S >
+inline void multiqueue<K, T, S>::purge()
+{
+    if( std::get<1>(queues).empty() || std::get<0>(queues).empty() ) { return; }
+    while( std::get<0>(queues).front().first - std::get<1>(queues).front().first > _max_diff ) 
+    { 
+        if( std::get<1>(queues).empty() ) { return; }
+        std::get<1>(queues).pop(); 
+    }
+    while( std::get<1>(queues).front().first - std::get<0>(queues).front().first > _max_diff ) 
+    { 
+        if( std::get<0>(queues).empty() ) { return; }
+        std::get<0>(queues).pop(); 
+    }
+}
+
+} } } // namespace comma { namespace containers { namespace synchronized {
diff --git a/containers/test/synchronized_multiqueue_test.cpp b/containers/test/synchronized_multiqueue_test.cpp
new file mode 100644
index 000000000..f78cfcf4c
--- /dev/null
+++ b/containers/test/synchronized_multiqueue_test.cpp
@@ -0,0 +1,167 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+
+#include <gtest/gtest.h>
+#include "../synchronized/multiqueue.h"
+#include <boost/date_time/posix_time/posix_time.hpp>
+
+TEST( multiqueue, usage ){
+    typedef comma::containers::synchronized::multiqueue< int, int, int > multiqueue_t;
+    multiqueue_t q{ 2 /*timeout*/  };
+
+    EXPECT_EQ( std::get<0>(q.queues).size(), 0 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 0 );
+    EXPECT_EQ( q.ready(), false );
+
+    std::get<0>(q.queues).push( std::make_pair( 0, 1 ) );
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 0 );
+    EXPECT_EQ( q.ready(), false );
+
+    std::get<1>(q.queues).push( std::make_pair( 0, 1 ) );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+    // Purge should only remove items if they are unsynced
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 1 );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+}
+
+TEST( multiqueue, sync_first_to_second ){
+    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    multiqueue_t q{ 2 /*timeout*/  };
+
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 0}, {2, 0}, {4, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q.queues).front().first, 4 );
+    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );    
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+}
+
+TEST( multiqueue, sync_second_to_first ){
+    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    multiqueue_t q{ 2 /*timeout*/  };
+
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {1, 0}, {2, 0}, {4, 5} });
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q.queues).front().first, 5 );
+    EXPECT_EQ( std::get<1>(q.queues).front().first, 4 );    
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+}
+
+TEST( multiqueue, empty_list_before_sync ){
+    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    multiqueue_t q{ 2 /*timeout*/ };
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 0}, {1, 0}, {2, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).size(), 0 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( q.ready(), false );
+}
+
+TEST( multiqueue, max_time_offset ){
+    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    multiqueue_t q{ 2 /*timeout*/ };
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {3, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q.queues).front().first, 3 );
+    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );        
+    EXPECT_EQ( q.ready(), true );
+}
+
+TEST( multiqueue, floating_point_error ){
+    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    {
+    multiqueue_t q{ 2 /*timeout*/ };
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
+    EXPECT_NEAR( std::get<0>(q.queues).front().first, 3.000001, 1e-6 );
+    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );        
+    EXPECT_EQ( q.ready(), true );
+    }
+    {
+    multiqueue_t q{ 2 /*timeout*/ };
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).size(), 0 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );        
+    EXPECT_EQ( q.ready(), false );
+    }
+    {
+    multiqueue_t q{ 2 /*timeout*/ };
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q.queues).front().first, 5 );
+    EXPECT_NEAR( std::get<1>(q.queues).front().first, 3.000001, 1e-6 );
+    EXPECT_EQ( q.ready(), true );
+    }
+    {
+    multiqueue_t q{ 2 /*timeout*/ };
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 0 );
+    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q.queues).front().first, 5 );
+    EXPECT_EQ( q.ready(), false );
+    }    
+}
+
+TEST( multiqueue, type_difference ){
+    typedef comma::containers::synchronized::multiqueue< float, int, double > multiqueue_t;
+    multiqueue_t q{ 2 /*timeout*/ };
+    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 1} });
+    std::get<1>(q.queues) = std::queue< std::pair< float, double > >({ {0, 1.0} });
+}
+
+TEST( multiqueue, boost_time ){
+    typedef comma::containers::synchronized::multiqueue< boost::posix_time::ptime, double, double > multiqueue_t;
+    multiqueue_t q{boost::posix_time::seconds( 2 /*timeout*/  ) };
+
+    boost::posix_time::ptime t( boost::gregorian::date( 2023, 1, 1 ) );
+    std::get<0>(q.queues) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    std::get<1>(q.queues) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
+    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+}

From 10f0beac3c7a0ff887b629cf556b38e4df7900f4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 9 Aug 2023 17:17:28 +1000
Subject: [PATCH 0636/1056] csv-shape: split: first cut implemented; basic
 tests done

---
 csv/applications/csv-shape.cpp    | 104 ++++++++++++++++--------------
 csv/test/csv-shape/split/expected |  18 ++++++
 csv/test/csv-shape/split/input    |   5 ++
 3 files changed, 78 insertions(+), 49 deletions(-)
 create mode 100644 csv/test/csv-shape/split/expected
 create mode 100644 csv/test/csv-shape/split/input

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index e346a6186..4f679ee9b 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -1,31 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2023 Vsevolod Vlaskine
 
 /// @author dewey nguyen
 
@@ -51,12 +25,12 @@ static void usage( bool verbose=false )
     std::cerr << "                 last input record concatenated with the first record (hence, 'loop')" << std::endl;
     std::cerr << "                 this mode always uses the sliding window for overlapping groups" << std::endl;
     std::cerr << "    repeat:      repeat input given number of times, e.g. csv-shape repeat --size 5" << std::endl;
+    std::cerr << "    split:       csv-only: split line at n-th field, e.g. csv-shape split --size 4" << std::endl;
     std::cerr << std::endl;
     std::cerr << "Usage: cat data.csv | csv-shape <operation> [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --expected-records; output the expected records for given --size and --step, and exit" << std::endl;
-    std::cerr << "    --help,-h;  see this usage message" << std::endl;
     std::cerr << "    --size,-n=<num>; number of input records in each grouping, range: 2 and above" << std::endl;
     std::cerr << "    --step=<num>; default=1; relative offset of the records to be concatenated" << std::endl;
     std::cerr << "    --verbose,-v: more output to stderr, shows examples with --help,-h" << std::endl;
@@ -70,7 +44,15 @@ static void usage( bool verbose=false )
     std::cerr << "   loop" << std::endl;
     std::cerr << "      --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
     std::cerr << "      --reverse; output records in reverse order (e.g. b,a)" << std::endl;
+    std::cerr << "   split" << std::endl;
+    std::cerr << "      --repeat; e.g: echo 0,1,2,3,4,5 | csv-shape split -n 2 will output: 0,1 and 2,3,4,5" << std::endl;
+    std::cerr << "                     echo 0,1,2,3,4,5 | csv-shape split -n 2 --repeat will output: 0,1, then 2,3, then 4,5" << std::endl;
+    std::cerr << "      --size,-n=<n>; e.g. echo 0,1,2,3,4,5| csv-shape split -n 3 will output" << std::endl;
+    std::cerr << "                     two lines: 0,1,2 and 3,4,5" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << "examples" << std::endl;
     if( verbose )
     {
         std::cerr << "examples" << std::endl;
@@ -84,36 +66,34 @@ static void usage( bool verbose=false )
         std::cerr << "          input records 1 to 5 create the first output record, input records 2 to 6 create the second record, input records 3 to 7 create the third record, and so forth" << std::endl;
         std::cerr << "              seq 1 10 | csv-shape concatenate -n 5 --sliding-window" << std::endl;
         std::cerr << std::endl;
-        std::cerr << "csv options" << std::endl;
-        std::cerr << comma::csv::options::usage() << std::endl;
     }
     else
     {
-        std::cerr << "examples: run csv-shape --help --verbose for more..." << std::endl;
+        std::cerr << "    run csv-shape --help --verbose for more..." << std::endl;
     }
     exit( 0 );
 }
 
 // There is nothing to do in this case - binary data
-static void simple_binary_pass_through(const comma::csv::format& f, bool flush=false)
+static void _binary_pass_through(const comma::csv::format& f, bool flush=false)
 {
     std::vector< char > buffer( f.size(), '\0' );
     while( std::cin.good() && !std::cin.eof() )
     {
-        if( std::cin.read( &buffer[0], buffer.size() ) ) {
+        if( std::cin.read( &buffer[0], buffer.size() ) )
+        {
             std::cout.write( &buffer[0], buffer.size() );
             if( flush ) { std::cout.flush(); }
         }
     }
 }
 
-bool is_binary;
+static bool is_binary;
 
-class concatenate_
+class _concatenate
 {
 public:
-
-    concatenate_()
+    _concatenate()
         : use_sliding_window_(false)
         , bidirectional_(false)
         , reverse_(false)
@@ -133,7 +113,7 @@ class concatenate_
         use_sliding_window_ = ( looping_ || options.exists("--sliding-window,-w") );
         reverse_ = options.exists("--reverse");
         bidirectional_ = options.exists("--bidirectional");
-        if( !use_sliding_window_ && is_binary ) { simple_binary_pass_through(csv.format(), csv.flush); return 0; };
+        if( !use_sliding_window_ && is_binary ) { _binary_pass_through( csv.format(), csv.flush ); return 0; };
         size_ = looping_ ? options.value("--size,-n", 2) : options.value< comma::uint32 >("--size,-n");
         step_ = options.value( "--step",1 );
         if( size_ < 2 ) { std::cerr <<  comma::verbose.app_name() << ": expected --size,-n= value to be greater than 1" << std::endl; return 1; }
@@ -231,20 +211,20 @@ class concatenate_
 
 namespace comma { namespace visiting {
 
-template <> struct traits< concatenate_::input_t >
+template <> struct traits< _concatenate::input_t >
 {
-    template < typename K, typename V > static void visit( const K&, const concatenate_::input_t& p, V& v ) { v.apply("block", p.block); }
-    template < typename K, typename V > static void visit( const K&, concatenate_::input_t& p, V& v ) { v.apply("block", p.block); }
+    template < typename K, typename V > static void visit( const K&, const _concatenate::input_t& p, V& v ) { v.apply("block", p.block); }
+    template < typename K, typename V > static void visit( const K&, _concatenate::input_t& p, V& v ) { v.apply("block", p.block); }
 };
 
 } } // namespace comma { namespace visiting {
 
-static int repeat_( const comma::command_line_options& options, const comma::csv::options& csv )
+static int _repeat( const comma::command_line_options& options, const comma::csv::options& csv )
 {
     unsigned int size = options.value< unsigned int >( "--size,-n" );
     if( csv.binary() )
     {
-        typedef concatenate_::input_t input_t; // quick and dirty
+        typedef _concatenate::input_t input_t; // quick and dirty
         comma::csv::input_stream< input_t > is( std::cin, csv ); // quick and dirty, will be slow on ascii
         while( is.ready() || ( std::cin.good() && !std::cin.eof() ) )
         {
@@ -267,22 +247,48 @@ static int repeat_( const comma::command_line_options& options, const comma::csv
     return 0;
 }
 
+static int _split( const comma::command_line_options& options, const comma::csv::options& csv )
+{
+    if( csv.binary() ) { _binary_pass_through( csv.format(), csv.flush ); return 0; };
+    unsigned int size = options.value< unsigned int >( "--size,-n" );
+    bool repeat = options.exists( "--repeat" );
+    while( std::cin.good() && !std::cin.eof() )
+    {
+        std::string line;
+        std::getline( std::cin, line );
+        const auto& s = comma::strip( line );
+        if( s.empty() ) { continue; }
+        unsigned int p{0};
+        for( unsigned int i{0}, c{0}; i < s.size(); ++i )
+        {
+            if( s[i] == csv.delimiter ) { ++c; }
+            if( c < size ) { continue; }
+            std::cout << s.substr( p, i - p ) << std::endl;
+            p = i + 1;
+            c = 0;
+            if( !repeat ) { break; }
+        }
+        if( p < s.size() ) { std::cout << s.substr( p ) << std::endl; }
+    }
+    return 0;
+}
+
 int main( int ac, char** av )
 {
     try
     {
         comma::command_line_options options( ac, av, usage );
-        std::vector< std::string > unnamed = options.unnamed( "--size,-n,--sliding-window,-w,--step,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--expected-records,--repeat,--sliding-window,-w,--verbose,-v", "-.*" );
         comma::csv::options csv( options );
         csv.full_xpath = false;
-        if (csv.fields.empty()) { csv.fields="a"; }
+        if( csv.fields.empty() ) { csv.fields="a"; }
         is_binary = csv.binary();
         if( unnamed.empty() ) { std::cerr << comma::verbose.app_name() << ": please specify operations" << std::endl; exit( 1 ); }
         std::string operation = unnamed[0];
-        if( operation == "concatenate" || operation == "loop" ) { return concatenate_().run(options, csv); }
-        if( operation == "repeat" ) { return repeat_( options, csv ); }
-        std::cerr << comma::verbose.app_name() << ": operation not supported or unknown: '" << operation << '\'' << std::endl;
-        return 1;
+        if( operation == "concatenate" || operation == "loop" ) { return _concatenate().run( options, csv ); }
+        if( operation == "repeat" ) { return _repeat( options, csv ); }
+        if( operation == "split" ) { return _split( options, csv ); }
+        std::cerr << comma::verbose.app_name() << ": expected operation; got: '" << operation << '\'' << std::endl;
     }
     catch( std::exception& ex ) { std::cerr << "csv-shape: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-shape: unknown exception" << std::endl; }
diff --git a/csv/test/csv-shape/split/expected b/csv/test/csv-shape/split/expected
new file mode 100644
index 000000000..d2b7aa428
--- /dev/null
+++ b/csv/test/csv-shape/split/expected
@@ -0,0 +1,18 @@
+split[0]/output/line[0]="1,2"
+split[0]/output/line[1]="3,4,5,6"
+split[0]/status=0
+split[1]/output/line[0]="1,2,3"
+split[1]/output/line[1]="4,5,6"
+split[1]/status=0
+split[2]/output/line[0]="1,2,3,4"
+split[2]/output/line[1]="5,6"
+split[2]/status=0
+split[3]/output/line[0]="1,2"
+split[3]/output/line[1]="3,4"
+split[3]/output/line[2]="5,6"
+split[3]/status=0
+split[4]/output/line[0]="1,2"
+split[4]/output/line[1]="3"
+split[4]/output/line[2]="4,5"
+split[4]/output/line[3]="6"
+split[4]/status=0
diff --git a/csv/test/csv-shape/split/input b/csv/test/csv-shape/split/input
new file mode 100644
index 000000000..244e91155
--- /dev/null
+++ b/csv/test/csv-shape/split/input
@@ -0,0 +1,5 @@
+split[0]="echo 1,2,3,4,5,6 | csv-shape split -n 2"
+split[1]="echo 1,2,3,4,5,6 | csv-shape split -n 3"
+split[2]="echo 1,2,3,4,5,6 | csv-shape split -n 4"
+split[3]="echo 1,2,3,4,5,6 | csv-shape split -n 2 --repeat"
+split[4]="( echo 1,2,3; echo; echo 4,5,6 ) | csv-shape split -n 2 --repeat"

From ba33f6a873a0fb898cee6f950788a65887bd198c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Aug 2023 13:14:37 +1000
Subject: [PATCH 0637/1056] command_line_options: optional bash completion
 added to constructor

---
 application/command_line_options.cpp | 5 +++--
 application/command_line_options.h   | 2 +-
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 72021fff4..dd3410429 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -40,14 +40,15 @@ void command_line_options::_init_verbose( bool v, const std::string& path )
     comma::application::detail::verbose = v;
 }
 
-command_line_options::command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage )
+command_line_options::command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage, boost::function< void( int, char** ) > bash_completion )
 {
     argv_.resize( argc );
     for( int i = 0; i < argc; ++i ) { argv_[i] = argv[i]; }
     _fill_map( argv_ );
     bool v = exists("--verbose,-v");
     _init_verbose( v, argv[0] );
-    if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 1 ); }
+    if( bash_completion && exists( "--bash-completion" ) ) { bash_completion( argc, argv ); exit( 0 ); }
+    if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 0 ); }
 }
 
 command_line_options::command_line_options( const std::vector< std::string >& argv, boost::function< void( bool ) > usage )
diff --git a/application/command_line_options.h b/application/command_line_options.h
index b4b9380ca..a7613c3e8 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -39,7 +39,7 @@ class command_line_options
         /// constructor
         /// if --help,-h present, call usage()
         /// if --verbose,-v present, call usage( verbose )
-        command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage = NULL );
+        command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage = NULL, boost::function< void( int, char** ) > bash_completion = NULL );
 
         /// constructor
         /// if --help,-h present, call usage()

From d45efee3877af9abf0d3b90f4551be02d70d4ef2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Aug 2023 18:24:48 +1000
Subject: [PATCH 0638/1056] containers/multidimensional/array: compilation
 problem (on some systems): ugly patch implemented for now

---
 containers/applications/math-lookup.cpp    | 16 ++++++++--------
 containers/multidimensional/array_traits.h | 12 ++++++++++++
 2 files changed, 20 insertions(+), 8 deletions(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index ee6fe720b..14e3c8a62 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -55,17 +55,17 @@ void usage( bool verbose )
 static bool permissive{false};
 static bool verbose{false};
 
-template< typename T, std::size_t D, typename S >
-std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
+// template< typename T, std::size_t D, typename S >
+// std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
 
-template< typename T, std::size_t D, typename S >
-std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { auto r = lhs; r *= rhs; return r; }
+// template< typename T, std::size_t D, typename S >
+// std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { auto r = lhs; r *= rhs; return r; }
 
-template< typename T, std::size_t D >
-std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] += rhs[i]; } return lhs; } // quick and dirty; let compiler optimize
+// template< typename T, std::size_t D >
+// std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] += rhs[i]; } return lhs; } // quick and dirty; let compiler optimize
 
-template< typename T, std::size_t D >
-std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { auto r = lhs; r += rhs; return r; }
+// template< typename T, std::size_t D >
+// std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { auto r = lhs; r += rhs; return r; }
 
 template< typename T, std::size_t D >
 std::ostream& operator<<( std::ostream& os, const std::array< T, D >& rhs ) { std::string d; for( unsigned int i = 0; i < D; ++i ) { os << d << rhs[i]; d = ","; } return os; }
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index 4fac00e00..4122d7358 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -9,6 +9,18 @@
 #include <type_traits>
 #include "../../math/compare.h"
 
+template< typename T, std::size_t D, typename S >
+inline std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
+
+template< typename T, std::size_t D, typename S >
+inline std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { auto r = lhs; r *= rhs; return r; }
+
+template< typename T, std::size_t D >
+inline std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] += rhs[i]; } return lhs; } // quick and dirty; let compiler optimize
+
+template< typename T, std::size_t D >
+inline std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { auto r = lhs; r += rhs; return r; }
+
 namespace comma { namespace containers { namespace multidimensional { namespace impl {
 
 template < typename T > inline int index( T p, T origin, T resolution )

From c970c87bccdb0ae5ce28aa8fcd2c7853bc1b99f5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Aug 2023 18:34:09 +1000
Subject: [PATCH 0639/1056] CMakeFiles/check.c++.standard.cmake: default c++
 standard set to 14

---
 CMakeFiles/check.c++.standard.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeFiles/check.c++.standard.cmake b/CMakeFiles/check.c++.standard.cmake
index 5e42f46d0..1f4b01b82 100644
--- a/CMakeFiles/check.c++.standard.cmake
+++ b/CMakeFiles/check.c++.standard.cmake
@@ -1,7 +1,7 @@
     SET( CXX_STANDARDS "0x;11;14;17" CACHE STRING "list of known c++ standards" )
     MARK_AS_ADVANCED( FORCE CXX_STANDARDS )
     STRING( REGEX REPLACE ";" "," CXX_STANDARDS_READABLE "${CXX_STANDARDS}" )
-    SET( CXX_STANDARD_DEFAULT "11" CACHE STRING "default c++ standard to use" )
+    SET( CXX_STANDARD_DEFAULT "14" CACHE STRING "default c++ standard to use" )
     MARK_AS_ADVANCED( FORCE CXX_STANDARD_DEFAULT )
     SET( CXX_STANDARD_TO_USE "${CXX_STANDARD_DEFAULT}" CACHE STRING "c++ standard to use (one of ${CXX_STANDARDS_READABLE})" )
     SET_PROPERTY( CACHE CXX_STANDARD_TO_USE PROPERTY STRINGS ${CXX_STANDARDS} )

From 1bd9e9de495b1bbe959060568c5b3dfa0e3de40f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 30 Aug 2023 13:36:20 +1000
Subject: [PATCH 0640/1056] python: comma.dictionary.parents(): in progress...

---
 python/comma/dictionary/__init__.py |  2 +-
 python/comma/dictionary/util.py     | 19 ++++++++++++++++++-
 2 files changed, 19 insertions(+), 2 deletions(-)

diff --git a/python/comma/dictionary/__init__.py b/python/comma/dictionary/__init__.py
index 8fab06d41..fa16bc6a1 100644
--- a/python/comma/dictionary/__init__.py
+++ b/python/comma/dictionary/__init__.py
@@ -1,3 +1,3 @@
 # Copyright (c) 2023 Vsevolod Vlaskine
 
-from .util import at, has, leaves, set
+from .util import at, has, leaves, parents, set
diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/util.py
index b6bc49eb8..da5b93f97 100644
--- a/python/comma/dictionary/util.py
+++ b/python/comma/dictionary/util.py
@@ -99,7 +99,7 @@ def _set( d, p ):
 
 def leaves( d, path=None ):
     '''
-    iterator through the leaf items of a nested dictionary or list, yields path-value pairs
+    generator of the leaf items of a nested dictionary or list, yields path-value pairs
 
     example
     -------
@@ -113,3 +113,20 @@ def leaves( d, path=None ):
         for i, value in enumerate(d): yield from leaves( value, f'{path}[{i}]' )
     else:
         yield path[1:] if path and path[0] == '/' else path, d
+
+def parents( d, path, parent_field_name=None, root=None ):
+    '''
+    generator of parents of a given path
+
+    todo: usage semantics and examples
+    todo: unit test
+    '''
+    if root is None: root = ''
+    if parent_field_name is None or not has( d, f'{path}/{parent_field_name}' ):
+        p = os.path.dirname( path )
+        if p == root: yield p
+        else: yield from parents( d, p )
+    else:
+        p = at( d, f'{path}/{parent_field_name}' )
+        if p == '': yield p
+        else: yield from parents( d, f'{root}{p}' if p[0] == '/' else f'{os.path.dirname( path )}/{p}', parent_field_name, root )
\ No newline at end of file

From 7fe414ba9044a07b29ea58c620f93c7c26a23f01 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 30 Aug 2023 18:13:52 +1000
Subject: [PATCH 0641/1056] python: comma.dictionary.parents(): first ugly-ish
 cut tested

---
 .../comma/dictionary/test/test_dictionary.py  | 13 +++-
 python/comma/dictionary/util.py               | 76 ++++++++++---------
 2 files changed, 51 insertions(+), 38 deletions(-)

diff --git a/python/comma/dictionary/test/test_dictionary.py b/python/comma/dictionary/test/test_dictionary.py
index 07f0037d2..ea3605de0 100644
--- a/python/comma/dictionary/test/test_dictionary.py
+++ b/python/comma/dictionary/test/test_dictionary.py
@@ -47,10 +47,14 @@ def test_dictionary_at():
     assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]/g', no_throw=True) == 6
 
 def test_dictionary_has():
-    d = { 'a': { 'b': { 'c': { 'd': 1 } } } }
+    d = { 'a': { 'b': { 'c': { 'd': 1 } }, 'e': [ 2, { 'f': 3 } ] } }
     assert dictionary.has( d, 'a/b/c' )
     assert dictionary.has( d, 'a.b.c', delimiter = '.' )
     assert dictionary.has( d, 'a/b/c/d' )
+    # assert dictionary.has( d, 'a/b/e' ) # todo: support arrays
+    # assert dictionary.has( d, 'a/b/e[0]' ) # todo: support arrays
+    # assert dictionary.has( d, 'a/b/e[1]' ) # todo: support arrays
+    # assert dictionary.has( d, 'a/b/e[1]/f' ) # todo: support arrays
     assert not dictionary.has( d, 'x' )
     assert not dictionary.has( d, 'x/y' )
     assert not dictionary.has( d, 'a/z' )
@@ -69,6 +73,13 @@ def test_dictionary_leaves():
     assert list( dictionary.leaves( {} ) ) == []
     assert list( dictionary.leaves( [] ) ) == []
 
+def test_dictionary_parents():
+    assert list( dictionary.parents( { 'a': { 'b': { 'c': {} } } }, 'a/b/c' ) ) == ['a/b', 'a']
+    assert list( dictionary.parents( { 'a': { 'b': [ 5, { 'c': 6 } ] } }, 'a/b[1]/c' ) ) == ['a/b[1]', 'a']
+    assert list( dictionary.parents( { 'a': { 'b': [ 5, { 'c': 6 } ] } }, 'a/b[1]/c', parent='parent' ) ) == ['a/b[1]', 'a']
+    with pytest.raises( KeyError ): dictionary.at( {}, 'a/b/c' )
+    assert list( dictionary.parents( { 'a': { 'parent': 'd', 'b': [ 5, { 'c': { 'parent': '/a/b[0]' } } ], 'd': 3 } }, 'a/b[1]/c', parent='parent' ) ) == ['a/b[0]', 'a', 'd']
+
 def test_dictionary_set():
     d = {}
     dictionary.set( d, 'a/b/c', 5 )
diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/util.py
index da5b93f97..affdbe51b 100644
--- a/python/comma/dictionary/util.py
+++ b/python/comma/dictionary/util.py
@@ -3,7 +3,7 @@
 made for convenience, not for performance
 '''
 
-import copy, functools, typing
+import copy, functools, os, sys, typing
 
 def at( d, path, delimiter = '/', no_throw = False, full = False ): # todo: default=...
     '''
@@ -30,7 +30,8 @@ def at( d, path, delimiter = '/', no_throw = False, full = False ): # todo: defa
         [ 8, 9, 10 ]
         >>> comma.dictionary.at( d, 'e[2][1]' )
         10
-        >>> comma.dictionary.at( d, 'e[1][1:]' )
+        >>> comma.dictionary.at( d, 'e[1][1:]' )assert permissive or has( d, p )
+                
         [ 9, 10 ]
         >>> e = [1, 2, {'a': 3} ]
         >>> comma.dictionary.at( e, '[2]/a' )
@@ -72,31 +73,6 @@ def has( d, path, delimiter = '/' ):
     p = path.split( delimiter ) if isinstance( path, str ) else path
     return functools.reduce( lambda d, k: ( d[k[1]] if k[0] + 1 < len( p ) else True ) if isinstance( d, dict ) and k[1] in d else False, enumerate( p ), d )
 
-def set( d, path, value, delimiter = '/' ):
-    '''
-    assign value to a nested dictionary/list element
-    
-    examples
-    --------
-        >>> d = { "a": { "b": 1, "c": [ 2, 3 ], "d": { "e": 4 } } }
-        >>> comma.dictionary.set( d, 'a/b/c[1]', 5 )
-        todo
-    '''
-    def _set( d, p ):
-        s = p[0].split( '[', 1 )
-        if len( p ) == 1:
-            if len( s ) == 1: d[p[0]] = value
-            else: exec( f'd[{s[1]} = value' if s[0] == '' else f'd["{s[0]}"][{s[1]} = value', { 'd': d, 'value': value } )
-        else:
-            if len( s ) == 1:
-                if not p[0] in d: d[p[0]] = {}
-                _set( d[p[0]], p[ 1: ] )
-            else:
-                if ( len( s ) == 1 or s[0] != '' ) and not s[0] in d: raise KeyError( f'on path {path}: {s[0]} not found' )
-                _set( eval( f'd[{s[1]}' if s[0] == '' else f'd["{s[0]}"][{s[1]}', { 'd': d } ), p[1:])
-    _set( d, path.split( delimiter ) )
-    return d
-
 def leaves( d, path=None ):
     '''
     generator of the leaf items of a nested dictionary or list, yields path-value pairs
@@ -114,19 +90,45 @@ def leaves( d, path=None ):
     else:
         yield path[1:] if path and path[0] == '/' else path, d
 
-def parents( d, path, parent_field_name=None, root=None ):
+def parents( d, path, parent=None ):
     '''
     generator of parents of a given path
 
     todo: usage semantics and examples
     todo: unit test
     '''
-    if root is None: root = ''
-    if parent_field_name is None or not has( d, f'{path}/{parent_field_name}' ):
-        p = os.path.dirname( path )
-        if p == root: yield p
-        else: yield from parents( d, p )
-    else:
-        p = at( d, f'{path}/{parent_field_name}' )
-        if p == '': yield p
-        else: yield from parents( d, f'{root}{p}' if p[0] == '/' else f'{os.path.dirname( path )}/{p}', parent_field_name, root )
\ No newline at end of file
+    p = path
+    while p not in [ '', '/' ]:
+        if parent is None:
+            p = os.path.dirname( p )
+        else:
+            q = at( d, f'{p}/{parent}', no_throw=True )
+            if q in [ '', '/' ]: break
+            if q is None: p = os.path.dirname( p )
+            else: p = q[1:] if q[0] == '/' else f'{os.path.dirname( p )}/{q}'
+        if p not in [ '', '/' ]: yield p[1:] if p[0] == '/' else p # quick and dirty
+
+def set( d, path, value, delimiter = '/' ):
+    '''
+    assign value to a nested dictionary/list element
+    
+    examples
+    --------
+        >>> d = { "a": { "b": 1, "c": [ 2, 3 ], "d": { "e": 4 } } }
+        >>> comma.dictionary.set( d, 'a/b/c[1]', 5 )
+        todo
+    '''
+    def _set( d, p ):
+        s = p[0].split( '[', 1 )
+        if len( p ) == 1:
+            if len( s ) == 1: d[p[0]] = value
+            else: exec( f'd[{s[1]} = value' if s[0] == '' else f'd["{s[0]}"][{s[1]} = value', { 'd': d, 'value': value } )
+        else:
+            if len( s ) == 1:
+                if not p[0] in d: d[p[0]] = {}
+                _set( d[p[0]], p[ 1: ] )
+            else:
+                if ( len( s ) == 1 or s[0] != '' ) and not s[0] in d: raise KeyError( f'on path {path}: {s[0]} not found' )
+                _set( eval( f'd[{s[1]}' if s[0] == '' else f'd["{s[0]}"][{s[1]}', { 'd': d } ), p[1:])
+    _set( d, path.split( delimiter ) )
+    return d
\ No newline at end of file

From 8c397434abe9b68bb6e0aeea7463495fab050b1b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 11 Sep 2023 16:10:06 +1000
Subject: [PATCH 0642/1056] comma::name_value::ptree::from: bug patched

---
 name_value/ptree.h | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/name_value/ptree.h b/name_value/ptree.h
index bef9c81e1..43af5e60a 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -217,11 +217,16 @@ struct property_tree // quick and dirty
                     for( boost::property_tree::ptree::const_assoc_iterator j = t->ordered_begin(); j != t->not_found(); ++j, ++i )
                     {
                         cur_ = j->second;
-                        //std::size_t index = j->first == "" ? i : boost::lexical_cast< std::size_t >( j->first ); // way quick and dirty
+                        std::size_t index = i; // super-quick and dirty for now
+                        if( j->first != "" )
+                        {
+                            try { index = boost::lexical_cast< std::size_t >( j->first ); }
+                            catch( ... ) { index = i; }
+                        }
                         //if( index >= t->size() ) { COMMA_THROW( comma::exception, "expected index less than " << t->size() << "; got: " << index ); }
                         visiting::do_while<    !boost::is_fundamental< typename A::value_type >::value
                                             && !boost::is_same< typename A::value_type, boost::posix_time::ptime >::value
-                                            && !boost::is_same< typename A::value_type, std::string >::value >::visit( "", value[i], *this );
+                                            && !boost::is_same< typename A::value_type, std::string >::value >::visit( "", value[index], *this );
                     }
                     cur_ = parent;
                 }

From c7510398fff6cdb959686305f3f5a440a5caac39 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 13 Sep 2023 20:57:03 +1000
Subject: [PATCH 0643/1056] math-lookup: --help: typo fixed

---
 containers/applications/math-lookup.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index 14e3c8a62..d41783eeb 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -16,7 +16,7 @@
 void usage( bool verbose )
 {
     std::cerr << "operations on a multidimensional lookup table" << std::endl;
-    std::cerr << "up to 4-dimension lookup tables with up to 4-dimension" << std::endl;
+    std::cerr << "lookup tables with up to 4-dimension" << std::endl;
     std::cerr << "values are currently supported; if you need more, just ask" << std::endl;
     std::cerr << std::endl;
     std::cerr << "usage: cat input.csv | math-lookup <operation> [<lut-filename>[;<lut-csv-options>]] <options>" << std::endl;

From 1b6910453b05003a54838b2efac63e2feeb4c2ac Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 19 Sep 2023 14:32:27 +1000
Subject: [PATCH 0644/1056] name-value-convert: --to dot: first cut implemented

---
 .../applications/name-value-convert.cpp       | 49 ++++++++++++++++++-
 name_value/ptree.cpp                          | 35 ++++++++++---
 name_value/ptree.h                            |  3 ++
 3 files changed, 79 insertions(+), 8 deletions(-)

diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index f8caf56d2..6a3b2aa66 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -3,6 +3,7 @@
 /// @author vsevolod vlaskine
 
 #include <iostream>
+#include <map>
 #include <boost/bind.hpp>
 #include <boost/function.hpp>
 #include <boost/property_tree/info_parser.hpp>
@@ -26,7 +27,7 @@ static void usage( bool verbose = false )
     std::cerr << std::endl;
     std::cerr << "data options" << std::endl;
     std::cerr << "    --from <format>: input format; if this options is omitted, input format will be guessed; formats: json, xml, path-value/pv" << std::endl;
-    std::cerr << "    --to <format>: output format; formats: ini, json, xml, path-value (pv); default: path-value" << std::endl;
+    std::cerr << "    --to <format>: output format; formats: ini, json, xml, path-value (pv), dot; default: path-value" << std::endl;
     std::cerr << "    --path=[<path>]; output data at a given path in the input" << std::endl;
     std::cerr << "                     multiple instances of --path supported" << std::endl;
     std::cerr << "                     regex expression support: todo" << std::endl;
@@ -38,6 +39,7 @@ static void usage( bool verbose = false )
     std::cerr << "    json: json data" << std::endl;
     std::cerr << "    xml: xml data" << std::endl;
     std::cerr << "    path-value: path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
+    std::cerr << "    dot: as graphviz dot language, see: https://graphviz.org/doc/info/lang.html" << std::endl;
     std::cerr << std::endl;
     std::cerr << "name/path-value options" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal sign>: default '='" << std::endl;
@@ -66,6 +68,19 @@ static void usage( bool verbose = false )
     std::cerr << "    --linewise,-l: if present, treat each input line as a record" << std::endl;
     std::cerr << "                   if absent, treat all of the input as one record" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    if( verbose )
+    {
+        std::cerr << "dot" << std::endl;
+        std::cerr << "    sudo apt install graphviz" << std::endl;
+        std::cerr << "    { echo a/b/c=hello; echo a/c/d=world; } | name-value-convert --to dot | dot -Tsvg > test.svg" << std::endl;
+        std::cerr << "    eog test.svg" << std::endl;
+    }
+    else
+    {
+        std::cerr << "    run: name-value-convert --help --verbose for more..." << std::endl;
+    }
+    std::cerr << std::endl;
     exit( 0 );
 }
 
@@ -81,7 +96,7 @@ static path_mode indices_mode = comma::property_tree::disabled;
 static bool use_index = true;
 static comma::property_tree::path_value::check_repeated_paths check_type( comma::property_tree::path_value::no_check );
 
-enum Types { ini, info, json, xml, path_value, void_t };
+enum Types { ini, info, json, xml, path_value, dot, void_t };
 
 template < Types Type > struct traits {};
 
@@ -130,6 +145,34 @@ template <> struct traits< path_value > // quick and dirty
     }
 };
 
+template <> struct traits< dot >
+{
+    static void input( std::istream& is, boost::property_tree::ptree& ptree ) { COMMA_THROW_BRIEF( comma::exception, "--from dot: not implemented (and most likely never will)" ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode mode )
+    { 
+        const auto& pv = comma::property_tree::to_path_value( ptree, comma::xpath(), mode ); // todo: optional root
+        std::set< std::string > r; // super-quick and dirty; ordered set: slower, but neater output
+        std::map< std::string, std::pair< std::string, std::string > > nodes;
+        std::set< std::string > edges;
+        os << "digraph callgraph {" << std::endl;
+        for( const auto& p: pv )
+        {
+            std::string q = p.first.elements[0].to_string();
+            nodes.insert( std::make_pair( q, std::make_pair( q, p.first.elements.size() == 1 ? p.second : std::string() ) ) );
+            for( unsigned int i = 1; i < p.first.elements.size(); ++i )
+            {
+                auto s = p.first.elements[i].to_string();
+                edges.insert( "\"" + q + "\" -> \"" + q + "/" + s + "\"" );
+                q += "/" + s;
+                nodes.insert( std::make_pair( q, std::make_pair( s, i + 1 == p.first.elements.size() ? p.second : std::string() ) ) );
+            }
+        }
+        for( const auto& n: nodes ) { os << "    \"" << n.first << "\" [label=\"" << n.second.first << ( n.second.second.empty() ? std::string() : ( ":\n" + n.second.second ) ) << "\"]" << std::endl; }
+        for( const auto& e: edges ) { os << "    " << e << std::endl; }
+        os << "}" << std::endl;
+    }
+};
+
 void ( * input )( std::istream& is, boost::property_tree::ptree& ptree );
 void ( * output )( std::ostream& is, const boost::property_tree::ptree& ptree, const path_mode );
 
@@ -162,6 +205,7 @@ int main( int ac, char** av )
             else if( *from == "json" ) { input = &traits< json >::input; }
             else if( *from == "xml" ) { input = &traits< xml >::input; }
             else if( *from == "path-value" || *from == "pv" ) { input = &traits< path_value >::input; }
+            else if( *from == "dot" ) { input = &traits< dot >::input; }
             else { std::cerr << "name-value-convert: expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         }
         else
@@ -174,6 +218,7 @@ int main( int ac, char** av )
         else if( to == "json" ) { output = &traits< json >::output; }
         else if( to == "xml" ) { output = &traits< xml >::output; }
         else if( to == "path-value" || to == "pv" ) { output = &traits< path_value >::output; }
+        else if( to == "dot" ) { output = &traits< dot >::output; }
         else { std::cerr << "name-value-convert: expected --to format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         if( use_index )
         {
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index 78f9454d5..15ac3a896 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -125,7 +125,8 @@ static void ptree_output_value_( std::ostream& os, const std::string& value, boo
     if( quoted ) { os << '"' << value << '"'; } else { os << value; }
 }
 
-static void ptree_to_path_value_string_impl( std::ostream& os
+static void ptree_to_path_value_string_impl( std::ostream* os
+                                           , std::vector< std::pair< xpath, std::string > >& pv // todo! refactor! super-quick and dirty for now
                                            , boost::property_tree::ptree::const_iterator i
                                            , bool is_begin
                                            , xpath& path
@@ -138,7 +139,8 @@ static void ptree_to_path_value_string_impl( std::ostream& os
 {
     if( i->second.begin() == i->second.end() )
     {
-        ptree_output_value_( os, i->second.get_value< std::string >(), is_begin, display_path / i->first, equal_sign, delimiter, root, unquote_numbers );
+        if( os ) { ptree_output_value_( *os, i->second.get_value< std::string >(), is_begin, display_path / i->first, equal_sign, delimiter, root, unquote_numbers ); }
+        else { pv.push_back( std::make_pair( display_path / i->first, i->second.get_value< std::string >() ) ); }
     }
     else
     {
@@ -148,16 +150,19 @@ static void ptree_to_path_value_string_impl( std::ostream& os
         if( v ) // quick and dirty
         {
             const std::string& stripped = comma::strip( *v );
-            if( !stripped.empty() )  { ptree_output_value_( os, stripped, is_begin, display_path, equal_sign, delimiter, root, unquote_numbers );  }
+            if( !stripped.empty() )
+            { 
+                if( os ) { ptree_output_value_( *os, stripped, is_begin, display_path, equal_sign, delimiter, root, unquote_numbers ); }
+                else { pv.push_back( std::make_pair( display_path, stripped ) ); }
+            }
         }
-
         comma::uint32 index=0;
         for( boost::property_tree::ptree::const_iterator j = i->second.begin(); j != i->second.end(); ++j )
         {
             // Test if it is json array data, if so all keys are empty. If so display indices in path if requested
             if( mode == property_tree::without_brackets && j->first.empty()  ) { display_path /= boost::lexical_cast< std::string >( index++ ); }
             else if( mode == property_tree::with_brackets && j->first.empty() ) { display_path.elements.back().index = index++; }
-            ptree_to_path_value_string_impl( os, j, is_begin, path, display_path, mode, equal_sign, delimiter, root, unquote_numbers );
+            ptree_to_path_value_string_impl( os, pv, j, is_begin, path, display_path, mode, equal_sign, delimiter, root, unquote_numbers );
             if( mode == property_tree::without_brackets && j->first.empty() ) { display_path = display_path.head(); }
             is_begin = false;
         }
@@ -172,6 +177,23 @@ namespace comma {
 
 void property_tree::to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode mode, char equal_sign, char delimiter, const xpath& root, bool const unquote_numbers )
 {
+    std::vector< std::pair< xpath, std::string > > dummy; // quick and dirty
+    for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
+    {
+        // display_path is the modified key path showing array indices, if array exists within e.g abc[0]/xyz[0]
+        // But the actual path to the value is many empty keys under abc and abc/xyz
+        // Boost: "JSON arrays are mapped to nodes. Each element is a child node with an empty name.
+        //         If a node has both named and unnamed child nodes, it cannot be mapped to a JSON representation."
+        // http://www.boost.org/doc/libs/1_41_0/doc/html/boost_propertytree/parsers.html#boost_propertytree.parsers.json_parser
+        xpath path;
+        xpath display_path;
+        impl::ptree_to_path_value_string_impl( &os, dummy, i, i == ptree.begin(), path, display_path, mode, equal_sign, delimiter, root.to_string(), unquote_numbers ); // quick and dirty
+    }
+}
+
+std::vector< std::pair< xpath, std::string > > property_tree::to_path_value( const boost::property_tree::ptree& ptree, const xpath& root, path_mode mode )
+{
+    std::vector< std::pair< xpath, std::string > > pv; // quick and dirty
     for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
     {
         // display_path is the modified key path showing array indices, if array exists within e.g abc[0]/xyz[0]
@@ -181,8 +203,9 @@ void property_tree::to_path_value( std::ostream& os, const boost::property_tree:
         // http://www.boost.org/doc/libs/1_41_0/doc/html/boost_propertytree/parsers.html#boost_propertytree.parsers.json_parser
         xpath path;
         xpath display_path;
-        impl::ptree_to_path_value_string_impl( os, i, i == ptree.begin(), path, display_path, mode, equal_sign, delimiter, root.to_string(), unquote_numbers ); // quick and dirty
+        impl::ptree_to_path_value_string_impl( nullptr, pv, i, i == ptree.begin(), path, display_path, mode, '=', ',', root.to_string(), true ); // quick and dirty
     }
+    return pv;
 }
 
 void property_tree::from_path_value( std::istream& is, boost::property_tree::ptree& ptree, property_tree::path_value::check_repeated_paths check_type, char equal_sign, char delimiter, bool use_index )
diff --git a/name_value/ptree.h b/name_value/ptree.h
index 43af5e60a..1417368d4 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -42,6 +42,9 @@ struct property_tree // quick and dirty
     /// write as path-value to output stream
     static void to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode indices_mode = disabled, char equal_sign = '=', char delimiter = ',', const xpath& root = xpath(), bool const unquote_numbers = false );
 
+    /// return path-value pairs
+    static std::vector< std::pair< xpath, std::string > > to_path_value( const boost::property_tree::ptree& ptree, const xpath& root = xpath(), path_mode indices_mode = with_brackets );
+
     /// convert boost parameter tree into path=value-style string (equal sign and delimiter have to be escaped)
     static std::string to_path_value_string( const boost::property_tree::ptree& ptree, path_mode mode=disabled, char equal_sign = '=', char delimiter = ',', bool const unquote_numbers = false );
     

From f00c1e6ef56e42be150f684388e1ef123fa53518 Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Tue, 19 Sep 2023 17:12:25 +1000
Subject: [PATCH 0645/1056] dynamic/shared_library: added

---
 CMakeLists.txt                |  1 +
 dynamic/CMakeLists.txt        | 14 +++++++++
 dynamic/shared_library.h      | 57 +++++++++++++++++++++++++++++++++++
 dynamic/test/CMakeLists.txt   | 13 ++++++++
 dynamic/test/include_test.cpp | 21 +++++++++++++
 5 files changed, 106 insertions(+)
 create mode 100644 dynamic/CMakeLists.txt
 create mode 100644 dynamic/shared_library.h
 create mode 100644 dynamic/test/CMakeLists.txt
 create mode 100644 dynamic/test/include_test.cpp

diff --git a/CMakeLists.txt b/CMakeLists.txt
index fff280f40..0532f2b19 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -305,6 +305,7 @@ ADD_SUBDIRECTORY( containers )
 ADD_SUBDIRECTORY( csv )
 ADD_SUBDIRECTORY( dispatch )
 ADD_SUBDIRECTORY( doc )
+ADD_SUBDIRECTORY( dynamic ) 
 ADD_SUBDIRECTORY( io )
 ADD_SUBDIRECTORY( math )
 ADD_SUBDIRECTORY( name_value )
diff --git a/dynamic/CMakeLists.txt b/dynamic/CMakeLists.txt
new file mode 100644
index 000000000..c5d406906
--- /dev/null
+++ b/dynamic/CMakeLists.txt
@@ -0,0 +1,14 @@
+SET( PROJECT "dynamic" )
+SET( TARGET_NAME comma_${PROJECT} )
+
+FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp )
+FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h )
+SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
+ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
+ADD_DEPENDENCIES( ${TARGET_NAME} comma_base )
+
+INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+
+IF( comma_BUILD_TESTS )
+    ADD_SUBDIRECTORY( test )
+ENDIF( comma_BUILD_TESTS )
diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
new file mode 100644
index 000000000..632c947c6
--- /dev/null
+++ b/dynamic/shared_library.h
@@ -0,0 +1,57 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+
+/// @authors aspen eyers, vsevolod vlaskine
+
+#pragma once 
+#include <dlfcn.h>
+#include <vector>
+#include <memory>
+#include "../base/exception.h"
+
+namespace comma { namespace dynamic {
+
+class shared_library
+{
+    public:
+        shared_library( const std::string& lib, std::vector<std::string> additional_directories={} );
+
+        ~shared_library() { dlclose(handle_); }
+
+        template < typename T, typename... Args >
+        T* make( const std::string& library_symbol, Args... args ) const;
+
+    private:
+        void* handle_;
+        std::string lib_;
+};
+
+
+inline shared_library::shared_library( const std::string& lib, std::vector<std::string> link_directories )
+: lib_(lib)
+{
+    // sanitise_search_directories_
+    for (auto& dir : link_directories) { if( dir.back() != '/' ) { dir += std::string("/"); } }
+
+    for (const auto& dir : link_directories) {
+        handle_ = dlopen( (dir+"/"+lib).c_str(), RTLD_LAZY);
+        if( handle_ ) { break; }
+    }
+    
+    if( !handle_ ) handle_ = dlopen(&lib[0], RTLD_LAZY);
+    COMMA_ASSERT( handle_, "Shared library loading failed: could not open library: \"" + lib + "\"" );
+}
+
+template < typename T, typename... Args >
+inline T* shared_library::make( const std::string& library_symbol, Args... args ) const
+{
+    T* (*create_)(Args...) = reinterpret_cast<T*(*)(Args...)>(dlsym(handle_, &library_symbol[0]));
+    COMMA_ASSERT( create_, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");
+
+    T* object = create_(args...);
+
+    dlclose(handle_);
+
+    return object;
+}
+
+}}; // namespace comma { namespace dynamic {
diff --git a/dynamic/test/CMakeLists.txt b/dynamic/test/CMakeLists.txt
new file mode 100644
index 000000000..68a7da156
--- /dev/null
+++ b/dynamic/test/CMakeLists.txt
@@ -0,0 +1,13 @@
+set( KIT dynamic )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/dynamic/test/include_test.cpp b/dynamic/test/include_test.cpp
new file mode 100644
index 000000000..a639a5d34
--- /dev/null
+++ b/dynamic/test/include_test.cpp
@@ -0,0 +1,21 @@
+
+// Copyright (c) 2023 aspen eyers
+
+#include <gtest/gtest.h>
+#include "../shared_library.h"
+#include "../../base/exception.h"
+
+namespace comma {
+
+TEST( string, join )
+{
+  
+}
+
+} // namespace comma {
+
+int main( int argc, char* argv[] )
+{    
+    ::testing::InitGoogleTest(&argc, argv);
+    return RUN_ALL_TESTS();
+}

From 3d1ff4056d803eb149f52b28c6206c5e3666edc7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 19 Sep 2023 19:07:01 +1000
Subject: [PATCH 0646/1056] property_tree::as< T >(): first cut implemented

---
 name_value/ptree.h             | 17 ++++++++++++++++-
 name_value/test/ptree_test.cpp |  6 ++++++
 2 files changed, 22 insertions(+), 1 deletion(-)

diff --git a/name_value/ptree.h b/name_value/ptree.h
index 1417368d4..6e463e970 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -22,6 +22,7 @@
 #include "../base/types.h"
 #include "../string/string.h"
 #include "../xpath/xpath.h"
+#include "../visiting/apply.h"
 #include "../visiting/visit.h"
 #include "../visiting/while.h"
 
@@ -53,6 +54,10 @@ struct property_tree // quick and dirty
     
     /// get value as string from an xpath like a/b[5]/c/d[3]=4 on ptree
     static boost::optional< std::string > get( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true );
+
+    /// return value of a given type
+    template < typename T >
+    static boost::optional< T > as( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true, bool permissive = true );
     
     /// get subtree
     static boost::optional< boost::property_tree::ptree& > get_tree( boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true );
@@ -315,5 +320,15 @@ class to_ptree
         template < typename T > static T value_( T v ) { return v; }
 };
 
-} // namespace comma
+template < typename T >
+boost::optional< T > property_tree::as( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index, bool permissive )
+{
+    auto p = property_tree::get_tree( ptree, path, use_index );
+    if( !p ) { return boost::none; }
+    comma::from_ptree from_ptree( *p, xpath(), permissive );
+    T t;
+    comma::visiting::apply( from_ptree ).to( t );
+    return t;
+}
 
+} // namespace comma
diff --git a/name_value/test/ptree_test.cpp b/name_value/test/ptree_test.cpp
index b619181ba..d4335a2e1 100644
--- a/name_value/test/ptree_test.cpp
+++ b/name_value/test/ptree_test.cpp
@@ -152,6 +152,12 @@ TEST( ptree, basics )
         EXPECT_TRUE( !t.world );
         EXPECT_TRUE( !t1.world );
         EXPECT_EQ( t.nested->moon, t1.nested->moon );
+
+        comma::name_value::impl::write_json( std::cerr, tree1 );
+        auto a = property_tree::as< nested_type >( tree1, "test_type/nested" );
+        EXPECT_TRUE( a );
+        EXPECT_EQ( a->moon, t.nested->moon );
+        // todo! way more tests
     }
     {
         boost::property_tree::ptree ptree;

From 6739f79f768d4cce45c78eb42c25633b550d7016 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 19 Sep 2023 19:08:43 +1000
Subject: [PATCH 0647/1056] property_tree::as< T >(): todo comments added

---
 name_value/ptree.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/name_value/ptree.h b/name_value/ptree.h
index 6e463e970..c49d5feaa 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -56,6 +56,7 @@ struct property_tree // quick and dirty
     static boost::optional< std::string > get( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true );
 
     /// return value of a given type
+    /// todo! support non-class types and time
     template < typename T >
     static boost::optional< T > as( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true, bool permissive = true );
     

From 73f5a518681383ba33244476bc8e009c672977a2 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 21 Sep 2023 14:37:29 +1000
Subject: [PATCH 0648/1056] comma-progress: brushed up help and examples

---
 util/applications/comma-progress.cpp | 107 +++++++++++++++++++--------
 1 file changed, 75 insertions(+), 32 deletions(-)

diff --git a/util/applications/comma-progress.cpp b/util/applications/comma-progress.cpp
index c9e0b86d7..1e10392b3 100644
--- a/util/applications/comma-progress.cpp
+++ b/util/applications/comma-progress.cpp
@@ -85,37 +85,82 @@ template < > struct traits< impl_::log > {
     
 } } // namespace comma { namespace visiting { 
 
-
-static void usage( bool verbose=false )
+static void usage( bool verbose )
 {
-    std::cerr << std::endl;
-    std::cerr << "cat progress.csv | " << name() << " [<options>] > stat.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "Example: cat progress.csv | comma-progress --elapsed | comma-progress --ratio run_all/application"  << std::endl;
-    std::cerr << "         In this example, every 'ratio' value is compared against time of run_all/application, instead" << std::endl;
-    std::cerr << "         of total time." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "modes" << std::endl;
-    std::cerr << "    These are mutually exclusive." << std::endl;
-    std::cerr << "    <no option>: Outputs path value for input data: " << comma::join( comma::csv::names< impl_::log >(), ',' )  << std::endl;
-    std::cerr << "                 Output format is 'path/{begin,end}=<ISO timestamp>'" << std::endl;
-    std::cerr << "    --elapsed [ --from-path-value|--from-pv ]" << std::endl;
-    std::cerr << "                 Outputs path value with 'elapsed' time, input data format: " << comma::join( comma::csv::names< impl_::log >(), ',' )  << std::endl;
-    std::cerr << "                 If '--from-path-value|--from-pv' is given, it takes inputs from outputs of < no option >" << std::endl;
-    std::cerr << "                 Output format is 'path/elapsed=<duration in second>'" << std::endl;
-    std::cerr << "    --sum [--mean] [--count] [--ratio ] [-P|--percentage] " << std::endl;
-    std::cerr << "                 Outputs path value with summed 'elapsed' time, taking input data from --elapsed mode." << std::endl;
-    std::cerr << "                 Elapsed duration is duration sum of runs with the same <path> key, where one application was called multiple times." << std::endl;
-    std::cerr << "                 Output format is '<path>/elapsed=<duration in second>'" << std::endl;
-    std::cerr << "                 --mean  adds '<path>/mean=< mean duration in second >' for items that ran more than once - duplicated elapsed path/keys." << std::endl;
-    std::cerr << "                 --mean  adds '<path>/count=< occurances of <path>/elapsed >', where mean=( elapsed / count )." << std::endl;
-    std::cerr << "                 --ratio adds '<path>/ratio=< ratio to total time or time of [path] if given >', " << std::endl;
-    std::cerr << "                 --ratio with -P|--percentage, a percentage is the value for <path>/ratio, rounded to 3 decimal places." << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --help,-h:   Print this message.." << std::endl;
-    std::cerr << std::endl;
+    std::cerr << "\nsummarise timestamped elapsed time data";
+    std::cerr << "\n";
+    std::cerr << "\nusage: cat progress.csv | " << name() << " [<options>] > stat.csv";
+    std::cerr << "\n";
+    std::cerr << "\noptions:";
+    std::cerr << "\n    --help,-h:     display this help message and exit";
+    std::cerr << "\n    --verbose,-v:  more output";
+    std::cerr << "\n    --elapsed:     output path value with elapsed time";
+    std::cerr << "\n    --sum          output path value with summed elapsed time";
+    std::cerr << "\n";
+    std::cerr << "\nelapsed options:";
+    std::cerr << "\n    --from-path-value,--from-pv: take input from output of <no option>";
+    std::cerr << "\n";
+    std::cerr << "\nsum options:";
+    std::cerr << "\n    --count:          adds number of occurances of <path> (requires --mean)";
+    std::cerr << "\n    --mean:           adds mean duration for duplicate paths";
+    std::cerr << "\n    --percentage,-P:  express --ratio as a percentage";
+    std::cerr << "\n    --ratio [<path>]: adds ratio to total time or time of [path] if given";
+    std::cerr << "\n";
+    std::cerr << "\nmodes:";
+    std::cerr << "\n    with no option comma-progress takes " << comma::join( comma::csv::names< impl_::log >(), ',' ) << " and converts to";
+    std::cerr << "\n    path-value format of 'path/{begin,end}=<ISO timestamp>'";
+    std::cerr << "\n";
+    std::cerr << "\n    --elapsed";
+    std::cerr << "\n        input data format: " << comma::join( comma::csv::names< impl_::log >(), ',' );
+    std::cerr << "\n        output format: 'path/elapsed=<duration in second>'";
+    std::cerr << "\n        if --from-path-value is given input format is <no option> output";
+    std::cerr << "\n";
+    std::cerr << "\n    --sum";
+    std::cerr << "\n        input: data in format from --elapsed mode";
+    std::cerr << "\n        output: path-value with summed 'elapsed' time";
+    std::cerr << "\n        elapsed duration sums of runs with the same <path>";
+    std::cerr << "\n        additional accumlation stats can be added with --mean, --count, --ratio";
+    std::cerr << "\n        options in the format <path>/<stat>=<value>";
+    std::cerr << "\n";
+    if( verbose )
+    {
+        std::cerr << "\nexamples:";
+        std::cerr << "\n    --- create input data ---";
+        std::cerr << "\n    cat <<-EOF > data.csv";
+        std::cerr << "\n\t20230101T120000,main,begin";
+        std::cerr << "\n\t20230101T120100,sub_a,begin";
+        std::cerr << "\n\t20230101T120200,sub_a,end";
+        std::cerr << "\n\t20230101T120200,sub_b,begin";
+        std::cerr << "\n\t20230101T120600,sub_b,end";
+        std::cerr << "\n\t20230101T120600,sub_a,begin";
+        std::cerr << "\n\t20230101T120800,sub_a,end";
+        std::cerr << "\n\t20230101T121000,main,end";
+        std::cerr << "\n\tEOF";
+        std::cerr << "\n";
+        std::cerr << "\n    --- create path/value data ---";
+        std::cerr << "\n    cat data.csv | comma-progress";
+        std::cerr << "\n";
+        std::cerr << "\n    --- calculate elapsed times ---";
+        std::cerr << "\n    cat data.csv | comma-progress --elapsed";
+        std::cerr << "\n    cat data.csv | comma-progress | comma-progress --elapsed --from-path-value";
+        std::cerr << "\n";
+        std::cerr << "\n    --- sum up repeated entries ---";
+        std::cerr << "\n    cat data.csv | comma-progress --elapsed > elapsed.csv";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --mean";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --mean --count";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --ratio";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --ratio --percentage";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --ratio main/sub_b";
+    }
+    else
+    {
+        std::cerr << "\nsee comma-progress --help --verbose for examples";
+    }
+    std::cerr << "\n" << std::endl;
     exit( 1 );
 }
+
 static const std::string start = "begin";
 static const std::string finished = "end";
 
@@ -306,12 +351,10 @@ void process_begin_end( L get_log, O output )
 
 int main( int ac, char** av )
 {
-    comma::command_line_options options( ac, av );
-    
-    if( options.exists( "-h,--help" ) ) { usage(); }
-    
     try
     {
+        comma::command_line_options options( ac, av, usage );
+
         if( options.exists( "--sum" ) )
         {
             

From 69f0a984805940e9918a8ec2164f97fe0f94c611 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 21 Sep 2023 16:04:04 +1000
Subject: [PATCH 0649/1056] added comma-profile-graph-example

---
 util/examples/comma-profile-graph-example | 55 +++++++++++++++++++++++
 1 file changed, 55 insertions(+)
 create mode 100755 util/examples/comma-profile-graph-example

diff --git a/util/examples/comma-profile-graph-example b/util/examples/comma-profile-graph-example
new file mode 100755
index 000000000..fc47cc709
--- /dev/null
+++ b/util/examples/comma-profile-graph-example
@@ -0,0 +1,55 @@
+#!/bin/bash
+
+scriptname=$( basename $0 )
+
+source $( type -p comma-progress-util ) || { echo "$scriptname: cannot source 'comma-progress-util'" >&2; exit 1; }
+
+elapsed_csv=elapsed.csv
+profile_svg=profile.svg
+
+function usage()
+{
+    cat <<EOF
+
+usage: $scriptname <make|view>
+
+make - create profile data in $elapsed_csv
+view - visualise $elapsed_csv in $profile_svg
+
+EOF
+}
+
+function profile()
+{
+    local fn=$1
+    comma_progress_named $elapsed_csv $fn $fn
+}
+
+function func_a() { profile func_b; profile func_d; sleep 1.5; }
+function func_b() { for i in {0..2}; do profile func_c; done; sleep 0.1; }
+function func_c() { sleep 0.4; }
+function func_d() { sleep 0.2; }
+function func_e() { profile func_b; }
+function func_f() { profile func_d; }
+
+function make()
+{
+    [[ -f $elapsed_csv ]] && rm $elapsed_csv
+    profile func_a
+    profile func_e
+    profile func_f
+}
+
+function view()
+{
+    cat $elapsed_csv | comma-progress --elapsed | comma-profile-graph | dot -Tsvg > $profile_svg
+    eog $profile_svg
+}
+
+[[ $1 == "-h" || $1 == "--help" ]] && { usage; exit 1; }
+
+case $1 in
+    make) make ;;
+    view) view ;;
+    *)    usage
+esac

From 5ac90d387d9657e2cad675682d9d46031d4b3e06 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 25 Sep 2023 11:22:47 +1000
Subject: [PATCH 0650/1056] io-topics: on_demand: value check improved

---
 io/applications/io-topics | 30 ++----------------------------
 1 file changed, 2 insertions(+), 28 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index b68b86e83..64575a367 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -1,34 +1,8 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
 # Copyright (c) 2020 Vsevolod Vlaskine
 # All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 scriptname=$( basename $0 )
 
@@ -320,7 +294,7 @@ function publish_command()
     [[ -n "$topic_secondary_address" ]] || { [[ -z "$topic_secondary_port" ]] || topic_secondary_address="tcp:$topic_secondary_port"; }
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_multiplier" ]]; then multiplier="--multiplier $topic_multiplier"; else unset multiplier; fi
-    if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
+    if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand -- "
     if [[ -z "$topic_input" ]]; then cmd+="$topic_command"
     else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
@@ -334,7 +308,7 @@ function cat_command()
     local ignore_command=$2
     (( ignore_command )) || [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
     set_topic_address
-    if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
+    if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     if [[ -n "$topic_flush" ]]; then flush_option="--flush"; else unset flush_option; fi # todo! make flush default?!
     if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi

From d102adea9aeff369d19abfcad08bcefdd77d6cf6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 5 Oct 2023 20:50:56 +1100
Subject: [PATCH 0651/1056] io::publisher::accept(): return vector of new
 streams instead of just count

---
 io/applications/io-publish.cpp |  6 +++++-
 io/impl/publisher.cpp          | 36 +++++-----------------------------
 io/impl/publisher.h            | 33 ++-----------------------------
 io/publisher.cpp               |  2 +-
 io/publisher.h                 | 34 ++------------------------------
 5 files changed, 15 insertions(+), 96 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 1ad5e92c1..437e40d40 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -263,7 +263,11 @@ class publish
                 transaction_t t( publishers_ );
                 for( unsigned int i = 0; i < t->size(); ++i )
                 {
-                    if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) ) { ( *t )[i]->accept(); }
+                    if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
+                    {
+                        const auto& streams = ( *t )[i]->accept();
+
+                    }
                 }
                 handle_sizes_( t );
                 if( has_primary_clients_ )
diff --git a/io/impl/publisher.cpp b/io/impl/publisher.cpp
index f155e77b8..6b91b5682 100644
--- a/io/impl/publisher.cpp
+++ b/io/impl/publisher.cpp
@@ -1,31 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author cedric wohlleber
 
@@ -280,17 +254,17 @@ void publisher::close()
 
 void publisher::disconnect_all() { while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); } }
 
-unsigned int publisher::accept()
+std::vector< io::ostream* > publisher::accept()
 {
-    if( !acceptor_ ) { return 0; }
-    unsigned int count = 0;
+    std::vector< io::ostream* > streams;
+    if( !acceptor_ ) { return streams; }
     while( true ) // while( streams_.size() < maxSize ?
     {
         io::ostream* s = acceptor_->accept();
-        if( s == NULL ) { return count; }
+        if( s == NULL ) { return streams; }
+        streams.push_back( s );
         streams_.insert( boost::shared_ptr< io::ostream >( s ) );
         select_.write().add( *s );
-        ++count;
     }
 }
 
diff --git a/io/impl/publisher.h b/io/impl/publisher.h
index 4540ec79d..7a16f0a02 100644
--- a/io/impl/publisher.h
+++ b/io/impl/publisher.h
@@ -1,36 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author cedric wohlleber
 
-#ifndef COMMA_IO_IMPL_PUBLISHER_H_
-#define COMMA_IO_IMPL_PUBLISHER_H_
+#pragma once
 
 #include <set>
 #include <boost/scoped_ptr.hpp>
@@ -87,7 +60,7 @@ class publisher
 
         std::size_t size() const;
 
-        unsigned int accept();
+        std::vector< io::ostream* > accept();
         
         const io::impl::acceptor& acceptor() const { return *acceptor_; }
 
@@ -103,5 +76,3 @@ class publisher
 };
 
 } } } // namespace comma { namespace io { namespace impl {
-
-#endif // #ifndef COMMA_IO_IMPL_PUBLISHER_H_
diff --git a/io/publisher.cpp b/io/publisher.cpp
index 2bf0d01bd..3ce8a265b 100644
--- a/io/publisher.cpp
+++ b/io/publisher.cpp
@@ -40,7 +40,7 @@ publisher::~publisher() { delete pimpl_; }
 
 std::size_t publisher::write( const char* buf, std::size_t size, bool do_accept ) { return pimpl_->write( buf, size, do_accept ); }
 
-unsigned int publisher::accept() { return pimpl_->accept(); }
+std::vector< io::ostream* > publisher::accept() { return pimpl_->accept(); }
 
 void publisher::close() { pimpl_->close(); }
 
diff --git a/io/publisher.h b/io/publisher.h
index 564011028..caa536f8a 100644
--- a/io/publisher.h
+++ b/io/publisher.h
@@ -1,37 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_IO_PUBLISHER_H_
-#define COMMA_IO_PUBLISHER_H_
+#pragma once
 
 #include <stdlib.h>
 #include <string>
@@ -84,7 +56,7 @@ class publisher : public boost::noncopyable
 
         /// accept waiting clients, non-blocking
         /// @return number of clients accepted
-        unsigned int accept();
+        std::vector< io::ostream* > accept();
         
         /// return acceptor file descriptor
         file_descriptor acceptor_file_descriptor() const;
@@ -94,5 +66,3 @@ class publisher : public boost::noncopyable
 };
 
 } } // namespace comma { namespace io {
-
-#endif // #ifndef COMMA_IO_PUBLISHER_H_

From d0eca13cf08e7f7f26ddbe448ffcee52cf810e08 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 6 Oct 2023 01:08:42 +1100
Subject: [PATCH 0652/1056] io-publish: --cache-size: in progress...

---
 io/applications/io-publish.cpp | 41 +++++++++-------------------------
 1 file changed, 11 insertions(+), 30 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 437e40d40..5bf277c39 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // Copyright (c) 2020 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @authors cedric wohlleber, vsevolod vlaskine, dave jennings
 
@@ -34,6 +7,7 @@
 #include <signal.h>
 #include <sys/wait.h>
 #include <unistd.h>
+#include <deque>
 #include <memory>
 #include <boost/bind.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
@@ -68,6 +42,8 @@ static void usage( bool verbose = false )
     std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
     std::cerr << std::endl;
     std::cerr << "stream options" << std::endl;
+    std::cerr << "    --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the" << std::endl;
+    std::cerr << "                                         the cached records will be sent to it once connected (todo)" << std::endl;
     std::cerr << "    --size,-s: binary input; packet size" << std::endl;
     std::cerr << "    --multiplier,-m: multiplier for packet size, default is 1. The actual packet size will be m * s" << std::endl;
     std::cerr << "    --no-discard: if present, do blocking write to every open stream" << std::endl;
@@ -119,7 +95,6 @@ static void usage( bool verbose = false )
     std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand --exec \"camera-cat arg1 arg2\"" << std::endl;
     std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand -- camera-cat arg1 arg2" << std::endl;
     std::cerr << std::endl;
-    std::cerr << std::endl;
     exit( 0 );
 }
 
@@ -142,12 +117,14 @@ class publish
                , bool discard
                , bool flush
                , bool output_number_of_clients
-               , bool update_no_clients )
+               , bool update_no_clients
+               , unsigned int cache_size )
             : discard_( discard )
             , flush_( flush )
             , buffer_( packet_size, '\0' )
             , packet_size_( packet_size )
             , output_number_of_clients_( output_number_of_clients )
+            , cache_size_( cache_size )
             , update_no_clients_( update_no_clients )
             , got_first_client_ever_( false )
             , sizes_( endpoints.size(), 0 )
@@ -298,6 +275,7 @@ class publish
         std::string buffer_;
         unsigned int packet_size_;
         bool output_number_of_clients_;
+        unsigned int cache_size_;
         bool update_no_clients_;
         bool got_first_client_ever_;
         std::vector< unsigned int > sizes_;
@@ -305,6 +283,7 @@ class publish
         unsigned int num_clients_;
         boost::scoped_ptr< boost::thread > acceptor_thread_;
         bool is_shutdown_;
+        std::deque< std::string > cache_;
 };
 
 class command
@@ -364,6 +343,7 @@ int main( int ac, char** av )
         comma::command_line_options options( head, usage );
         const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand", "-.+" );
         if( names.empty() ) { std::cerr << "io-publish: please specify at least one stream; use '-' for stdout" << std::endl; return 1; }
+        options.assert_mutually_exclusive( "--cache-size,--cache", "--on-demand" );
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
         comma::signal_flag is_shutdown( signals );
         bool on_demand = options.exists( "--on-demand" );
@@ -373,7 +353,8 @@ int main( int ac, char** av )
                  , !options.exists( "--no-discard" )
                  , !options.exists( "--no-flush" )
                  , options.exists( "--output-number-of-clients,--clients" )
-                 , exit_on_no_clients || on_demand );
+                 , exit_on_no_clients || on_demand
+                 , options.value( "--cache-size,--cache", 0 ) );
         std::string exec_command = options.value< std::string >( "--exec", "" );
         if( !tail.empty() )
         {

From 7d3f70e537a6080a8e32311861fff700ba6dd632 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 6 Oct 2023 01:17:46 +1100
Subject: [PATCH 0653/1056] io-publish: --cache-size: first cut implemented;
 debugging...

---
 io/applications/io-publish.cpp | 14 +++++++++++++-
 io/stream.h                    | 32 +-------------------------------
 2 files changed, 14 insertions(+), 32 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 5bf277c39..6521c04a9 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -183,6 +183,11 @@ class publish
                 if( !input.good() ) { return false; }
             }
             transaction_t t( publishers_ );
+            if( cache_size_ > 0 )
+            {
+                cache_.push_back( buffer_ );
+                if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
+            }
             for( auto& p: *t ) { if( p ) { p->write( &buffer_[0], buffer_.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
             return handle_sizes_( t );
         }
@@ -243,7 +248,14 @@ class publish
                     if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
                     {
                         const auto& streams = ( *t )[i]->accept();
-
+                        for( unsigned int i = 0; i < cache_.size(); ++i )
+                        {
+                            for( auto s: streams )
+                            { 
+                                ( *s )->write( &buffer_[0], buffer_.size() );
+                                if( flush_ ) { ( *s )->flush(); }
+                            }
+                        }
                     }
                 }
                 handle_sizes_( t );
diff --git a/io/stream.h b/io/stream.h
index 9948e9bf9..3e6b59b07 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -1,37 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_IO_STREAM_H_
-#define COMMA_IO_STREAM_H_
+#pragma once
 
 #include <iostream>
 #include <string>
@@ -138,5 +110,3 @@ struct iostream : public stream< std::iostream >
 };
 
 } } // namespace comma { namespace io {
-
-#endif

From c4b9818e48cda45a77f7dd78a3774441e3f60263 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 6 Oct 2023 01:30:56 +1100
Subject: [PATCH 0654/1056] io-topics: cache_size added to publish config

---
 io/applications/io-topics | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 64575a367..a21b02869 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -187,6 +187,7 @@ function publish_topic_fields_help()
     cat <<eof
 address;           passed verbatim to io-publish, port attribute will be ignored
 binary;            for binary data, binary format of data, overrides size
+cache_size;        same meaning as io-publish --cache-size
 command;           command for the publisher to run
 input;             input topic for publish command to read on stdin
 multiplier;        passed to io-publish
@@ -295,7 +296,8 @@ function publish_command()
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_multiplier" ]]; then multiplier="--multiplier $topic_multiplier"; else unset multiplier; fi
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
-    local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand -- "
+    if [[ -n "$topic_cache_size" ]]; then cache_size=$topic_cache_size; else unset cache_size; fi
+    local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size -- "
     if [[ -z "$topic_input" ]]; then cmd+="$topic_command"
     else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"
@@ -308,7 +310,8 @@ function cat_command()
     local ignore_command=$2
     (( ignore_command )) || [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
     set_topic_address
-    if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
+    if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi # todo? remove? is it even used anywhere?
+    if [[ -n "$topic_cache_size" ]]; then cache_size=$topic_cache_size; else unset cache_size; fi
     if [[ -n "$topic_flush" ]]; then flush_option="--flush"; else unset flush_option; fi # todo! make flush default?!
     if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi

From 2d275dfa23b22871fef9549700b7bb009510ae2d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 6 Oct 2023 01:31:54 +1100
Subject: [PATCH 0655/1056] io-topics: cache_size: typo fixed

---
 io/applications/io-topics | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index a21b02869..c845e8ba5 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -296,7 +296,7 @@ function publish_command()
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_multiplier" ]]; then multiplier="--multiplier $topic_multiplier"; else unset multiplier; fi
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
-    if [[ -n "$topic_cache_size" ]]; then cache_size=$topic_cache_size; else unset cache_size; fi
+    if [[ -n "$topic_cache_size" ]]; then cache_size="--cache-size=$topic_cache_size"; else unset cache_size; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size -- "
     if [[ -z "$topic_input" ]]; then cmd+="$topic_command"
     else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi

From 9d33532caaae58057be998ec6ef45992412d2b70 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 6 Oct 2023 17:47:06 +1100
Subject: [PATCH 0656/1056] io-publish: typo fixed

---
 io/applications/io-publish.cpp | 9 +++------
 1 file changed, 3 insertions(+), 6 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 6521c04a9..bfda6798b 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -248,13 +248,10 @@ class publish
                     if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
                     {
                         const auto& streams = ( *t )[i]->accept();
-                        for( unsigned int i = 0; i < cache_.size(); ++i )
+                        for( auto s: streams )
                         {
-                            for( auto s: streams )
-                            { 
-                                ( *s )->write( &buffer_[0], buffer_.size() );
-                                if( flush_ ) { ( *s )->flush(); }
-                            }
+                            for( const auto& c: cache_ ) { ( *s )->write( &c[0], c.size() ); }
+                            if( flush_ ) { ( *s )->flush(); }
                         }
                     }
                 }

From e93b52738910f525a2ebcd5bab910935b4880a32 Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Mon, 25 Sep 2023 15:03:43 +1000
Subject: [PATCH 0657/1056] dynamic/shared_library.h: dlcose - dereference and
 subsuquent destruction of the shred object moved to the destructor.

---
 dynamic/shared_library.h | 2 --
 1 file changed, 2 deletions(-)

diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
index 632c947c6..3a0f7db25 100644
--- a/dynamic/shared_library.h
+++ b/dynamic/shared_library.h
@@ -49,8 +49,6 @@ inline T* shared_library::make( const std::string& library_symbol, Args... args
 
     T* object = create_(args...);
 
-    dlclose(handle_);
-
     return object;
 }
 

From 5035f88a51c088b77bf32f6b00282c92fe676698 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sat, 30 Sep 2023 23:32:11 +1000
Subject: [PATCH 0658/1056] name-value-permute.cpp: include
 boost/math/special_functions.hpp

for boost::math:isfinite()

for some reason in Boost 1.80 this is no longer brought in by the other
include files
---
 name_value/applications/name-value-permute.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/name_value/applications/name-value-permute.cpp b/name_value/applications/name-value-permute.cpp
index 43148e1a7..743e39e6d 100644
--- a/name_value/applications/name-value-permute.cpp
+++ b/name_value/applications/name-value-permute.cpp
@@ -31,6 +31,7 @@
 #include <fstream>
 #include <boost/lexical_cast.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/math/special_functions.hpp>
 #include "../../base/exception.h"
 #include "../../application/command_line_options.h"
 #include "../../string/split.h"

From 16dbf451581a41ed113d5cca2eb03832d88d4de4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 19 Oct 2023 05:37:20 +1100
Subject: [PATCH 0659/1056] io-cat: --head: first cut added

---
 io/applications/io-cat.cpp | 32 +++++++++++++++++++++++++++++---
 1 file changed, 29 insertions(+), 3 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 03a6a6dd4..006f9b1bf 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -66,6 +66,10 @@ void usage( bool verbose = false )
     std::cerr << "options" << std::endl;
     std::cerr << "    --exit-on-first-closed,-e: exit, if one of the streams finishes" << std::endl;
     std::cerr << "    --flush,--unbuffered,-u: flush output" << std::endl;
+    std::cerr << "    --head=[<n>]; output first <n> records and exit without waiting for record n+1" << std::endl;
+    std::cerr << "                  a workaround for sparse input fed into: io-cat ... | head -n10, which" << std::endl;
+    std::cerr << "                  not exit until io-cat receives record 11" << std::endl;
+    std::cerr << "                  instead run: io-cat ... --head=10 (use --flush if you don't want buffering" << std::endl;
     std::cerr << "    --round-robin=[<number of packets>]: todo: only for multiple inputs: read not more" << std::endl;
     std::cerr << "                                         than <number of packets> from an input at once," << std::endl;
     std::cerr << "                                         before checking other inputs" << std::endl;
@@ -302,6 +306,26 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
     exit( 1 );
 }
 
+static bool _write( const comma::command_line_options& options, const std::vector< char >& buffer, unsigned int bytes_read )
+{
+    static unsigned int head = options.value( "--head", 0 );
+    static unsigned int size = options.value( "--size,-s", 0 );
+    static unsigned int count = 0;
+    if( head == 0 ) { std::cout.write( &buffer[0], bytes_read ); return true; }
+    if( size == 0 )
+    {
+        std::cout.write( &buffer[0], bytes_read );
+        ++count;
+    }
+    else
+    {
+        unsigned int n = std::min( bytes_read / size, head - count );
+        std::cout.write( &buffer[0], n * size );
+        count += n;
+    }
+    return count < head;
+}
+
 int main( int argc, char** argv )
 {
     #ifdef WIN32
@@ -325,12 +349,14 @@ int main( int argc, char** argv )
         permissive = options.exists( "--permissive" );
         const std::vector< std::string >& unnamed = options.unnamed( "--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
         #ifdef WIN32
-        if( size || unnamed.size() == 1 ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        //if( size || unnamed.size() == 1 ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
         if( unnamed.empty() ) { std::cerr << "io-cat: please specify at least one source" << std::endl; return 1; }
         boost::ptr_vector< stream > streams;
         comma::io::select select;
-        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size || unnamed.size() == 1 ) ); }
+        // for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size || unnamed.size() == 1 ) ); }
+        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 ) ); }
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;
@@ -362,7 +388,7 @@ int main( int argc, char** argv )
                     if( bytes_read == 0 ) { break; }
                     done = false;
                     if( size && bytes_read % size != 0 ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) << std::endl; return 1; }
-                    std::cout.write( &buffer[0], bytes_read );
+                    if( !_write( options, buffer, bytes_read ) ) { done = true; break; }
                     if( !std::cout.good() ) { done = true; break; }
                     if( unbuffered ) { std::cout.flush(); }
                     if( round_robin_count )

From becaf13d8e95d7765963ba4d3d9766bf8f66fd90 Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Fri, 29 Sep 2023 14:20:06 +1000
Subject: [PATCH 0660/1056] dynamic/shared_library: Expand tests to cover
 object lifetime expectations

---
 dynamic/shared_library.h                     | 14 ++++----
 dynamic/test/CMakeLists.txt                  |  6 +++-
 dynamic/test/include_test.cpp                | 37 ++++++++++++++++++--
 dynamic/test/shared_library_test_classes.cpp |  1 +
 dynamic/test/shared_library_test_classes.h   |  7 ++++
 dynamic/test/shared_library_test_detail.h    | 34 ++++++++++++++++++
 6 files changed, 90 insertions(+), 9 deletions(-)
 create mode 100644 dynamic/test/shared_library_test_classes.cpp
 create mode 100644 dynamic/test/shared_library_test_classes.h
 create mode 100644 dynamic/test/shared_library_test_detail.h

diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
index 3a0f7db25..cf890d0ec 100644
--- a/dynamic/shared_library.h
+++ b/dynamic/shared_library.h
@@ -15,7 +15,9 @@ class shared_library
     public:
         shared_library( const std::string& lib, std::vector<std::string> additional_directories={} );
 
-        ~shared_library() { dlclose(handle_); }
+        ~shared_library() { 
+            dlclose(handle_); 
+        }
 
         template < typename T, typename... Args >
         T* make( const std::string& library_symbol, Args... args ) const;
@@ -31,24 +33,24 @@ inline shared_library::shared_library( const std::string& lib, std::vector<std::
 {
     // sanitise_search_directories_
     for (auto& dir : link_directories) { if( dir.back() != '/' ) { dir += std::string("/"); } }
-
     for (const auto& dir : link_directories) {
-        handle_ = dlopen( (dir+"/"+lib).c_str(), RTLD_LAZY);
+        handle_ = dlopen( (dir+lib).c_str(), RTLD_LAZY);
         if( handle_ ) { break; }
     }
-    
     if( !handle_ ) handle_ = dlopen(&lib[0], RTLD_LAZY);
+    COMMA_ASSERT( !dlerror(), "Shared library loading failed: could not open library: \"" + lib + "\"");
     COMMA_ASSERT( handle_, "Shared library loading failed: could not open library: \"" + lib + "\"" );
 }
 
 template < typename T, typename... Args >
 inline T* shared_library::make( const std::string& library_symbol, Args... args ) const
 {
-    T* (*create_)(Args...) = reinterpret_cast<T*(*)(Args...)>(dlsym(handle_, &library_symbol[0]));
+    auto symbol = dlsym(handle_, library_symbol.c_str());
+    COMMA_ASSERT( symbol, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");
+    T* (*create_)(Args...) = reinterpret_cast<T*(*)(Args...)>(symbol);
     COMMA_ASSERT( create_, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");
 
     T* object = create_(args...);
-
     return object;
 }
 
diff --git a/dynamic/test/CMakeLists.txt b/dynamic/test/CMakeLists.txt
index 68a7da156..1353ef27e 100644
--- a/dynamic/test/CMakeLists.txt
+++ b/dynamic/test/CMakeLists.txt
@@ -1,8 +1,12 @@
 set( KIT dynamic )
 file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
 set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+
+add_library( comma_dynamic_test_classes SHARED shared_library_test_classes.cpp )
+target_compile_definitions(comma_dynamic_test_classes PRIVATE DYNAMICLIB_EXPORTS)
+
 add_executable( ${test_name} ${source} )
-target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
+target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread ${CMAKE_DL_LIBS} )
 add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
 if( INSTALL_TESTS )
     install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
diff --git a/dynamic/test/include_test.cpp b/dynamic/test/include_test.cpp
index a639a5d34..b72a4ed0f 100644
--- a/dynamic/test/include_test.cpp
+++ b/dynamic/test/include_test.cpp
@@ -5,13 +5,46 @@
 #include "../shared_library.h"
 #include "../../base/exception.h"
 
+#include "shared_library_test_detail.h"
+#include <dlfcn.h>
+
 namespace comma {
 
-TEST( string, join )
+TEST( initialise, no_args )
+{
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    comma::dynamic::test::point* p = library.make<comma::dynamic::test::point>( "comma_dynamic_test_create_simple" );
+}
+
+
+TEST( initialise, args )
 {
-  
+    comma::dynamic::test::point* p;
+    {
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    p = library.make<comma::dynamic::test::point, float, float, float>( "comma_dynamic_test_create_point", 1.0, 2.0, 3.0 );
+    }
+    EXPECT_EQ( p->x, 1.0 );
+    EXPECT_EQ( p->y, 2.0 );
+    EXPECT_EQ( p->z, 3.0 );
 }
 
+TEST( initialise, polymorphic )
+{
+    comma::dynamic::test::polymorphic_point* p;
+    {
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    p = library.make<comma::dynamic::test::polymorphic_point, float, float, float>( "comma_dynamic_test_create_polymorphic_point", 1.0, 2.0, 3.0 );
+    }
+
+    // This will cause a seg fault!
+    EXPECT_EQ( p->get_x(), 1.0 );
+    EXPECT_EQ( p->get_y(), 2.0 );
+    EXPECT_EQ( p->get_z(), 3.0 );
+}
+
+
+
 } // namespace comma {
 
 int main( int argc, char* argv[] )
diff --git a/dynamic/test/shared_library_test_classes.cpp b/dynamic/test/shared_library_test_classes.cpp
new file mode 100644
index 000000000..2f931c638
--- /dev/null
+++ b/dynamic/test/shared_library_test_classes.cpp
@@ -0,0 +1 @@
+#include "shared_library_test_classes.h"
diff --git a/dynamic/test/shared_library_test_classes.h b/dynamic/test/shared_library_test_classes.h
new file mode 100644
index 000000000..a91dba1fa
--- /dev/null
+++ b/dynamic/test/shared_library_test_classes.h
@@ -0,0 +1,7 @@
+#pragma once 
+#include "shared_library_test_detail.h"
+#define DYNAMICLIB_API
+
+extern "C" DYNAMICLIB_API comma::dynamic::test::simple comma_dynamic_test_create_simple(){ return comma::dynamic::test::simple(); }
+extern "C" DYNAMICLIB_API comma::dynamic::test::point comma_dynamic_test_create_point(float x, float y, float z){ return comma::dynamic::test::point(x, y, z); }
+extern "C" DYNAMICLIB_API comma::dynamic::test::polymorphic_point comma_dynamic_test_create_polymorphic_point(float x, float y, float z){ return comma::dynamic::test::polymorphic_point(x, y, z); }
diff --git a/dynamic/test/shared_library_test_detail.h b/dynamic/test/shared_library_test_detail.h
new file mode 100644
index 000000000..f8eadf39d
--- /dev/null
+++ b/dynamic/test/shared_library_test_detail.h
@@ -0,0 +1,34 @@
+#pragma once
+#include <string>
+
+namespace comma { namespace dynamic { namespace test {
+
+class simple{
+    std::string name{"hello world"};
+};
+
+class point{
+    public:
+        point() : x(0), y(0), z(0) {}
+        point(float x, float y, float z) : x(x), y(y), z(z) {}
+        float x;
+        float y;
+        float z;
+};
+
+class polymorphic_point {
+public:
+    polymorphic_point() : x(0), y(0), z(0) {}
+    polymorphic_point(float x, float y, float z) : x(x), y(y), z(z) {}
+    virtual ~polymorphic_point() {}
+    virtual float get_x() const { return x; }
+    virtual float get_y() const { return y; }
+    virtual float get_z() const { return z; }
+
+private:
+    float x;
+    float y;
+    float z;
+};
+
+} } } // namespace comma { namespace dynamic { namespace test {

From 8e2e5f88d61495ff7cc726aab58981a7a060e0cc Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Fri, 29 Sep 2023 18:23:41 +1000
Subject: [PATCH 0661/1056] dynamic/shared_library/test: adding new cases and
 trying to make less romm for user error (dynamic libs are painful with a lack
 of type checking & tend to seg fault...)

---
 dynamic/shared_library.h                   |  4 +---
 dynamic/test/include_test.cpp              | 27 +++++++++++++++-------
 dynamic/test/shared_library_test_classes.h |  6 ++---
 3 files changed, 23 insertions(+), 14 deletions(-)

diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
index cf890d0ec..436ee82ad 100644
--- a/dynamic/shared_library.h
+++ b/dynamic/shared_library.h
@@ -15,9 +15,7 @@ class shared_library
     public:
         shared_library( const std::string& lib, std::vector<std::string> additional_directories={} );
 
-        ~shared_library() { 
-            dlclose(handle_); 
-        }
+        ~shared_library() { dlclose(handle_); }
 
         template < typename T, typename... Args >
         T* make( const std::string& library_symbol, Args... args ) const;
diff --git a/dynamic/test/include_test.cpp b/dynamic/test/include_test.cpp
index b72a4ed0f..dd696fcd0 100644
--- a/dynamic/test/include_test.cpp
+++ b/dynamic/test/include_test.cpp
@@ -13,17 +13,15 @@ namespace comma {
 TEST( initialise, no_args )
 {
     comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
-    comma::dynamic::test::point* p = library.make<comma::dynamic::test::point>( "comma_dynamic_test_create_simple" );
+    auto p = library.make< comma::dynamic::test::simple >( "comma_dynamic_test_create_simple" );
 }
 
 
 TEST( initialise, args )
 {
     comma::dynamic::test::point* p;
-    {
     comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
     p = library.make<comma::dynamic::test::point, float, float, float>( "comma_dynamic_test_create_point", 1.0, 2.0, 3.0 );
-    }
     EXPECT_EQ( p->x, 1.0 );
     EXPECT_EQ( p->y, 2.0 );
     EXPECT_EQ( p->z, 3.0 );
@@ -31,16 +29,29 @@ TEST( initialise, args )
 
 TEST( initialise, polymorphic )
 {
-    comma::dynamic::test::polymorphic_point* p;
-    {
     comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
-    p = library.make<comma::dynamic::test::polymorphic_point, float, float, float>( "comma_dynamic_test_create_polymorphic_point", 1.0, 2.0, 3.0 );
-    }
+    auto p = library.make< comma::dynamic::test::polymorphic_point, float, float, float>( "comma_dynamic_test_create_polymorphic_point", 1.0, 2.0, 3.0 );
+    EXPECT_EQ( p->get_x(), 1.0 );
+    EXPECT_EQ( p->get_y(), 2.0 );
+    EXPECT_EQ( p->get_z(), 3.0 );
+}
+
 
-    // This will cause a seg fault!
+TEST( initialise, vector )
+{
+    std::vector<comma::dynamic::shared_library*> libraries;
+    libraries.emplace_back( new comma::dynamic::shared_library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} ) );
+    auto p = libraries.back()->make< comma::dynamic::test::polymorphic_point, float, float, float>( "comma_dynamic_test_create_polymorphic_point", 1.0, 2.0, 3.0 );
     EXPECT_EQ( p->get_x(), 1.0 );
     EXPECT_EQ( p->get_y(), 2.0 );
     EXPECT_EQ( p->get_z(), 3.0 );
+
+}
+
+TEST( initialise, failure_case )
+{
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    EXPECT_THROW({library.make< comma::dynamic::test::simple >( "non_existant_symbol" ); }, comma::exception);
 }
 
 
diff --git a/dynamic/test/shared_library_test_classes.h b/dynamic/test/shared_library_test_classes.h
index a91dba1fa..dbb456dc6 100644
--- a/dynamic/test/shared_library_test_classes.h
+++ b/dynamic/test/shared_library_test_classes.h
@@ -2,6 +2,6 @@
 #include "shared_library_test_detail.h"
 #define DYNAMICLIB_API
 
-extern "C" DYNAMICLIB_API comma::dynamic::test::simple comma_dynamic_test_create_simple(){ return comma::dynamic::test::simple(); }
-extern "C" DYNAMICLIB_API comma::dynamic::test::point comma_dynamic_test_create_point(float x, float y, float z){ return comma::dynamic::test::point(x, y, z); }
-extern "C" DYNAMICLIB_API comma::dynamic::test::polymorphic_point comma_dynamic_test_create_polymorphic_point(float x, float y, float z){ return comma::dynamic::test::polymorphic_point(x, y, z); }
+extern "C" DYNAMICLIB_API comma::dynamic::test::simple* comma_dynamic_test_create_simple(){ return new comma::dynamic::test::simple(); }
+extern "C" DYNAMICLIB_API comma::dynamic::test::point* comma_dynamic_test_create_point(float x, float y, float z){ return new comma::dynamic::test::point(x, y, z); }
+extern "C" DYNAMICLIB_API comma::dynamic::test::polymorphic_point* comma_dynamic_test_create_polymorphic_point(float x, float y, float z){ return new comma::dynamic::test::polymorphic_point(x, y, z); }

From f5fcd7a270ccd01dfc2e8096a41b9cce72e81d14 Mon Sep 17 00:00:00 2001
From: aspen <aspen@aspen>
Date: Sat, 30 Sep 2023 01:20:43 +1000
Subject: [PATCH 0662/1056] dynamic/shared_library: Fixed the way that the
 dynamic library errors are handled.

---
 dynamic/shared_library.h | 17 +++++++++++------
 1 file changed, 11 insertions(+), 6 deletions(-)

diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
index 436ee82ad..5761b2ea4 100644
--- a/dynamic/shared_library.h
+++ b/dynamic/shared_library.h
@@ -29,21 +29,26 @@ class shared_library
 inline shared_library::shared_library( const std::string& lib, std::vector<std::string> link_directories )
 : lib_(lib)
 {
+    char* error;
     // sanitise_search_directories_
     for (auto& dir : link_directories) { if( dir.back() != '/' ) { dir += std::string("/"); } }
     for (const auto& dir : link_directories) {
-        handle_ = dlopen( (dir+lib).c_str(), RTLD_LAZY);
-        if( handle_ ) { break; }
+        std::string link_lib = (dir+lib).c_str();
+        handle_ = dlopen( &link_lib[0], RTLD_LAZY);
+        error = dlerror();
+        if( error == NULL ){ break; } 
     }
-    if( !handle_ ) handle_ = dlopen(&lib[0], RTLD_LAZY);
-    COMMA_ASSERT( !dlerror(), "Shared library loading failed: could not open library: \"" + lib + "\"");
-    COMMA_ASSERT( handle_, "Shared library loading failed: could not open library: \"" + lib + "\"" );
+    if( error != NULL ) handle_ = dlopen(&lib[0], RTLD_LAZY);
+    COMMA_ASSERT( error == NULL, error );
 }
 
 template < typename T, typename... Args >
 inline T* shared_library::make( const std::string& library_symbol, Args... args ) const
 {
-    auto symbol = dlsym(handle_, library_symbol.c_str());
+    char* error;
+    auto symbol = dlsym(handle_, &library_symbol[0]);
+    COMMA_ASSERT( error == NULL, error );
+    if( symbol == nullptr ) { std::cerr << dlerror() << std::endl; }
     COMMA_ASSERT( symbol, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");
     T* (*create_)(Args...) = reinterpret_cast<T*(*)(Args...)>(symbol);
     COMMA_ASSERT( create_, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");

From ce5e0b625c9f053804a8bf704af21ca036f617da Mon Sep 17 00:00:00 2001
From: aspen <aspen@aspen>
Date: Sat, 30 Sep 2023 01:21:11 +1000
Subject: [PATCH 0663/1056] dynamic/shared_library: fixed incorrect variable
 name

---
 dynamic/shared_library.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
index 5761b2ea4..38c3246d8 100644
--- a/dynamic/shared_library.h
+++ b/dynamic/shared_library.h
@@ -13,7 +13,7 @@ namespace comma { namespace dynamic {
 class shared_library
 {
     public:
-        shared_library( const std::string& lib, std::vector<std::string> additional_directories={} );
+        shared_library( const std::string& lib, std::vector<std::string> link_directories={} );
 
         ~shared_library() { dlclose(handle_); }
 

From a125b0a05b5cb0a30d8bf40626bdc161285bbfa9 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 20 Oct 2023 18:38:08 +1100
Subject: [PATCH 0664/1056] io-cat: --head: made behaviour more consistent

---
 io/applications/io-cat.cpp | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 006f9b1bf..3e9ee3543 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -347,16 +347,17 @@ int main( int argc, char** argv )
         double connect_period_seconds = options.value( "--connect-period", 1.0 );
         connect_period = boost::posix_time::milliseconds( static_cast<unsigned int>(std::floor( connect_period_seconds * 1000 ) ));
         permissive = options.exists( "--permissive" );
+        bool has_head = options.exists( "--head" );
         const std::vector< std::string >& unnamed = options.unnamed( "--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
         #ifdef WIN32
-        //if( size || unnamed.size() == 1 ) { _setmode( _fileno( stdout ), _O_BINARY ); }
-        if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        if( size || ( unnamed.size() == 1 && !has_head ) ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        //if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
         if( unnamed.empty() ) { std::cerr << "io-cat: please specify at least one source" << std::endl; return 1; }
         boost::ptr_vector< stream > streams;
         comma::io::select select;
-        // for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size || unnamed.size() == 1 ) ); }
-        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 ) ); }
+        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 || ( unnamed.size() == 1 && !has_head ) ) ); }
+        //for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 ) ); }
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;

From 8fc720283932950067d30061714034f2c63b6180 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Oct 2023 11:38:04 +1100
Subject: [PATCH 0665/1056] csv/examples/application: placeholder created; in
 progress...

---
 csv/examples/application/CMakeLists.txt       |  6 ++++
 .../comma-csv-sample-application.cpp          | 36 +++++++++++++++++++
 2 files changed, 42 insertions(+)
 create mode 100644 csv/examples/application/CMakeLists.txt
 create mode 100644 csv/examples/application/comma-csv-sample-application.cpp

diff --git a/csv/examples/application/CMakeLists.txt b/csv/examples/application/CMakeLists.txt
new file mode 100644
index 000000000..040ae9416
--- /dev/null
+++ b/csv/examples/application/CMakeLists.txt
@@ -0,0 +1,6 @@
+project( comma-csv-sample-application )
+cmake_minimum_required(VERSION 3.20)
+set_property( CACHE CMAKE_BUILD_TYPE PROPERTY STRINGS "Debug" "Release" "RelWithDebInfo" "MinSizeRel" )
+find_package( comma REQUIRED PATHS "/usr/local/CMakeFiles" )
+add_executable( comma-csv-sample-application comma-csv-sample-application.cpp )
+target_link_libraries( comma-csv-sample-application ${comma_ALL_LIBRARIES} )
diff --git a/csv/examples/application/comma-csv-sample-application.cpp b/csv/examples/application/comma-csv-sample-application.cpp
new file mode 100644
index 000000000..103c5eaf5
--- /dev/null
+++ b/csv/examples/application/comma-csv-sample-application.cpp
@@ -0,0 +1,36 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+#include <exception>
+#include <iostream>
+#include <comma/application/command_line_options.h>
+#include <comma/csv/stream.h>
+#include <comma/visiting/traits.h>
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "todo" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --input-fields" << std::endl;
+    std::cerr << "    --output-fields" << std::endl;
+    std::cerr << "    --output-format" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+}
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        
+        return 0;
+    }
+    catch( const std::exception& e ) { std::cerr << av[0] << ": " << e.what() << std::endl; }
+    catch( ... ) { std::cerr << av[0] << ": unknown exception" << std::endl; }
+    return 1;
+}
\ No newline at end of file

From d88904d13666396b8ba1df9aa2e149f631f22382 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Oct 2023 12:39:01 +1100
Subject: [PATCH 0666/1056] csv/examples/application:
 comma-csv-sample-application-append: first cut implemented

---
 csv/examples/application/CMakeLists.txt       |  10 +-
 .../comma-csv-sample-application-append.cpp   | 121 ++++++++++++++++++
 .../comma-csv-sample-application.cpp          |  36 ------
 3 files changed, 126 insertions(+), 41 deletions(-)
 create mode 100644 csv/examples/application/comma-csv-sample-application-append.cpp
 delete mode 100644 csv/examples/application/comma-csv-sample-application.cpp

diff --git a/csv/examples/application/CMakeLists.txt b/csv/examples/application/CMakeLists.txt
index 040ae9416..f01196561 100644
--- a/csv/examples/application/CMakeLists.txt
+++ b/csv/examples/application/CMakeLists.txt
@@ -1,6 +1,6 @@
-project( comma-csv-sample-application )
-cmake_minimum_required(VERSION 3.20)
-set_property( CACHE CMAKE_BUILD_TYPE PROPERTY STRINGS "Debug" "Release" "RelWithDebInfo" "MinSizeRel" )
+project( comma-csv-sample-application-append )
+cmake_minimum_required( VERSION 3.1 )
+add_compile_options( -std=c++14 )
 find_package( comma REQUIRED PATHS "/usr/local/CMakeFiles" )
-add_executable( comma-csv-sample-application comma-csv-sample-application.cpp )
-target_link_libraries( comma-csv-sample-application ${comma_ALL_LIBRARIES} )
+add_executable( comma-csv-sample-application-append comma-csv-sample-application-append.cpp )
+target_link_libraries( comma-csv-sample-application-append ${comma_ALL_LIBRARIES} )
diff --git a/csv/examples/application/comma-csv-sample-application-append.cpp b/csv/examples/application/comma-csv-sample-application-append.cpp
new file mode 100644
index 000000000..b92b7dc6f
--- /dev/null
+++ b/csv/examples/application/comma-csv-sample-application-append.cpp
@@ -0,0 +1,121 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+#include <exception>
+#include <iostream>
+#include <comma/application/command_line_options.h>
+#include <comma/csv/stream.h>
+#include <comma/string/string.h>
+#include <comma/visiting/traits.h>
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "todo" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --input-fields; print input fields to stdout and exit" << std::endl;
+    std::cerr << "    --output-fields; print output fields to stdout and exit" << std::endl;
+    std::cerr << "    --output-format; print output format to stdout and exit" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+}
+
+namespace comma { namespace csv { namespace examples { namespace application {
+
+struct input
+{
+    struct nested { double d{0}; };
+    unsigned int a{0};
+    double b{0};
+    nested c;
+};
+
+struct output
+{
+    unsigned int count{0};
+    double result{0};
+};
+
+} } } } // namespace comma { namespace csv { namespace examples { namespace application {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv::examples::application::input::nested >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input::nested& p, Visitor& v )
+    {
+        v.apply( "d", p.d );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input::nested& p, Visitor& v )
+    {
+        v.apply( "d", p.d );
+    }
+};
+
+template <> struct traits< comma::csv::examples::application::input >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+        v.apply( "c", p.c );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+        v.apply( "c", p.c );
+    }
+};
+
+template <> struct traits< comma::csv::examples::application::output >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::output& p, Visitor& v )
+    {
+        v.apply( "count", p.count );
+        v.apply( "result", p.result );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+static comma::csv::examples::application::output& populate_output( const comma::csv::examples::application::input& input
+                                                                 , comma::csv::examples::application::output& output )
+{
+    ++output.count;
+    output.result = input.a + input.b * input.c.d;
+    return output;
+}
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        comma::csv::options csv( options );
+        typedef comma::csv::examples::application::input input_t;
+        typedef comma::csv::examples::application::output output_t;
+        if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< input_t >(), ',' ) << std::endl; return 0; }
+        if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< output_t >(), ',' ) << std::endl; return 0; }
+        if( options.exists( "--output-format" ) ) { std::cout << comma::csv::format::value< output_t >() << std::endl; return 0; }
+        comma::csv::input_stream< comma::csv::examples::application::input > is( std::cin, csv );
+        comma::csv::output_stream< comma::csv::examples::application::output > os( std::cout, csv.binary() );
+        auto tied = comma::csv::make_tied( is, os );
+        comma::csv::examples::application::output output;
+        while( is.ready() || std::cin.good() )
+        {
+            auto p = is.read();
+            if( !p ) { break; }
+            tied.append( populate_output( *p, output ) );
+        }
+        return 0;
+    }
+    catch( const std::exception& e ) { std::cerr << av[0] << ": " << e.what() << std::endl; }
+    catch( ... ) { std::cerr << av[0] << ": unknown exception" << std::endl; }
+    return 1;
+}
\ No newline at end of file
diff --git a/csv/examples/application/comma-csv-sample-application.cpp b/csv/examples/application/comma-csv-sample-application.cpp
deleted file mode 100644
index 103c5eaf5..000000000
--- a/csv/examples/application/comma-csv-sample-application.cpp
+++ /dev/null
@@ -1,36 +0,0 @@
-// Copyright (c) 2023 Vsevolod Vlaskine
-// All rights reserved.
-
-#include <exception>
-#include <iostream>
-#include <comma/application/command_line_options.h>
-#include <comma/csv/stream.h>
-#include <comma/visiting/traits.h>
-
-static void usage( bool verbose )
-{
-    std::cerr << std::endl;
-    std::cerr << "todo" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --input-fields" << std::endl;
-    std::cerr << "    --output-fields" << std::endl;
-    std::cerr << "    --output-format" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "csv options" << std::endl;
-    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
-    std::cerr << std::endl;
-}
-
-int main( int ac, char** av )
-{
-    try
-    {
-        comma::command_line_options options( ac, av, usage );
-        
-        return 0;
-    }
-    catch( const std::exception& e ) { std::cerr << av[0] << ": " << e.what() << std::endl; }
-    catch( ... ) { std::cerr << av[0] << ": unknown exception" << std::endl; }
-    return 1;
-}
\ No newline at end of file

From 3eb70474d81e9eb4184887dab31ce951cf3ac676 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Oct 2023 12:44:24 +1100
Subject: [PATCH 0667/1056] csv/examples/application:
 comma-csv-sample-application-append: examples added

---
 .../application/comma-csv-sample-application-append.cpp  | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/csv/examples/application/comma-csv-sample-application-append.cpp b/csv/examples/application/comma-csv-sample-application-append.cpp
index b92b7dc6f..c257702cc 100644
--- a/csv/examples/application/comma-csv-sample-application-append.cpp
+++ b/csv/examples/application/comma-csv-sample-application-append.cpp
@@ -21,6 +21,15 @@ static void usage( bool verbose )
     std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
     std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "    ascii" << std::endl;
+    std::cerr << "        ( echo 1,2,3; echo 4,5,6 ) | ./comma-csv-sample-application-append" << std::endl;
+    std::cerr << "    binary" << std::endl;
+    std::cerr << "        ( echo 1,2,3; echo 4,5,6 ) \\" << std::endl;
+    std::cerr << "            | csv-to-bin 3ui \\" << std::endl;
+    std::cerr << "            | ./comma-csv-sample-application-append --binary 3ui" << std::endl;
+    std::cerr << "            | csv-from-bin 3ui,ui,d" << std::endl;
+    std::cerr << std::endl;
 }
 
 namespace comma { namespace csv { namespace examples { namespace application {

From a1a95c03f4e946ffd6112f0089a89f41b702328a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Oct 2023 13:12:29 +1100
Subject: [PATCH 0668/1056] csv/examples/application:
 comma-csv-sample-application-emplace: first cut implemented

---
 csv/examples/application/CMakeLists.txt       |   4 +-
 .../comma-csv-sample-application-append.cpp   |   5 +-
 .../comma-csv-sample-application-emplace.cpp  | 107 ++++++++++++++++++
 3 files changed, 114 insertions(+), 2 deletions(-)
 create mode 100644 csv/examples/application/comma-csv-sample-application-emplace.cpp

diff --git a/csv/examples/application/CMakeLists.txt b/csv/examples/application/CMakeLists.txt
index f01196561..daca46063 100644
--- a/csv/examples/application/CMakeLists.txt
+++ b/csv/examples/application/CMakeLists.txt
@@ -1,6 +1,8 @@
-project( comma-csv-sample-application-append )
+project( comma-csv-sample-application )
 cmake_minimum_required( VERSION 3.1 )
 add_compile_options( -std=c++14 )
 find_package( comma REQUIRED PATHS "/usr/local/CMakeFiles" )
 add_executable( comma-csv-sample-application-append comma-csv-sample-application-append.cpp )
 target_link_libraries( comma-csv-sample-application-append ${comma_ALL_LIBRARIES} )
+add_executable( comma-csv-sample-application-emplace comma-csv-sample-application-emplace.cpp )
+target_link_libraries( comma-csv-sample-application-emplace ${comma_ALL_LIBRARIES} )
diff --git a/csv/examples/application/comma-csv-sample-application-append.cpp b/csv/examples/application/comma-csv-sample-application-append.cpp
index c257702cc..6e9537058 100644
--- a/csv/examples/application/comma-csv-sample-application-append.cpp
+++ b/csv/examples/application/comma-csv-sample-application-append.cpp
@@ -11,7 +11,10 @@
 static void usage( bool verbose )
 {
     std::cerr << std::endl;
-    std::cerr << "todo" << std::endl;
+    std::cerr << "example: read csv/binary fixed-width data on stdin, calculate some result" << std::endl;
+    std::cerr << "         append to input, output to stdout" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat values.csv | ./comma-csv-sample-application-append [<options>] > result.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --input-fields; print input fields to stdout and exit" << std::endl;
diff --git a/csv/examples/application/comma-csv-sample-application-emplace.cpp b/csv/examples/application/comma-csv-sample-application-emplace.cpp
new file mode 100644
index 000000000..1b8320df3
--- /dev/null
+++ b/csv/examples/application/comma-csv-sample-application-emplace.cpp
@@ -0,0 +1,107 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+#include <exception>
+#include <iostream>
+#include <comma/application/command_line_options.h>
+#include <comma/csv/stream.h>
+#include <comma/string/string.h>
+#include <comma/visiting/traits.h>
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "example: read csv/binary fixed-width data on stdin, calculate some result" << std::endl;
+    std::cerr << "         update input values emplace, output to stdout" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat values.csv | ./comma-csv-sample-application-append [<options>] > result.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --input-fields; print input fields to stdout and exit" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "    ascii" << std::endl;
+    std::cerr << "        ( echo 1,2; echo 3,4 ) | ./comma-csv-sample-application-emplace" << std::endl;
+    std::cerr << "    binary" << std::endl;
+    std::cerr << "        ( echo 1,2; echo 3,4 ) \\" << std::endl;
+    std::cerr << "            | csv-to-bin 2ui \\" << std::endl;
+    std::cerr << "            | ./comma-csv-sample-application-emplace --binary 2ui \\" << std::endl;
+    std::cerr << "            | csv-from-bin 2ui" << std::endl;
+    std::cerr << std::endl;
+}
+
+namespace comma { namespace csv { namespace examples { namespace application {
+
+struct input
+{
+    struct nested { double c{0}; };
+    double a{0};
+    nested b;
+};
+
+} } } } // namespace comma { namespace csv { namespace examples { namespace application {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv::examples::application::input::nested >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input::nested& p, Visitor& v )
+    {
+        v.apply( "c", p.c );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input::nested& p, Visitor& v )
+    {
+        v.apply( "c", p.c );
+    }
+};
+
+template <> struct traits< comma::csv::examples::application::input >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+static comma::csv::examples::application::input updated( const comma::csv::examples::application::input& input )
+{
+    auto r = input;
+    r.a = input.a + input.b.c;
+    return r;
+}
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        comma::csv::options csv( options );
+        typedef comma::csv::examples::application::input input_t;
+        if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< input_t >(), ',' ) << std::endl; return 0; }
+        comma::csv::input_stream< comma::csv::examples::application::input > is( std::cin, csv );
+        auto passed = comma::csv::make_passed( is, std::cout, csv.flush );
+        while( is.ready() || std::cin.good() )
+        {
+            auto p = is.read();
+            if( !p ) { break; }
+            passed.write( updated( *p ) );
+        }
+        return 0;
+    }
+    catch( const std::exception& e ) { std::cerr << av[0] << ": " << e.what() << std::endl; }
+    catch( ... ) { std::cerr << av[0] << ": unknown exception" << std::endl; }
+    return 1;
+}
\ No newline at end of file

From 9b6d101a18ca354eec12be2f258b6ab349fd6ecb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Oct 2023 13:27:12 +1100
Subject: [PATCH 0669/1056] csv::make_passed() implemented

---
 .../application/comma-csv-sample-application-emplace.cpp       | 2 +-
 csv/stream.h                                                   | 3 +++
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/csv/examples/application/comma-csv-sample-application-emplace.cpp b/csv/examples/application/comma-csv-sample-application-emplace.cpp
index 1b8320df3..63a2e7ff6 100644
--- a/csv/examples/application/comma-csv-sample-application-emplace.cpp
+++ b/csv/examples/application/comma-csv-sample-application-emplace.cpp
@@ -14,7 +14,7 @@ static void usage( bool verbose )
     std::cerr << "example: read csv/binary fixed-width data on stdin, calculate some result" << std::endl;
     std::cerr << "         update input values emplace, output to stdout" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage: cat values.csv | ./comma-csv-sample-application-append [<options>] > result.csv" << std::endl;
+    std::cerr << "usage: cat values.csv | ./comma-csv-sample-application-emplace [<options>] > result.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --input-fields; print input fields to stdout and exit" << std::endl;
diff --git a/csv/stream.h b/csv/stream.h
index d88776cc5..b1e92116a 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -436,6 +436,9 @@ class passed
         bool is_stdout_;
 };
 
+template < typename S >
+inline passed< S > make_passed( const input_stream< S >& is, std::ostream& os, bool flush = false ) { return passed< S >( is, os, flush ); }
+ 
 template < typename S >
 inline passed< S >::passed( const input_stream< S >& is, std::ostream& os, bool flush ) : is_( is ), os_( os ), flush( flush )
 {

From 732a2ad4e83231d7c27c5531790d6f13c37cd607 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Oct 2023 13:39:17 +1100
Subject: [PATCH 0670/1056] csv/examples/application:
 comma-csv-sample-application-append: --no-append implemented

---
 .../application/comma-csv-sample-application-append.cpp      | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/csv/examples/application/comma-csv-sample-application-append.cpp b/csv/examples/application/comma-csv-sample-application-append.cpp
index 6e9537058..5b72a30fb 100644
--- a/csv/examples/application/comma-csv-sample-application-append.cpp
+++ b/csv/examples/application/comma-csv-sample-application-append.cpp
@@ -20,6 +20,7 @@ static void usage( bool verbose )
     std::cerr << "    --input-fields; print input fields to stdout and exit" << std::endl;
     std::cerr << "    --output-fields; print output fields to stdout and exit" << std::endl;
     std::cerr << "    --output-format; print output format to stdout and exit" << std::endl;
+    std::cerr << "    --no-append; do not output stdin records to stdout, output only result" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
@@ -118,12 +119,14 @@ int main( int ac, char** av )
         comma::csv::input_stream< comma::csv::examples::application::input > is( std::cin, csv );
         comma::csv::output_stream< comma::csv::examples::application::output > os( std::cout, csv.binary() );
         auto tied = comma::csv::make_tied( is, os );
+        bool append = !options.exists( "--no-append" );
         comma::csv::examples::application::output output;
         while( is.ready() || std::cin.good() )
         {
             auto p = is.read();
             if( !p ) { break; }
-            tied.append( populate_output( *p, output ) );
+            if( append ) { tied.append( populate_output( *p, output ) ); }
+            else { os.write( populate_output( *p, output ) ); }
         }
         return 0;
     }

From a52da5561e105ec2a0373d2dd70d66ded73b3877 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Oct 2023 17:23:05 +1100
Subject: [PATCH 0671/1056] csv/examples: application renamed to applications

---
 csv/examples/{application => applications}/CMakeLists.txt         | 0
 .../comma-csv-sample-application-append.cpp                       | 0
 .../comma-csv-sample-application-emplace.cpp                      | 0
 3 files changed, 0 insertions(+), 0 deletions(-)
 rename csv/examples/{application => applications}/CMakeLists.txt (100%)
 rename csv/examples/{application => applications}/comma-csv-sample-application-append.cpp (100%)
 rename csv/examples/{application => applications}/comma-csv-sample-application-emplace.cpp (100%)

diff --git a/csv/examples/application/CMakeLists.txt b/csv/examples/applications/CMakeLists.txt
similarity index 100%
rename from csv/examples/application/CMakeLists.txt
rename to csv/examples/applications/CMakeLists.txt
diff --git a/csv/examples/application/comma-csv-sample-application-append.cpp b/csv/examples/applications/comma-csv-sample-application-append.cpp
similarity index 100%
rename from csv/examples/application/comma-csv-sample-application-append.cpp
rename to csv/examples/applications/comma-csv-sample-application-append.cpp
diff --git a/csv/examples/application/comma-csv-sample-application-emplace.cpp b/csv/examples/applications/comma-csv-sample-application-emplace.cpp
similarity index 100%
rename from csv/examples/application/comma-csv-sample-application-emplace.cpp
rename to csv/examples/applications/comma-csv-sample-application-emplace.cpp

From 60d342a740909dd23731a53879c810d7f4d43ab5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 31 Oct 2023 10:31:43 +1100
Subject: [PATCH 0672/1056] csv/examples/applications:
 comma-csv-sample-application-append: made more meaningful

---
 csv/examples/applications/CMakeLists.txt      |  1 +
 .../comma-csv-sample-application-append.cpp   | 55 ++++++++++---------
 2 files changed, 30 insertions(+), 26 deletions(-)

diff --git a/csv/examples/applications/CMakeLists.txt b/csv/examples/applications/CMakeLists.txt
index daca46063..1445ca4c6 100644
--- a/csv/examples/applications/CMakeLists.txt
+++ b/csv/examples/applications/CMakeLists.txt
@@ -1,6 +1,7 @@
 project( comma-csv-sample-application )
 cmake_minimum_required( VERSION 3.1 )
 add_compile_options( -std=c++14 )
+find_package( Boost REQUIRED COMPONENTS thread filesystem system date_time iostreams program_options regex )
 find_package( comma REQUIRED PATHS "/usr/local/CMakeFiles" )
 add_executable( comma-csv-sample-application-append comma-csv-sample-application-append.cpp )
 target_link_libraries( comma-csv-sample-application-append ${comma_ALL_LIBRARIES} )
diff --git a/csv/examples/applications/comma-csv-sample-application-append.cpp b/csv/examples/applications/comma-csv-sample-application-append.cpp
index 5b72a30fb..5693b57e5 100644
--- a/csv/examples/applications/comma-csv-sample-application-append.cpp
+++ b/csv/examples/applications/comma-csv-sample-application-append.cpp
@@ -1,6 +1,7 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 // All rights reserved.
 
+#include <cmath>
 #include <exception>
 #include <iostream>
 #include <comma/application/command_line_options.h>
@@ -11,7 +12,8 @@
 static void usage( bool verbose )
 {
     std::cerr << std::endl;
-    std::cerr << "example: read csv/binary fixed-width data on stdin, calculate some result" << std::endl;
+    std::cerr << "example: read csv/binary fixed-width data on stdin (angle and factor)" << std::endl;
+    std::cerr << "         count input records, calculate sin and cos of angle, and sign of factor" << std::endl;
     std::cerr << "         append to input, output to stdout" << std::endl;
     std::cerr << std::endl;
     std::cerr << "usage: cat values.csv | ./comma-csv-sample-application-append [<options>] > result.csv" << std::endl;
@@ -27,7 +29,7 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    ascii" << std::endl;
-    std::cerr << "        ( echo 1,2,3; echo 4,5,6 ) | ./comma-csv-sample-application-append" << std::endl;
+    std::cerr << "        ( echo 45,20; echo 30,-10 ) | ./comma-csv-sample-application-append" << std::endl;
     std::cerr << "    binary" << std::endl;
     std::cerr << "        ( echo 1,2,3; echo 4,5,6 ) \\" << std::endl;
     std::cerr << "            | csv-to-bin 3ui \\" << std::endl;
@@ -40,49 +42,47 @@ namespace comma { namespace csv { namespace examples { namespace application {
 
 struct input
 {
-    struct nested { double d{0}; };
-    unsigned int a{0};
-    double b{0};
-    nested c;
+    double angle{0};
+    double factor{0};
 };
 
 struct output
 {
+    struct trigonometric_t
+    {
+        double sin;
+        double cos;
+    };
     unsigned int count{0};
-    double result{0};
+    trigonometric_t trigonometric;
+    double factor_sign{0};
 };
 
 } } } } // namespace comma { namespace csv { namespace examples { namespace application {
 
 namespace comma { namespace visiting {
 
-template <> struct traits< comma::csv::examples::application::input::nested >
+template <> struct traits< comma::csv::examples::application::input >
 {
-    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input::nested& p, Visitor& v )
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input& p, Visitor& v )
     {
-        v.apply( "d", p.d );
+        v.apply( "angle", p.angle );
+        v.apply( "factor", p.factor );
     }
 
-    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input::nested& p, Visitor& v )
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input& p, Visitor& v )
     {
-        v.apply( "d", p.d );
+        v.apply( "angle", p.angle );
+        v.apply( "factor", p.factor );
     }
 };
 
-template <> struct traits< comma::csv::examples::application::input >
+template <> struct traits< comma::csv::examples::application::output::trigonometric_t >
 {
-    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input& p, Visitor& v )
-    {
-        v.apply( "a", p.a );
-        v.apply( "b", p.b );
-        v.apply( "c", p.c );
-    }
-
-    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input& p, Visitor& v )
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::output::trigonometric_t& p, Visitor& v )
     {
-        v.apply( "a", p.a );
-        v.apply( "b", p.b );
-        v.apply( "c", p.c );
+        v.apply( "sin", p.sin );
+        v.apply( "cos", p.cos );
     }
 };
 
@@ -91,7 +91,8 @@ template <> struct traits< comma::csv::examples::application::output >
     template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::output& p, Visitor& v )
     {
         v.apply( "count", p.count );
-        v.apply( "result", p.result );
+        v.apply( "trigonometric", p.trigonometric );
+        v.apply( "factor_sign", p.factor_sign );
     }
 };
 
@@ -101,7 +102,9 @@ static comma::csv::examples::application::output& populate_output( const comma::
                                                                  , comma::csv::examples::application::output& output )
 {
     ++output.count;
-    output.result = input.a + input.b * input.c.d;
+    output.trigonometric.sin = std::sin( input.angle * M_PI / 180 );
+    output.trigonometric.cos = std::cos( input.angle * M_PI / 180 );
+    output.factor_sign = input.factor > 0 ? 1 : input.factor < 0 ? -1 : 0;
     return output;
 }
 

From 2c0decad25ed181db39b1094e93b69740362196b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 31 Oct 2023 10:38:52 +1100
Subject: [PATCH 0673/1056] csv/examples/applications:
 comma-csv-sample-application-append: example fixed

---
 .../comma-csv-sample-application-append.cpp        | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/csv/examples/applications/comma-csv-sample-application-append.cpp b/csv/examples/applications/comma-csv-sample-application-append.cpp
index 5693b57e5..f56e7f75e 100644
--- a/csv/examples/applications/comma-csv-sample-application-append.cpp
+++ b/csv/examples/applications/comma-csv-sample-application-append.cpp
@@ -31,10 +31,10 @@ static void usage( bool verbose )
     std::cerr << "    ascii" << std::endl;
     std::cerr << "        ( echo 45,20; echo 30,-10 ) | ./comma-csv-sample-application-append" << std::endl;
     std::cerr << "    binary" << std::endl;
-    std::cerr << "        ( echo 1,2,3; echo 4,5,6 ) \\" << std::endl;
-    std::cerr << "            | csv-to-bin 3ui \\" << std::endl;
-    std::cerr << "            | ./comma-csv-sample-application-append --binary 3ui" << std::endl;
-    std::cerr << "            | csv-from-bin 3ui,ui,d" << std::endl;
+    std::cerr << "        ( echo 45,20; echo 30,-10 ) \\" << std::endl;
+    std::cerr << "            | csv-to-bin 2d \\" << std::endl;
+    std::cerr << "            | ./comma-csv-sample-application-append --binary 2d \\" << std::endl;
+    std::cerr << "            | csv-from-bin 2d,ui,3d" << std::endl;
     std::cerr << std::endl;
 }
 
@@ -119,11 +119,11 @@ int main( int ac, char** av )
         if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< input_t >(), ',' ) << std::endl; return 0; }
         if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< output_t >(), ',' ) << std::endl; return 0; }
         if( options.exists( "--output-format" ) ) { std::cout << comma::csv::format::value< output_t >() << std::endl; return 0; }
-        comma::csv::input_stream< comma::csv::examples::application::input > is( std::cin, csv );
-        comma::csv::output_stream< comma::csv::examples::application::output > os( std::cout, csv.binary() );
+        comma::csv::input_stream< input_t > is( std::cin, csv );
+        comma::csv::output_stream< output_t > os( std::cout, csv.binary() );
         auto tied = comma::csv::make_tied( is, os );
         bool append = !options.exists( "--no-append" );
-        comma::csv::examples::application::output output;
+        output_t output;
         while( is.ready() || std::cin.good() )
         {
             auto p = is.read();

From b6f85b6376da5e172787292a342f8d009914fac3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 8 Nov 2023 15:14:39 +1100
Subject: [PATCH 0674/1056] csv-join: --discard-id: ascii support implemented;
 binary: in progress...

---
 csv/applications/csv-join.cpp | 59 +++++++++++++++++------------------
 1 file changed, 29 insertions(+), 30 deletions(-)

diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 302e5300b..def07a6fb 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -1,31 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -107,8 +81,12 @@ static void usage( bool more )
         std::cerr << "        block. If no block field is given the entire input is considered to be" << std::endl;
         std::cerr << "        one block. Blocks are required to be contiguous in the input stream." << std::endl;
     }
+    else
+    {
+        std::cerr << "    run csv-join --help --verbose for more..." << std::endl;
+    }
     std::cerr << std::endl;
-    std::cerr << "Examples (try them):" << std::endl;
+    std::cerr << "examples (try them)" << std::endl;
     std::cerr << "    on the following data file:" << std::endl;
     std::cerr << "        echo 1,1,2,hello > data.csv" << std::endl;
     std::cerr << "        echo 1,2,3,hello >> data.csv" << std::endl;
@@ -136,7 +114,6 @@ static void usage( bool more )
     std::cerr << "        <input:3>" << std::endl;
     std::cerr << "        <input:3>" << std::endl;
     std::cerr << std::endl;
-    std::cerr << std::endl;
     exit( 0 );
 }
 
@@ -149,8 +126,10 @@ static bool not_matching;
 static bool matching;
 static bool flag_matching;
 static bool swap_output;
+static bool filter_id_fields_discard;
 static comma::csv::options stdin_csv;
 static comma::csv::options filter_csv;
+static std::vector< unsigned int > filter_id_fields_flags; // quick and dirty
 boost::scoped_ptr< comma::io::istream > filter_transport;
 static comma::uint32 block = 0;
 static boost::optional< double > radius;
@@ -305,6 +284,20 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
     static typename traits< K, Strict >::map filter_map;
     static input< K > default_input;
 
+    static std::string make_output_string( const std::vector< std::string >& values ) // todo? something like comma::join( values, drop )?
+    {
+        if( filter_id_fields_flags.empty() ) { return comma::join( values, stdin_csv.delimiter ); }
+        std::string s;
+        std::string delimiter;
+        unsigned int i = 0;
+        for( ; i < std::min( filter_id_fields_flags.size(), values.size() ); ++i )
+        {
+            if( filter_id_fields_flags[i] == 0 ) { s += delimiter + values[i]; delimiter = std::string( 1, stdin_csv.delimiter ); }
+        }
+        for( ; i < values.size(); ++i ) { s += delimiter + values[i]; delimiter = std::string( 1, stdin_csv.delimiter ); }
+        return s;
+    }
+
     static void read_filter_block()
     {
         static comma::csv::input_stream< input< K > > filter_stream( **filter_transport, filter_csv, default_input );
@@ -326,7 +319,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
             }
             else
             {
-                d.push_back( comma::join( filter_stream.ascii().last(), stdin_csv.delimiter ) );
+                d.push_back( make_output_string( filter_stream.ascii().last() ) );
             }
             if( verbose ) { ++count; if( count % 10000 == 0 ) { std::cerr << "csv-join: reading block " << block << "; loaded " << count << " point" << ( count == 1 ? "" : "s" ) << "; hash map size: " << filter_map.size() << std::endl; } }
             //if( ( *filter_transport )->good() && !( *filter_transport )->eof() ) { break; }
@@ -340,6 +333,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
     {
         std::vector< std::string > v = comma::split( stdin_csv.fields, ',' );
         std::vector< std::string > w = comma::split( filter_csv.fields, ',' );
+        if( filter_id_fields_discard ) { filter_id_fields_flags.resize( w.size(), 0 ); }
         bool got_state = false;
         bool got_next_state = false;
         std::size_t filter_state_index;
@@ -348,6 +342,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
             if( w[k] == "state" ) { got_state = true; filter_state_index = k; continue; }
             if( w[k] == "next_state" ) { got_next_state = true; continue; }
         }
+        if( ( got_state || got_next_state ) && filter_id_fields_discard ) { std::cerr << "csv-join: --discard-id and 'state' or 'next_field' are mutually exclusive" << std::endl; return 1; }
         bool is_state_machine = got_state && got_next_state;
         std::size_t default_input_keys_count = 0;
         bool no_stdin_key_fields = true;
@@ -360,9 +355,11 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
             {
                 if( is_state_machine && ( w[k] == "state" || w[k] == "next_state" ) ) { no_filter_key_fields = false; continue; }
                 if( !w[k].empty() && w[k] != "block" ) { no_filter_key_fields = false; }
+                if( filter_id_fields_discard && w[k] == "block" ) { filter_id_fields_flags[k] = 1; }
                 if( v[i] != w[k] ) { continue; }
                 v[i] = "keys[" + boost::lexical_cast< std::string >( default_input_keys_count ) + "]";
                 w[k] = "keys[" + boost::lexical_cast< std::string >( default_input_keys_count ) + "]";
+                if( filter_id_fields_discard ) { filter_id_fields_flags[k] = 1; }
                 ++default_input_keys_count;
             }
         }
@@ -500,12 +497,14 @@ int main( int ac, char** av )
         radius = options.optional< double >( "--radius,--epsilon" );
         nearest = options.exists( "--nearest" );
         swap_output = options.exists( "--output-swap,--swap-output,--swap" );
+        filter_id_fields_discard = options.exists( "--discard-id-fields,--discard-id" );
         if( nearest && !radius ) { std::cerr << "csv-join: if using --nearest, please specify --radius" << std::endl; return 1; }
         options.assert_mutually_exclusive( "--matching,--not-matching,--flag-matching,--swap-output,--swap,--output-swap" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--first-matching" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--string,-s,--double,--time" );
+        options.assert_mutually_exclusive( "--matching,--not-matching", "--discard-id-fields,--discard-id" );
         stdin_csv = comma::csv::options( options );
-        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest,--discard-id-fields,--discard-id", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-join: please specify the second source" << std::endl; return 1; }
         if( unnamed.size() > 1 ) { std::cerr << "csv-join: expected one file or stream to join, got " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
         comma::name_value::parser parser( "filename", ';', '=', false );

From c2a28338d7631c6c3ef317797394e1ce9d6c767f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 8 Nov 2023 15:23:30 +1100
Subject: [PATCH 0675/1056] csv-join: --discard-id: ascii support implemented;
 binary: in progress...

---
 csv/applications/csv-join.cpp | 25 ++++++++++++++++++-------
 1 file changed, 18 insertions(+), 7 deletions(-)

diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index def07a6fb..6c9948d25 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -137,7 +137,7 @@ static boost::optional< double > radius;
 static void hash_combine_( std::size_t& seed, boost::posix_time::ptime key )
 {
     static_assert( sizeof( boost::posix_time::ptime ) == 8, "expected time of size 8" );
-    boost::hash_combine( seed, *reinterpret_cast< const long long* >( &key ) );
+    boost::hash_combine( seed, *reinterpret_cast< const comma::uint64* >( &key ) );
 }
 
 template < typename K > static void hash_combine_( std::size_t& seed, K key ) { boost::hash_combine( seed, key ); }
@@ -284,7 +284,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
     static typename traits< K, Strict >::map filter_map;
     static input< K > default_input;
 
-    static std::string make_output_string( const std::vector< std::string >& values ) // todo? something like comma::join( values, drop )?
+    static std::string make_output( const std::vector< std::string >& values ) // todo? something like comma::join( values, drop )?
     {
         if( filter_id_fields_flags.empty() ) { return comma::join( values, stdin_csv.delimiter ); }
         std::string s;
@@ -298,6 +298,17 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         return s;
     }
 
+    static std::string make_output( const char* values ) // quick and dirty for now
+    {
+        if( filter_id_fields_flags.empty() )
+        {
+            std::string s( filter_csv.format().size() );
+            ::memcpy( &s[0], values, filter_csv.format().size() );
+            return s;
+        }
+        COMMA_THROW( comma::exception, "--drop-id: binary support: todo" );
+    }
+
     static void read_filter_block()
     {
         static comma::csv::input_stream< input< K > > filter_stream( **filter_transport, filter_csv, default_input );
@@ -319,7 +330,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
             }
             else
             {
-                d.push_back( make_output_string( filter_stream.ascii().last() ) );
+                d.push_back( make_output( filter_stream.ascii().last() ) );
             }
             if( verbose ) { ++count; if( count % 10000 == 0 ) { std::cerr << "csv-join: reading block " << block << "; loaded " << count << " point" << ( count == 1 ? "" : "s" ) << "; hash map size: " << filter_map.size() << std::endl; } }
             //if( ( *filter_transport )->good() && !( *filter_transport )->eof() ) { break; }
@@ -342,7 +353,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
             if( w[k] == "state" ) { got_state = true; filter_state_index = k; continue; }
             if( w[k] == "next_state" ) { got_next_state = true; continue; }
         }
-        if( ( got_state || got_next_state ) && filter_id_fields_discard ) { std::cerr << "csv-join: --discard-id and 'state' or 'next_field' are mutually exclusive" << std::endl; return 1; }
+        if( ( got_state || got_next_state ) && filter_id_fields_discard ) { std::cerr << "csv-join: --drop-id and 'state' or 'next_field' are mutually exclusive" << std::endl; return 1; }
         bool is_state_machine = got_state && got_next_state;
         std::size_t default_input_keys_count = 0;
         bool no_stdin_key_fields = true;
@@ -497,14 +508,14 @@ int main( int ac, char** av )
         radius = options.optional< double >( "--radius,--epsilon" );
         nearest = options.exists( "--nearest" );
         swap_output = options.exists( "--output-swap,--swap-output,--swap" );
-        filter_id_fields_discard = options.exists( "--discard-id-fields,--discard-id" );
+        filter_id_fields_discard = options.exists( "--drop-id-fields,--drop-id" );
         if( nearest && !radius ) { std::cerr << "csv-join: if using --nearest, please specify --radius" << std::endl; return 1; }
         options.assert_mutually_exclusive( "--matching,--not-matching,--flag-matching,--swap-output,--swap,--output-swap" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--first-matching" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--string,-s,--double,--time" );
-        options.assert_mutually_exclusive( "--matching,--not-matching", "--discard-id-fields,--discard-id" );
+        options.assert_mutually_exclusive( "--matching,--not-matching", "--drop-id-fields,--drop-id" );
         stdin_csv = comma::csv::options( options );
-        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest,--discard-id-fields,--discard-id", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest,--drop-id-fields,--drop-id", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-join: please specify the second source" << std::endl; return 1; }
         if( unnamed.size() > 1 ) { std::cerr << "csv-join: expected one file or stream to join, got " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
         comma::name_value::parser parser( "filename", ';', '=', false );

From 475e3dcd1818c8d59cffb68b889902f2299ad2df Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 8 Nov 2023 16:44:01 +1100
Subject: [PATCH 0676/1056] csv-join: --drop-id: first cut implemented; unit
 test: todo...

---
 csv/applications/csv-bin-cut.cpp | 59 ++++++++----------------------
 csv/applications/csv-join.cpp    | 62 +++++++++++++++++++++-----------
 2 files changed, 56 insertions(+), 65 deletions(-)

diff --git a/csv/applications/csv-bin-cut.cpp b/csv/applications/csv-bin-cut.cpp
index b95315d14..3fbc2c9b1 100644
--- a/csv/applications/csv-bin-cut.cpp
+++ b/csv/applications/csv-bin-cut.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author dmitry mikhin
 
@@ -289,7 +262,8 @@ namespace {
         // - check for read errors / end of input
         // - write the buffer to stdout
         std::streampos record_start = 0;
-        if ( skip_ ) {
+        if ( skip_ )
+        {
             ifs.seekg( 0, std::ios_base::end );
             std::streampos fsize = ifs.tellg();
             unsigned int nrecords = fsize / irecord_size_;
@@ -307,7 +281,8 @@ namespace {
                 std::streamoff off = fields_[i].input_offset - ( i == 0 ? 0 : fields_[i - 1].input_offset + fields_[i - 1].size );
                 ifs.seekg( off, std::ios_base::cur );
                 ifs.read( &obuf_[ fields_[i].offset ], fields_[i].size );
-                if ( ifs.eof() ) {
+                if ( ifs.eof() )
+                {
                     if ( i == 0 ) { break; }
                     std::cerr << "csv-bin-cut: encountered eof mid-record in '" << fname << "'" << std::endl; exit( 1 );
                 }
@@ -332,12 +307,16 @@ namespace {
     int seeker::process( const std::vector< std::string > & files )
     {
         if ( files.empty() ) { return read_all( std::cin ); }
-        for ( std::vector< std::string >::const_iterator ifile = files.begin(); ifile < files.end(); ++ifile ) {
-            if ( count_max_ >= 0 && count_ >= count_max_ ) { return 0; }
-            if ( *ifile == "-" ) {
+        for ( std::vector< std::string >::const_iterator ifile = files.begin(); ifile < files.end(); ++ifile )
+        {
+            if( count_max_ >= 0 && count_ >= count_max_ ) { return 0; }
+            if( *ifile == "-" )
+            {
                 int rv = read_all( std::cin );
                 if ( rv != 0 ) { return rv; }
-            } else {
+            }
+            else
+            {
                 std::ifstream ifs( &( *ifile )[0], std::ifstream::binary );
                 if ( !ifs.is_open() ) { std::cerr << "csv-bin-cut: cannot open '" << *ifile << "' for reading" << std::endl; exit( 1 ); }
                 int rv = ( force_read_ ? read_all( ifs ) : read_fields( ifs, *ifile ) );
@@ -365,26 +344,16 @@ int main( int ac, char** av )
         {
             if( files.size() == 1 && files[0] != "-" ) // deprecated, left for backward compatibility
             {
-                try
-                {
-                    csv.format( comma::csv::format( files[0] ) );
-                    files.clear();
-                }
-                catch ( comma::exception & )
-                {
-                    // it's not a format string
-                }
+                try { csv.format( comma::csv::format( files[0] ) ); files.clear(); }
+                catch ( comma::exception & ) {} // it's not a format string
             }
         }
         if( !csv.binary() ) { std::cerr << "csv-bin-cut: please specify --binary" << std::endl; exit( 1 ); }
-
         const std::vector< field >& fields = setup_fields( options, csv );
-
         unsigned int skip = options.value< unsigned int >( "--skip", 0 );
         long int count_max = options.value< long int >( "--count", -1 );
         bool flush = options.exists( "--flush" );
         bool force_read = options.exists( "--read-all,--force-read" );
-
         seeker seek( fields, csv, skip, count_max, flush, force_read );
         return seek.process( files );
     }
diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 6c9948d25..ae615b280 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -41,6 +41,7 @@ static void usage( bool more )
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
+    std::cerr << "    --drop-id-fields,--drop-id; remove id and block fields from filter output (same as if you did csv-join|csv-shuffle)" << std::endl;
     std::cerr << "    --first-matching: output only the first matching record (a bit of hack for now, but we needed it)" << std::endl;
     std::cerr << "    --flag-matching: output all records, with 1 appended to matching records and 0 appended to not-matching records" << std::endl;
     std::cerr << "    --matching: output only matching records from stdin" << std::endl;
@@ -114,6 +115,12 @@ static void usage( bool more )
     std::cerr << "        <input:3>" << std::endl;
     std::cerr << "        <input:3>" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "    --drop-id (same would work in binary as well)" << std::endl;
+    std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y'" << std::endl;
+    std::cerr << "        0,1,2,3,1,A,B,3" << std::endl;
+    std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y' --drop-id" << std::endl;
+    std::cerr << "        0,1,2,3,A,B" << std::endl;
+    std::cerr << std::endl;
     exit( 0 );
 }
 
@@ -126,10 +133,12 @@ static bool not_matching;
 static bool matching;
 static bool flag_matching;
 static bool swap_output;
-static bool filter_id_fields_discard;
 static comma::csv::options stdin_csv;
 static comma::csv::options filter_csv;
-static std::vector< unsigned int > filter_id_fields_flags; // quick and dirty
+static bool filter_id_fields_discard; // todo: super-quick and dirty, put in a separate class
+static std::vector< unsigned int > filter_id_fields_flags; // todo: super-quick and dirty, put in a separate class
+static std::vector< std::pair< unsigned int, unsigned int > > filter_id_fields_offsets; // todo: super-quick and dirty, put in a separate class
+static unsigned int filter_id_fields_size{0}; // todo: super-quick and dirty, put in a separate class
 boost::scoped_ptr< comma::io::istream > filter_transport;
 static comma::uint32 block = 0;
 static boost::optional< double > radius;
@@ -284,7 +293,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
     static typename traits< K, Strict >::map filter_map;
     static input< K > default_input;
 
-    static std::string make_output( const std::vector< std::string >& values ) // todo? something like comma::join( values, drop )?
+    static std::string make_output( const std::vector< std::string >& values ) // todo? implement something like comma::join( values, drop )?
     {
         if( filter_id_fields_flags.empty() ) { return comma::join( values, stdin_csv.delimiter ); }
         std::string s;
@@ -298,15 +307,27 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         return s;
     }
 
-    static std::string make_output( const char* values ) // quick and dirty for now
+    static std::string make_output( const char* values ) // todo? quick and dirty for now; use csv::binary? or implement something like csv::format::drop_fields...?
     {
+        std::string s( filter_csv.format().size() - filter_id_fields_size, '\0' );
         if( filter_id_fields_flags.empty() )
         {
-            std::string s( filter_csv.format().size() );
             ::memcpy( &s[0], values, filter_csv.format().size() );
-            return s;
         }
-        COMMA_THROW( comma::exception, "--drop-id: binary support: todo" );
+        else
+        {
+            char* p = &s[0];
+            unsigned int t = 0;
+            for( const auto& e: filter_id_fields_offsets ) // todo: quick and dirty, watch performance
+            {
+                unsigned int c = e.first - t;
+                std::memcpy( p, values + t, c );
+                p += c;
+                t = e.first + e.second;
+            }
+            std::memcpy( p, values + t, filter_csv.format().size() - t ); // todo: quick and dirty, watch performance
+        }
+        return s;
     }
 
     static void read_filter_block()
@@ -320,18 +341,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         static comma::signal_flag is_shutdown( comma::signal_flag::hard );
         while( last->block == block && !is_shutdown )
         {
-            typename traits< K, Strict >::map::mapped_type& d = filter_map[ *last ];
-            if( filter_stream.is_binary() )
-            {
-                typename traits< K, Strict >::map::mapped_type& d = filter_map[ *last ];
-                d.push_back( std::string() );
-                d.back().resize( filter_csv.format().size() );
-                ::memcpy( &d.back()[0], filter_stream.binary().last(), filter_csv.format().size() );
-            }
-            else
-            {
-                d.push_back( make_output( filter_stream.ascii().last() ) );
-            }
+            filter_map[ *last ].push_back( filter_stream.is_binary() ? make_output( filter_stream.binary().last() ) : make_output( filter_stream.ascii().last() ) );
             if( verbose ) { ++count; if( count % 10000 == 0 ) { std::cerr << "csv-join: reading block " << block << "; loaded " << count << " point" << ( count == 1 ? "" : "s" ) << "; hash map size: " << filter_map.size() << std::endl; } }
             //if( ( *filter_transport )->good() && !( *filter_transport )->eof() ) { break; }
             last = filter_stream.read();
@@ -374,6 +384,18 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
                 ++default_input_keys_count;
             }
         }
+        if( filter_csv.binary() ) // todo: super-quick and dirty; move all the --drop-id stuff to a class
+        {
+            for( unsigned int i = 0; i < filter_id_fields_flags.size(); ++i )
+            {
+                if( filter_id_fields_flags[i] )
+                { 
+                    const auto& e = filter_csv.format().offset( i );
+                    filter_id_fields_offsets.push_back( { e.offset, e.size } );
+                    filter_id_fields_size += e.size;
+                }
+            }
+        }
         bool do_full_join = no_stdin_key_fields && no_filter_key_fields;
         if( default_input_keys_count == 0 && !do_full_join ) { std::cerr << "csv-join: please specify at least one common key; fields: " << stdin_csv.fields << "; filter fields: " << filter_csv.fields << std::endl; return 1; }
         //if( default_input_keys_count == 0 ) { std::cerr << "csv-join: please specify at least one common key; fields: " << stdin_csv.fields << "; filter fields: " << filter_csv.fields << std::endl; return 1; }
@@ -459,7 +481,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
                         if( is_state_machine ) { state = it->first.next_state; }
                         if( flag_matching ) { char match = 1; std::cout.write( &match, 1 ); break; }
                         if( matching ) { break; }
-                        std::cout.write( &( it->second[i][0] ), filter_csv.format().size() );
+                        std::cout.write( &( it->second[i][0] ), it->second[i].size() );
                         if( swap_output ) { std::cout.write( stdin_stream.binary().last(), stdin_csv.format().size() ); }
                         std::cout.flush();
                     }

From e1681b61d4863e208d7c683b35f5d2e188d432ed Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 9 Nov 2023 12:35:34 +1100
Subject: [PATCH 0677/1056] csv/test/csv-join/drop-id: basic ascii tests added

---
 csv/test/csv-join/drop-id/expected | 9 +++++++++
 csv/test/csv-join/drop-id/input    | 8 ++++++++
 2 files changed, 17 insertions(+)
 create mode 100644 csv/test/csv-join/drop-id/expected
 create mode 100644 csv/test/csv-join/drop-id/input

diff --git a/csv/test/csv-join/drop-id/expected b/csv/test/csv-join/drop-id/expected
new file mode 100644
index 000000000..d0b50fdbb
--- /dev/null
+++ b/csv/test/csv-join/drop-id/expected
@@ -0,0 +1,9 @@
+drop_id/ascii[0]/output="0,1,2,3,A,B,C"
+drop_id/ascii[1]/output="0,1,2,3,A,B,C"
+drop_id/ascii[2]/output="0,1,2,3,A,B,C"
+drop_id/ascii[3]/output="0,1,2,3,A,B,C"
+drop_id/ascii[4]/output="0,1,2,3,A,B"
+drop_id/ascii[5]/output="0,1,2,3,A,B"
+drop_id/ascii[6]/output/line[0]="a,1,b,3,A,B"
+drop_id/ascii[6]/output/line[1]="c,1,d,3,A,B"
+
diff --git a/csv/test/csv-join/drop-id/input b/csv/test/csv-join/drop-id/input
new file mode 100644
index 000000000..790aedd69
--- /dev/null
+++ b/csv/test/csv-join/drop-id/input
@@ -0,0 +1,8 @@
+drop_id/ascii[0]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo 1,A,B,C )';fields=x'"
+drop_id/ascii[1]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo 1,A,B,C )';fields=x,,,'"
+drop_id/ascii[2]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo A,1,B,C )';fields=,x'"
+drop_id/ascii[3]="echo 0,1,2,3 | csv-join --drop-id --fields ,,,x <( echo A,B,C,3 )';fields=,,,x'"
+
+drop_id/ascii[4]="echo 0,1,2,3 | csv-join --drop-id --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y'"
+drop_id/ascii[5]="echo 0,1,2,3 | csv-join --drop-id --fields ,x,,y <( echo 3,A,B,1 )';fields=y,,,x'"
+drop_id/ascii[6]="( echo a,1,b,3; echo c,1,d,3 ) | csv-join --drop-id --fields ,x,,y <( echo 3,A,B,1 )';fields=y,,,x'"

From 44e168a6d38550792c5d61045b11c58498a631be Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 9 Nov 2023 12:42:39 +1100
Subject: [PATCH 0678/1056] csv/test/csv-join/drop-id: basic binary tests added

---
 csv/test/csv-join/drop-id/expected | 7 +++++++
 csv/test/csv-join/drop-id/input    | 8 +++++++-
 2 files changed, 14 insertions(+), 1 deletion(-)

diff --git a/csv/test/csv-join/drop-id/expected b/csv/test/csv-join/drop-id/expected
index d0b50fdbb..5a8109c1a 100644
--- a/csv/test/csv-join/drop-id/expected
+++ b/csv/test/csv-join/drop-id/expected
@@ -7,3 +7,10 @@ drop_id/ascii[5]/output="0,1,2,3,A,B"
 drop_id/ascii[6]/output/line[0]="a,1,b,3,A,B"
 drop_id/ascii[6]/output/line[1]="c,1,d,3,A,B"
 
+drop_id/binary[0]/output="0,1,2,3,111,222,333"
+drop_id/binary[1]/output="0,1,2,3,111,222"
+drop_id/binary[2]/output="0,1,2,3,111,222"
+drop_id/binary[3]/output="0,1,2,3,111,222"
+drop_id/binary[4]/output="0,1,2,3,111,222"
+drop_id/binary[5]/output/line[0]="111,1,222,3,111,222"
+drop_id/binary[5]/output/line[1]="333,1,444,3,111,222"
diff --git a/csv/test/csv-join/drop-id/input b/csv/test/csv-join/drop-id/input
index 790aedd69..864b7d21c 100644
--- a/csv/test/csv-join/drop-id/input
+++ b/csv/test/csv-join/drop-id/input
@@ -2,7 +2,13 @@ drop_id/ascii[0]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo 1,A,B,C
 drop_id/ascii[1]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo 1,A,B,C )';fields=x,,,'"
 drop_id/ascii[2]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo A,1,B,C )';fields=,x'"
 drop_id/ascii[3]="echo 0,1,2,3 | csv-join --drop-id --fields ,,,x <( echo A,B,C,3 )';fields=,,,x'"
-
 drop_id/ascii[4]="echo 0,1,2,3 | csv-join --drop-id --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y'"
 drop_id/ascii[5]="echo 0,1,2,3 | csv-join --drop-id --fields ,x,,y <( echo 3,A,B,1 )';fields=y,,,x'"
 drop_id/ascii[6]="( echo a,1,b,3; echo c,1,d,3 ) | csv-join --drop-id --fields ,x,,y <( echo 3,A,B,1 )';fields=y,,,x'"
+
+drop_id/binary[0]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x --binary=4ui <( echo 1,111,222,333 | csv-to-bin ui,d,ui,d )';fields=x;binary=ui,d,ui,d' | csv-from-bin 4ui,d,ui,d"
+drop_id/binary[1]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 1,111,222,3 | csv-to-bin ui,d,ui,ul )';fields=x,,,y;binary=ui,d,ui,ul' | csv-from-bin 4ui,d,ui"
+drop_id/binary[2]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 1,111,3,222 | csv-to-bin ui,d,ui,ul )';fields=x,,y,;binary=ui,d,ui,ul' | csv-from-bin 4ui,d,ul"
+drop_id/binary[3]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 3,111,1,222 | csv-to-bin ui,d,ui,ul )';fields=y,,x,;binary=ui,d,ui,ul' | csv-from-bin 4ui,d,ul"
+drop_id/binary[4]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 111,3,1,222 | csv-to-bin ui,d,ui,ul )';fields=,y,x,;binary=ui,d,ui,ul' | csv-from-bin 4ui,ui,ul"
+drop_id/binary[5]="( echo 111,1,222,3; echo 333,1,444,3 ) | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 111,3,1,222 | csv-to-bin ui,d,ui,ul )';fields=,y,x,;binary=ui,d,ui,ul' | csv-from-bin 4ui,ui,ul"

From f8d7a3dd1638e567083110c464d2afb5ee16b5f0 Mon Sep 17 00:00:00 2001
From: aspen <aspen@aspen>
Date: Wed, 15 Nov 2023 17:55:58 +1100
Subject: [PATCH 0679/1056] csv-random example added

---
 csv/applications/csv-random.cpp | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 0344550f7..68c492caa 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -117,6 +117,14 @@ static void usage( bool verbose )
     std::cerr << '\n';
     std::cerr << "\ncsv options:";
     std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;
+    std::cerr << "\nexamples";
+    std::cerr << "\n    generate three floating point random samples from gaussian distribution";
+    std::cerr << "\n        csv-random make --distribution gaussian 0,10 --type 3f";
+    std::cerr << "\n        csv-random make --distribution gaussian 0,10 --type 3f \\";
+    std::cerr << "\n            | csv-paste line-number - \\";
+    std::cerr << "\n            | csv-blocks group --fields scalar --span 1000 \\";
+    std::cerr << "\n            | csv-shuffle --fields=id,x,y,z,block --output-fields=id,block,x,y,z";
+    std::cerr << "\n\n";
     exit( 0 );
 }
 

From aa84d893163d3df737339040098567bfd4258350 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 16 Nov 2023 12:54:46 +1100
Subject: [PATCH 0680/1056] comma-test-run: --max-parallel: -P alias removed
 since it did not work anyway (decided to not debug for now); --parallel: -p
 alias added

---
 util/applications/comma-test-run | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 7504a61ed..708099572 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -75,14 +75,14 @@ function description_resources()
     cat <<EOF
 --estimate-resources; in serial mode, accumulates performance data using comma-top into 'output/performance.csv' files;
   note: file may be empty for very short tests
---max-parallel,-P=[<N>]; run up to N tests in parallel; default: $max_parallel
+--max-parallel=[<N>]; run up to N tests in parallel; default: $max_parallel
 --max-memory-main=[<N>]; limit on main memory, in MB; default: $max_memory_main
 --max-memory-shared=[<N>]; limit on shared memory, in MB; default: $max_memory_shared
 --max-wait-time=[<time>]; maximal time to wait for available CPUs before failing a test, default: ${max_wait_time}
 --max-run-time=[<time>]; maximal time to wait for a test completion before failing it by force, default: ${max_run_time}
 --max-resources=[<file>]; specify limits for all resources in path-value format; see config files in verbose help;
   explicit options above have precedence
---parallel; run tests in parallel; default: run serially
+--parallel,-p; run tests in parallel; default: run serially
 EOF
 }
 

From b5d34822dc14aaf7dfd5dfda5c240c196323b471 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 17 Nov 2023 14:56:16 +1100
Subject: [PATCH 0681/1056] io::istream, ostream, iostream::usage() implemented

---
 io/stream.cpp | 50 ++++++++++++++++++++++----------------------------
 io/stream.h   |  5 ++++-
 2 files changed, 26 insertions(+), 29 deletions(-)

diff --git a/io/stream.cpp b/io/stream.cpp
index 74d63aae9..78ec7042e 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// All rights reserved
 
 /// @author vsevolod vlaskine
 
@@ -43,6 +16,7 @@
 
 #include <fcntl.h>
 #include <fstream>
+#include <sstream>
 #include <vector>
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/ip/udp.hpp>
@@ -387,6 +361,26 @@ stream< S >::stream( const std::string& name, mode::value m, mode::blocking_valu
     }
 }
 
+namespace impl {
+
+static std::string usage( const std::string& what, const std::string& dash, unsigned int indent )
+{
+    std::string i( ' ', indent );
+    std::ostringstream oss;
+    oss << i << "<" << what << ">" << std::endl;
+    oss << i << "    '-': " << dash << std::endl;
+    oss << i << "    <path>: path to the input file or named pipe" << std::endl;
+    oss << i << "    local:<path>: local linux socket" << std::endl;
+    oss << i << "    tcp:<address>:<port>: tcp socket (not really required, but comes for free)" << std::endl;
+    return oss.str();
+}
+
+} // namespace impl {
+
+std::string istream::usage( unsigned int indent ) { return impl::usage( "input", "stdin", indent ); }
+std::string ostream::usage( unsigned int indent ) { return impl::usage( "output", "stdout", indent ); }
+std::string iostream::usage( unsigned int indent ) { return impl::usage( "input/output", "n/a", indent ); }
+
 template class stream< std::istream >;
 template class stream< std::ostream >;
 template class stream< std::iostream >;
diff --git a/io/stream.h b/io/stream.h
index 3e6b59b07..9c028fd01 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -1,5 +1,5 @@
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
+// All rights reserved
 
 /// @author vsevolod vlaskine
 
@@ -93,6 +93,7 @@ struct istream : public stream< std::istream >
     istream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
     istream( std::istream* s, io::file_descriptor fd, mode::value mode, boost::function< void() > close );
     istream( std::istream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close );
+    static std::string usage( unsigned int indent = 0 );
 };
 
 /// output stream owner
@@ -101,12 +102,14 @@ struct ostream : public stream< std::ostream >
     ostream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
     ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, boost::function< void() > close );
     ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close );
+    static std::string usage( unsigned int indent = 0 );
 };
 
 /// input/output stream owner
 struct iostream : public stream< std::iostream >
 {
     iostream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
+    static std::string usage( unsigned int indent = 0 );
 };
 
 } } // namespace comma { namespace io {

From b2158f6b4155c9fa826e2a56090f255ca4dce85e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 17 Nov 2023 15:03:25 +1100
Subject: [PATCH 0682/1056] io::istream, ostream, iostream::usage(): bug fixed,
 works now

---
 io/stream.cpp | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/io/stream.cpp b/io/stream.cpp
index 78ec7042e..d94b213d9 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -365,13 +365,13 @@ namespace impl {
 
 static std::string usage( const std::string& what, const std::string& dash, unsigned int indent )
 {
-    std::string i( ' ', indent );
+    std::string i( indent, ' ' );
     std::ostringstream oss;
     oss << i << "<" << what << ">" << std::endl;
-    oss << i << "    '-': " << dash << std::endl;
-    oss << i << "    <path>: path to the input file or named pipe" << std::endl;
-    oss << i << "    local:<path>: local linux socket" << std::endl;
-    oss << i << "    tcp:<address>:<port>: tcp socket (not really required, but comes for free)" << std::endl;
+    oss << i << "    '-'                  : " << dash << std::endl;
+    oss << i << "    <path>               : path to input file or named pipe" << std::endl;
+    oss << i << "    local:<path>         : local linux socket" << std::endl;
+    oss << i << "    tcp:<address>:<port> : tcp socket" << std::endl;
     return oss.str();
 }
 

From 4f92a21af5375582e159443f88e68ee9b25d6834 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 23 Nov 2023 14:57:05 +1100
Subject: [PATCH 0683/1056] math::exponential_moving_average: first cut
 implemented

---
 math/exponential_moving_average.h | 57 +++++++++++++++++++++++++++++++
 math/interval.h                   | 27 ---------------
 2 files changed, 57 insertions(+), 27 deletions(-)
 create mode 100644 math/exponential_moving_average.h

diff --git a/math/exponential_moving_average.h b/math/exponential_moving_average.h
new file mode 100644
index 000000000..5423d25d5
--- /dev/null
+++ b/math/exponential_moving_average.h
@@ -0,0 +1,57 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include "../base/exception.h"
+#include "../base/none.h"
+#include "../base/types.h"
+
+namespace comma { namespace math {
+
+template < typename T >
+class exponential_moving_average
+{
+    public:
+        typedef T value_type;
+
+        exponential_moving_average( double alpha = 0.5, comma::uint64 initial_count = 1 );
+
+        template < typename S >
+        exponential_moving_average& operator+=( const S& lhs );
+
+        const T& operator()() const { if( _count > 0 ) { return _value; } COMMA_THROW( comma::exception, "no values provided yet" ); }
+
+        comma::uint64 count() const { return _count; }
+
+    private:
+        double _alpha{0.5};
+        comma::uint64 _initial_count{1};
+        comma::uint64 _count{0};
+        T _value;
+};
+
+
+template < typename T >
+inline exponential_moving_average< T >::exponential_moving_average( double alpha, comma::uint64 initial_count )
+    : _alpha( alpha )
+    , _initial_count( initial_count )
+{
+}
+
+// todo! better casting, otherwise it does not work well on integral-like values (e.g. integers or boost::posix_time::time_duration)
+template < typename T >
+template < typename S >
+inline exponential_moving_average< T >& exponential_moving_average< T >::operator+=( const S& t )
+{
+    if( _count == 0 ) { _value = T( t ); }
+    else if( _count < _initial_count ) { _value = ( _value * _count + T( t ) ) * 1. / ( _count + 1 ); }
+    else { _value = _value * ( 1. - _alpha ) + T( t ) * _alpha; }
+    ++_count;
+    return *this;
+}
+
+
+} } // namespace comma { namespace math {
diff --git a/math/interval.h b/math/interval.h
index 23f491601..5fbec8d23 100644
--- a/math/interval.h
+++ b/math/interval.h
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 

From 49ef375a48d854b61982cc2f107a5b6fa14efabc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 23 Nov 2023 15:55:24 +1100
Subject: [PATCH 0684/1056] timing::stats: first cut implemented

---
 CMakeLists.txt                    | 35 +++++++++++----------
 math/exponential_moving_average.h |  2 --
 timing/CMakeLists.txt             |  9 ++++++
 timing/stats.h                    | 52 +++++++++++++++++++++++++++++++
 visiting/CMakeLists.txt           |  1 -
 5 files changed, 79 insertions(+), 20 deletions(-)
 create mode 100644 timing/CMakeLists.txt
 create mode 100644 timing/stats.h

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 0532f2b19..df647e220 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -188,7 +188,7 @@ include_directories( ${GTEST_INCLUDE_DIRS} )
     # todo: maybe else clause is actually the right way to do things
 #    IF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
 #        FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/googletest/googletest DOC "source code of gtest" ) # FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/gtest DOC "source code of gtest" )
-#        ADD_SUBDIRECTORY( ${GTest_SOURCE_DIR} gtest )
+#        add_subdirectory( ${GTest_SOURCE_DIR} gtest )
 #        INCLUDE_DIRECTORIES( src ${GTest_SOURCE_DIR}/include ${GTest_SOURCE_DIR} )
 #        SET( GTEST_BOTH_LIBRARIES gtest gtest_main )
 #    ELSE( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
@@ -298,22 +298,23 @@ install( FILES ${comma_PACKAGE_CMAKEFILES} DESTINATION ${comma_INSTALL_PACKAGE_D
 #-----------------------------------------------------------------------------
 # add sources
 
-ADD_SUBDIRECTORY( application )
-ADD_SUBDIRECTORY( base )
-ADD_SUBDIRECTORY( bash )
-ADD_SUBDIRECTORY( containers )
-ADD_SUBDIRECTORY( csv )
-ADD_SUBDIRECTORY( dispatch )
-ADD_SUBDIRECTORY( doc )
-ADD_SUBDIRECTORY( dynamic ) 
-ADD_SUBDIRECTORY( io )
-ADD_SUBDIRECTORY( math )
-ADD_SUBDIRECTORY( name_value )
-ADD_SUBDIRECTORY( packed )
-ADD_SUBDIRECTORY( string )
-ADD_SUBDIRECTORY( sync )
-ADD_SUBDIRECTORY( util )
-ADD_SUBDIRECTORY( visiting )
+add_subdirectory( application )
+add_subdirectory( base )
+add_subdirectory( bash )
+add_subdirectory( containers )
+add_subdirectory( csv )
+add_subdirectory( dispatch )
+add_subdirectory( doc )
+add_subdirectory( dynamic ) 
+add_subdirectory( io )
+add_subdirectory( math )
+add_subdirectory( name_value )
+add_subdirectory( packed )
+add_subdirectory( string )
+add_subdirectory( sync )
+add_subdirectory( timing )
+add_subdirectory( util )
+add_subdirectory( visiting )
 add_subdirectory( web )
 if( comma_BUILD_XML )
     add_subdirectory( xml )
diff --git a/math/exponential_moving_average.h b/math/exponential_moving_average.h
index 5423d25d5..c38792a54 100644
--- a/math/exponential_moving_average.h
+++ b/math/exponential_moving_average.h
@@ -33,7 +33,6 @@ class exponential_moving_average
         T _value;
 };
 
-
 template < typename T >
 inline exponential_moving_average< T >::exponential_moving_average( double alpha, comma::uint64 initial_count )
     : _alpha( alpha )
@@ -53,5 +52,4 @@ inline exponential_moving_average< T >& exponential_moving_average< T >::operato
     return *this;
 }
 
-
 } } // namespace comma { namespace math {
diff --git a/timing/CMakeLists.txt b/timing/CMakeLists.txt
new file mode 100644
index 000000000..3fe24051e
--- /dev/null
+++ b/timing/CMakeLists.txt
@@ -0,0 +1,9 @@
+SET( PROJECT "timing" )
+SET( TARGET_NAME comma_${PROJECT} )
+
+FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
+FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
+SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
+ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
+
+INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/timing/stats.h b/timing/stats.h
new file mode 100644
index 000000000..84d186e0c
--- /dev/null
+++ b/timing/stats.h
@@ -0,0 +1,52 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <chrono>
+#include "../math/exponential_moving_average.h"
+
+namespace comma { namespace timing {
+
+class stats
+{
+    public:
+        stats( double ema_alpha = 0.5, comma::uint64 ema_initial_count = 1 ): _ema( ema_alpha, ema_initial_count ) {}
+
+        stats& operator++() { return operator+=( std::chrono::system_clock::now() ); }
+
+        stats& operator+=( const std::chrono::time_point< std::chrono::system_clock >& t );
+
+        comma::uint64 count() const { return _ema.count(); }
+
+        double rate() const { return 1. / _ema(); }
+
+        double ema() const { return _ema(); }
+
+        double min() const { return _min; }
+
+        double max() const { return _max; }
+
+    private:
+        std::chrono::time_point< std::chrono::system_clock > _t;
+        math::exponential_moving_average< double > _ema;
+        double _min{0};
+        double _max{0};
+};
+
+inline stats& stats::operator+=( const std::chrono::time_point< std::chrono::system_clock >& t ) // todo: move to cpp file
+{
+    if( _t.time_since_epoch() > std::chrono::seconds( 0 ) )
+    {
+        double d = double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000;
+        if( _ema.count() == 0 ) { _min = _max = d; }
+        else { if( d < _min ) { _min = d; } else if( d > _max ) { _max = d; } }
+        _ema += double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000; // quick and dirty for now
+    }
+    _t = t;
+    return *this;
+}
+
+} } // namespace comma { namespace timing {
diff --git a/visiting/CMakeLists.txt b/visiting/CMakeLists.txt
index bb08d565b..32339a5ba 100644
--- a/visiting/CMakeLists.txt
+++ b/visiting/CMakeLists.txt
@@ -7,7 +7,6 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
-INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/Visitors )
                                            
 IF( comma_BUILD_TESTS )
     ADD_SUBDIRECTORY( test )

From 0c3b7390f105dd4bc663aac5fbf312f6d66fcab2 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 23 Nov 2023 16:29:51 +1100
Subject: [PATCH 0685/1056] timing::stats::print(): first cut implemented

---
 timing/stats.h | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/timing/stats.h b/timing/stats.h
index 84d186e0c..e53bb074a 100644
--- a/timing/stats.h
+++ b/timing/stats.h
@@ -6,6 +6,8 @@
 #pragma once
 
 #include <chrono>
+#include <iostream>
+#include <string>
 #include "../math/exponential_moving_average.h"
 
 namespace comma { namespace timing {
@@ -29,6 +31,8 @@ class stats
 
         double max() const { return _max; }
 
+        void print( unsigned int count = 1, std::ostream& os = std::cerr, const std::string& prefix = "" );
+
     private:
         std::chrono::time_point< std::chrono::system_clock > _t;
         math::exponential_moving_average< double > _ema;
@@ -49,4 +53,9 @@ inline stats& stats::operator+=( const std::chrono::time_point< std::chrono::sys
     return *this;
 }
 
+inline void stats::print( unsigned int c, std::ostream& os, const std::string& prefix )
+{
+    if( count() > 0 && count() % c == 0 ) { os << ( prefix.empty() ? std::string() : ( prefix + ": " ) ) << "rate: " << rate() << "Hz" << " intervals: min: " << _min << " max: " << _max << " mean: " << _ema() << " count: " << _ema.count() << std::endl; }
+}
+
 } } // namespace comma { namespace timing {

From 1f82313521834c6f71046a24ca564f40cf909fdc Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 23 Nov 2023 20:46:41 +1100
Subject: [PATCH 0686/1056] timing::stats::output(...): brushed up, output as
 name-value pairs; todo: output start time, frigging hate chrono!

---
 timing/stats.h | 47 +++++++++++++++++++++++++++++++++++++++--------
 1 file changed, 39 insertions(+), 8 deletions(-)

diff --git a/timing/stats.h b/timing/stats.h
index e53bb074a..8f3dd1dee 100644
--- a/timing/stats.h
+++ b/timing/stats.h
@@ -15,11 +15,15 @@ namespace comma { namespace timing {
 class stats
 {
     public:
-        stats( double ema_alpha = 0.5, comma::uint64 ema_initial_count = 1 ): _ema( ema_alpha, ema_initial_count ) {}
+        typedef std::chrono::time_point< std::chrono::system_clock > time_type;
+
+        typedef decltype( time_type() - time_type() ) duration_type;
+
+        stats( double ema_alpha = 0.5, comma::uint64 ema_initial_count = 1 ): _ema( ema_alpha, ema_initial_count ), _previous( std::chrono::system_clock::now() ) {}
 
         stats& operator++() { return operator+=( std::chrono::system_clock::now() ); }
 
-        stats& operator+=( const std::chrono::time_point< std::chrono::system_clock >& t );
+        stats& operator+=( const time_type& t );
 
         comma::uint64 count() const { return _ema.count(); }
 
@@ -31,18 +35,30 @@ class stats
 
         double max() const { return _max; }
 
-        void print( unsigned int count = 1, std::ostream& os = std::cerr, const std::string& prefix = "" );
+        void output( std::ostream& os = std::cerr, const std::string& prefix = "" );
+    
+        void output( unsigned int count = 1, std::ostream& os = std::cerr, const std::string& prefix = "" );
+
+        void output_every( const stats::duration_type& d, std::ostream& os = std::cerr, const std::string& prefix = "" );
+
+        double elapsed() const { return double( std::chrono::duration_cast< std::chrono::microseconds >( _t - _start ).count() ) / 1000000; }
 
     private:
-        std::chrono::time_point< std::chrono::system_clock > _t;
+        time_type _start;
+        time_type _t;
+        time_type _previous;
         math::exponential_moving_average< double > _ema;
         double _min{0};
         double _max{0};
 };
 
-inline stats& stats::operator+=( const std::chrono::time_point< std::chrono::system_clock >& t ) // todo: move to cpp file
+inline stats& stats::operator+=( const stats::time_type& t ) // todo: move to cpp file
 {
-    if( _t.time_since_epoch() > std::chrono::seconds( 0 ) )
+    if( _t.time_since_epoch() == std::chrono::seconds( 0 ) )
+    {
+        _start = t;
+    }
+    else
     {
         double d = double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000;
         if( _ema.count() == 0 ) { _min = _max = d; }
@@ -53,9 +69,24 @@ inline stats& stats::operator+=( const std::chrono::time_point< std::chrono::sys
     return *this;
 }
 
-inline void stats::print( unsigned int c, std::ostream& os, const std::string& prefix )
+inline void stats::output( std::ostream& os, const std::string& prefix )
 {
-    if( count() > 0 && count() % c == 0 ) { os << ( prefix.empty() ? std::string() : ( prefix + ": " ) ) << "rate: " << rate() << "Hz" << " intervals: min: " << _min << " max: " << _max << " mean: " << _ema() << " count: " << _ema.count() << std::endl; }
+    // freaking hate chrono! os << prefix << "start=" << _start << ";elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
+    os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
 }
 
+inline void stats::output( unsigned int c, std::ostream& os, const std::string& prefix )
+{
+    if( count() > 0 && count() % c == 0 ) { output( os, prefix ); }
+}
+
+inline void stats::output_every( const stats::duration_type& d, std::ostream& os, const std::string& prefix )
+{
+    auto now = std::chrono::system_clock::now();
+    if( ( now - _previous ) < d ) { return; }
+    output( os, prefix );
+    _previous = now;
+}
+
+
 } } // namespace comma { namespace timing {

From c5ee2e283f9101489b1d1a8f128071dcf8cc6155 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 24 Nov 2023 10:54:45 +1100
Subject: [PATCH 0687/1056] timing::stats::touch() implemented

---
 timing/stats.h | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/timing/stats.h b/timing/stats.h
index 8f3dd1dee..97d7a3986 100644
--- a/timing/stats.h
+++ b/timing/stats.h
@@ -19,11 +19,15 @@ class stats
 
         typedef decltype( time_type() - time_type() ) duration_type;
 
-        stats( double ema_alpha = 0.5, comma::uint64 ema_initial_count = 1 ): _ema( ema_alpha, ema_initial_count ), _previous( std::chrono::system_clock::now() ) {}
+        stats( double ema_alpha = 0.5, comma::uint64 ema_initial_count = 1 ): _ema( ema_alpha, ema_initial_count ), _previous_output_time( std::chrono::system_clock::now() ) {}
+
+        stats& operator+=( const time_type& t );
 
         stats& operator++() { return operator+=( std::chrono::system_clock::now() ); }
 
-        stats& operator+=( const time_type& t );
+        stats& touch( const time_type& t ) { _t = t; return *this; }
+
+        stats& touch() { return touch( std::chrono::system_clock::now() ); }
 
         comma::uint64 count() const { return _ema.count(); }
 
@@ -46,7 +50,7 @@ class stats
     private:
         time_type _start;
         time_type _t;
-        time_type _previous;
+        time_type _previous_output_time;
         math::exponential_moving_average< double > _ema;
         double _min{0};
         double _max{0};
@@ -54,7 +58,7 @@ class stats
 
 inline stats& stats::operator+=( const stats::time_type& t ) // todo: move to cpp file
 {
-    if( _t.time_since_epoch() == std::chrono::seconds( 0 ) )
+    if( _start.time_since_epoch() == std::chrono::seconds( 0 ) )
     {
         _start = t;
     }
@@ -83,9 +87,9 @@ inline void stats::output( unsigned int c, std::ostream& os, const std::string&
 inline void stats::output_every( const stats::duration_type& d, std::ostream& os, const std::string& prefix )
 {
     auto now = std::chrono::system_clock::now();
-    if( ( now - _previous ) < d ) { return; }
+    if( ( now - _previous_output_time ) < d ) { return; }
     output( os, prefix );
-    _previous = now;
+    _previous_output_time = now;
 }
 
 
From 38ecea23cbad37420771e58b93f8c4dc8c09fb5a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 24 Nov 2023 12:00:07 +1100
Subject: [PATCH 0688/1056] timing::stats::output(): made more robust

---
 timing/stats.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/timing/stats.h b/timing/stats.h
index 97d7a3986..5b22a53cc 100644
--- a/timing/stats.h
+++ b/timing/stats.h
@@ -76,7 +76,8 @@ inline stats& stats::operator+=( const stats::time_type& t ) // todo: move to cp
 inline void stats::output( std::ostream& os, const std::string& prefix )
 {
     // freaking hate chrono! os << prefix << "start=" << _start << ";elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
-    os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
+    if( _ema.count() == 0 ) { os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=nan;intervals/min=nan;intervals/max=nan;intervals/mean=nan" << std::endl; }
+    else { os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl; }
 }
 
 inline void stats::output( unsigned int c, std::ostream& os, const std::string& prefix )

From 4805654a8ec8049e90a4c586333372abb6a35898 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 1 Dec 2023 18:57:49 +1100
Subject: [PATCH 0689/1056] timing: turned into a library; traits and csv
 output implemented

---
 CMakeLists.txt        |  4 ++-
 timing/CMakeLists.txt | 15 +++++++--
 timing/stats.cpp      | 72 +++++++++++++++++++++++++++++++++++++++++++
 timing/stats.h        | 54 +++++---------------------------
 timing/traits.h       | 24 +++++++++++++++
 5 files changed, 120 insertions(+), 49 deletions(-)
 create mode 100644 timing/stats.cpp
 create mode 100644 timing/traits.h

diff --git a/CMakeLists.txt b/CMakeLists.txt
index df647e220..06d2e2c66 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -254,7 +254,9 @@ SET( comma_ALL_LIBRARIES
         debug comma_xpath-d
         optimized comma_xpath
         debug comma_name_value-d
-        optimized comma_name_value )
+        optimized comma_name_value
+        debug comma_timing-d
+        optimized comma_timing )
 
 if(WIN32)
     set( comma_ALL_EXTERNAL_LIBRARIES Ws2_32.lib )
diff --git a/timing/CMakeLists.txt b/timing/CMakeLists.txt
index 3fe24051e..3029a3fc4 100644
--- a/timing/CMakeLists.txt
+++ b/timing/CMakeLists.txt
@@ -1,9 +1,20 @@
 SET( PROJECT "timing" )
 SET( TARGET_NAME comma_${PROJECT} )
 
+SET( PROJECT "timing" )
+SET( TARGET_NAME comma_${PROJECT} )
+
 FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
-SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
-ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
+SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
+ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
+target_link_libraries( ${TARGET_NAME} comma_csv comma_name_value comma_string )
+SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+INSTALL(
+    TARGETS ${TARGET_NAME}
+    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
+    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
+    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
+)
diff --git a/timing/stats.cpp b/timing/stats.cpp
new file mode 100644
index 000000000..66174c1dc
--- /dev/null
+++ b/timing/stats.cpp
@@ -0,0 +1,72 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "../csv/ascii.h" // quick and dirty
+#include "../name_value/ptree.h"
+#include "../timing/stats.h"
+#include "../timing/traits.h"
+
+namespace comma { namespace timing {
+
+stats& stats::operator+=( const stats::time_type& t ) // todo: move to cpp file
+{
+    if( _start.time_since_epoch() == std::chrono::seconds( 0 ) )
+    {
+        _start = t;
+    }
+    else
+    {
+        double d = double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000;
+        if( _ema.count() == 0 ) { _min = _max = d; }
+        else { if( d < _min ) { _min = d; } else if( d > _max ) { _max = d; } }
+        _ema += double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000; // quick and dirty for now
+    }
+    _t = t;
+    return *this;
+}
+
+double stats::elapsed() const
+{ 
+    return double( std::chrono::duration_cast< std::chrono::microseconds >( _t - _start ).count() ) / 1000000;
+}
+
+void stats::output( std::ostream& os, const std::string& prefix, bool csv ) // todo: template on prefix
+{
+    // freaking hate chrono! os << prefix << "start=" << _start << ";elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
+    auto p = os.precision();
+    os.setf( std::ios::fixed, std::ios::floatfield );
+    os << std::setprecision( 6 ) << prefix;
+    std::cerr << std::setprecision( 6 );
+    if( csv )
+    {
+        static comma::csv::ascii< stats > ascii;
+        os << ascii.put( *this ) << std::endl;
+    }
+    else
+    {
+        boost::property_tree::ptree t;
+        to_ptree to( t );
+        visiting::apply( to, *this );
+        comma::property_tree::to_path_value( os, t, comma::property_tree::disabled, '=', ';', xpath(), true );
+        os << std::endl;
+        //os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
+    }
+    os << std::setprecision( p ); // todo! not excetion-safe
+}
+
+void stats::output( unsigned int c, std::ostream& os, const std::string& prefix, bool csv )
+{
+    if( count() > 0 && count() % c == 0 ) { output( os, prefix, csv ); }
+}
+
+void stats::output_every( const stats::duration_type& d, std::ostream& os, const std::string& prefix, bool csv )
+{
+    auto now = std::chrono::system_clock::now();
+    if( ( now - _previous_output_time ) < d ) { return; }
+    output( os, prefix, csv );
+    _previous_output_time = now;
+}
+
+} } // namespace comma { namespace timing {
diff --git a/timing/stats.h b/timing/stats.h
index 5b22a53cc..4b0865815 100644
--- a/timing/stats.h
+++ b/timing/stats.h
@@ -31,67 +31,29 @@ class stats
 
         comma::uint64 count() const { return _ema.count(); }
 
-        double rate() const { return 1. / _ema(); }
+        double rate() const { return _ema.count() > 0 ? 1. / _ema() : 0; }
 
-        double ema() const { return _ema(); }
+        double ema() const { return _ema.count() > 0 ? _ema() : 0; }
 
         double min() const { return _min; }
 
         double max() const { return _max; }
 
-        void output( std::ostream& os = std::cerr, const std::string& prefix = "" );
-    
-        void output( unsigned int count = 1, std::ostream& os = std::cerr, const std::string& prefix = "" );
+        double elapsed() const;
 
-        void output_every( const stats::duration_type& d, std::ostream& os = std::cerr, const std::string& prefix = "" );
+        void output( std::ostream& os = std::cerr, const std::string& prefix = "", bool csv = false );
+    
+        void output( unsigned int count = 1, std::ostream& os = std::cerr, const std::string& prefix = "", bool csv = false );
 
-        double elapsed() const { return double( std::chrono::duration_cast< std::chrono::microseconds >( _t - _start ).count() ) / 1000000; }
+        void output_every( const stats::duration_type& d, std::ostream& os = std::cerr, const std::string& prefix = "", bool csv = false );
 
     private:
+        math::exponential_moving_average< double > _ema;
         time_type _start;
         time_type _t;
         time_type _previous_output_time;
-        math::exponential_moving_average< double > _ema;
         double _min{0};
         double _max{0};
 };
 
-inline stats& stats::operator+=( const stats::time_type& t ) // todo: move to cpp file
-{
-    if( _start.time_since_epoch() == std::chrono::seconds( 0 ) )
-    {
-        _start = t;
-    }
-    else
-    {
-        double d = double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000;
-        if( _ema.count() == 0 ) { _min = _max = d; }
-        else { if( d < _min ) { _min = d; } else if( d > _max ) { _max = d; } }
-        _ema += double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000; // quick and dirty for now
-    }
-    _t = t;
-    return *this;
-}
-
-inline void stats::output( std::ostream& os, const std::string& prefix )
-{
-    // freaking hate chrono! os << prefix << "start=" << _start << ";elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
-    if( _ema.count() == 0 ) { os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=nan;intervals/min=nan;intervals/max=nan;intervals/mean=nan" << std::endl; }
-    else { os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl; }
-}
-
-inline void stats::output( unsigned int c, std::ostream& os, const std::string& prefix )
-{
-    if( count() > 0 && count() % c == 0 ) { output( os, prefix ); }
-}
-
-inline void stats::output_every( const stats::duration_type& d, std::ostream& os, const std::string& prefix )
-{
-    auto now = std::chrono::system_clock::now();
-    if( ( now - _previous_output_time ) < d ) { return; }
-    output( os, prefix );
-    _previous_output_time = now;
-}
-
-
 } } // namespace comma { namespace timing {
diff --git a/timing/traits.h b/timing/traits.h
new file mode 100644
index 000000000..83b82cae6
--- /dev/null
+++ b/timing/traits.h
@@ -0,0 +1,24 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "../timing/stats.h"
+#include "../visiting/traits.h"
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::timing::stats > // quick and dirty
+{
+    template < typename Key, class Visitor > static void visit( const Key& k, const comma::timing::stats& p, Visitor& v )
+    {
+        v.apply( "elapsed", p.elapsed() );
+        v.apply( "count", p.count() );
+        v.apply( "rate", p.rate() );
+        v.apply( "min", p.min() );
+        v.apply( "max", p.max() );
+        v.apply( "mean", p.ema() );
+    }
+};
+
+} } // namespace comma { namespace visiting {

From e666d1c3108df8f709d9254f63b0c20543931a66 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 4 Dec 2023 10:26:08 +1100
Subject: [PATCH 0690/1056] timing/stats: name-value output: hacked for now;
 todo: make to_ptree configurable by precision

---
 timing/stats.cpp | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/timing/stats.cpp b/timing/stats.cpp
index 66174c1dc..f31b44031 100644
--- a/timing/stats.cpp
+++ b/timing/stats.cpp
@@ -46,12 +46,14 @@ void stats::output( std::ostream& os, const std::string& prefix, bool csv ) // t
     }
     else
     {
-        boost::property_tree::ptree t;
-        to_ptree to( t );
-        visiting::apply( to, *this );
-        comma::property_tree::to_path_value( os, t, comma::property_tree::disabled, '=', ';', xpath(), true );
-        os << std::endl;
-        //os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
+        // todo! fix! to_ptree: eventually calls ptree.put() which does lexical cast at very high precision
+        //                      the solution: parametrize on precision and/or provide translator for putting value (or getting)
+        // boost::property_tree::ptree t;
+        // to_ptree to( t );
+        // visiting::apply( to, *this );
+        // comma::property_tree::to_path_value( os, t, comma::property_tree::disabled, '=', ';', xpath(), true );
+        // os << std::endl;
+        os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
     }
     os << std::setprecision( p ); // todo! not excetion-safe
 }

From 239c9301214d75e2e0d85a59c9eb3f5067ac7ed4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 5 Dec 2023 12:47:49 +1100
Subject: [PATCH 0691/1056] timing::stats: minor bug fixed

---
 timing/stats.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/timing/stats.cpp b/timing/stats.cpp
index f31b44031..773dc5dc6 100644
--- a/timing/stats.cpp
+++ b/timing/stats.cpp
@@ -53,7 +53,7 @@ void stats::output( std::ostream& os, const std::string& prefix, bool csv ) // t
         // visiting::apply( to, *this );
         // comma::property_tree::to_path_value( os, t, comma::property_tree::disabled, '=', ';', xpath(), true );
         // os << std::endl;
-        os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
+        os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << ema() << std::endl;
     }
     os << std::setprecision( p ); // todo! not excetion-safe
 }

From 243ed5c6a566d434f09cd1f68808683377d510b6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 5 Dec 2023 20:17:25 +1100
Subject: [PATCH 0692/1056] a bunch of compilation warnings fixed

---
 application/command_line_options.cpp |  14 ++--
 csv/applications/csv-calc.cpp        | 104 ++++++++++-----------------
 csv/applications/csv-calc.new.cpp    |  51 ++++---------
 csv/applications/csv-units.cpp       |  45 +++---------
 csv/format.h                         |  31 ++------
 csv/test/binary_test.cpp             |  34 ++-------
 6 files changed, 76 insertions(+), 203 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index dd3410429..9df064ad1 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -7,7 +7,7 @@
 #include <sstream>
 #include <set>
 #include <unordered_map>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/config/warning_disable.hpp>
 //#include "boost/filesystem.hpp"
 #include "boost/iostreams/stream.hpp"
@@ -239,12 +239,12 @@ namespace impl {
         description_t d;
         bool r = boost::spirit::qi::phrase_parse( s.begin()
                                                 , s.end()
-                                                ,      name[ boost::bind( push_back_, boost::ref( d.names ), _1 ) ]
-                                                    >> *( ',' >> name[ boost::bind( push_back_, boost::ref( d.names ), _1 ) ] )
-                                                    >> -( '=' >> ( value[ boost::bind( got_value, boost::ref( d ), _1 ) ]
-                                                                | optional_value[ boost::bind( got_optional_value, boost::ref( d ), _1 ) ] ) )
-                                                    >> -( ';' >> default_value[ boost::bind( got_default_value, boost::ref( d ), _1 ) ] )
-                                                    >> -( ';' >> *( ascii::space ) >> help[ boost::bind( set_, boost::ref( d.help ), _1 ) ] )
+                                                ,      name[ boost::bind( push_back_, boost::ref( d.names ), boost::placeholders::_1 ) ]
+                                                    >> *( ',' >> name[ boost::bind( push_back_, boost::ref( d.names ), boost::placeholders::_1 ) ] )
+                                                    >> -( '=' >> ( value[ boost::bind( got_value, boost::ref( d ), boost::placeholders::_1 ) ]
+                                                                | optional_value[ boost::bind( got_optional_value, boost::ref( d ), boost::placeholders::_1 ) ] ) )
+                                                    >> -( ';' >> default_value[ boost::bind( got_default_value, boost::ref( d ), boost::placeholders::_1 ) ] )
+                                                    >> -( ';' >> *( ascii::space ) >> help[ boost::bind( set_, boost::ref( d.help ), boost::placeholders::_1 ) ] )
                                                     >> qi::eoi
                                                 , ascii::space );
         if( !r ) { COMMA_THROW( comma::exception, "invalid option description: \"" << s << "\"" ); }
diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 82f7979fc..00cac2faa 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // Copyright (c) 2020 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -41,7 +14,7 @@
 #include <map>
 #include <type_traits>
 #include <unordered_set>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/function.hpp>
 #include <boost/optional.hpp>
 #include <boost/ptr_container/ptr_vector.hpp>
@@ -50,6 +23,7 @@
 #include <boost/date_time/posix_time/posix_time_types.hpp>
 #include "../../application/verbose.h"
 #include "../../base/exception.h"
+#include "../../base/none.h"
 #include "../../csv/format.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
@@ -217,8 +191,8 @@ class Values
         std::vector< comma::csv::format::element > input_elements_;
         std::vector< comma::csv::format::element > elements_;
         std::vector< char > buffer_;
-        boost::optional< unsigned int > block_index_;
-        boost::optional< unsigned int > id_index_;
+        boost::optional< unsigned int > block_index_{ comma::silent_none< unsigned int >() };
+        boost::optional< unsigned int > id_index_{ comma::silent_none< unsigned int >() };
         comma::csv::format::element block_element_;
         comma::csv::format::element id_element_;
         unsigned int block_;
@@ -264,15 +238,15 @@ class Values
                 block_element_ = input_format_.offset( *block_index_ );
                 switch( block_element_.type )
                 {
-                    case comma::csv::format::char_t: block_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::int8: block_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::uint8: block_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, _1 ); break;
-                    case comma::csv::format::int16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, _1 ); break;
-                    case comma::csv::format::uint16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, _1 ); break;
-                    case comma::csv::format::int32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, _1 ); break;
-                    case comma::csv::format::uint32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, _1 ); break;
-                    case comma::csv::format::int64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, _1 ); break;
-                    case comma::csv::format::uint64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, _1 ); break;
+                    case comma::csv::format::char_t: block_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int8: block_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint8: block_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, boost::placeholders::_1 ); break;
                     default: COMMA_THROW( comma::exception, "expected integer for block id, got format " << input_format_.string() );
                 }
             }
@@ -281,15 +255,15 @@ class Values
                 id_element_ = input_format_.offset( *id_index_ );
                 switch( id_element_.type )
                 {
-                    case comma::csv::format::char_t: id_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::int8: id_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::uint8: id_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, _1 ); break;
-                    case comma::csv::format::int16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, _1 ); break;
-                    case comma::csv::format::uint16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, _1 ); break;
-                    case comma::csv::format::int32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, _1 ); break;
-                    case comma::csv::format::uint32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, _1 ); break;
-                    case comma::csv::format::int64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, _1 ); break;
-                    case comma::csv::format::uint64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, _1 ); break;
+                    case comma::csv::format::char_t: id_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int8: id_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint8: id_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::int64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::uint64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, boost::placeholders::_1 ); break;
                     default: COMMA_THROW( comma::exception, "expected integer for block id, got format " << input_format_.string() );
                 }
             }
@@ -456,7 +430,7 @@ namespace Operations
     class Min : public base
     {
         public:
-            void reset() { min_ = boost::optional< T >(); }
+            void reset() { min_ = comma::silent_none< T >(); }
             void push( const char* buf )
             {
                 const T& t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -468,14 +442,14 @@ namespace Operations
             friend class Centre< T, F >;
             friend class Diameter< T, F >;
             friend class Radius< T, F >;
-            boost::optional< T > min_;
+            boost::optional< T > min_{ comma::silent_none< T >() };
     };
 
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
     class Max : public base
     {
         public:
-            void reset() { max_ = boost::optional< T >(); }
+            void reset() { max_ = comma::silent_none< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -487,14 +461,14 @@ namespace Operations
             friend class Centre< T, F >;
             friend class Diameter< T, F >;
             friend class Radius< T, F >;
-            boost::optional< T > max_;
+            boost::optional< T > max_{ comma::silent_none< T >() };
     };
 
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
     class Sum : public base
     {
         public:
-            void reset() { sum_ = boost::optional< T >(); }
+            void reset() { sum_ = comma::silent_none< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -503,7 +477,7 @@ namespace Operations
             void calculate( char* buf ) { if( sum_ ) { comma::csv::format::traits< T, F >::to_bin( *sum_, buf ); } }
             base* clone() const { return new Sum< T, F >( *this ); }
         private:
-            boost::optional< T > sum_;
+            boost::optional< T > sum_{ comma::silent_none< T >() };
     };
 
     template < comma::csv::format::types_enum F >
@@ -558,7 +532,7 @@ namespace Operations
             void calculate( char* buf ) { if( count_ > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( *mean_ ), buf ); } }
             base* clone() const { return new Mean< T, F >( *this ); }
         private:
-            boost::optional< typename result_traits< T >::type > mean_;
+            boost::optional< typename result_traits< T >::type > mean_{ comma::silent_none< typename result_traits< T >::type >() };
             std::size_t count_;
     };
 
@@ -588,7 +562,7 @@ namespace Operations
                 if( values_.empty() ) { return; }
                 std::size_t count = values_.size();
                 comma::verbose << "calculating " << percentile_*100 << "th percentile using ";
-                T value;
+                T value = comma::csv::format::traits< T, F >::zero();
                 typename std::multiset< T >::iterator it = values_.begin();
                 switch( method_ )
                 {
@@ -776,7 +750,7 @@ namespace Operations
             void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
     };
 
@@ -797,7 +771,7 @@ namespace Operations
             void reset() { stddev_.reset(); first_ = boost::none; }
         private:
             Stddev< double, F > stddev_;
-            boost::optional<boost::posix_time::ptime> first_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -819,7 +793,7 @@ namespace Operations
             void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
     };
 
@@ -840,7 +814,7 @@ namespace Operations
             void reset() { variance_.reset(); first_ = boost::none; }
         private:
             Variance< double, F > variance_;
-            boost::optional< boost::posix_time::ptime > first_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -872,7 +846,7 @@ namespace Operations
             void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 3 > moments_;
-            boost::optional< T > first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
     };
 
@@ -893,7 +867,7 @@ namespace Operations
             void reset() { skew_.reset(); first_ = boost::none; }
         private:
             Skew< double, F > skew_;
-            boost::optional< boost::posix_time::ptime > first_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -936,7 +910,7 @@ namespace Operations
             void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 4 > moments_;
-            boost::optional< T > first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
             bool excess_;
     };
@@ -958,7 +932,7 @@ namespace Operations
             void reset() { kurtosis_.reset(); first_ = boost::none; }
         private:
             Kurtosis< double, F > kurtosis_;
-            boost::optional< boost::posix_time::ptime > first_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T > struct Diff
@@ -1311,7 +1285,7 @@ int main( int ac, char** av )
             operations_parameters[i].type = Operations::from_name( p[0] );
             if( p.size() == 2 ){ operations_parameters[i].options = comma::split( p[1], ':' ); }
         }
-        boost::optional< comma::csv::format > format;
+        boost::optional< comma::csv::format > format = { comma::silent_none< comma::csv::format >() };
         if( csv.binary() ) { format = csv.format(); }
         else if( options.exists( "--format" ) ) { format = comma::csv::format( options.value< std::string >( "--format" ) ); }
         boost::scoped_ptr< ascii_input > ascii;
diff --git a/csv/applications/csv-calc.new.cpp b/csv/applications/csv-calc.new.cpp
index 00d590c6d..84642d4b4 100644
--- a/csv/applications/csv-calc.new.cpp
+++ b/csv/applications/csv-calc.new.cpp
@@ -1,32 +1,7 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+/// @author vsevolod vlaskine
 
 #include <string.h>
 #include <algorithm>
@@ -36,7 +11,7 @@
 #include <string>
 #include <vector>
 #include <boost/array.hpp>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/function.hpp>
 #include "../../application/command_line_options.h"
 #include "../../base/types.h"
@@ -357,7 +332,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //             {
 //                 get_< R >( *result_ ).push_back( R() );
 //                 bound_functors< T > b( boost::bind( f.reset, boost::ref( get_< R >( *result_ ).back() ) )
-//                                      , boost::bind( f.update, boost::ref( get_< R >( *result_ ).back(), _1 ) )
+//                                      , boost::bind( f.update, boost::ref( get_< R >( *result_ ).back(), boost::placeholders::_1 ) )
 //                                      , boost::bind( f.finalize, boost::ref( get_< R >( *result_ ).back() ) ) );
 //                 get_< T >().push_back( b );
 //             }
@@ -382,7 +357,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef T result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { if( rhs < lhs ) { lhs = rhs; } }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, _1, _2 ), std::numeric_limits< T >::max() ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, boost::placeholders::_1, _2 ), std::numeric_limits< T >::max() ); }
 // };
 // 
 // template <> struct min< std::string >
@@ -390,7 +365,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef std::string type;
 //     typedef std::string result_type;
 //     static void apply( result_type&, const std::string& ) {}
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, _1, _2 ) ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template <> struct min< boost::posix_time::ptime >
@@ -398,7 +373,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef boost::posix_time::ptime type;
 //     typedef boost::posix_time::ptime result_type;
 //     static void apply( boost::posix_time::ptime& lhs, const boost::posix_time::ptime& rhs ) { if( lhs.is_not_a_date_time() || rhs < lhs ) { lhs = rhs; } }
-//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &min::apply, _1, _2 ) ); }
+//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &min::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template < typename T > struct max
@@ -406,7 +381,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef T result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { if( lhs < rhs ) { lhs = rhs; } }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, _1, _2 ), std::numeric_limits< T >::min() ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, boost::placeholders::_1, _2 ), std::numeric_limits< T >::min() ); }
 // };
 // 
 // template <> struct max< std::string >
@@ -414,7 +389,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef std::string type;
 //     typedef std::string result_type;
 //     static void apply( result_type& lhs, const std::string& rhs ) { if( lhs < rhs ) { lhs = rhs; } }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, _1, _2 ) ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template <> struct min< boost::posix_time::ptime >
@@ -422,7 +397,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef boost::posix_time::ptime type;
 //     typedef boost::posix_time::ptime result_type;
 //     static void apply( boost::posix_time::ptime& lhs, const boost::posix_time::ptime& rhs ) { if( lhs.is_not_a_date_time() || rhs < lhs ) { lhs = rhs; } }
-//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &max::apply, _1, _2 ) ); }
+//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &max::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template < typename T > struct size
@@ -430,7 +405,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef double result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { ++rhs; }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &size::apply, _1, _2 ), 0 ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &size::apply, boost::placeholders::_1, _2 ), 0 ); }
 // };
 // 
 // template < typename T > struct sum
@@ -438,7 +413,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef T result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { lhs += rhs; }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, _1, _2 ), 0 ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, boost::placeholders::_1, _2 ), 0 ); }
 // };
 // 
 // template <> struct sum< std::string >
@@ -446,7 +421,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef std::string type;
 //     typedef std::string result_type;
 //     static void apply( result_type&, const std::string& ) {}
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, _1, _2 ) ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template <> struct sum< boost::posix_time::ptime >
@@ -454,7 +429,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef boost::posix_time::ptime type;
 //     typedef boost::posix_time::ptime result_type;
 //     static void apply( boost::posix_time::ptime&, const boost::posix_time::ptime& ) {}
-//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &sum::apply, _1, _2 ) ); }
+//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &sum::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // } // namespace operations {
diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index c46bfd541..701b2bc0f 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -1,38 +1,11 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 /// @author kai huang
 
 #include <iostream>
 #include <boost/array.hpp>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/optional.hpp>
 #include <boost/unordered/unordered_map.hpp>
 
@@ -338,14 +311,14 @@ namespace units {
             map[metres][feet] = cast< length_t, imperial_us_length_t >;
             map[metres][nautical_miles] = cast< length_t, nautical_mile_t >;
             map[metres][statute_miles] = cast< length_t, statute_mile_t >;
-            map[hours][minutes] = boost::bind( &scale, _1, 60.0 );
-            map[hours][seconds] = boost::bind( &scale, _1, 3600.0 );
-            map[minutes][seconds] = boost::bind( &scale, _1, 60.0 );
-            map[minutes][hours] = boost::bind( &scale, _1, 1.0 / 60.0 );
-            map[seconds][hours] = boost::bind( &scale, _1, 1.0 / 3600.0 );
-            map[seconds][minutes] = boost::bind( &scale, _1, 1.0 / 60.0 );
-            map[percent][fraction] = boost::bind( &scale, _1, 0.01 );
-            map[fraction][percent] = boost::bind( &scale, _1, 100.0 );
+            map[hours][minutes] = boost::bind( &scale, boost::placeholders::_1, 60.0 );
+            map[hours][seconds] = boost::bind( &scale, boost::placeholders::_1, 3600.0 );
+            map[minutes][seconds] = boost::bind( &scale, boost::placeholders::_1, 60.0 );
+            map[minutes][hours] = boost::bind( &scale, boost::placeholders::_1, 1.0 / 60.0 );
+            map[seconds][hours] = boost::bind( &scale, boost::placeholders::_1, 1.0 / 3600.0 );
+            map[seconds][minutes] = boost::bind( &scale, boost::placeholders::_1, 1.0 / 60.0 );
+            map[percent][fraction] = boost::bind( &scale, boost::placeholders::_1, 0.01 );
+            map[fraction][percent] = boost::bind( &scale, boost::placeholders::_1, 100.0 );
         }
         return map[from][to];
     }
diff --git a/csv/format.h b/csv/format.h
index 8e27a02fb..7bd874db4 100644
--- a/csv/format.h
+++ b/csv/format.h
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -85,6 +58,7 @@ class format
             //static void to_bin( const T& t, char* buf, std::size_t size = sizeof( T ) ) { ::memcpy( buf, &t, sizeof( T ) ); }
             static T from_bin( const char* buf, std::size_t size = sizeof( T ) ) { (void)size; return *reinterpret_cast< const T* >( buf ); }
             static void to_bin( const T& t, char* buf, std::size_t size = sizeof( T ) ) { (void)size; *reinterpret_cast< T* >( buf ) = t; }
+            static T zero() { return 0; }
         };
 
         /// struct containing offsets
@@ -381,6 +355,7 @@ template <> struct format::traits< boost::posix_time::ptime, format::long_time >
     static const char* as_string() { return "lt"; }
     static boost::posix_time::ptime from_bin( const char* buf, std::size_t size = 12 );
     static void to_bin( const boost::posix_time::ptime& t, char* buf, std::size_t size = 12 );
+    static boost::posix_time::ptime zero() { return boost::posix_time::ptime(); }
 };
 
 template <> struct format::traits< boost::posix_time::ptime, format::time >
@@ -390,6 +365,7 @@ template <> struct format::traits< boost::posix_time::ptime, format::time >
     static const char* as_string() { return "t"; }
     static boost::posix_time::ptime from_bin( const char* buf, std::size_t size = 8 );
     static void to_bin( const boost::posix_time::ptime& t, char* buf, std::size_t size = 8 );
+    static boost::posix_time::ptime zero() { return boost::posix_time::ptime(); }
 };
 
 template <> struct format::traits< std::string, format::fixed_string >
@@ -398,6 +374,7 @@ template <> struct format::traits< std::string, format::fixed_string >
     static const char* as_string() { return type_to_enum< std::string >::as_string(); }
     static std::string from_bin( const char* buf, std::size_t size );
     static void to_bin( const std::string& t, char* buf, std::size_t size );
+    static std::string zero() { return std::string(); }
 };
 
 } } // namespace comma { namespace csv {
diff --git a/csv/test/binary_test.cpp b/csv/test/binary_test.cpp
index f61d4b50d..87cd46bb4 100644
--- a/csv/test/binary_test.cpp
+++ b/csv/test/binary_test.cpp
@@ -1,34 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 #include <gtest/gtest.h>
+#include <array>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include "../../csv/binary.h"
 #include "../../csv/format.h"
@@ -309,11 +283,11 @@ static void test_binary_cast( const char* format, T t, S expected )
 {
     comma::csv::binary< test_cast< T > > bt( format );
     comma::csv::binary< test_cast< S > > bs( format );
-    char buf[16] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 }; // just to trash it
+    std::string buf = "abcdefghijklmnop"; // just to trash it
     test_cast< T > vt( t );
     test_cast< S > vs;
-    bt.put( vt, buf );
-    bs.get( vs, buf );
+    bt.put( vt, &buf[0] );
+    bs.get( vs, &buf[0] );
     test_traits< T >::expect_equal( vs.value, expected );
 }
 

From 8dba10aa3dac9c764934efa9cef895497245f3ed Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 7 Dec 2023 14:27:53 +1100
Subject: [PATCH 0693/1056] base/exception.h: COMMA_ASSERT_BRIEF,
 COMMA_THROW_BRIEF_IF: condition is not passed to the user for readability

---
 base/exception.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/base/exception.h b/base/exception.h
index ea1f91b3a..1a2746c15 100644
--- a/base/exception.h
+++ b/base/exception.h
@@ -49,11 +49,11 @@ namespace comma {
 
 #define COMMA_ASSERT( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW( comma::exception, "condition: '" << #condition << "' is false; " << strmessage ); } }
 
-#define COMMA_ASSERT_BRIEF( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW_BRIEF( comma::exception, "condition: '" << #condition << "' is false; " << strmessage ); } }
+#define COMMA_ASSERT_BRIEF( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW_BRIEF( comma::exception, strmessage ); } }
 
 #define COMMA_THROW_IF( condition, strmessage ) { if( condition ) { COMMA_THROW( comma::exception, "throw because condition: '" << #condition << "' is true; " << strmessage ); } }
 
-#define COMMA_THROW_BRIEF_IF( condition, strmessage ) { if( condition ) { COMMA_THROW_BRIEF( comma::exception, "throw because condition: '" << #condition << "' is true; " << strmessage ); } }
+#define COMMA_THROW_BRIEF_IF( condition, strmessage ) { if( condition ) { COMMA_THROW_BRIEF( comma::exception, strmessage ); } }
 
 class exception : public std::runtime_error
 {

From 08b81e82c21427755eedb38be5cd0bbe63b7c165 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 7 Dec 2023 19:51:04 +1100
Subject: [PATCH 0694/1056] packed: compilation warnings fixed

---
 packed/bits.h          | 18 +++++++++---------
 packed/detail/endian.h |  3 ++-
 2 files changed, 11 insertions(+), 10 deletions(-)

diff --git a/packed/bits.h b/packed/bits.h
index c8d049de1..1d9b6b7bf 100644
--- a/packed/bits.h
+++ b/packed/bits.h
@@ -7,6 +7,7 @@
 
 #include <limits>
 #include <string.h>
+#include <memory>
 #include <type_traits>
 #include <boost/type_traits.hpp>
 #include "../packed/field.h"
@@ -31,17 +32,17 @@ struct bits : public packed::field< bits< B, Default >, B, sizeof( typename comm
     bits( integer_type v ) { operator=( v ); }
     bits( type t ) : base_type( t ) {}
 
-    static type default_value() { static const integer_type d = Default; type t; ::memcpy( &t, &d, size ); return t; }
+    static type default_value() { static const integer_type d = Default; type t; std::memcpy( ( char* )( &t ), ( const char* )( &d ), size ); return t; }
 
-    static void pack( char* storage, type value ) { ::memcpy( storage, &value, size ); }
+    static void pack( char* storage, type value ) { std::memcpy( storage, ( const char* )( &value ), size ); }
 
-    static type unpack( const char* storage ) { type t; ::memcpy( &t, storage, size ); return t; }
+    static type unpack( const char* storage ) { type t; std::memcpy( ( char* )( &t ), storage, size ); return t; }
 
     const bits& operator=( const bits& rhs ) { return base_type::operator=( rhs ); }
 
     const bits& operator=( type rhs ) { return base_type::operator=( rhs ); }
 
-    const bits& operator=( integer_type rhs ) { type t; ::memcpy( &t, &rhs, size ); return base_type::operator=( t ); }
+    const bits& operator=( integer_type rhs ) { type t; std::memcpy( ( char* )( &t ), &rhs, size ); return base_type::operator=( t ); }
 
     type& fields() { return *( reinterpret_cast< type* >( this ) ); }
 
@@ -83,18 +84,17 @@ struct reversed_bits : public packed::field< reversed_bits< B, Default >, B, siz
     reversed_bits( integer_type v ) { operator=( v ); }
     reversed_bits( type t ) : base_type( t ) {}
 
-    static type default_value() { static const integer_type d = Default; type t; ::memcpy( &t, &d, size ); return t; }
+    static type default_value() { static const integer_type d = Default; type t; std::memcpy( ( char* )( &t ), ( const char* )( &d ), size ); return t; }
 
-    static void pack( char* storage, type t ) { integer_type v; ::memcpy( &v, &t, size ); reverse_bits( v ); ::memcpy( storage, &v, size ); }
+    static void pack( char* storage, type t ) { integer_type v; std::memcpy( &v, &t, size ); reverse_bits( v ); std::memcpy( storage, ( const char* )( &v ), size ); }
 
-    static type unpack( const char* storage ) { integer_type v; ::memcpy( &v, storage, size ); reverse_bits( v ); type t; ::memcpy( &t, &v, size ); return t; }
+    static type unpack( const char* storage ) { integer_type v; std::memcpy( &v, storage, size ); reverse_bits( v ); type t; std::memcpy( ( char* )( &t ), ( const char* )( &v ), size ); return t; }
 
     const reversed_bits& operator=( const reversed_bits& rhs ) { return base_type::operator=( rhs ); }
 
     const reversed_bits& operator=( type rhs ) { return base_type::operator=( rhs ); }
 
-    const reversed_bits& operator=( integer_type rhs ) { type t; ::memcpy( &t, &rhs, size ); return base_type::operator=( t ); }
-
+    const reversed_bits& operator=( integer_type rhs ) { type t; std::memcpy( ( char* )( &t ), ( const char* )( &rhs ), size ); return base_type::operator=( t ); }
 };
 
 } } // namespace comma { namespace packed {
diff --git a/packed/detail/endian.h b/packed/detail/endian.h
index 8f3832d48..9b4d81cea 100644
--- a/packed/detail/endian.h
+++ b/packed/detail/endian.h
@@ -100,7 +100,8 @@ struct endian : public packed::field< endian< Endianness, Size, Signed, Floating
         uint_of_same_size i = ( !Floating && Signed && ( storage[ Endianness == little ? size - 1 : 0 ] & 0x80 ) ) ? -1 : 0;
         ::memcpy( reinterpret_cast< char * >( &i ) + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), storage, size );
         i = convert< Endianness >::to_host( i );
-        return *( reinterpret_cast< type* >( &i ) );
+        const type* p = reinterpret_cast< type* >( &i );
+        return *p;
     }
 
     const endian& operator=( const endian& rhs ) { return base_type::operator=( rhs ); }

From 49f1d2c8101020e49c53ba0d4a16f330ba0cdf1f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 7 Dec 2023 19:55:27 +1100
Subject: [PATCH 0695/1056] packed/bits.h: include fixed

---
 packed/bits.h | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/packed/bits.h b/packed/bits.h
index 1d9b6b7bf..5de90bb1b 100644
--- a/packed/bits.h
+++ b/packed/bits.h
@@ -5,9 +5,8 @@
 
 #pragma once
 
+#include <cstring>
 #include <limits>
-#include <string.h>
-#include <memory>
 #include <type_traits>
 #include <boost/type_traits.hpp>
 #include "../packed/field.h"

From 66e002ad86d7c05f07e63d8fd020da4d384f557c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 7 Dec 2023 20:01:38 +1100
Subject: [PATCH 0696/1056] boost/bind includes fixed

---
 io/applications/io-publish.cpp                 | 2 +-
 io/impl/publisher.cpp                          | 2 +-
 io/stream.cpp                                  | 2 +-
 name_value/applications/name-value-convert.cpp | 2 --
 name_value/applications/name-value-get.cpp     | 2 --
 sync/test/lazy_test.cpp                        | 2 +-
 6 files changed, 4 insertions(+), 8 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index bfda6798b..826b6e3a5 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -9,7 +9,7 @@
 #include <unistd.h>
 #include <deque>
 #include <memory>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/iostreams/device/file_descriptor.hpp>
 #include <boost/iostreams/stream.hpp>
diff --git a/io/impl/publisher.cpp b/io/impl/publisher.cpp
index 6b91b5682..b8d0e0c50 100644
--- a/io/impl/publisher.cpp
+++ b/io/impl/publisher.cpp
@@ -12,7 +12,7 @@
 
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/filesystem/operations.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../base/exception.h"
diff --git a/io/stream.cpp b/io/stream.cpp
index d94b213d9..a17208b53 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -21,7 +21,7 @@
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/ip/udp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/filesystem.hpp>
 #include <boost/filesystem/operations.hpp>
 #include <boost/lexical_cast.hpp>
diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index 6a3b2aa66..d38aaaca8 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -4,8 +4,6 @@
 
 #include <iostream>
 #include <map>
-#include <boost/bind.hpp>
-#include <boost/function.hpp>
 #include <boost/property_tree/info_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include <boost/property_tree/json_parser.hpp>
diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index 9991008ff..91ccc79cc 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -3,8 +3,6 @@
 /// @author vsevolod vlaskine
 
 #include <iostream>
-#include <boost/bind.hpp>
-#include <boost/function.hpp>
 #include <boost/property_tree/info_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include <boost/property_tree/json_parser.hpp>
diff --git a/sync/test/lazy_test.cpp b/sync/test/lazy_test.cpp
index 49de0cfd3..5ae86f9d8 100644
--- a/sync/test/lazy_test.cpp
+++ b/sync/test/lazy_test.cpp
@@ -28,7 +28,7 @@
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <gtest/gtest.h>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include "../lazy.h"
 
 namespace comma { namespace sync { namespace test {

From 398343814fb735708f2738b48d565c03eb1860da Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Fri, 8 Dec 2023 12:07:19 +1100
Subject: [PATCH 0697/1056] system/package/cpack/examples: new
 make-debian-package example

locally builds a debian package for comma in an isolated build folder
---
 .../cpack/examples/make-debian-package        | 37 +++++++++++++++++++
 1 file changed, 37 insertions(+)
 create mode 100755 system/package/cpack/examples/make-debian-package

diff --git a/system/package/cpack/examples/make-debian-package b/system/package/cpack/examples/make-debian-package
new file mode 100755
index 000000000..7ab533b10
--- /dev/null
+++ b/system/package/cpack/examples/make-debian-package
@@ -0,0 +1,37 @@
+#!/bin/bash
+
+package_root=$HOME/src/comma
+build_root=$HOME/src/comma_build
+
+mkdir -p $build_root/comma
+cd $build_root/comma
+cmake $package_root \
+    -DCMAKE_INSTALL_PREFIX=$package_root/debian/tmp/usr \
+    -DCMAKE_BUILD_TYPE=Release \
+    -DBUILD_SHARED_LIBS=ON \
+    -DBUILD_PYTHON_PACKAGES=OFF \
+    -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+    -DBUILD_TESTS=OFF \
+    -DINSTALL_BASH_COMPLETION=OFF \
+    -DINSTALL_TESTS=OFF \
+    -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+    -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
+    -Dcomma_INSTALL_RUN_POST_INSTALL=OFF \
+    -Dcomma_BUILD_XML=OFF \
+    -Dcomma_BUILD_ZEROMQ=OFF \
+    -Dcomma_build_io_rabbit_cat=OFF
+make -j
+sudo make install
+
+mkdir -p $build_root/comma/debian/tmp/usr/lib
+mkdir -p $build_root/comma/debian/tmp/DEBIAN
+
+# Copy installed lib files, and debian configuration files to our build directory for packaging
+cp -r $build_root/comma/lib/x86_64-linux-gnu debian/tmp/usr/lib
+rsync -r $package_root/debian/* debian/
+
+# Generate the control file
+dpkg-gencontrol -pcomma
+
+# Build the package
+dpkg --build debian/tmp $build_root/comma

From 72a377f04ce88b33675e6572328598a2c1f1fafd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Dec 2023 12:23:37 +1100
Subject: [PATCH 0698/1056] system/package: examples moved out of cpack
 directory

---
 .../{cpack => }/examples/make-debian-package  | 24 ++++++++++---------
 .../{cpack => }/examples/package-python       |  0
 2 files changed, 13 insertions(+), 11 deletions(-)
 rename system/package/{cpack => }/examples/make-debian-package (60%)
 rename system/package/{cpack => }/examples/package-python (100%)

diff --git a/system/package/cpack/examples/make-debian-package b/system/package/examples/make-debian-package
similarity index 60%
rename from system/package/cpack/examples/make-debian-package
rename to system/package/examples/make-debian-package
index 7ab533b10..130499574 100755
--- a/system/package/cpack/examples/make-debian-package
+++ b/system/package/examples/make-debian-package
@@ -1,12 +1,14 @@
 #!/bin/bash
 
-package_root=$HOME/src/comma
-build_root=$HOME/src/comma_build
-
-mkdir -p $build_root/comma
-cd $build_root/comma
-cmake $package_root \
-    -DCMAKE_INSTALL_PREFIX=$package_root/debian/tmp/usr \
+home=$1
+[[ -n "$home" ]] || { echo "usage: $0 <dir>" >&2; exit 1; }
+cd $home/src
+git clone https://gitlab.com/orthographic/comma.git
+build_dir=$home/src/comma/build
+mkdir -p $build_dir
+cd $build_dir
+cmake $home/src/comma \
+    -DCMAKE_INSTALL_PREFIX=$home/src/comma/debian/tmp/usr \
     -DCMAKE_BUILD_TYPE=Release \
     -DBUILD_SHARED_LIBS=ON \
     -DBUILD_PYTHON_PACKAGES=OFF \
@@ -23,15 +25,15 @@ cmake $package_root \
 make -j
 sudo make install
 
-mkdir -p $build_root/comma/debian/tmp/usr/lib
-mkdir -p $build_root/comma/debian/tmp/DEBIAN
+mkdir -p $build_dir/debian/tmp/usr/lib
+mkdir -p $build_dir/debian/tmp/DEBIAN
 
 # Copy installed lib files, and debian configuration files to our build directory for packaging
-cp -r $build_root/comma/lib/x86_64-linux-gnu debian/tmp/usr/lib
+cp -r $build_dir/lib/x86_64-linux-gnu $build_dir/debian/tmp/usr/lib
 rsync -r $package_root/debian/* debian/
 
 # Generate the control file
 dpkg-gencontrol -pcomma
 
 # Build the package
-dpkg --build debian/tmp $build_root/comma
+dpkg --build $build_dir/debian/tmp $build_dir
diff --git a/system/package/cpack/examples/package-python b/system/package/examples/package-python
similarity index 100%
rename from system/package/cpack/examples/package-python
rename to system/package/examples/package-python

From ec6ea682173f11f526aa2fd77cdac58d4d08113d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Dec 2023 13:20:59 +1100
Subject: [PATCH 0699/1056] system/package/examples/make-debian-package: works;
 trying a bit more cleanup...

---
 system/package/examples/make-debian-package | 17 +++++++++++------
 1 file changed, 11 insertions(+), 6 deletions(-)

diff --git a/system/package/examples/make-debian-package b/system/package/examples/make-debian-package
index 130499574..94272fc1f 100755
--- a/system/package/examples/make-debian-package
+++ b/system/package/examples/make-debian-package
@@ -1,7 +1,9 @@
 #!/bin/bash
 
 home=$1
-[[ -n "$home" ]] || { echo "usage: $0 <dir>" >&2; exit 1; }
+[[ -n "$home" ]] || { echo "usage: $0 <packaging-dir>" >&2; exit 1; }
+home=$( realpath $home )
+mkdir -p $home/src
 cd $home/src
 git clone https://gitlab.com/orthographic/comma.git
 build_dir=$home/src/comma/build
@@ -23,17 +25,20 @@ cmake $home/src/comma \
     -Dcomma_BUILD_ZEROMQ=OFF \
     -Dcomma_build_io_rabbit_cat=OFF
 make -j
-sudo make install
+make install -j
 
+# make vodoo debian directories
 mkdir -p $build_dir/debian/tmp/usr/lib
 mkdir -p $build_dir/debian/tmp/DEBIAN
 
-# Copy installed lib files, and debian configuration files to our build directory for packaging
+# copy installed lib files (because for some reason comma cmake does not install libraries at the right place; todo: fix!)
 cp -r $build_dir/lib/x86_64-linux-gnu $build_dir/debian/tmp/usr/lib
-rsync -r $package_root/debian/* debian/
 
-# Generate the control file
+# copy debian configuration files to our build directory for packaging
+cp -r $home/src/comma/debian/* $build_dir/debian
+
+# generate the control file
 dpkg-gencontrol -pcomma
 
-# Build the package
+# build the package
 dpkg --build $build_dir/debian/tmp $build_dir

From c0e809f7f2ffd0150efad104f23b08f24ba3b61d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Dec 2023 14:06:56 +1100
Subject: [PATCH 0700/1056] system/package/examples/make-debian-package: done
 for now

---
 system/package/examples/make-debian-package | 15 ++++++---------
 1 file changed, 6 insertions(+), 9 deletions(-)

diff --git a/system/package/examples/make-debian-package b/system/package/examples/make-debian-package
index 94272fc1f..359217e87 100755
--- a/system/package/examples/make-debian-package
+++ b/system/package/examples/make-debian-package
@@ -9,8 +9,11 @@ git clone https://gitlab.com/orthographic/comma.git
 build_dir=$home/src/comma/build
 mkdir -p $build_dir
 cd $build_dir
+
+# if you want the library path to be lib/x86_64-linux-gnu
+# see target build in src/comma/debian/rules
 cmake $home/src/comma \
-    -DCMAKE_INSTALL_PREFIX=$home/src/comma/debian/tmp/usr \
+    -DCMAKE_INSTALL_PREFIX=$build_dir/debian/tmp/usr \
     -DCMAKE_BUILD_TYPE=Release \
     -DBUILD_SHARED_LIBS=ON \
     -DBUILD_PYTHON_PACKAGES=OFF \
@@ -18,8 +21,6 @@ cmake $home/src/comma \
     -DBUILD_TESTS=OFF \
     -DINSTALL_BASH_COMPLETION=OFF \
     -DINSTALL_TESTS=OFF \
-    -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
-    -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
     -Dcomma_INSTALL_RUN_POST_INSTALL=OFF \
     -Dcomma_BUILD_XML=OFF \
     -Dcomma_BUILD_ZEROMQ=OFF \
@@ -27,15 +28,11 @@ cmake $home/src/comma \
 make -j
 make install -j
 
-# make vodoo debian directories
-mkdir -p $build_dir/debian/tmp/usr/lib
+# make vodoo debian directory
 mkdir -p $build_dir/debian/tmp/DEBIAN
 
-# copy installed lib files (because for some reason comma cmake does not install libraries at the right place; todo: fix!)
-cp -r $build_dir/lib/x86_64-linux-gnu $build_dir/debian/tmp/usr/lib
-
 # copy debian configuration files to our build directory for packaging
-cp -r $home/src/comma/debian/* $build_dir/debian
+cp -r $home/src/comma/debian/control $home/src/comma/debian/changelog $home/src/comma/debian/copyright $build_dir/debian
 
 # generate the control file
 dpkg-gencontrol -pcomma

From f0931dab9f53588698e068f02b4fc5bbce98721d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Dec 2023 12:19:26 +1100
Subject: [PATCH 0701/1056] timing::from_seconds_since_epoch(): first cut
 implemented

---
 csv/impl/epoch.h | 36 +++---------------------------------
 timing/epoch.cpp | 17 +++++++++++++++++
 timing/epoch.h   | 17 +++++++++++++++++
 3 files changed, 37 insertions(+), 33 deletions(-)
 create mode 100644 timing/epoch.cpp
 create mode 100644 timing/epoch.h

diff --git a/csv/impl/epoch.h b/csv/impl/epoch.h
index a428e3bb1..6b5dff0f4 100644
--- a/csv/impl/epoch.h
+++ b/csv/impl/epoch.h
@@ -1,44 +1,14 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_IMPL_EPOCH_H_
-#define COMMA_CSV_IMPL_EPOCH_H_
+#pragma once
 
-#include <boost/date_time/posix_time/posix_time.hpp>
+#include "../../timing/epoch.h"
 
 namespace comma { namespace csv { namespace impl {
 
-static const boost::gregorian::date epoch( 1970, 1, 1 );
+static const boost::gregorian::date epoch = comma::timing::epoch;
 
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // #ifndef COMMA_CSV_IMPL_EPOCH_H_
diff --git a/timing/epoch.cpp b/timing/epoch.cpp
new file mode 100644
index 000000000..4fc3cd1bf
--- /dev/null
+++ b/timing/epoch.cpp
@@ -0,0 +1,17 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "epoch.h"
+
+namespace comma { namespace timing {
+
+boost::posix_time::ptime from_seconds_since_epoch( double seconds, boost::gregorian::date e )
+{
+    long long s = seconds;
+    int microseconds = ::ceil( ( seconds - s ) * 1000000 - 0.5 ); //int microseconds = ::round( ( d - seconds ) * 1000000 ); // although ::round() is slow, have to round, since lexical cast has floating point jitter, e.g. try: boost::lexical_cast< double >( "1369179610.752231000" );
+    return boost::posix_time::ptime( e, boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds ) );
+}
+
+} } // namespace comma { namespace timing {
diff --git a/timing/epoch.h b/timing/epoch.h
new file mode 100644
index 000000000..8592e5678
--- /dev/null
+++ b/timing/epoch.h
@@ -0,0 +1,17 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time.hpp>
+
+namespace comma { namespace timing {
+
+const boost::gregorian::date epoch( 1970, 1, 1 );
+
+boost::posix_time::ptime from_seconds_since_epoch( double seconds, boost::gregorian::date e = timing::epoch );
+
+} } // namespace comma { namespace timing {
+

From 7b31a1f8ce4ab8c22acee37efb87a08f79090f93 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Dec 2023 13:19:26 +1100
Subject: [PATCH 0702/1056] timing::duration::from_seconds(): first cut
 implemented

---
 timing/duration.cpp | 17 +++++++++++++++++
 timing/duration.h   | 15 +++++++++++++++
 timing/epoch.cpp    |  5 ++---
 3 files changed, 34 insertions(+), 3 deletions(-)
 create mode 100644 timing/duration.cpp
 create mode 100644 timing/duration.h

diff --git a/timing/duration.cpp b/timing/duration.cpp
new file mode 100644
index 000000000..a46a0ca3f
--- /dev/null
+++ b/timing/duration.cpp
@@ -0,0 +1,17 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "duration.h"
+
+namespace comma { namespace timing { namespace duration {
+
+boost::posix_time::time_duration from_seconds( double seconds )
+{
+    long long s = seconds;
+    int microseconds = ::ceil( ( seconds - s ) * 1000000 - 0.5 ); //int microseconds = ::round( ( d - seconds ) * 1000000 ); // although ::round() is slow, have to round, since lexical cast has floating point jitter, e.g. try: boost::lexical_cast< double >( "1369179610.752231000" );
+    return boost::posix_time::time_duration( boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds ) );
+}
+
+} } } // namespace comma { namespace timing { namespace duration {
diff --git a/timing/duration.h b/timing/duration.h
new file mode 100644
index 000000000..9a0e1edd6
--- /dev/null
+++ b/timing/duration.h
@@ -0,0 +1,15 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time.hpp>
+
+namespace comma { namespace timing { namespace duration {
+
+boost::posix_time::time_duration from_seconds( double seconds );
+
+} } } // namespace comma { namespace timing { namespace duration {
+
diff --git a/timing/epoch.cpp b/timing/epoch.cpp
index 4fc3cd1bf..4fe492da4 100644
--- a/timing/epoch.cpp
+++ b/timing/epoch.cpp
@@ -3,15 +3,14 @@
 
 /// @author vsevolod vlaskine
 
+#include "duration.h"
 #include "epoch.h"
 
 namespace comma { namespace timing {
 
 boost::posix_time::ptime from_seconds_since_epoch( double seconds, boost::gregorian::date e )
 {
-    long long s = seconds;
-    int microseconds = ::ceil( ( seconds - s ) * 1000000 - 0.5 ); //int microseconds = ::round( ( d - seconds ) * 1000000 ); // although ::round() is slow, have to round, since lexical cast has floating point jitter, e.g. try: boost::lexical_cast< double >( "1369179610.752231000" );
-    return boost::posix_time::ptime( e, boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds ) );
+    return boost::posix_time::ptime( e, duration::from_seconds( seconds ) );
 }
 
 } } // namespace comma { namespace timing {

From 3058703f391e10f9c49fe49f3e8a30c59b5ed97b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 15 Dec 2023 15:14:03 +1100
Subject: [PATCH 0703/1056] timing: typo fixed

---
 timing/duration.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/timing/duration.cpp b/timing/duration.cpp
index a46a0ca3f..17e082d29 100644
--- a/timing/duration.cpp
+++ b/timing/duration.cpp
@@ -11,7 +11,7 @@ boost::posix_time::time_duration from_seconds( double seconds )
 {
     long long s = seconds;
     int microseconds = ::ceil( ( seconds - s ) * 1000000 - 0.5 ); //int microseconds = ::round( ( d - seconds ) * 1000000 ); // although ::round() is slow, have to round, since lexical cast has floating point jitter, e.g. try: boost::lexical_cast< double >( "1369179610.752231000" );
-    return boost::posix_time::time_duration( boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds ) );
+    return boost::posix_time::time_duration( boost::posix_time::seconds( s ) + boost::posix_time::microseconds( microseconds ) );
 }
 
 } } } // namespace comma { namespace timing { namespace duration {

From 595f7b1ef1393c23e8d06b86cd705cd357991b5e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 20 Dec 2023 10:57:31 +1100
Subject: [PATCH 0704/1056] csv::make_output_options renamed to
 csv::options::make_same_kind; delimiter, quote, and precision copied

---
 csv/options.h | 21 ++++++++++++---------
 1 file changed, 12 insertions(+), 9 deletions(-)

diff --git a/csv/options.h b/csv/options.h
index a94c95ecf..bcc0fd8b4 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -10,12 +10,6 @@
 
 namespace comma { namespace csv {
 
-class options;
-
-/// convenience method: make output options from input options (propagate binary setting, flush); todo? add more parameters?
-template < typename T >
-static options make_output_options( const options& input_options );
-
 /// a helper class to extract csv-related command line options
 class options
 {
@@ -29,6 +23,11 @@ class options
         /// constructor
         options( const comma::command_line_options& options, const std::string& defaultFields = "", bool full_xpath = true );
 
+        /// make options from input options (propagate binary setting, flush, delimiter, etc)
+        /// typical use: make output stream options compatible with the input stream options
+        template < typename T >
+        static options make_same_kind( const options& rhs );
+
         /// return usage to incorporate into application usage
         static std::string usage( const std::string& default_fields = "", bool verbose = true );
 
@@ -98,11 +97,15 @@ class options
 };
 
 template < typename T >
-inline options make_output_options( const options& input_options )
+inline options options::make_same_kind( const options& rhs )
 {
     options o;
-    o.flush = input_options.flush;
-    if( input_options.binary() ) { o.format( format::value< T >() ); }
+    o.flush = rhs.flush;
+    o.delimiter = rhs.delimiter;
+    o.flush = rhs.flush;
+    o.precision = rhs.precision;
+    o.quote = rhs.quote;
+    if( rhs.binary() ) { o.format( format::value< T >() ); }
     return o;
 }
 

From adf3e2138d64a086b6bc91622a11f412ae8e7704 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Jan 2024 13:36:11 +1100
Subject: [PATCH 0705/1056] string: comma::replace() implemented; csv::options:
 constructor with field name aliases implemented and tested

---
 csv/options.cpp           | 16 +++++++++++-----
 csv/options.h             |  8 ++++++--
 csv/test/options_test.cpp | 36 +++++++++++++++++++++++++++++++++++-
 string/string.cpp         | 14 ++++++++++++++
 string/string.h           |  4 ++++
 5 files changed, 70 insertions(+), 8 deletions(-)

diff --git a/csv/options.cpp b/csv/options.cpp
index f6f494e8c..16733f020 100644
--- a/csv/options.cpp
+++ b/csv/options.cpp
@@ -49,10 +49,14 @@ bool options::binary() const { return static_cast< bool >( format_ ); }
 
 namespace impl {
 
-inline static void init( comma::csv::options& csv_options, const comma::command_line_options& options, const std::string& defaultFields, bool full_xpath )
+static void init( comma::csv::options& csv_options
+                , const comma::command_line_options& options
+                , const std::string& default_fields
+                , bool full_xpath
+                , const std::unordered_map< std::string, std::string >& field_aliases )
 {
     csv_options.full_xpath = full_xpath;
-    csv_options.fields = options.value( "--fields,-f", defaultFields );
+    csv_options.fields = comma::replace( options.value( "--fields,-f", default_fields ), field_aliases );
     if( options.exists( "--binary,-b" ) )
     {
         boost::optional< std::string > format = options.optional< std::string >( "--binary,-b" );
@@ -75,11 +79,13 @@ inline static void init( comma::csv::options& csv_options, const comma::command_
 
 } // namespace impl {
 
-options::options() : full_xpath( true ), delimiter( ',' ), precision( 12 ), quote( '"' ), flush( false ) {}
+options::options(): full_xpath( true ), delimiter( ',' ), precision( 12 ), quote( '"' ), flush( false ) {}
 
-options::options( int argc, char** argv, const std::string& defaultFields, bool full_xpath ) { impl::init( *this, comma::command_line_options( argc, argv ), defaultFields, full_xpath ); }
+options::options( int argc, char** argv, const std::string& default_fields, bool full_xpath ): options( comma::command_line_options( argc, argv ), default_fields, full_xpath ) {}
 
-options::options( const comma::command_line_options& options, const std::string& defaultFields, bool full_xpath ) { impl::init( *this, options, defaultFields, full_xpath ); }
+options::options( const comma::command_line_options& options, const std::string& default_fields, bool full_xpath ) { impl::init( *this, options, default_fields, full_xpath, {} ); }
+
+options::options( const comma::command_line_options& options, const std::unordered_map< std::string, std::string >& field_aliases, const std::string& default_fields ) { impl::init( *this, options, default_fields, true, field_aliases ); }
 
 std::string options::usage( const std::string& default_fields, bool verbose )
 {
diff --git a/csv/options.h b/csv/options.h
index bcc0fd8b4..bb4e79154 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -4,6 +4,7 @@
 
 #pragma once
 
+#include <unordered_map>
 #include <boost/optional.hpp>
 #include "../application/command_line_options.h"
 #include "format.h"
@@ -18,10 +19,13 @@ class options
         options();
 
         /// constructor
-        options( int argc, char** argv, const std::string& defaultFields = "", bool full_xpath = true );
+        options( int argc, char** argv, const std::string& default_fields = "", bool full_xpath = true );
 
         /// constructor
-        options( const comma::command_line_options& options, const std::string& defaultFields = "", bool full_xpath = true );
+        options( const comma::command_line_options& options, const std::string& default_fields = "", bool full_xpath = true );
+
+        /// constructor
+        options( const comma::command_line_options& options, const std::unordered_map< std::string, std::string >& field_aliases, const std::string& default_fields = "" );
 
         /// make options from input options (propagate binary setting, flush, delimiter, etc)
         /// typical use: make output stream options compatible with the input stream options
diff --git a/csv/test/options_test.cpp b/csv/test/options_test.cpp
index 8e13dd614..7d02c244b 100644
--- a/csv/test/options_test.cpp
+++ b/csv/test/options_test.cpp
@@ -28,6 +28,7 @@
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <gtest/gtest.h>
+#include "../../application/command_line_options.h"
 #include "../../csv/options.h"
 
 namespace comma {
@@ -98,5 +99,38 @@ TEST( options, has_paths )
         EXPECT_FALSE( csv.has_some_of_paths( "c" ) );
     }
 }
-    
+
+TEST( options, aliases )
+{
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "" } ), std::unordered_map< std::string, std::string >() );
+        EXPECT_EQ( csv.fields, "" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "" } ), { { "b", "x/y/b" } }, "a,b,b" );
+        EXPECT_EQ( csv.fields, "a,x/y/b,x/y/b" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,b,c" } ), std::unordered_map< std::string, std::string >() );
+        EXPECT_EQ( csv.fields, "a,b,c" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=,b,c" } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, ",x/y/b,c" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,b," } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, "a,x/y/b," );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,,b" } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, "a,,x/y/b" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,b,c" } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, "a,x/y/b,c" );
+    }
+    // todo: more tests
+}
+
 } // namespace comma {
diff --git a/string/string.cpp b/string/string.cpp
index 25b3b0a28..d75bb7ecc 100644
--- a/string/string.cpp
+++ b/string/string.cpp
@@ -139,4 +139,18 @@ std::string common_front( const std::string& s, const std::string& t, char delim
     return s.substr( 0, i );
 }
 
+std::string replace( const std::string& s, const std::unordered_map< std::string, std::string >& aliases )
+{
+    if( aliases.empty() ) { return s; }
+    auto v = comma::split( s, ',', true );
+    std::string f, comma;
+    for( const auto& e: v )
+    {
+        auto i = aliases.find( e );
+        f += comma + ( i == aliases.end() ? e : i->second );
+        comma = ",";
+    }
+    return f;
+}
+
 } // namespace comma {
diff --git a/string/string.h b/string/string.h
index 89dd93a44..0849c2d6c 100644
--- a/string/string.h
+++ b/string/string.h
@@ -7,6 +7,7 @@
 #include <stdlib.h>
 #include <sstream>
 #include <string>
+#include <unordered_map>
 #include <vector>
 #include "../string/split.h"
 
@@ -44,6 +45,9 @@ std::string join( const A& a, std::size_t size, char delimiter );
 template < typename A >
 inline std::string join( const A& a, char delimiter ) { return join( a, a.size(), delimiter ); }
 
+/// convenience function, somewhat overfit: split, replace aliased entries, join
+std::string replace( const std::string& s, const std::unordered_map< std::string, std::string >& aliases );
+
 template < typename A >
 inline std::string join( const A& a, std::size_t size, char delimiter )
 {

From 277094d0113961960a09933d9478c17ef2f940ba Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 10 Jan 2024 14:33:26 +1100
Subject: [PATCH 0706/1056] csv::leaves() implemented

---
 csv/names.h             | 29 +++++++++++++++++++++--------
 csv/test/names_test.cpp |  8 ++++++++
 2 files changed, 29 insertions(+), 8 deletions(-)

diff --git a/csv/names.h b/csv/names.h
index fdc4af7df..4d379f48c 100644
--- a/csv/names.h
+++ b/csv/names.h
@@ -4,6 +4,9 @@
 
 #pragma once
 
+#include <algorithm>
+#include <vector>
+#include <unordered_map>
 #include "../csv/impl/to_names.h"
 #include "../string/string.h"
 #include "../visiting/apply.h"
@@ -13,20 +16,20 @@ namespace comma { namespace csv {
 
 /// the most generic way: return default column names for
 /// a given sample and given subtree in comma-separated xpaths
-template < typename S >
-std::vector< std::string > names( const std::string& paths, bool useFullxpath = true, const S& sample = S() );
+template < typename S > std::vector< std::string > names( const std::string& paths, bool useFullxpath = true, const S& sample = S() );
 
 /// return default column names for a given sample and given subtree in comma-separated xpaths
-template < typename S >
-std::vector< std::string > names( const char* paths, bool useFullxpath = true, const S& sample = S() ) { return names( std::string( paths ), useFullxpath, sample ); }
+template < typename S > std::vector< std::string > names( const char* paths, bool useFullxpath = true, const S& sample = S() ) { return names( std::string( paths ), useFullxpath, sample ); }
 
 /// return default column names for a given sample
-template < typename S >
-std::vector< std::string > names( bool useFullxpath, const S& sample = S() ) { return names( "", useFullxpath, sample ); }
+template < typename S > std::vector< std::string > names( bool useFullxpath, const S& sample = S() ) { return names( "", useFullxpath, sample ); }
 
 /// return default column names for a given sample, use full xpath
-template < typename S >
-std::vector< std::string > names( const S& sample = S() ) { return names( true, sample ); }
+template < typename S > std::vector< std::string > names( const S& sample = S() ) { return names( true, sample ); }
+
+template < typename S > std::unordered_map< std::string, std::string > leaves( const std::string& paths, const S& sample = S() );
+template < typename S > std::unordered_map< std::string, std::string > leaves( const char* paths, const S& sample = S() ) { return leaves( std::string( paths ), sample ); }
+template < typename S > std::unordered_map< std::string, std::string > leaves( const S& sample = S() ) { return leaves( "", sample ); }
 
 /// return true, if all the fields from subset present in fields
 /// @todo make a generic subset application
@@ -55,4 +58,14 @@ inline std::vector< std::string > names( const std::string& paths, bool useFullx
     return r;
 }
 
+template < typename S >
+inline std::unordered_map< std::string, std::string > leaves( const std::string& paths, const S& sample )
+{
+    const auto& flat = names< S >( paths, false, sample );
+    const auto& full = names< S >( paths, true, sample );
+    std::unordered_map< std::string, std::string > m;
+    std::transform( flat.begin(), flat.end(), full.begin(), std::inserter( m, m.end() ), []( const std::string& k, const std::string& v ) { return std::make_pair( k, v ); } );
+    return m;
+}
+
 } } // namespace comma { namespace csv {
diff --git a/csv/test/names_test.cpp b/csv/test/names_test.cpp
index 07a41f975..26649b597 100644
--- a/csv/test/names_test.cpp
+++ b/csv/test/names_test.cpp
@@ -245,6 +245,14 @@ TEST( csv, names )
     EXPECT_EQ( join( names< test_struct >( ",,,,no-such-field,,," ), ',' ), ",,,,no-such-field,,," );
 }
 
+TEST( csv, leaves )
+{
+    {
+        std::unordered_map< std::string, std::string > m{ { "A", "D/A" }, { "X", "D/B/X" }, { "Y", "D/B/Y" } };
+        EXPECT_EQ( leaves< test_struct >( "D" ), m );
+    }
+}
+
 TEST( csv, names_optional_element )
 {
     EXPECT_EQ( join( names< struct_with_optional_element >(), ',' ), "x,nested/X,nested/Y" );

From 6f27b3fb29ff02a602db2a34118d01a0c16f964c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Jan 2024 13:47:14 +1100
Subject: [PATCH 0707/1056] io-cat: --sources-ordered: implemented; todo: fix
 default case, update --help...

---
 io/applications/io-cat.cpp | 23 +++++++++++++++++------
 1 file changed, 17 insertions(+), 6 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 3e9ee3543..3972725f8 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -215,7 +215,7 @@ class any_stream : public stream
         
         bool empty() const { return !connected() || closed_ || available_() == 0; }
         
-        bool eof() const { return !( *istream_ )->good() || ( *istream_ )->eof(); }
+        bool eof() const { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
         
         void close() { closed_ = true; ( *istream_ ).close(); }
         
@@ -226,7 +226,8 @@ class any_stream : public stream
         void connect()
         {
             if( istream_ ) { return; }
-            istream_.reset( new comma::io::istream( address_, comma::io::mode::binary, comma::io::mode::non_blocking ) );
+            auto blocking_mode = false ? comma::io::mode::non_blocking : comma::io::mode::blocking; // todo? expose on command line?
+            istream_.reset( new comma::io::istream( address_, comma::io::mode::binary, blocking_mode ) );
             if( ( *istream_ )() != &std::cin ) { return; }
             std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
             std::cin.tie( NULL ); // std::cin is tied to std::cout by default
@@ -262,8 +263,16 @@ static unsigned int connect_max_attempts;
 static boost::posix_time::time_duration connect_period;
 static bool permissive;
 
-static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select& select, bool connected_all_we_could )
+static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select& select, bool connected_all_we_could, bool ordered )
 {
+    if( ordered )
+    {
+        select.check();
+        bool r{connected_all_we_could};
+        for( unsigned int i = 0; i < streams.size() && r; ++i ) { r = streams[i].closed() || select.read().ready( streams[i].fd() ); }
+        if( !r ) { boost::this_thread::sleep( boost::posix_time::milliseconds( 10 ) ); } // quick and dirty
+        return r;
+    }
     for( unsigned int i = 0; i < streams.size(); ++i ) { if( !streams[i].empty() ) { select.check(); return true; } }
     if( !select.read()().empty() ) { return select.wait( boost::posix_time::seconds( 1 ) ) > 0; }
     if( connected_all_we_could ) { return true; }
@@ -340,15 +349,17 @@ int main( int argc, char** argv )
         comma::signal_flag is_shutdown;
         verbose = options.exists( "--verbose,-v" );
         unsigned int size = options.value( "--size,-s", 0 );
+        bool ordered = options.exists( "--sources-ordered,--ordered" );
         bool unbuffered = options.exists( "--flush,--unbuffered,-u" );
         bool exit_on_first_closed = options.exists( "--exit-on-first-closed,-e" );
+        options.assert_mutually_exclusive( "--sources-ordered,--ordered", "--permissive" );
         std::string connect_max_attempts_string = options.value< std::string >( "--connect-max-attempts,--connect-attempts,--attempts,--max-attempts", "1" );
         connect_max_attempts = connect_max_attempts_string == "unlimited" ? 0 : boost::lexical_cast< unsigned int >( connect_max_attempts_string );
         double connect_period_seconds = options.value( "--connect-period", 1.0 );
         connect_period = boost::posix_time::milliseconds( static_cast<unsigned int>(std::floor( connect_period_seconds * 1000 ) ));
         permissive = options.exists( "--permissive" );
         bool has_head = options.exists( "--head" );
-        const std::vector< std::string >& unnamed = options.unnamed( "--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
+        const std::vector< std::string >& unnamed = options.unnamed( "--sources-ordered,--ordered,--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
         #ifdef WIN32
         if( size || ( unnamed.size() == 1 && !has_head ) ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         //if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
@@ -365,7 +376,7 @@ int main( int argc, char** argv )
         {
             if( is_shutdown ) { if( verbose ) { std::cerr << "io-cat: received signal" << std::endl; }; break; }
             bool connected_all_we_could = try_connect( streams, select );
-            if( !ready( streams, select, connected_all_we_could ) ) { continue; }
+            if( !ready( streams, select, connected_all_we_could, ordered ) ) { continue; }
             done = true;
             for( unsigned int i = 0; i < streams.size(); ++i )
             {
@@ -373,7 +384,7 @@ int main( int argc, char** argv )
                 if( streams[i].closed() ) { continue; }
                 bool ready = select.read().ready( streams[i].fd() );
                 bool empty = streams[i].empty();
-                if( empty && ( streams[i].eof() || ready ) )
+                if( empty && ( ready || streams[i].eof() ) )
                 { 
                     if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << unnamed[i] << "): closed" << std::endl; }
                     select.read().remove( streams[i].fd() );

From adda83625b1d312e0de54c45a951b5de1dbad12b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Jan 2024 14:10:10 +1100
Subject: [PATCH 0708/1056] io-cat: --sources-ordered: default case: fixed;
 todo: test, update --help...

---
 io/applications/io-cat.cpp | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 3972725f8..440509f7d 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -116,7 +116,7 @@ class stream
     public:
         stream( const std::string& address ): address_( address ) {}
         virtual ~stream() {}
-        virtual unsigned int read_available( std::vector< char >& buffer, unsigned int max_count ) = 0;
+        virtual unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking ) = 0;
         virtual comma::io::file_descriptor fd() const = 0;
         virtual bool eof() const = 0;
         virtual bool empty() const = 0;
@@ -150,7 +150,7 @@ class udp_stream : public stream
         
         comma::io::file_descriptor fd() const { return socket_->native_handle(); }
         
-        unsigned int read_available( std::vector< char >& buffer, unsigned int )
+        unsigned int read_available( std::vector< char >& buffer, unsigned int, bool )
         {
             boost::system::error_code error;
             std::size_t size = socket_->receive( boost::asio::buffer( buffer ), 0, error );
@@ -188,10 +188,10 @@ class any_stream : public stream
         
         comma::io::file_descriptor fd() const { return ( *istream_ ).fd(); }
         
-        unsigned int read_available( std::vector< char >& buffer, unsigned int max_count )
+        unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
         {
             std::size_t available = available_();
-            if( available == 0 ) { return 0; }
+            if( !blocking && available == 0 ) { return 0; }
             if( binary_ )
             {
                 unsigned int count = size_ ? available / size_ : 0;
@@ -396,7 +396,7 @@ int main( int argc, char** argv )
                 unsigned int countdown = round_robin_count;
                 while( !streams[i].eof() ) // todo? check is_shutdown here as well?
                 {
-                    unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count );
+                    unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count, ordered );
                     if( bytes_read == 0 ) { break; }
                     done = false;
                     if( size && bytes_read % size != 0 ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) << std::endl; return 1; }

From a63a7b73726fc6470b3c870d997cc567dfaf0f18 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Jan 2024 14:56:49 +1100
Subject: [PATCH 0709/1056] io-cat: --sources-ordered: renamed to --blocking,
 documented in --help; todo: unit test

---
 io/applications/io-cat.cpp | 48 ++++++++++++++++++++++++++++++--------
 1 file changed, 38 insertions(+), 10 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 440509f7d..9a4cdd941 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -66,19 +66,47 @@ void usage( bool verbose = false )
     std::cerr << "options" << std::endl;
     std::cerr << "    --exit-on-first-closed,-e: exit, if one of the streams finishes" << std::endl;
     std::cerr << "    --flush,--unbuffered,-u: flush output" << std::endl;
+    std::cerr << "    --verbose,-v: more output" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "output order options" << std::endl;
+    std::cerr << "    --blocking: blocking read on each source in order sources appear on command line" << std::endl;
+    std::cerr << "                output modes" << std::endl;
+    std::cerr << "                    default:     output all records from the first source, then all" << std::endl;
+    std::cerr << "                                 records from the seconds source, etc" << std::endl;
+    std::cerr << "                    round robin: output <n> records from the first source, then <n>" << std::endl;
+    std::cerr << "                                 records from the seconds source, etc; note that if" << std::endl;
+    std::cerr << "                                 the number of records in a source is not divisible by <n>" << std::endl;
+    std::cerr << "                                 then the last records groups may contain fewer than <n>" << std::endl;
+    std::cerr << "                                 records" << std::endl;
+    std::cerr << "                attention: if you want full control over record ordering, use --blocking" << std::endl;
+    std::cerr << "                           when using subshells or sockets as io-cat inputs " << std::endl;
+    if( verbose )
+    {
+        std::cerr << "                           io-cat will open such inputs, but they may not be immediately" << std::endl;
+        std::cerr << "                           ready for reading, which may lead to records being read from sources" << std::endl;
+        std::cerr << "                           out of order;  use --blocking to avoid this problem" << std::endl;
+        std::cerr << "                           e.g. in the following command without --blocking one subshell may" << std::endl;
+        std::cerr << "                           start slightly earlier than the other and thus likely to output" << std::endl;
+        std::cerr << "                           not what you expect or want - add --blocking to fix that:" << std::endl;
+        std::cerr << "                               io-cat --round-robin=1 \\" << std::endl;
+        std::cerr << "                                      <( csv-paste line-number value=a | head -n100 ) \\" << std::endl;
+        std::cerr << "                                      <( csv-paste line-number value=b | head -n100 )" << std::endl;
+    }
+    else
+    {
+        std::cerr << "                           run io-cat --help --verbose for more details" << std::endl;
+    }
     std::cerr << "    --head=[<n>]; output first <n> records and exit without waiting for record n+1" << std::endl;
     std::cerr << "                  a workaround for sparse input fed into: io-cat ... | head -n10, which" << std::endl;
     std::cerr << "                  not exit until io-cat receives record 11" << std::endl;
     std::cerr << "                  instead run: io-cat ... --head=10 (use --flush if you don't want buffering" << std::endl;
-    std::cerr << "    --round-robin=[<number of packets>]: todo: only for multiple inputs: read not more" << std::endl;
+    std::cerr << "    --round-robin=[<number of packets>]: only for multiple inputs: read not more" << std::endl;
     std::cerr << "                                         than <number of packets> from an input at once," << std::endl;
     std::cerr << "                                         before checking other inputs" << std::endl;
     std::cerr << "                                         if not specified, read from each input" << std::endl;
     std::cerr << "                                         all available data" << std::endl;
     std::cerr << "                                         ignored for udp streams, where one full udp" << std::endl;
     std::cerr << "                                         packet at a time is always read" << std::endl;
-    std::cerr << "    --size,-s=[<size>]: packet size, if binary data (required only for multiple sources)" << std::endl;
-    std::cerr << "    --verbose,-v: more output" << std::endl;
     std::cerr << std::endl;
     std::cerr << "connect options" << std::endl;
     std::cerr << "    --connect-max-attempts,--connect-attempts,--attempts,--max-attempts=<n>; default=1; number of attempts to reconnect or 'unlimited'" << std::endl;
@@ -263,9 +291,9 @@ static unsigned int connect_max_attempts;
 static boost::posix_time::time_duration connect_period;
 static bool permissive;
 
-static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select& select, bool connected_all_we_could, bool ordered )
+static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select& select, bool connected_all_we_could, bool blocking )
 {
-    if( ordered )
+    if( blocking )
     {
         select.check();
         bool r{connected_all_we_could};
@@ -349,17 +377,17 @@ int main( int argc, char** argv )
         comma::signal_flag is_shutdown;
         verbose = options.exists( "--verbose,-v" );
         unsigned int size = options.value( "--size,-s", 0 );
-        bool ordered = options.exists( "--sources-ordered,--ordered" );
+        bool blocking = options.exists( "--blocking" );
         bool unbuffered = options.exists( "--flush,--unbuffered,-u" );
         bool exit_on_first_closed = options.exists( "--exit-on-first-closed,-e" );
-        options.assert_mutually_exclusive( "--sources-ordered,--ordered", "--permissive" );
+        options.assert_mutually_exclusive( "--blocking", "--permissive" );
         std::string connect_max_attempts_string = options.value< std::string >( "--connect-max-attempts,--connect-attempts,--attempts,--max-attempts", "1" );
         connect_max_attempts = connect_max_attempts_string == "unlimited" ? 0 : boost::lexical_cast< unsigned int >( connect_max_attempts_string );
         double connect_period_seconds = options.value( "--connect-period", 1.0 );
         connect_period = boost::posix_time::milliseconds( static_cast<unsigned int>(std::floor( connect_period_seconds * 1000 ) ));
         permissive = options.exists( "--permissive" );
         bool has_head = options.exists( "--head" );
-        const std::vector< std::string >& unnamed = options.unnamed( "--sources-ordered,--ordered,--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
+        const std::vector< std::string >& unnamed = options.unnamed( "--blocking,--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
         #ifdef WIN32
         if( size || ( unnamed.size() == 1 && !has_head ) ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         //if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
@@ -376,7 +404,7 @@ int main( int argc, char** argv )
         {
             if( is_shutdown ) { if( verbose ) { std::cerr << "io-cat: received signal" << std::endl; }; break; }
             bool connected_all_we_could = try_connect( streams, select );
-            if( !ready( streams, select, connected_all_we_could, ordered ) ) { continue; }
+            if( !ready( streams, select, connected_all_we_could, blocking ) ) { continue; }
             done = true;
             for( unsigned int i = 0; i < streams.size(); ++i )
             {
@@ -396,7 +424,7 @@ int main( int argc, char** argv )
                 unsigned int countdown = round_robin_count;
                 while( !streams[i].eof() ) // todo? check is_shutdown here as well?
                 {
-                    unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count, ordered );
+                    unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count, blocking );
                     if( bytes_read == 0 ) { break; }
                     done = false;
                     if( size && bytes_read % size != 0 ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) << std::endl; return 1; }

From 910cda894d2d8348f45f86ef6c2db138d3bf9a72 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 12 Jan 2024 17:12:55 +1100
Subject: [PATCH 0710/1056] csv-repeat: --at-least-from, --at-least-to: typo
 bug fixed: aliases handled correctly

---
 csv/applications/csv-repeat.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index 6cef51af5..5401c1173 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -224,9 +224,9 @@ int main( int ac, char** av )
             if( options.exists( "--timeout,-t" ) ) { std::cerr << "csv-repeat: for --timestamped: --timeout not supported" << std::endl; return 1; }
             comma::csv::input_stream< input_t > istream( std::cin, csv );
             boost::posix_time::ptime last;
-            if( options.exists( "--from" ) ) { last = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-from,--from" ) ); }
+            if( options.exists( "--at-least-from,--from" ) ) { last = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-from,--from" ) ); }
             boost::posix_time::ptime to;
-            if( options.exists( "--to" ) ) { to = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-to,--to" ) ); }
+            if( options.exists( "--at-least-to,--to" ) ) { to = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-to,--to" ) ); }
             std::string last_record;
             if( csv.binary() ) { last_record = std::string( csv.format().size(), 0 ); }
             auto pass = [&]( const output_t& )

From 82ee9798211817d681625d3e4c0a139117e82021 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 15 Jan 2024 16:04:42 +1100
Subject: [PATCH 0711/1056] application::command_line_options: verbosity
 levels: first cut implemented

---
 application/command_line_options.cpp | 56 ++++++++++++++++++++--------
 application/command_line_options.h   | 18 ++++++---
 2 files changed, 53 insertions(+), 21 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 9df064ad1..a2c2f6a75 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -4,6 +4,7 @@
 /// @author vsevolod vlaskine
 
 #include <algorithm>
+#include <array>
 #include <sstream>
 #include <set>
 #include <unordered_map>
@@ -24,20 +25,46 @@ namespace comma {
 namespace application { namespace detail {
 
 static std::string name;
-static bool verbose = false;
+static unsigned int verbosity_level{0};
 static boost::iostreams::stream< boost::iostreams::null_sink > null_ostream( ( boost::iostreams::null_sink() ) );
 
 } } // namespace application { namespace detail {
 
+unsigned int verbosity::level() { return comma::application::detail::verbosity_level; }
+
+unsigned int verbosity::from_string( const std::string& s )
+{
+    return   s == "none"   ? verbosity::none
+           : s == "low"    ? verbosity::low
+           : s == "medium" ? verbosity::medium
+           : s == "high"   ? verbosity::high
+           : boost::lexical_cast< unsigned int >( s );
+}
+
+std::string verbosity::usage()
+{
+    const char* s = R"verbosity(verbosity options
+    --verbose,-v; more output on stderr, same as --verbosity=1
+    --verbosity=<n>; default=0; verbosity level from 0 to 5 or 'none'(0), 'low'(1), 'medium'(2), 'high'(3)
+    --v,--vv,--vvv,--vvvv,--vvvvv; same as --verbosity from 1 to 5
+)verbosity";
+    return s;
+}
+
 std::ostream& say( std::ostream& os ) { os << comma::application::detail::name << ": "; return os; }
 
-std::ostream& saymore() { return say( comma::application::detail::verbose ? std::cerr : comma::application::detail::null_ostream ); }
+std::ostream& saymore( unsigned int verbosity ) { return say( verbosity < comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : std::cerr ); }
 
-void command_line_options::_init_verbose( bool v, const std::string& path )
+void command_line_options::_init_verbose( const std::string& path )
 {
-    comma::verbose.init( v, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
+    comma::application::detail::verbosity_level = verbosity::from_string( value< std::string >( "--verbosity", exists( "--verbose,-v" ) ? "1" : "0" ) );
+    static const std::array< std::string, 5 > v{{ "--vvvvv", "--vvvv", "--vvv", "--vv", "--v" }}; // add more verbosity levels if some strange people need them
+    for( unsigned int i = 0; i < v.size() && comma::application::detail::verbosity_level + i < v.size(); ++i )
+    {
+        if( exists( v[i] ) ) { comma::application::detail::verbosity_level = v.size() - i; break; }
+    }
+    comma::verbose.init( comma::application::detail::verbosity_level > 0, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
     comma::application::detail::name = comma::split( path, '/' ).back(); // boost::filesystem::basename( path );
-    comma::application::detail::verbose = v;
 }
 
 command_line_options::command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage, boost::function< void( int, char** ) > bash_completion )
@@ -45,19 +72,17 @@ command_line_options::command_line_options( int argc, char ** argv, boost::funct
     argv_.resize( argc );
     for( int i = 0; i < argc; ++i ) { argv_[i] = argv[i]; }
     _fill_map( argv_ );
-    bool v = exists("--verbose,-v");
-    _init_verbose( v, argv[0] );
+    _init_verbose( argv[0] );
     if( bash_completion && exists( "--bash-completion" ) ) { bash_completion( argc, argv ); exit( 0 ); }
-    if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 0 ); }
+    if( usage && exists( "--help,-h" ) ) { usage( comma::application::detail::verbosity_level > 0 ); exit( 0 ); }
 }
 
 command_line_options::command_line_options( const std::vector< std::string >& argv, boost::function< void( bool ) > usage )
     : argv_( argv )
 {
     _fill_map( argv_ );
-    bool v = exists( "--verbose,-v" );
-    _init_verbose( v, argv[0] );
-    if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 1 ); }
+    _init_verbose( argv[0] );
+    if( usage && exists( "--help,-h" ) ) { usage( comma::application::detail::verbosity_level > 0 ); exit( 1 ); }
 }
 
 std::string command_line_options::escaped( const std::string& s ) // quick and dirty
@@ -86,16 +111,15 @@ const std::vector< std::string >& command_line_options::argv() const { return ar
 bool command_line_options::exists( const std::string& name ) const
 {
     std::vector< std::string > names = comma::split( name, ',' );
-    for( std::size_t i = 0; i < names.size(); ++i )
-    {
-        if( map_.find( names[i] ) != map_.end() ) { return true; }
-    }
+    for( const std::string& n: names ) { if( map_.find( n ) != map_.end() ) { return true; } }
     return false;
 }
 
 std::vector< std::string > command_line_options::unnamed( const std::string& valueless_options, const std::string& options_with_values ) const
 {
-    std::vector< std::string > valueless = split( valueless_options, ',' );
+
+    std::vector< std::string > valueless{ "--verbose", "-v", "--v", "--vv", "--vvv", "--vvvv", "--vvvvv" };
+    if( !valueless_options.empty() ) { valueless = split( valueless_options + ",--verbose,-v,--v,--vv,--vvv,--vvvv,--vvvvv", ',' ); }
     std::vector< std::string > valued = split( options_with_values, ',' );
     std::vector< std::string > w;
     for( unsigned int i = 1; i < argv_.size(); ++i )
diff --git a/application/command_line_options.h b/application/command_line_options.h
index a7613c3e8..8bc885418 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -18,6 +18,14 @@
 
 namespace comma {
 
+struct verbosity
+{
+    enum levels { none=0, low=1, medium=2, high=3 }; // todo: more levels and or aliases like warning, info, debug - but when choosing names, remember: verbosity is not the same as logging!
+    static unsigned int level();
+    static unsigned int from_string( const std::string& s );
+    static std::string usage();
+};
+
 /// @example
 ///      in my-application:
 ///          say() << "some message";
@@ -30,7 +38,8 @@ std::ostream& say( std::ostream& os = std::cerr );
 ///          saymore() << "some debug message";
 ///      if run as: my-application --verbose, will print on stderr:
 ///          my-application: some debug message
-std::ostream& saymore();
+///      define verbosity level on command line as --verbosity-level=3 or equivalently --vvv
+std::ostream& saymore( unsigned int verbosity = verbosity::low );
     
 /// a simple command line options class
 class command_line_options
@@ -154,7 +163,7 @@ class command_line_options
         map_type_ map_;
         std::vector< std::string > names_;
         void _fill_map( const std::vector< std::string >& v );
-        void _init_verbose( bool v, const std::string& path );
+        void _init_verbose( const std::string& path );
         template < typename T > static T lexical_cast_( const std::string& s );
         
 };
@@ -166,9 +175,8 @@ template< typename Iterator > inline command_line_options::command_line_options(
     _fill_map( argv_ );
     if( usage && exists( "--help,-h" ) )
     {
-        bool v = exists( "--verbose,-v" );
-        _init_verbose( v, *begin );
-        usage( v );
+        _init_verbose( *begin );
+        usage( verbosity::level() > 0 );
         exit( 0 );
     }
 }

From 77a3a501bc59f344f6838555f04893996509cb2c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 15 Jan 2024 16:49:48 +1100
Subject: [PATCH 0712/1056] application::command_line_options: verbosity
 levels: bug fixed; say(verbosity) implemented

---
 application/command_line_options.cpp | 8 +++++---
 application/command_line_options.h   | 8 ++++++--
 packed/test/CMakeLists.txt           | 2 +-
 3 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index a2c2f6a75..49c709f15 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -51,9 +51,11 @@ std::string verbosity::usage()
     return s;
 }
 
-std::ostream& say( std::ostream& os ) { os << comma::application::detail::name << ": "; return os; }
-
-std::ostream& saymore( unsigned int verbosity ) { return say( verbosity < comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : std::cerr ); }
+std::ostream& say( std::ostream& os, unsigned int verbosity )
+{ 
+    ( verbosity > comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : os ) << comma::application::detail::name << ": ";
+    return os;
+}
 
 void command_line_options::_init_verbose( const std::string& path )
 {
diff --git a/application/command_line_options.h b/application/command_line_options.h
index 8bc885418..76c5e94b5 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -31,15 +31,19 @@ struct verbosity
 ///          say() << "some message";
 ///      will print on stderr:
 ///          my-application: some message
-std::ostream& say( std::ostream& os = std::cerr );
+std::ostream& say( std::ostream& os, unsigned int verbosity=0 );
+inline std::ostream& say( unsigned int verbosity=0 ) { return say( std::cerr, verbosity ); }
 
+/// convenience alias of say( verbosity )
 /// @example
 ///      in my-application
 ///          saymore() << "some debug message";
+///          saymore( 2 ) << "some debug message at medium verbosity";
+///          saymore( comma::verbosity::medium ) << "some debug message at medium verbosity";
 ///      if run as: my-application --verbose, will print on stderr:
 ///          my-application: some debug message
 ///      define verbosity level on command line as --verbosity-level=3 or equivalently --vvv
-std::ostream& saymore( unsigned int verbosity = verbosity::low );
+inline std::ostream& saymore( unsigned int verbosity=comma::verbosity::low ) { return say( verbosity ); }
     
 /// a simple command line options class
 class command_line_options
diff --git a/packed/test/CMakeLists.txt b/packed/test/CMakeLists.txt
index ab1f5d597..c503d81e2 100644
--- a/packed/test/CMakeLists.txt
+++ b/packed/test/CMakeLists.txt
@@ -2,7 +2,7 @@ set( KIT packed )
 file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
 set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
 add_executable( ${test_name} ${source} )
-target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
+target_link_libraries( ${test_name} comma_application comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
 add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
 if( INSTALL_TESTS )
     install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )

From 660c2eff721ad14ca0e29caaf6719a9286b2731b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 15 Jan 2024 17:08:35 +1100
Subject: [PATCH 0713/1056] application::command_line_options: verbosity
 levels: bug fixed

---
 application/command_line_options.cpp | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 49c709f15..a10cddeb7 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -52,9 +52,8 @@ std::string verbosity::usage()
 }
 
 std::ostream& say( std::ostream& os, unsigned int verbosity )
-{ 
-    ( verbosity > comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : os ) << comma::application::detail::name << ": ";
-    return os;
+{
+    return ( verbosity > comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : os ) << comma::application::detail::name << ": ";
 }
 
 void command_line_options::_init_verbose( const std::string& path )

From c3a4e7b96221a8bebc19286c97c8301e45d3fc70 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 15 Jan 2024 17:16:09 +1100
Subject: [PATCH 0714/1056] application::command_line_options: verbosity
 levels: --vvvvv, etc replaced with -vvvvv

---
 application/command_line_options.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index a10cddeb7..ab97c2e86 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -46,7 +46,7 @@ std::string verbosity::usage()
     const char* s = R"verbosity(verbosity options
     --verbose,-v; more output on stderr, same as --verbosity=1
     --verbosity=<n>; default=0; verbosity level from 0 to 5 or 'none'(0), 'low'(1), 'medium'(2), 'high'(3)
-    --v,--vv,--vvv,--vvvv,--vvvvv; same as --verbosity from 1 to 5
+    -v,-vv,-vvv,-vvvv,-vvvvv; same as --verbosity from 1 to 5
 )verbosity";
     return s;
 }
@@ -59,7 +59,7 @@ std::ostream& say( std::ostream& os, unsigned int verbosity )
 void command_line_options::_init_verbose( const std::string& path )
 {
     comma::application::detail::verbosity_level = verbosity::from_string( value< std::string >( "--verbosity", exists( "--verbose,-v" ) ? "1" : "0" ) );
-    static const std::array< std::string, 5 > v{{ "--vvvvv", "--vvvv", "--vvv", "--vv", "--v" }}; // add more verbosity levels if some strange people need them
+    static const std::array< std::string, 5 > v{{ "-vvvvv", "-vvvv", "-vvv", "-vv", "-v" }}; // add more verbosity levels if some strange people need them
     for( unsigned int i = 0; i < v.size() && comma::application::detail::verbosity_level + i < v.size(); ++i )
     {
         if( exists( v[i] ) ) { comma::application::detail::verbosity_level = v.size() - i; break; }
@@ -119,8 +119,8 @@ bool command_line_options::exists( const std::string& name ) const
 std::vector< std::string > command_line_options::unnamed( const std::string& valueless_options, const std::string& options_with_values ) const
 {
 
-    std::vector< std::string > valueless{ "--verbose", "-v", "--v", "--vv", "--vvv", "--vvvv", "--vvvvv" };
-    if( !valueless_options.empty() ) { valueless = split( valueless_options + ",--verbose,-v,--v,--vv,--vvv,--vvvv,--vvvvv", ',' ); }
+    std::vector< std::string > valueless{ "--verbose", "-v", "-vv", "-vvv", "-vvvv", "-vvvvv" };
+    if( !valueless_options.empty() ) { valueless = split( valueless_options + ",--verbose,-v,-vv,-vvv,-vvvv,-vvvvv", ',' ); }
     std::vector< std::string > valued = split( options_with_values, ',' );
     std::vector< std::string > w;
     for( unsigned int i = 1; i < argv_.size(); ++i )

From dc6a02bc6c707fc00595120898006369d883ebc8 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 16 Jan 2024 12:31:27 +1100
Subject: [PATCH 0715/1056] comma-build: auto-completion: sudo-install added

---
 util/applications/comma-build | 1 +
 1 file changed, 1 insertion(+)

diff --git a/util/applications/comma-build b/util/applications/comma-build
index 487624c58..e1f4ed709 100755
--- a/util/applications/comma-build
+++ b/util/applications/comma-build
@@ -170,6 +170,7 @@ list-commits
 pack
 pull
 push
+sudo-install
 eof
 }
 

From 6b2ec88128926d864ca27b8753b24550861b60f0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 17 Jan 2024 16:23:59 +1100
Subject: [PATCH 0716/1056] comma-name-value-util: comma_path_value_mangle
 [<delimiter>] [<default_value>] semantics implemented

---
 bash/comma-name-value-util | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/bash/comma-name-value-util b/bash/comma-name-value-util
index 4405ad058..1774a7478 100644
--- a/bash/comma-name-value-util
+++ b/bash/comma-name-value-util
@@ -39,6 +39,9 @@ readonly comma_name_value_util_include_guard_=1
     || source $( type -p comma-log-util ) \
     || { echo "$name: cannot source 'comma-log-util' from '$BASH_SOURCE'" >&2; exit 1; }
 
+# usage: echo <path-value pairs> | comma_path_value_mangle [<delimiter>] [<default_value>]
+#        <delimiter>: default='_'
+#
 # take path-value pairs, mangle path to turn them into bash
 # expressions, e.g:
 # echo hello/world=5 | comma_path_value_mangle
@@ -53,7 +56,7 @@ readonly comma_name_value_util_include_guard_=1
 # local hello_world="5"
 function comma_path_value_mangle()
 {
-    local delimiter="$1"
+    local delimiter="$1" default_value="$2"
     [[ -n "$delimiter" ]] || delimiter="_"
     local path name value
     while IFS='=' read -r path value || [[ -n "$path" ]]; do
@@ -64,6 +67,7 @@ function comma_path_value_mangle()
         name=${name//]/}        # just remove trailing ] since it's always followed by / or the end of the line
         value="${value#\"}"
         value="${value%\"}"
+        [[ -n "$value" || -z "$default_value" ]] || value="$default_value"
         echo "$name='$value'"
     done
 }

From e990525f655ea2927658f0009e6483d44d95fc98 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 17 Jan 2024 16:31:42 +1100
Subject: [PATCH 0717/1056] comma_path_value_mangle: unit test added

---
 .../comma_name_value_util/comma_path_value_mangle/expected     | 3 +++
 bash/test/comma_name_value_util/comma_path_value_mangle/test   | 1 +
 2 files changed, 4 insertions(+)

diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/expected b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
index 2df059ba9..54da3e682 100644
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/expected
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
@@ -9,3 +9,6 @@ dashes/a_b_c='1'
 path_with_dashes/a_b_c='1'
 subscript/a_b_0='1'
 subscript_followed_by_path/a_b_0_c='1'
+a="123"
+b="123"
+c="123"
\ No newline at end of file
diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/test b/bash/test/comma_name_value_util/comma_path_value_mangle/test
index 06dabc782..78f608eff 100755
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/test
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/test
@@ -15,3 +15,4 @@ echo "a-b-c=1" | comma_path_value_mangle | sed 's|^|dashes/|'
 echo "a/b-c=1" | comma_path_value_mangle | sed 's|^|path_with_dashes/|'
 echo "a/b[0]=1" | comma_path_value_mangle | sed 's|^|subscript/|'
 echo "a/b[0]/c=1" | comma_path_value_mangle | sed 's|^|subscript_followed_by_path/|'
+( echo a; echo b; echo c ) | comma_path_value_mangle '_' 123
\ No newline at end of file

From b7d7d7911432e7b58018f00b6952775a675fcd3c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 22 Jan 2024 11:06:58 +1100
Subject: [PATCH 0718/1056] 
 application/applications/test/comma_options_to_name_value: a (seeming)
 misnomer in tests fixed

---
 .../comma_options_to_name_value/basic/test     |  4 ++--
 .../double_quotes/test                         | 18 +++++++++---------
 .../comma_options_to_name_value/no_quotes/test |  8 ++++----
 .../single_quotes/test                         | 16 ++++++++--------
 util/applications/comma-test-run               | 12 ++++++------
 5 files changed, 29 insertions(+), 29 deletions(-)

diff --git a/application/applications/test/comma_options_to_name_value/basic/test b/application/applications/test/comma_options_to_name_value/basic/test
index f59d8cb29..5fb476ae6 100755
--- a/application/applications/test/comma_options_to_name_value/basic/test
+++ b/application/applications/test/comma_options_to_name_value/basic/test
@@ -2,6 +2,6 @@
 
 set -e
 
-echo '--var=[<var>]; default=10; help text' | comma-options-to-name-value "--var=1" | sed 's|"||g; s|^|given_value/|'
-echo '--var=[<var>]; default=10; help text' | comma-options-to-name-value "" | sed 's|"||g; s|^|default_value/|'
+echo '--var=<var>; default=10; help text' | comma-options-to-name-value "--var=1" | sed 's|"||g; s|^|given_value/|'
+echo '--var=<var>; default=10; help text' | comma-options-to-name-value  | sed 's|"||g; s|^|default_value/|'
 
diff --git a/application/applications/test/comma_options_to_name_value/double_quotes/test b/application/applications/test/comma_options_to_name_value/double_quotes/test
index eedda9e75..58da3a61c 100755
--- a/application/applications/test/comma_options_to_name_value/double_quotes/test
+++ b/application/applications/test/comma_options_to_name_value/double_quotes/test
@@ -2,18 +2,18 @@
 
 set -e
 
-echo '--var=[<var>]; default="blah"; help text' | comma-options-to-name-value "" | sed 's|^|basic/|'
-echo '--var=[<var>]; default="blah blah"; help text' | comma-options-to-name-value "" | sed 's|^|space_inside/|'
-echo '--var=[<var>]; default="blah" ; help text' | comma-options-to-name-value "" | sed 's|^|space_outside/|'
-echo '--var=[<var>]; default="blah;blah" ; help text' | comma-options-to-name-value "" | sed 's|^|semicolon_inside/|'
-echo '--var=[<var>]; default="blah"' | comma-options-to-name-value "" | sed 's|^|no_help/basic/|'
-echo '--var=[<var>]; default="blah" ' | comma-options-to-name-value "" | sed 's|^|no_help/space_outside/|'
-echo '--var=[<var>]; default="blah";' | comma-options-to-name-value "" | sed 's|^|no_help/semicolon/|'
+echo '--var=[<var>]; default="blah"; help text' | comma-options-to-name-value | sed 's|^|basic/|'
+echo '--var=[<var>]; default="blah blah"; help text' | comma-options-to-name-value | sed 's|^|space_inside/|'
+echo '--var=[<var>]; default="blah" ; help text' | comma-options-to-name-value | sed 's|^|space_outside/|'
+echo '--var=[<var>]; default="blah;blah" ; help text' | comma-options-to-name-value | sed 's|^|semicolon_inside/|'
+echo '--var=[<var>]; default="blah"' | comma-options-to-name-value | sed 's|^|no_help/basic/|'
+echo '--var=[<var>]; default="blah" ' | comma-options-to-name-value | sed 's|^|no_help/space_outside/|'
+echo '--var=[<var>]; default="blah";' | comma-options-to-name-value | sed 's|^|no_help/semicolon/|'
 
-cat <<END | comma-options-to-name-value "" | sed 's|^|escaped_quotes/|'
+cat <<END | comma-options-to-name-value | sed 's|^|escaped_quotes/|'
 --var=[<var>]; default="blah=\"\$value\""
 END
 
-cat <<END | comma-options-to-name-value "" | sed 's|^|single_quotes/|'
+cat <<END | comma-options-to-name-value | sed 's|^|single_quotes/|'
 --var=[<var>]; default="blah='\$value'"
 END
diff --git a/application/applications/test/comma_options_to_name_value/no_quotes/test b/application/applications/test/comma_options_to_name_value/no_quotes/test
index 759223f7a..5f836cfec 100755
--- a/application/applications/test/comma_options_to_name_value/no_quotes/test
+++ b/application/applications/test/comma_options_to_name_value/no_quotes/test
@@ -2,8 +2,8 @@
 
 set -e
 
-echo '--var=[<var>]; default=10 ; help text' | comma-options-to-name-value "" | sed 's|"||g; s|^|space_with_help/|'
-echo '--var=[<var>]; default=10;' | comma-options-to-name-value "" | sed 's|"||g; s|^|semicolon_no_help/|'
-echo '--var=[<var>]; default=10' | comma-options-to-name-value "" | sed 's|"||g; s|^|no_help/|'
-echo '--var=[<var>]; default=10 ' | comma-options-to-name-value "" | sed 's|"||g; s|^|space_no_help/|'
+echo '--var=[<var>]; default=10 ; help text' | comma-options-to-name-value | sed 's|"||g; s|^|space_with_help/|'
+echo '--var=[<var>]; default=10;' | comma-options-to-name-value | sed 's|"||g; s|^|semicolon_no_help/|'
+echo '--var=[<var>]; default=10' | comma-options-to-name-value | sed 's|"||g; s|^|no_help/|'
+echo '--var=[<var>]; default=10 ' | comma-options-to-name-value | sed 's|"||g; s|^|space_no_help/|'
 
diff --git a/application/applications/test/comma_options_to_name_value/single_quotes/test b/application/applications/test/comma_options_to_name_value/single_quotes/test
index 0aa4c480c..0c8b0a558 100755
--- a/application/applications/test/comma_options_to_name_value/single_quotes/test
+++ b/application/applications/test/comma_options_to_name_value/single_quotes/test
@@ -2,14 +2,14 @@
 
 set -e
 
-echo "--var=[<var>]; default='blah'; help text" | comma-options-to-name-value "" | sed 's|^|basic/|'
-echo "--var=[<var>]; default='blah blah'; help text" | comma-options-to-name-value "" | sed 's|^|space_inside/|'
-echo "--var=[<var>]; default='blah;blah' ; help text" | comma-options-to-name-value "" | sed 's|^|semicolon_inside/|'
-echo "--var=[<var>]; default='blah' ; help text" | comma-options-to-name-value "" | sed 's|^|space_outside/|'
-echo "--var=[<var>]; default='blah'" | comma-options-to-name-value "" | sed 's|^|no_help/basic/|'
-echo "--var=[<var>]; default='blah' " | comma-options-to-name-value "" | sed 's|^|no_help/space_outside/|'
-echo "--var=[<var>]; default='blah';" | comma-options-to-name-value "" | sed 's|^|no_help/semicolon/|'
+echo "--var=[<var>]; default='blah'; help text" | comma-options-to-name-value | sed 's|^|basic/|'
+echo "--var=[<var>]; default='blah blah'; help text" | comma-options-to-name-value | sed 's|^|space_inside/|'
+echo "--var=[<var>]; default='blah;blah' ; help text" | comma-options-to-name-value | sed 's|^|semicolon_inside/|'
+echo "--var=[<var>]; default='blah' ; help text" | comma-options-to-name-value | sed 's|^|space_outside/|'
+echo "--var=[<var>]; default='blah'" | comma-options-to-name-value | sed 's|^|no_help/basic/|'
+echo "--var=[<var>]; default='blah' " | comma-options-to-name-value | sed 's|^|no_help/space_outside/|'
+echo "--var=[<var>]; default='blah';" | comma-options-to-name-value | sed 's|^|no_help/semicolon/|'
 
-cat <<END | comma-options-to-name-value "" | sed 's|^|escaped_quotes/|'
+cat <<END | comma-options-to-name-value | sed 's|^|escaped_quotes/|'
 --var=[<var>]; default='blah="\$value"'
 END
diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 708099572..e3a933c1a 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -278,7 +278,7 @@ function error_()
         local bold=$( tput bold )
         local red=$( tput setaf 1 )
         local normal=$( tput sgr0 )
-        echo -e "$bold$red$*$normal" >&2
+        echo -e "${bold}${red}$*${normal}" >&2
     fi
 }
 export -f error_
@@ -286,7 +286,7 @@ export -f error_
 function error_and_junit_()
 {
     local -r error_and_junit_formatted=$( echo -e "$1" )
-    error_ $( head -1 <<< "$error_and_junit_formatted" )
+    error_ $( head -1 <<< "comma-test-run: $error_and_junit_formatted" )
     local -r error_and_junit_formatted_tail="$( tail -n +2 <<< "$error_and_junit_formatted" )"
     [[ -z "$error_and_junit_formatted_tail" ]] || cat >&2 <<< "$error_and_junit_formatted_tail"
     if [[ -n "$options_output_junit" && -d 'output' ]] ; then cat >> 'output/junit.failure.log' <<< "$error_and_junit_formatted" ; fi
@@ -595,8 +595,8 @@ function run_and_match_test()
 
     local env_variables="PYTHONPATH,XDG_RUNTIME_DIR,DISPLAY"
     
-    rm -rf output || { error_and_junit_ "Unable to remove 'output' directory" ; return 1 ; }
-    mkdir -p output || { error_and_junit_ "Unable to make 'output' directory" ; return 1 ; }
+    rm -rf output || { error_and_junit_ "unable to remove 'output' directory" ; return 1 ; }
+    mkdir -p output || { error_and_junit_ "unable to make 'output' directory" ; return 1 ; }
 
     {
         if [[ -f ./input ]] ; then cat ./input ; fi | comma_env --import "$env_variables" "$test_exec" "$path" $verbose $options_test_option
@@ -648,9 +648,9 @@ function run_and_match_test()
         if [[ -n "$options_always_expected" ]] ; then
             for global_expected in $options_always_expected ; do match_expected "$global_expected" "is_global" ; done
         fi
-        echo -e '\n# After comma-test-match in comma-test-run' >> 'output/stdout.log'
+        echo -e '\n# after comma-test-match in comma-test-run' >> 'output/stdout.log'
         if [[ -n "$match_output" ]]; then
-            error_and_junit_ "Test output does not match expected:\nexpected output:\n$match_output"
+            error_and_junit_ "test output does not match expected:\nexpected output:\n$match_output"
             return 1
         fi
     }

From 3a22e708e7780aef1d7c0a38f1d0a76d4be012cb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 22 Jan 2024 15:11:06 +1100
Subject: [PATCH 0719/1056] comma::say(): adding convenience macros

---
 application/command_line_options.cpp | 21 ++++++++++++++-------
 application/command_line_options.h   | 13 ++++++++++---
 2 files changed, 24 insertions(+), 10 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index ab97c2e86..d303d5604 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -34,26 +34,33 @@ unsigned int verbosity::level() { return comma::application::detail::verbosity_l
 
 unsigned int verbosity::from_string( const std::string& s )
 {
-    return   s == "none"   ? verbosity::none
-           : s == "low"    ? verbosity::low
-           : s == "medium" ? verbosity::medium
-           : s == "high"   ? verbosity::high
+    return   s == "none"                     ? verbosity::none
+           : s == "low"    || s == "error"   ? verbosity::low
+           : s == "medium" || s == "warning" ? verbosity::medium
+           : s == "high"   || s == "info"    ? verbosity::high
+           : s == "debug"  || s == "extreme" ? verbosity::extreme
            : boost::lexical_cast< unsigned int >( s );
 }
 
+const std::string verbosity::to_string( unsigned int v )
+{
+    static const std::array< std::string, 5 > s{{ "", "low", "medium", "high", "extreme" }};
+    return v < s.size() ? s[v] : ""; // output lexical cast?
+}
+
 std::string verbosity::usage()
 {
     const char* s = R"verbosity(verbosity options
     --verbose,-v; more output on stderr, same as --verbosity=1
-    --verbosity=<n>; default=0; verbosity level from 0 to 5 or 'none'(0), 'low'(1), 'medium'(2), 'high'(3)
+    --verbosity=<n>; default=0; verbosity level from 0 to 5 or 'none'(0), 'low'|'error'(1), 'medium'|'warning'(2), 'high'|'info'(3), 'extreme'|'debug'(4)
     -v,-vv,-vvv,-vvvv,-vvvvv; same as --verbosity from 1 to 5
 )verbosity";
     return s;
 }
 
-std::ostream& say( std::ostream& os, unsigned int verbosity )
+std::ostream& say( std::ostream& os, unsigned int verbosity, const std::string& prefix )
 {
-    return ( verbosity > comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : os ) << comma::application::detail::name << ": ";
+    return ( verbosity > comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : os ) << comma::application::detail::name << ": " << ( prefix.empty() ? std::string() : ( prefix + ": " ) );
 }
 
 void command_line_options::_init_verbose( const std::string& path )
diff --git a/application/command_line_options.h b/application/command_line_options.h
index 76c5e94b5..b75d490d6 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -20,9 +20,10 @@ namespace comma {
 
 struct verbosity
 {
-    enum levels { none=0, low=1, medium=2, high=3 }; // todo: more levels and or aliases like warning, info, debug - but when choosing names, remember: verbosity is not the same as logging!
+    enum levels { none=0, low=1, medium=2, high=3, extreme=4 }; // todo: more levels and or aliases like warning, info, debug - but when choosing names, remember: verbosity is not the same as logging!
     static unsigned int level();
     static unsigned int from_string( const std::string& s );
+    static const std::string to_string( unsigned int v );
     static std::string usage();
 };
 
@@ -31,8 +32,14 @@ struct verbosity
 ///          say() << "some message";
 ///      will print on stderr:
 ///          my-application: some message
-std::ostream& say( std::ostream& os, unsigned int verbosity=0 );
-inline std::ostream& say( unsigned int verbosity=0 ) { return say( std::cerr, verbosity ); }
+std::ostream& say( std::ostream& os, unsigned int verbosity=0, const std::string& prefix="" );
+inline std::ostream& say( unsigned int verbosity=0, const std::string& prefix="" ) { return say( std::cerr, verbosity, prefix ); }
+#define COMMA_SAY ( say( verbosity::none ) << __FILE__ << ": " << __FUNCTION__ << ": " << __LINE__ << ": " )
+#define COMMA_SAY_ERROR ( say( verbosity::low ) << "error: " )
+#define COMMA_SAY_WARN ( say( verbosity::medium ) << "warning: " )
+#define COMMA_SAY_INFO ( say( verbosity::high ) << "info: " )
+#define COMMA_SAY_DEBUG ( say( verbosity::extreme ) << "debug: " )
+#define COMMA_SAY_TRACE ( say( 5 ) << "trace: " << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " )
 
 /// convenience alias of say( verbosity )
 /// @example

From 5501aa14a8552cdd554ac5d022f80f206e0e529b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 22 Jan 2024 16:26:55 +1100
Subject: [PATCH 0720/1056] COMMA_SAY_* macros implemented

---
 application/command_line_options.h | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/application/command_line_options.h b/application/command_line_options.h
index b75d490d6..b76efb5d0 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -34,12 +34,15 @@ struct verbosity
 ///          my-application: some message
 std::ostream& say( std::ostream& os, unsigned int verbosity=0, const std::string& prefix="" );
 inline std::ostream& say( unsigned int verbosity=0, const std::string& prefix="" ) { return say( std::cerr, verbosity, prefix ); }
-#define COMMA_SAY ( say( verbosity::none ) << __FILE__ << ": " << __FUNCTION__ << ": " << __LINE__ << ": " )
-#define COMMA_SAY_ERROR ( say( verbosity::low ) << "error: " )
-#define COMMA_SAY_WARN ( say( verbosity::medium ) << "warning: " )
-#define COMMA_SAY_INFO ( say( verbosity::high ) << "info: " )
-#define COMMA_SAY_DEBUG ( say( verbosity::extreme ) << "debug: " )
-#define COMMA_SAY_TRACE ( say( 5 ) << "trace: " << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " )
+
+/// convenience macros
+#define _COMMA_SAY( _level, _message ) { if( _level <= ::comma::verbosity::level() ) { ::comma::say( _level ) << _message; } }
+#define COMMA_SAY( message )       _COMMA_SAY( 0,                message << std::endl )
+#define COMMA_SAY_ERROR( message ) _COMMA_SAY( 1, "error: "   << message << std::endl )
+#define COMMA_SAY_WARN( message )  _COMMA_SAY( 2, "warning: " << message << std::endl )
+#define COMMA_SAY_INFO( message )  _COMMA_SAY( 3, "info: "    << message << std::endl )
+#define COMMA_SAY_DEBUG( message ) _COMMA_SAY( 4, "debug: "   << message << std::endl )
+#define COMMA_SAY_TRACE( message ) _COMMA_SAY( 5, "trace: "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
 
 /// convenience alias of say( verbosity )
 /// @example

From 2d00ba1abdd0020611769c33087d730480ba3b7f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 23 Jan 2024 16:46:14 +1100
Subject: [PATCH 0721/1056] csv-join: --block-less: first cut (with a clumsy
 option name) implemented; basic unit test added

---
 csv/applications/csv-join.cpp         | 108 ++++++++++++++++----------
 csv/test/csv-join/block_less/expected |  58 ++++++++++++++
 csv/test/csv-join/block_less/input    |   8 ++
 3 files changed, 133 insertions(+), 41 deletions(-)
 create mode 100644 csv/test/csv-join/block_less/expected
 create mode 100644 csv/test/csv-join/block_less/input

diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index ae615b280..04bb6d338 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -41,6 +41,8 @@ static void usage( bool more )
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
+    std::cerr << "    --block-less; todo! better option name! input and filter block ids expected sorted" << std::endl;
+    std::cerr << "                  " << std::endl;
     std::cerr << "    --drop-id-fields,--drop-id; remove id and block fields from filter output (same as if you did csv-join|csv-shuffle)" << std::endl;
     std::cerr << "    --first-matching: output only the first matching record (a bit of hack for now, but we needed it)" << std::endl;
     std::cerr << "    --flag-matching: output all records, with 1 appended to matching records and 0 appended to not-matching records" << std::endl;
@@ -79,48 +81,59 @@ static void usage( bool more )
         std::cerr << "        any other field name: key" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        block acts as a key but stream processing occurs at the end of each" << std::endl;
-        std::cerr << "        block. If no block field is given the entire input is considered to be" << std::endl;
-        std::cerr << "        one block. Blocks are required to be contiguous in the input stream." << std::endl;
+        std::cerr << "        block; if no block field is given the entire input is considered to be" << std::endl;
+        std::cerr << "        one block; blocks are required to be contiguous in the input stream" << std::endl;
     }
     else
     {
         std::cerr << "    run csv-join --help --verbose for more..." << std::endl;
     }
     std::cerr << std::endl;
-    std::cerr << "examples (try them)" << std::endl;
-    std::cerr << "    on the following data file:" << std::endl;
-    std::cerr << "        echo 1,1,2,hello > data.csv" << std::endl;
-    std::cerr << "        echo 1,2,3,hello >> data.csv" << std::endl;
-    std::cerr << "        echo 3,3,4,world >> data.csv" << std::endl;
-    std::cerr << "        echo 3,4,3,world >> data.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    join with a matching record" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=id \"data.csv;fields=id\"" << std::endl;
-    std::cerr << "        echo 3,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
-    std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
-    std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --not-matching" << std::endl;
-    std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --strict" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    join by key which is a string" << std::endl;
-    std::cerr << "        echo 1,hello | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
-    std::cerr << "        echo 1,world | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --not-matching" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --strict" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    finite state machine" << std::endl;
-    std::cerr << "        csv-join --fields=event \"data.csv;fields=event,state,next_state\" --initial-state 1" << std::endl;
-    std::cerr << "        <input:1>" << std::endl;
-    std::cerr << "        <input:1>" << std::endl;
-    std::cerr << "        <input:3>" << std::endl;
-    std::cerr << "        <input:3>" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    --drop-id (same would work in binary as well)" << std::endl;
-    std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y'" << std::endl;
-    std::cerr << "        0,1,2,3,1,A,B,3" << std::endl;
-    std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y' --drop-id" << std::endl;
-    std::cerr << "        0,1,2,3,A,B" << std::endl;
-    std::cerr << std::endl;
+    if( more )
+    {
+        std::cerr << "examples (try them)" << std::endl;
+        std::cerr << "    on the following data file:" << std::endl;
+        std::cerr << "        echo 1,1,2,hello > data.csv" << std::endl;
+        std::cerr << "        echo 1,2,3,hello >> data.csv" << std::endl;
+        std::cerr << "        echo 3,3,4,world >> data.csv" << std::endl;
+        std::cerr << "        echo 3,4,3,world >> data.csv" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    join with a matching record" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=id \"data.csv;fields=id\"" << std::endl;
+        std::cerr << "        echo 3,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
+        std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
+        std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --not-matching" << std::endl;
+        std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --strict" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    join by key which is a string" << std::endl;
+        std::cerr << "        echo 1,hello | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
+        std::cerr << "        echo 1,world | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --not-matching" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --strict" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    block id ordered, gaps in filter blocks allowed" << std::endl;
+        std::cerr << "        csv-paste line-number value=0 | head \\" << std::endl;
+        std::cerr << "            | csv-join --fields block,id <( echo 3,0; echo 6,0 )';fields=block,id' --block-less" << std::endl;
+        std::cerr << "    finite state machine" << std::endl;
+        std::cerr << "        csv-join --fields=event \"data.csv;fields=event,state,next_state\" --initial-state 1" << std::endl;
+        std::cerr << "        <input:1>" << std::endl;
+        std::cerr << "        <input:1>" << std::endl;
+        std::cerr << "        <input:3>" << std::endl;
+        std::cerr << "        <input:3>" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    --drop-id (same would work in binary as well)" << std::endl;
+        std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y'" << std::endl;
+        std::cerr << "        0,1,2,3,1,A,B,3" << std::endl;
+        std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y' --drop-id" << std::endl;
+        std::cerr << "        0,1,2,3,A,B" << std::endl;
+        std::cerr << std::endl;
+    }
+    else
+    {
+        std::cerr << "examples" << std::endl;
+        std::cerr << "    run csv-join --help --verbose for more..." << std::endl;
+    }
     exit( 0 );
 }
 
@@ -330,12 +343,12 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         return s;
     }
 
-    static void read_filter_block()
+    static const input< K >* read_filter_block()
     {
         static comma::csv::input_stream< input< K > > filter_stream( **filter_transport, filter_csv, default_input );
         static const input< K >* last = filter_stream.read();
         filter_map.clear();
-        if( !last ) { return; }
+        if( !last ) { return last; }
         block = last->block;
         comma::uint64 count = 0;
         static comma::signal_flag is_shutdown( comma::signal_flag::hard );
@@ -348,10 +361,12 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
             if( !last ) { break; }
         }
         if( verbose ) { std::cerr << "csv-join: read block " << block << " of " << count << " point" << ( count == 1 ? "" : "s" ) << "; hash map size: " << filter_map.size() << std::endl; }
+        return last;
     }
 
     static int run( const comma::command_line_options& options )
     {
+        bool block_less = options.exists( "--block-less" );
         std::vector< std::string > v = comma::split( stdin_csv.fields, ',' );
         std::vector< std::string > w = comma::split( filter_csv.fields, ',' );
         if( filter_id_fields_discard ) { filter_id_fields_flags.resize( w.size(), 0 ); }
@@ -419,7 +434,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         filter_transport.reset( new comma::io::istream( filter_csv.filename, filter_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii ) );
         if( filter_transport->fd() == comma::io::invalid_file_descriptor ) { std::cerr << "csv-join: failed to open \"" << filter_csv.filename << "\"" << std::endl; return 1; }
         std::size_t discarded = 0;
-        read_filter_block();
+        auto last = read_filter_block();
         #ifdef WIN32
         if( stdin_stream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
@@ -427,7 +442,18 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         {
             const input< K >* p = stdin_stream.read();
             if( !p ) { break; }
-            if( block != p->block ) { read_filter_block(); }
+            if( block_less )
+            {
+                if( p->block < block ) { continue; }
+                while( last && p->block >= last->block )
+                {
+                    last = read_filter_block();
+                }
+            }
+            else
+            {
+                if( p->block != block ) { last = read_filter_block(); }
+            }
             typename traits< K, Strict >::pair pair;
             if( is_state_machine )
             {
@@ -537,7 +563,7 @@ int main( int ac, char** av )
         options.assert_mutually_exclusive( "--radius,--epsilon,--string,-s,--double,--time" );
         options.assert_mutually_exclusive( "--matching,--not-matching", "--drop-id-fields,--drop-id" );
         stdin_csv = comma::csv::options( options );
-        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest,--drop-id-fields,--drop-id", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--block-less,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest,--drop-id-fields,--drop-id", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-join: please specify the second source" << std::endl; return 1; }
         if( unnamed.size() > 1 ) { std::cerr << "csv-join: expected one file or stream to join, got " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
         comma::name_value::parser parser( "filename", ';', '=', false );
diff --git a/csv/test/csv-join/block_less/expected b/csv/test/csv-join/block_less/expected
new file mode 100644
index 000000000..784085d5d
--- /dev/null
+++ b/csv/test/csv-join/block_less/expected
@@ -0,0 +1,58 @@
+block_less/basics[0]/output/line[0]="0,0,0,0"
+block_less/basics[0]/output/line[1]="1,0,0,0"
+block_less/basics[0]/output/line[2]="2,0,0,0"
+block_less/basics[0]/output/line[3]="3,0,0,0"
+block_less/basics[0]/output/line[4]="4,0,0,0"
+block_less/basics[0]/output/line[5]="5,0,0,0"
+block_less/basics[0]/output/line[6]="6,0,0,0"
+block_less/basics[0]/output/line[7]="7,0,0,0"
+block_less/basics[0]/output/line[8]="8,0,0,0"
+block_less/basics[0]/output/line[9]="9,0,0,0"
+block_less/basics[0]/status=0
+block_less/basics[1]/output/line[0]="3,0,3,0"
+block_less/basics[1]/output/line[1]="4,0,3,0"
+block_less/basics[1]/output/line[2]="5,0,3,0"
+block_less/basics[1]/output/line[3]="6,0,3,0"
+block_less/basics[1]/output/line[4]="7,0,3,0"
+block_less/basics[1]/output/line[5]="8,0,3,0"
+block_less/basics[1]/output/line[6]="9,0,3,0"
+block_less/basics[1]/status=0
+block_less/basics[2]/output="9,0,9,0"
+block_less/basics[2]/status=0
+block_less/basics[3]/output=""
+block_less/basics[3]/status=0
+block_less/basics[4]/output/line[0]="0,0,0,0"
+block_less/basics[4]/output/line[1]="1,0,0,0"
+block_less/basics[4]/output/line[2]="2,0,0,0"
+block_less/basics[4]/output/line[3]="3,0,0,0"
+block_less/basics[4]/output/line[4]="4,0,0,0"
+block_less/basics[4]/output/line[5]="5,0,0,0"
+block_less/basics[4]/output/line[6]="6,0,6,0"
+block_less/basics[4]/output/line[7]="7,0,6,0"
+block_less/basics[4]/output/line[8]="8,0,6,0"
+block_less/basics[4]/output/line[9]="9,0,6,0"
+block_less/basics[4]/status=0
+block_less/basics[5]/output/line[0]="3,0,3,0"
+block_less/basics[5]/output/line[1]="4,0,3,0"
+block_less/basics[5]/output/line[2]="5,0,3,0"
+block_less/basics[5]/output/line[3]="6,0,6,0"
+block_less/basics[5]/output/line[4]="7,0,6,0"
+block_less/basics[5]/output/line[5]="8,0,6,0"
+block_less/basics[5]/output/line[6]="9,0,6,0"
+block_less/basics[5]/status=0
+block_less/basics[6]/output/line[0]="3,0,3,0"
+block_less/basics[6]/output/line[1]="4,0,3,0"
+block_less/basics[6]/output/line[2]="5,0,3,0"
+block_less/basics[6]/output/line[3]="6,0,3,0"
+block_less/basics[6]/output/line[4]="7,0,3,0"
+block_less/basics[6]/output/line[5]="8,0,3,0"
+block_less/basics[6]/output/line[6]="9,0,9,0"
+block_less/basics[6]/status=0
+block_less/basics[7]/output/line[0]="3,0,3,0"
+block_less/basics[7]/output/line[1]="4,0,3,0"
+block_less/basics[7]/output/line[2]="5,0,3,0"
+block_less/basics[7]/output/line[3]="6,0,3,0"
+block_less/basics[7]/output/line[4]="7,0,3,0"
+block_less/basics[7]/output/line[5]="8,0,3,0"
+block_less/basics[7]/output/line[6]="9,0,3,0"
+block_less/basics[7]/status=0
diff --git a/csv/test/csv-join/block_less/input b/csv/test/csv-join/block_less/input
new file mode 100644
index 000000000..1cdbff01b
--- /dev/null
+++ b/csv/test/csv-join/block_less/input
@@ -0,0 +1,8 @@
+block_less/basics[0]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 0,0 )';fields=block,id' --block-less"
+block_less/basics[1]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0 )';fields=block,id' --block-less"
+block_less/basics[2]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 9,0 )';fields=block,id' --block-less"
+block_less/basics[3]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 10,0 )';fields=block,id' --block-less"
+block_less/basics[4]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 0,0; echo 6,0 )';fields=block,id' --block-less"
+block_less/basics[5]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0; echo 6,0 )';fields=block,id' --block-less"
+block_less/basics[6]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0; echo 9,0 )';fields=block,id' --block-less"
+block_less/basics[7]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0; echo 10,0 )';fields=block,id' --block-less"
\ No newline at end of file

From a99add3b5e0ebcfc0cf9b905b09ace0565ab3fc3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 23 Jan 2024 18:01:31 +1100
Subject: [PATCH 0722/1056] csv-join: negligible change

---
 csv/applications/csv-join.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 04bb6d338..9bad81d5b 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -42,7 +42,7 @@ static void usage( bool more )
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
     std::cerr << "    --block-less; todo! better option name! input and filter block ids expected sorted" << std::endl;
-    std::cerr << "                  " << std::endl;
+    std::cerr << "                  todo! document" << std::endl;
     std::cerr << "    --drop-id-fields,--drop-id; remove id and block fields from filter output (same as if you did csv-join|csv-shuffle)" << std::endl;
     std::cerr << "    --first-matching: output only the first matching record (a bit of hack for now, but we needed it)" << std::endl;
     std::cerr << "    --flag-matching: output all records, with 1 appended to matching records and 0 appended to not-matching records" << std::endl;

From 170e47079b48545459e8a0e5de6c41bcdfd37913 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 Jan 2024 11:50:57 +1100
Subject: [PATCH 0723/1056] name_value: comma::json_to_string() implemented

---
 name_value/serialize.h | 48 ++++++++++++++++++++++++++----------------
 1 file changed, 30 insertions(+), 18 deletions(-)

diff --git a/name_value/serialize.h b/name_value/serialize.h
index 270ee46d2..07441b16a 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2023 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -29,11 +30,11 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_NAME_VALUE_SERIALIZE_H_
-#define COMMA_NAME_VALUE_SERIALIZE_H_
+#pragma once
 
 #include <fstream>
 #include <iostream>
+#include <sstream>
 #include <string>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
@@ -184,12 +185,15 @@ template < typename T > void read_ini( T& t, std::istream& stream );
 
 /// write json object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
-template < typename T > void write_json( const T& t, const std::string& filename, const xpath& root );
-template < typename T > void write_json( const T& t, const std::string& filename, const char* root );
-template < typename T > void write_json( const T& t, const std::string& filename );
-template < typename T > void write_json( const T& t, std::ostream& stream, const xpath& root );
-template < typename T > void write_json( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_json( const T& t, std::ostream& stream );
+template < typename T > void write_json( const T& t, const std::string& filename, const xpath& root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > void write_json( const T& t, const std::string& filename, const char* root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > void write_json( const T& t, const std::string& filename, bool pretty = true, bool unquote_numbers = true );
+template < typename T > void write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > void write_json( const T& t, std::ostream& stream, const char* root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > void write_json( const T& t, std::ostream& stream, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::string json_to_string( const T& t, const xpath& root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::string json_to_string( const T& t, const char* root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::string json_to_string( const T& t, bool pretty = true, bool unquote_numbers = true );
 
 /// write xml object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
@@ -376,27 +380,37 @@ template < typename T > inline void read_ini( T& t, std::istream& stream, const
 template < typename T > inline void read_ini( T& t, std::istream& stream, bool permissive ) { read_ini< T >( t, stream, xpath(), permissive ); }
 template < typename T > inline void read_ini( T& t, std::istream& stream ) { read_ini< T >( t, stream, xpath(), true ); }
 
-template < typename T > inline void write_json( const T& t, const std::string& filename, const xpath& root )
+template < typename T > inline void write_json( const T& t, const std::string& filename, const xpath& root, bool pretty, bool unquote_numbers )
 {
     std::ofstream ofs( &filename[0] );
     if( !ofs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
-    write_json< T >( t, ofs, root );
+    write_json< T >( t, ofs, root, pretty, unquote_numbers );
     ofs.close();
 }
 
-template < typename T > inline void write_json( const T& t, std::ostream& stream, const xpath& root )
+template < typename T > inline void write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty, bool unquote_numbers )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
-    comma::name_value::impl::write_json( stream, p );
+    comma::name_value::impl::write_json( stream, p, pretty, unquote_numbers );
 }
 
-template < typename T > inline void write_json( const T& t, const std::string& filename, const char* root ) { write_json( t, filename, xpath( root ) ); }
-template < typename T > inline void write_json( const T& t, const std::string& filename ) { write_json( t, filename, xpath() ); }
-template < typename T > inline void write_json( const T& t, std::ostream& stream, const char* root ) { write_json( t, stream, xpath( root ) ); }
-template < typename T > inline void write_json( const T& t, std::ostream& stream ) { write_json( t, stream, xpath() ); }
+template < typename T > inline void write_json( const T& t, const std::string& filename, const char* root, bool pretty, bool unquote_numbers ) { write_json( t, filename, xpath( root ), pretty, unquote_numbers ); }
+template < typename T > inline void write_json( const T& t, const std::string& filename, bool pretty, bool unquote_numbers ) { write_json( t, filename, xpath(), pretty, unquote_numbers ); }
+template < typename T > inline void write_json( const T& t, std::ostream& stream, const char* root, bool pretty, bool unquote_numbers ) { write_json( t, stream, xpath( root ), pretty, unquote_numbers ); }
+template < typename T > inline void write_json( const T& t, std::ostream& stream, bool pretty, bool unquote_numbers ) { write_json( t, stream, xpath(), pretty, unquote_numbers ); }
+
+template < typename T > inline std::string json_to_string( const T& t, const char* root, bool pretty, bool unquote_numbers ) { return json_to_string( t, xpath( root ), pretty, unquote_numbers ); }
+template < typename T > inline std::string json_to_string( const T& t, bool pretty, bool unquote_numbers ) { return json_to_string( t, xpath(), pretty, unquote_numbers ); }
+
+template < typename T > inline std::string json_to_string( const T& t, const xpath& root, bool pretty, bool unquote_numbers )
+{
+    std::ostringstream os;
+    write_json( t, os, root, pretty, unquote_numbers );
+    return os.str();
+}
 
 template < typename T > inline void write_xml( const T& t, const std::string& filename, const xpath& root )
 {
@@ -505,5 +519,3 @@ template < typename T > inline void read( T& t, std::istream& stream, bool permi
 template < typename T > inline void read( T& t, std::istream& stream ) { read< T >( t, stream, xpath(), true ); }
 
 } // namespace comma {
-
-#endif // COMMA_NAME_VALUE_SERIALIZE_H_

From d4adb388871a8a3c9b1781a1a67a5a544efefa15 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 Jan 2024 12:53:42 +1100
Subject: [PATCH 0724/1056] name_value: comma::write_json(): minified mode:
 trailing end of line removed

---
 name_value/impl/json_writer.h | 23 +++++++++++-----
 name_value/serialize.h        | 52 +++++++++++++++++++----------------
 2 files changed, 44 insertions(+), 31 deletions(-)

diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index eefce886c..857acc87d 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -16,7 +16,7 @@
 
 namespace comma { namespace name_value { namespace impl {
 
-template< typename C > inline void json_remove_quotes( std::basic_string< C >& json_text ) // assuming valid json
+template< typename C > inline void json_remove_quotes( std::basic_string< C >& json_text, bool pretty = true ) // assuming valid json
 {
     using string_type = std::basic_string< C >;
     static string_type const true_str( std::initializer_list< C >{ 't', 'r', 'u', 'e' } );
@@ -53,16 +53,25 @@ template< typename C > inline void json_remove_quotes( std::basic_string< C >& j
         *source++ = *next_token++;
         target = next_token;
     }
-    json_text.erase( source, json_text.cend() );
+    json_text.erase( pretty ? source : ( source - 1 ), json_text.cend() );
 }
 
 template< class PTree > void write_json( std::basic_ostream< typename PTree::key_type::value_type > &stream, const PTree &ptree, bool const pretty = true, bool unquote_numbers = true )
 {
-    std::basic_ostringstream< typename PTree::key_type::value_type > string_stream;
-    boost::property_tree::write_json( string_stream, ptree, pretty );
-    auto json_text = string_stream.str();
-    if( unquote_numbers ) { json_remove_quotes( json_text ); }
-    stream << json_text << std::flush;
+    std::basic_ostringstream< typename PTree::key_type::value_type > oss;
+    boost::property_tree::write_json( oss, ptree, pretty );
+    if( unquote_numbers )
+    {
+        std::string s = oss.str();
+        json_remove_quotes( s, pretty );
+        stream << s;
+    }
+    else
+    {
+        if( pretty ) { stream << oss.str(); }
+        else { std::string s = oss.str(); stream << s.substr( 0, s.size() - 1 ); } // unfortunately, boost adds trailing end of line, which we don't want in minified mode
+    }
+    stream << std::flush;
 }
  
 } } }
diff --git a/name_value/serialize.h b/name_value/serialize.h
index 07441b16a..8716a4c09 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -188,9 +188,9 @@ template < typename T > void read_ini( T& t, std::istream& stream );
 template < typename T > void write_json( const T& t, const std::string& filename, const xpath& root, bool pretty = true, bool unquote_numbers = true );
 template < typename T > void write_json( const T& t, const std::string& filename, const char* root, bool pretty = true, bool unquote_numbers = true );
 template < typename T > void write_json( const T& t, const std::string& filename, bool pretty = true, bool unquote_numbers = true );
-template < typename T > void write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty = true, bool unquote_numbers = true );
-template < typename T > void write_json( const T& t, std::ostream& stream, const char* root, bool pretty = true, bool unquote_numbers = true );
-template < typename T > void write_json( const T& t, std::ostream& stream, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::ostream& write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::ostream& write_json( const T& t, std::ostream& stream, const char* root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::ostream& write_json( const T& t, std::ostream& stream, bool pretty = true, bool unquote_numbers = true );
 template < typename T > std::string json_to_string( const T& t, const xpath& root, bool pretty = true, bool unquote_numbers = true );
 template < typename T > std::string json_to_string( const T& t, const char* root, bool pretty = true, bool unquote_numbers = true );
 template < typename T > std::string json_to_string( const T& t, bool pretty = true, bool unquote_numbers = true );
@@ -200,9 +200,9 @@ template < typename T > std::string json_to_string( const T& t, bool pretty = tr
 template < typename T > void write_xml( const T& t, const std::string& filename, const xpath& root );
 template < typename T > void write_xml( const T& t, const std::string& filename, const char* root );
 template < typename T > void write_xml( const T& t, const std::string& filename );
-template < typename T > void write_xml( const T& t, std::ostream& stream, const xpath& root );
-template < typename T > void write_xml( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_xml( const T& t, std::ostream& stream );
+template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream, const xpath& root );
+template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream );
 
 /// write path-value object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
@@ -210,18 +210,18 @@ template < typename T > void write_xml( const T& t, std::ostream& stream );
 template < typename T > void write_path_value( const T& t, const std::string& filename, const xpath& root );
 template < typename T > void write_path_value( const T& t, const std::string& filename, const char* root );
 template < typename T > void write_path_value( const T& t, const std::string& filename );
-template < typename T > void write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers = false );
-template < typename T > void write_path_value( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_path_value( const T& t, std::ostream& stream );
+template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers = false );
+template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream );
 
 /// write ini object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 template < typename T > void write_ini( const T& t, const std::string& filename, const xpath& root );
 template < typename T > void write_ini( const T& t, const std::string& filename, const char* root );
 template < typename T > void write_ini( const T& t, const std::string& filename );
-template < typename T > void write_ini( const T& t, std::ostream& stream, const xpath& root );
-template < typename T > void write_ini( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_ini( const T& t, std::ostream& stream );
+template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream, const xpath& root );
+template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream );
 
 
 template < typename T > inline void read_json( T& t, const std::string& filename, const xpath& root, bool permissive )
@@ -388,19 +388,20 @@ template < typename T > inline void write_json( const T& t, const std::string& f
     ofs.close();
 }
 
-template < typename T > inline void write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty, bool unquote_numbers )
+template < typename T > inline std::ostream& write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty, bool unquote_numbers )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
     comma::name_value::impl::write_json( stream, p, pretty, unquote_numbers );
+    return stream;
 }
 
 template < typename T > inline void write_json( const T& t, const std::string& filename, const char* root, bool pretty, bool unquote_numbers ) { write_json( t, filename, xpath( root ), pretty, unquote_numbers ); }
 template < typename T > inline void write_json( const T& t, const std::string& filename, bool pretty, bool unquote_numbers ) { write_json( t, filename, xpath(), pretty, unquote_numbers ); }
-template < typename T > inline void write_json( const T& t, std::ostream& stream, const char* root, bool pretty, bool unquote_numbers ) { write_json( t, stream, xpath( root ), pretty, unquote_numbers ); }
-template < typename T > inline void write_json( const T& t, std::ostream& stream, bool pretty, bool unquote_numbers ) { write_json( t, stream, xpath(), pretty, unquote_numbers ); }
+template < typename T > inline std::ostream& write_json( const T& t, std::ostream& stream, const char* root, bool pretty, bool unquote_numbers ) { return write_json( t, stream, xpath( root ), pretty, unquote_numbers ); }
+template < typename T > inline std::ostream& write_json( const T& t, std::ostream& stream, bool pretty, bool unquote_numbers ) { return write_json( t, stream, xpath(), pretty, unquote_numbers ); }
 
 template < typename T > inline std::string json_to_string( const T& t, const char* root, bool pretty, bool unquote_numbers ) { return json_to_string( t, xpath( root ), pretty, unquote_numbers ); }
 template < typename T > inline std::string json_to_string( const T& t, bool pretty, bool unquote_numbers ) { return json_to_string( t, xpath(), pretty, unquote_numbers ); }
@@ -420,27 +421,29 @@ template < typename T > inline void write_xml( const T& t, const std::string& fi
     ofs.close();
 }
 
-template < typename T > inline void write_xml( const T& t, std::ostream& stream, const xpath& root )
+template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream, const xpath& root )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
     boost::property_tree::write_xml( stream, p );
+    return stream;
 }
 
 template < typename T > inline void write_xml( const T& t, const std::string& filename, const char* root ) { write_xml( t, filename, xpath( root ) ); }
 template < typename T > inline void write_xml( const T& t, const std::string& filename ) { write_xml( t, filename, xpath() ); }
-template < typename T > inline void write_xml( const T& t, std::ostream& stream, const char* root ) { write_xml( t, stream, xpath( root ) ); }
-template < typename T > inline void write_xml( const T& t, std::ostream& stream ) { write_xml( t, stream, xpath() ); }
+template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream, const char* root ) { return write_xml( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream ) { return write_xml( t, stream, xpath() ); }
 
-template < typename T > inline void write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers )
+template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
     comma::property_tree::to_path_value( stream, p, comma::property_tree::disabled, '=', '\n', xpath(), unquote_numbers );
+    return stream;
 }
 
 template < typename T > inline void write_path_value( const T& t, const std::string& filename, const xpath& root )
@@ -453,16 +456,17 @@ template < typename T > inline void write_path_value( const T& t, const std::str
 
 template < typename T > inline void write_path_value( const T& t, const std::string& filename, const char* root ) { write_path_value( t, filename, xpath( root ) ); }
 template < typename T > inline void write_path_value( const T& t, const std::string& filename ) { write_path_value( t, filename, xpath() ); }
-template < typename T > inline void write_path_value( const T& t, std::ostream& stream, const char* root ) { write_path_value( t, stream, xpath( root ) ); }
-template < typename T > inline void write_path_value( const T& t, std::ostream& stream ) { write_path_value( t, stream, xpath() ); }
+template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream, const char* root ) { return write_path_value( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream ) { return write_path_value( t, stream, xpath() ); }
 
-template < typename T > inline void write_ini( const T& t, std::ostream& stream, const xpath& root )
+template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream, const xpath& root )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
     boost::property_tree::write_ini( stream, p );
+    return stream;
 }
 
 template < typename T > inline void write_ini( const T& t, const std::string& filename, const xpath& root )
@@ -475,8 +479,8 @@ template < typename T > inline void write_ini( const T& t, const std::string& fi
 
 template < typename T > inline void write_ini( const T& t, const std::string& filename, const char* root ) { write_ini( t, filename, xpath( root ) ); }
 template < typename T > inline void write_ini( const T& t, const std::string& filename ) { write_ini( t, filename, xpath() ); }
-template < typename T > inline void write_ini( const T& t, std::ostream& stream, const char* root ) { write_ini( t, stream, xpath( root ) ); }
-template < typename T > inline void write_ini( const T& t, std::ostream& stream ) { write_ini( t, stream, xpath() ); }
+template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream, const char* root ) { return write_ini( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream ) { return write_ini( t, stream, xpath() ); }
 
 
 template < typename T > inline void read( T& t, std::istream& stream, const xpath& root, bool permissive )

From c260044d82af3d4ac31d24c1e1bc9780dfc52382 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 Jan 2024 13:42:07 +1100
Subject: [PATCH 0725/1056] csv::options::indices() method implemented

---
 csv/options.cpp | 12 ++++++++++--
 csv/options.h   |  4 ++++
 2 files changed, 14 insertions(+), 2 deletions(-)

diff --git a/csv/options.cpp b/csv/options.cpp
index 16733f020..21718bd83 100644
--- a/csv/options.cpp
+++ b/csv/options.cpp
@@ -121,12 +121,20 @@ std::string options::usage( const std::string& default_fields, bool verbose )
 bool options::has_field( const std::string& field ) const
 {
     if( field.empty() ) { return false; }
-    const std::vector< std::string >& v = split( fields, ',' );
-    const std::vector< std::string >& f = split( field, ',' );
+    const auto& v = split( fields, ',' );
+    const auto& f = split( field, ',' );
     for( unsigned int i = 0; i < f.size(); ++i ) { if( std::find( v.begin(), v.end(), f[i] ) == v.end() ) { return false; } }
     return true;
 }
 
+std::map< std::string, unsigned int > options::indices() const
+{
+    std::map< std::string, unsigned int > m;
+    const auto& v = split( fields, ',' );
+    for( unsigned int i = 0; i < v.size(); ++i ) { if( !v[i].empty() ) { m[v[i]] = i; } }
+    return m;
+}
+
 bool options::has_some_of_fields( const std::string& field ) const
 {
     if( field.empty() ) { return false; }
diff --git a/csv/options.h b/csv/options.h
index bb4e79154..2996b6c4f 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -4,6 +4,7 @@
 
 #pragma once
 
+#include <map>
 #include <unordered_map>
 #include <boost/optional.hpp>
 #include "../application/command_line_options.h"
@@ -93,6 +94,9 @@ class options
         ///              have paths 'centre/position', 'centre', 'centre/position/x', etc
         bool has_some_of_paths( const std::string& paths ) const;
 
+        /// return field indices
+        std::map< std::string, unsigned int > indices() const;
+
         /// returns comma separated list of valueless csv options that can be passed to command_line_options.unnamed
         static std::string valueless_options();
 

From 5cdd61ebb09017c0ba308852844990955adfc95e Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Jan 2024 01:29:03 +0000
Subject: [PATCH 0726/1056] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index b988105ad..7bd91579b 100644
--- a/README.md
+++ b/README.md
@@ -66,6 +66,6 @@ Albeit more tedious, it is safe since **comma** master branch is thoroughly test
 
 Read install.yml, if interested in tweaking build configuration.
 
-#documentation
+# documentation
 
 [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)

From a84a2892bde7dc4f55d3c942e1ffb250eb963782 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Jan 2024 01:30:32 +0000
Subject: [PATCH 0727/1056] Update README.md

---
 README.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 7bd91579b..fcea07986 100644
--- a/README.md
+++ b/README.md
@@ -4,6 +4,8 @@
 
 **comma** is a generic library for fixed-width (comma-separated or binary) and structured (e.g. json) data processing primarily on Linux. MacOS is supported, but less tested.
 
+Documentation: [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)
+
 **comma** consists of a collection of command line utilities, as well as underlying C++ and python libraries.
 
 **comma** design considerations:
@@ -19,7 +21,7 @@ This documentation will have not more than a brief description of each command l
 
 Instead, this documentation is intended to provide more and more step-by-step tutorials and recipes for **comma** command line applications.
 
-The library code is self-documented. You can generate it with **doxigen**. Use **git grep** or explore code of respective applications for usage examples.
+The library code is self-documented. You can generate it with **doxygen**. Use **git grep** or explore code of respective applications for usage examples.
 
 # installation
 

From 5bd6c308ddf1068d4e5d2afb1aadd7330c755a83 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Jan 2024 01:32:01 +0000
Subject: [PATCH 0728/1056] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index fcea07986..d0b522007 100644
--- a/README.md
+++ b/README.md
@@ -17,7 +17,7 @@ Documentation: [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitl
 
 You can limit yourself to using the **comma** command line utilities. Further, **comma** provides libraries for serialization, binary protocol packet layouts, etc.
 
-This documentation will have not more than a brief description of each command line utility. For details, each utility has elaborate help, e.g. run: **csv-eval --help**.
+This documentation will have not more than a brief description of each command line utility. For details, each utility has elaborate help with examples, e.g. run: **csv-eval --help**.
 
 Instead, this documentation is intended to provide more and more step-by-step tutorials and recipes for **comma** command line applications.
 

From 3c8eb41dc8c24a58b85040d279cbef5b95586e5b Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Jan 2024 01:34:14 +0000
Subject: [PATCH 0729/1056] Update README.md

---
 README.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/README.md b/README.md
index d0b522007..ea74a44bb 100644
--- a/README.md
+++ b/README.md
@@ -36,6 +36,9 @@ pip3 install comma-py==1.0.0
 ```
 
 ## build from source
+
+Building from source gives you the latest features and thus may be a good choice. The code is continuously tested and backward compatible.
+
 ### building with ansible
 
 ```

From 137888ba39d1c834177d8d338e419701c693848f Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 26 Jan 2024 01:35:39 +0000
Subject: [PATCH 0730/1056] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index ea74a44bb..9b68d5788 100644
--- a/README.md
+++ b/README.md
@@ -35,7 +35,7 @@ sudo apt-get install comma
 pip3 install comma-py==1.0.0
 ```
 
-## build from source
+## building from source
 
 Building from source gives you the latest features and thus may be a good choice. The code is continuously tested and backward compatible.
 

From acd4eada6012b182d5c817aafbf2e0cda4b6a020 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 29 Jan 2024 15:35:09 +1100
Subject: [PATCH 0731/1056] csv::options::make_same_kind(): typo bug fixed

---
 csv/options.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/options.h b/csv/options.h
index 2996b6c4f..a3489e9c0 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -110,7 +110,7 @@ inline options options::make_same_kind( const options& rhs )
     options o;
     o.flush = rhs.flush;
     o.delimiter = rhs.delimiter;
-    o.flush = rhs.flush;
+    o.full_xpath = rhs.full_xpath;
     o.precision = rhs.precision;
     o.quote = rhs.quote;
     if( rhs.binary() ) { o.format( format::value< T >() ); }

From 2ae34acab103a44abcfae9d21bdcf2aa26a8083c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 30 Jan 2024 10:46:26 +1100
Subject: [PATCH 0732/1056] COMMA_SAY_ERROR, COMMA_SAY_WARN, etc: respective
 verbosity levels made more intuitive

---
 application/command_line_options.h | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/application/command_line_options.h b/application/command_line_options.h
index b76efb5d0..f33b082c4 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -38,11 +38,11 @@ inline std::ostream& say( unsigned int verbosity=0, const std::string& prefix=""
 /// convenience macros
 #define _COMMA_SAY( _level, _message ) { if( _level <= ::comma::verbosity::level() ) { ::comma::say( _level ) << _message; } }
 #define COMMA_SAY( message )       _COMMA_SAY( 0,                message << std::endl )
-#define COMMA_SAY_ERROR( message ) _COMMA_SAY( 1, "error: "   << message << std::endl )
-#define COMMA_SAY_WARN( message )  _COMMA_SAY( 2, "warning: " << message << std::endl )
-#define COMMA_SAY_INFO( message )  _COMMA_SAY( 3, "info: "    << message << std::endl )
-#define COMMA_SAY_DEBUG( message ) _COMMA_SAY( 4, "debug: "   << message << std::endl )
-#define COMMA_SAY_TRACE( message ) _COMMA_SAY( 5, "trace: "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
+#define COMMA_SAY_ERROR( message ) _COMMA_SAY( 0, "error: "   << message << std::endl )
+#define COMMA_SAY_WARN( message )  _COMMA_SAY( 1, "warning: " << message << std::endl )
+#define COMMA_SAY_INFO( message )  _COMMA_SAY( 2, "info: "    << message << std::endl )
+#define COMMA_SAY_DEBUG( message ) _COMMA_SAY( 3, "debug: "   << message << std::endl )
+#define COMMA_SAY_TRACE( message ) _COMMA_SAY( 4, "trace: "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
 
 /// convenience alias of say( verbosity )
 /// @example

From f7fe9683cfc9d812b67815561298953e4adc9dfa Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 31 Jan 2024 20:45:04 +1100
Subject: [PATCH 0733/1056] io-cat: --repeat, --repeat-forever: in progress...

---
 io/applications/io-cat.cpp | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 9a4cdd941..b6eecdeec 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -100,6 +100,10 @@ void usage( bool verbose = false )
     std::cerr << "                  a workaround for sparse input fed into: io-cat ... | head -n10, which" << std::endl;
     std::cerr << "                  not exit until io-cat receives record 11" << std::endl;
     std::cerr << "                  instead run: io-cat ... --head=10 (use --flush if you don't want buffering" << std::endl;
+    std::cerr << "    --repeat=[<n>]; read each stream, output <n> times" << std::endl;
+    std::cerr << "                  e.g: run: io-cat my-file-1 my-file-2 --repeat=3" << std::endl;
+    std::cerr << "                       instead of: cat my-file-1 my-file-2 my-file-1 my-file-2 my-file-1 my-file-2" << std::endl;
+    std::cerr << "    --repeat-forever,--forever; same as --repeat, but forever" << std::endl;
     std::cerr << "    --round-robin=[<number of packets>]: only for multiple inputs: read not more" << std::endl;
     std::cerr << "                                         than <number of packets> from an input at once," << std::endl;
     std::cerr << "                                         before checking other inputs" << std::endl;
@@ -387,7 +391,12 @@ int main( int argc, char** argv )
         connect_period = boost::posix_time::milliseconds( static_cast<unsigned int>(std::floor( connect_period_seconds * 1000 ) ));
         permissive = options.exists( "--permissive" );
         bool has_head = options.exists( "--head" );
-        const std::vector< std::string >& unnamed = options.unnamed( "--blocking,--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
+        unsigned int repeat = options.value( "--repeat", 0 );
+        bool forever = options.exists( "--repeat-forever,--forever" );
+        std::uint64_t count{0};
+        ( void )repeat; ( void )forever; ( void )count;
+        const std::vector< std::string >& unnamed = options.unnamed( "--repeat-forever,--forever,--blocking,--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
+        options.assert_mutually_exclusive( "--round-robin", "--repeat,--repeat-forever,--forever" );
         #ifdef WIN32
         if( size || ( unnamed.size() == 1 && !has_head ) ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         //if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }

From 14c63b2edde7037455269670c294b184b5fdda85 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 31 Jan 2024 22:04:01 +1100
Subject: [PATCH 0734/1056] io-cat: --repeat, --repeat-forever: implemented,
 basic regression test added

---
 io/applications/io-cat.cpp     | 56 ++++++++++++++++++++++++++++------
 io/test/io-cat/repeat/expected | 29 ++++++++++++++++++
 io/test/io-cat/repeat/input    |  4 +++
 io/test/test                   |  6 ++++
 4 files changed, 85 insertions(+), 10 deletions(-)
 create mode 100644 io/test/io-cat/repeat/expected
 create mode 100644 io/test/io-cat/repeat/input
 create mode 100755 io/test/test

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index b6eecdeec..fb55c6531 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -103,6 +103,7 @@ void usage( bool verbose = false )
     std::cerr << "    --repeat=[<n>]; read each stream, output <n> times" << std::endl;
     std::cerr << "                  e.g: run: io-cat my-file-1 my-file-2 --repeat=3" << std::endl;
     std::cerr << "                       instead of: cat my-file-1 my-file-2 my-file-1 my-file-2 my-file-1 my-file-2" << std::endl;
+    std::cerr << "                  when using for large source, be aware that the sources get stored in memory first" << std::endl;
     std::cerr << "    --repeat-forever,--forever; same as --repeat, but forever" << std::endl;
     std::cerr << "    --round-robin=[<number of packets>]: only for multiple inputs: read not more" << std::endl;
     std::cerr << "                                         than <number of packets> from an input at once," << std::endl;
@@ -347,21 +348,58 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
     exit( 1 );
 }
 
-static bool _write( const comma::command_line_options& options, const std::vector< char >& buffer, unsigned int bytes_read )
+struct output_t
+{
+    unsigned int size{0};
+    bool forever{false};
+    std::vector< std::vector< char > > buffers; // todo: quick and dirty, watch performance on push back of large inputs
+    operator bool() const { return !buffers.empty(); }
+
+    output_t() = default;
+    output_t( const comma::command_line_options& options, unsigned int n )
+        : size( options.value( "--repeat", 0 ) )
+        , forever( options.exists( "--repeat-forever,--forever" ) )
+        , buffers( size > 0 || forever ? n : 0 )
+    {
+    }
+
+    void write( unsigned int i, const std::vector< char >& buffer, unsigned int bytes_read )
+    {
+        if( buffers.empty() ) { std::cout.write( &buffer[0], bytes_read ); return; }
+        unsigned int s = buffers[i].size();
+        buffers[i].resize( s + bytes_read );
+        std::memcpy( &buffers[i][s], &buffer[0], bytes_read );
+    }
+
+    void finalise( const comma::signal_flag& is_shutdown ) const
+    {
+        for( unsigned int i = 0; !is_shutdown && ( i < size || forever ); ++i )
+        {
+            for( unsigned int j = 0; !is_shutdown && j < buffers.size() && std::cout.good(); ++j )
+            {
+                std::cout.write( &buffers[j][0], buffers[j].size() );
+            }
+        }
+    }
+};
+
+output_t output;
+
+static bool _write( unsigned int i, const comma::command_line_options& options, const std::vector< char >& buffer, unsigned int bytes_read )
 {
     static unsigned int head = options.value( "--head", 0 );
     static unsigned int size = options.value( "--size,-s", 0 );
     static unsigned int count = 0;
-    if( head == 0 ) { std::cout.write( &buffer[0], bytes_read ); return true; }
+    if( head == 0 ) { output.write( i, buffer, bytes_read ); return true; }
     if( size == 0 )
     {
-        std::cout.write( &buffer[0], bytes_read );
+        output.write( i, buffer, bytes_read );
         ++count;
     }
     else
     {
         unsigned int n = std::min( bytes_read / size, head - count );
-        std::cout.write( &buffer[0], n * size );
+        output.write( i, buffer, n * size );
         count += n;
     }
     return count < head;
@@ -391,10 +429,6 @@ int main( int argc, char** argv )
         connect_period = boost::posix_time::milliseconds( static_cast<unsigned int>(std::floor( connect_period_seconds * 1000 ) ));
         permissive = options.exists( "--permissive" );
         bool has_head = options.exists( "--head" );
-        unsigned int repeat = options.value( "--repeat", 0 );
-        bool forever = options.exists( "--repeat-forever,--forever" );
-        std::uint64_t count{0};
-        ( void )repeat; ( void )forever; ( void )count;
         const std::vector< std::string >& unnamed = options.unnamed( "--repeat-forever,--forever,--blocking,--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
         options.assert_mutually_exclusive( "--round-robin", "--repeat,--repeat-forever,--forever" );
         #ifdef WIN32
@@ -402,6 +436,7 @@ int main( int argc, char** argv )
         //if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
         if( unnamed.empty() ) { std::cerr << "io-cat: please specify at least one source" << std::endl; return 1; }
+        output = output_t( options, unnamed.size() );
         boost::ptr_vector< stream > streams;
         comma::io::select select;
         for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 || ( unnamed.size() == 1 && !has_head ) ) ); }
@@ -426,7 +461,7 @@ int main( int argc, char** argv )
                     if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << unnamed[i] << "): closed" << std::endl; }
                     select.read().remove( streams[i].fd() );
                     streams[i].close();
-                    if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { return 0; }
+                    if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { done = true; break; }
                     continue;
                 }
                 if( !ready && empty ) { done = false; continue; }
@@ -437,7 +472,7 @@ int main( int argc, char** argv )
                     if( bytes_read == 0 ) { break; }
                     done = false;
                     if( size && bytes_read % size != 0 ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) << std::endl; return 1; }
-                    if( !_write( options, buffer, bytes_read ) ) { done = true; break; }
+                    if( !_write( i, options, buffer, bytes_read ) ) { done = true; break; }
                     if( !std::cout.good() ) { done = true; break; }
                     if( unbuffered ) { std::cout.flush(); }
                     if( round_robin_count )
@@ -448,6 +483,7 @@ int main( int argc, char** argv )
                 }
             }
         }
+        output.finalise( is_shutdown );
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "io-cat: " << ex.what() << std::endl; }
diff --git a/io/test/io-cat/repeat/expected b/io/test/io-cat/repeat/expected
new file mode 100644
index 000000000..fa9664e7c
--- /dev/null
+++ b/io/test/io-cat/repeat/expected
@@ -0,0 +1,29 @@
+repeat[0]/output/line[0]="1,2,3"
+repeat[0]/output/line[1]="4,5,6"
+repeat[0]/output/line[2]="1,2,3"
+repeat[0]/output/line[3]="4,5,6"
+repeat[0]/output/line[4]="1,2,3"
+repeat[0]/output/line[5]="4,5,6"
+repeat[0]/status=0
+repeat[1]/output/line[0]="1,2,3"
+repeat[1]/output/line[1]="4,5,6"
+repeat[1]/output/line[2]="1,2,3"
+repeat[1]/output/line[3]="4,5,6"
+repeat[1]/output/line[4]="1,2,3"
+repeat[1]/output/line[5]="4,5,6"
+repeat[1]/status=0
+repeat[2]/output/line[0]="1,2,3"
+repeat[2]/output/line[1]="4,5,6"
+repeat[2]/output/line[2]="1,2,3"
+repeat[2]/output/line[3]="4,5,6"
+repeat[2]/status=0
+repeat[3]/output/line[0]="0,0,0"
+repeat[3]/output/line[1]="1,1,1"
+repeat[3]/output/line[2]="2,2,2"
+repeat[3]/output/line[3]="0,0,0"
+repeat[3]/output/line[4]="1,1,1"
+repeat[3]/output/line[5]="2,2,2"
+repeat[3]/output/line[6]="0,0,0"
+repeat[3]/output/line[7]="1,1,1"
+repeat[3]/output/line[8]="2,2,2"
+repeat[3]/status=0
diff --git a/io/test/io-cat/repeat/input b/io/test/io-cat/repeat/input
new file mode 100644
index 000000000..850130f89
--- /dev/null
+++ b/io/test/io-cat/repeat/input
@@ -0,0 +1,4 @@
+repeat[0]="( echo 1,2,3; echo 4,5,6 ) | io-cat - --repeat=3"
+repeat[1]="( echo 1,2,3; echo 4,5,6 ) | csv-to-bin 3ui | io-cat - --repeat=3 | csv-from-bin 3ui"
+repeat[2]="( echo 1,2,3; echo 4,5,6 ) | io-cat - --repeat-forever | head -n4"
+repeat[3]="( echo 0,0,0; echo 1,1,1 ) | io-cat - <( echo 2,2,2 ) --repeat=3"
diff --git a/io/test/test b/io/test/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/io/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From b3082f8e77e515c0f2e14ead883506dc3f9b19d6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 5 Feb 2024 12:28:35 +1100
Subject: [PATCH 0735/1056] python: version and upload notes updated

---
 python/README.md        | 4 +++-
 python/comma/version.py | 2 +-
 system/launchpad/readme | 9 +++++++++
 3 files changed, 13 insertions(+), 2 deletions(-)

diff --git a/python/README.md b/python/README.md
index 9d61ceb42..57478d578 100644
--- a/python/README.md
+++ b/python/README.md
@@ -4,7 +4,9 @@
 **comma-py** is the part of **comma** written in python; the main part of
 it is **csv-eval** command line utility for efficient **numpy**-style
 conversions on an input stream of comma-separated or fixed-width binary
-data
+data.
+
+**comma-py** also has useful modules for dictionary and signal manipulations.
 
 for more details, run:
 ```
diff --git a/python/comma/version.py b/python/comma/version.py
index bda5995cb..3d27eb5f0 100644
--- a/python/comma/version.py
+++ b/python/comma/version.py
@@ -1,4 +1,4 @@
 # Copyright (c) 2011 The University of Sydney
 
 # if you change this file, check that it still works with ../setup.py, which gets the comma version by reading this file
-__version__ = "1.1.0"
+__version__ = "1.2.1"
diff --git a/system/launchpad/readme b/system/launchpad/readme
index e4f748c65..7c4af6652 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -26,6 +26,15 @@ python3 setup.py sdist bdist_wheel
 twine upload --repository-url https://pypi.org/legacy/ dist/* # test
 twine upload dist/*
 
+update of 20240205
+- pypi requires 2FA now (set e.g. with google authenticator on a mobile)
+- legacy twine upload dist/* does not work: 
+    HTTPError: 403 Forbidden from https://upload.pypi.org/legacy/
+    Username/Password authentication is no longer supported. Migrate to API Tokens or Trusted Publishers instead. See https://pypi.org/help/#apitoken and https://pypi.org/help/#trusted-publishers
+- follow instructions in the link above to set up api token and rc file (which are really vague: e.g. it seems that PROJECT_NAME should be left as is, NOT replaced with comma-py)
+- then run: twine upload --repository PROJECT_NAME dist/* or twine upload dist/*
+- it may exit with a very obscure HTTP error 403 or 400, but it seems to upload the repo nevertheless...
+
 todo
   - document
     - uploading to launchpad

From ad57befde8a9a6cf85e1ce260e3f7d3d4bcf695c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 5 Feb 2024 12:32:08 +1100
Subject: [PATCH 0736/1056] system/launchpad/readme updated

---
 system/launchpad/readme | 1 +
 1 file changed, 1 insertion(+)

diff --git a/system/launchpad/readme b/system/launchpad/readme
index 7c4af6652..0347dbf59 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -22,6 +22,7 @@ uploading to pypi (i know, wrong place; todo: script)
 cd comma/python
 # version.py: bump up version
 # setup.py: uncomment install_requires (commented since it messes installation for those who use apt to install python3 packages (e.g. numpy)
+rm -rf dist
 python3 setup.py sdist bdist_wheel
 twine upload --repository-url https://pypi.org/legacy/ dist/* # test
 twine upload dist/*

From 627091366716a9f832725ea35994934f9f5df420 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 5 Feb 2024 13:06:25 +1100
Subject: [PATCH 0737/1056] version bumped up to 1.1.0

---
 CMakeLists.txt                          | 2 +-
 debian/changelog                        | 6 +++---
 system/launchpad/comma-launchpad-upload | 1 +
 system/launchpad/readme                 | 2 +-
 4 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 06d2e2c66..cf8379b41 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,7 +10,7 @@ endif( USE_ARM_TOOLCHAIN )
 
 cmake_minimum_required( VERSION 3.1 )
 cmake_policy( SET CMP0048 NEW )
-project( comma VERSION 1.0.12 LANGUAGES CXX )
+project( comma VERSION 1.1.0 LANGUAGES CXX )
 if( NOT DEFINED CMAKE_PROJECT_VERSION )
     set( CMAKE_PROJECT_VERSION ${PROJECT_VERSION} )
     set( CMAKE_PROJECT_VERSION_MAJOR ${PROJECT_VERSION_MAJOR} )
diff --git a/debian/changelog b/debian/changelog
index d54a10c6e..012c9b8de 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,5 +1,5 @@
-comma (1.0.12-0ppa0) jammy; urgency=low
+comma (1.1.0-0ppa0) jammy; urgency=low
 
-  * launchpad stopped installing so files; trying to fix...
+  * substantially more functionality and bug fixes in utilities like csv-paste, io-cat, etc
 
- -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Sat, 14 May 2022 22:23:49 +1000
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Mon, 5 Feb 2024 12:44:00 +1000
diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
index 342d40d99..f6a472b6d 100755
--- a/system/launchpad/comma-launchpad-upload
+++ b/system/launchpad/comma-launchpad-upload
@@ -11,6 +11,7 @@
 #     - tag repo with version
 #     - push
 
+type -p debuild >/dev/null || sudo apt install devscripts
 function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1; }
 [[ -n "$2" ]] || { echo "usage: $0 <what> <ubuntu-name> <comma-version>" >&2; exit 1; }
 what=$1
diff --git a/system/launchpad/readme b/system/launchpad/readme
index 0347dbf59..4f7b5d09c 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -12,7 +12,7 @@ uploading to launchpad
       cd ..
       comma/system/launchpad/comma-launchpad-upload update 1.2.3
 - once build in launchpad succeeds, commit and push
-- if there were changes in comma/python, release them into pypi (todo)
+- if there were changes in comma/python, release them into pypi
 - notify interested parties
 
 verifying ppa in docker

From a0abc3d196026618e0dcc9d2adb730af850c8927 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 5 Feb 2024 20:22:05 +1100
Subject: [PATCH 0738/1056] system/launchpad/comma-launchpad-upload: minor fix

---
 system/launchpad/comma-launchpad-upload | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
index f6a472b6d..6c6d5301c 100755
--- a/system/launchpad/comma-launchpad-upload
+++ b/system/launchpad/comma-launchpad-upload
@@ -12,7 +12,7 @@
 #     - push
 
 type -p debuild >/dev/null || sudo apt install devscripts
-function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1; }
+function say() { echo "usage: $0: $@" >&2; }; function die() { "$0: error: $@"; exit 1; }
 [[ -n "$2" ]] || { echo "usage: $0 <what> <ubuntu-name> <comma-version>" >&2; exit 1; }
 what=$1
 comma_version=$2

From 5df4ab63b0b613b48d5073293a20048d072b3dde Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Feb 2024 00:08:34 +1100
Subject: [PATCH 0739/1056] system/launchpad/readme: comment added

---
 system/launchpad/readme | 1 +
 1 file changed, 1 insertion(+)

diff --git a/system/launchpad/readme b/system/launchpad/readme
index 4f7b5d09c..7f469bb8a 100644
--- a/system/launchpad/readme
+++ b/system/launchpad/readme
@@ -11,6 +11,7 @@ uploading to launchpad
       git tag -a 1.2.3 -m 'your comments for version 1.2.3'
       cd ..
       comma/system/launchpad/comma-launchpad-upload update 1.2.3
+- sign gpg as snaky gpg (as opposed to dromedary)
 - once build in launchpad succeeds, commit and push
 - if there were changes in comma/python, release them into pypi
 - notify interested parties

From 6aa8e3695e57feebfdb79a62b4c3e154ae97bcc7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 Feb 2024 19:45:37 +1100
Subject: [PATCH 0740/1056] comma-launchpad-upload: todo comment added

---
 system/launchpad/comma-launchpad-upload | 1 +
 1 file changed, 1 insertion(+)

diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
index 6c6d5301c..e5db5a449 100755
--- a/system/launchpad/comma-launchpad-upload
+++ b/system/launchpad/comma-launchpad-upload
@@ -1,6 +1,7 @@
 #!/bin/bash
 
 # todo
+#   - !!! script to build in docker (how to manage signature and dput in docker?)
 #   - manual steps (automate if possible)
 #     - update changelog
 #       - version

From 8073b17cc34a953a8e311083b2583b7e938609ec Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 9 Feb 2024 11:39:43 +1100
Subject: [PATCH 0741/1056] name-value-form: first cut implemented

---
 name_value/applications/CMakeLists.txt  | 15 ++++--
 name_value/applications/name-value-form | 62 +++++++++++++++++++++++++
 2 files changed, 72 insertions(+), 5 deletions(-)
 create mode 100755 name_value/applications/name-value-form

diff --git a/name_value/applications/CMakeLists.txt b/name_value/applications/CMakeLists.txt
index c1b94c309..50f29d37e 100644
--- a/name_value/applications/CMakeLists.txt
+++ b/name_value/applications/CMakeLists.txt
@@ -17,11 +17,11 @@ set_target_properties( name-value-get PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( name-value-eval-preparse PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( name-value-permute PROPERTIES LINK_FLAGS_RELEASE -s )
 
-INSTALL( TARGETS name-value-convert name-value-get name-value-eval-preparse name-value-permute
-         RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR}
-         COMPONENT Runtime )
-
-install( PROGRAMS name-value-eval name-value-calc name-value-apply DESTINATION ${comma_INSTALL_BIN_DIR} )
+INSTALL( TARGETS name-value-convert
+                 name-value-get
+                 name-value-eval-preparse
+                 name-value-permute
+                 RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
          
 add_executable( name-value-from-csv ${dir}/name-value-from-csv.cpp )
 target_link_libraries( name-value-from-csv comma_application comma_string )
@@ -32,3 +32,8 @@ add_executable( name-value-to-csv ${dir}/name-value-to-csv.cpp )
 target_link_libraries( name-value-to-csv comma_application comma_string )
 set_target_properties( name-value-to-csv PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS name-value-to-csv RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
+install( PROGRAMS name-value-apply DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS name-value-calc DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS name-value-eval DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS name-value-form DESTINATION ${comma_INSTALL_BIN_DIR} )
\ No newline at end of file
diff --git a/name_value/applications/name-value-form b/name_value/applications/name-value-form
new file mode 100755
index 000000000..2f17ea5ea
--- /dev/null
+++ b/name_value/applications/name-value-form
@@ -0,0 +1,62 @@
+#!/bin/bash
+
+# Copyright (c) 2024 Vsevolod Vlaskine
+
+type -p zenity >/dev/null || { echo "$0: please install zenity (zenity is great!): sudo apt install zenity" >&2; exit 1; }
+source $( type -p comma-application-util ) || { echo "tinysar-simulation-console: you need to install comma and snark to run this utility" >&2; exit 1; }
+source $( type -p comma-name-value-util )
+
+function prologue()
+{
+    cat <<eof
+usage: todo
+eof
+}
+
+function epilogue()
+{
+    cat <<eof
+examples (try them)
+    todo
+eof
+}
+
+function options-description()
+{
+    cat <<eof
+--delimiter=<character>; default=,
+--dry-run,--dry; print zenity command and exit
+--height=[<pixels>]
+--title=[<title>]
+--verbose,-v
+--width=[<pixels>]
+eof
+}
+
+function _run()
+{
+    local command="zenity --forms"
+    [[ -z "$options_width" ]] || command+=" --width='$options_width'" # todo? adaptive width
+    [[ -z "$options_height" ]] || command+=" --width='$options_height'" # todo? adaptive height
+    [[ -z "$options_title" ]] || command+=" --text='$options_title'"
+    local input=$( cat | grep -v '^#' )
+    local label name value default_value combo_list names=() defaults=() values=()
+    while IFS== read name value; do
+        IFS="$options_delimiter" read default_value combo_list <<< "$value"
+        label="$name"
+        names+=( "$name" )
+        defaults+=( "$default_value" )
+        [[ -z "$default_value" ]] || label+=" ($default_value)"
+        if [[ -n "$combo_list" ]]; then command+=" --add-combo='$label' --combo-values='$( sed 's#,#|#g' <<< "$combo_list" )'"
+        else command+=" --add-entry='$label'"; fi
+    done <<< "$input"
+    (( ! options_dry_run )) || { echo "$command"; exit; }
+    while read value; do values+=( "$value" ); done < <( eval "$command" 2> >( if (( options_verbose )); then cat; else cat >/dev/null; fi ) | tr '|' '\n' )
+    for (( i = 0; i < ${#names[@]}; ++i )); do # keeping it plain vanilla; todo? use comma utilities
+        if [[ -n "${values[$i]}" ]]; then echo "${names[$i]}=\"${values[$i]}\""; else echo "${names[$i]}=\"${defaults[$i]}\""; fi
+    done
+    comma_status_ok || die "failed"
+}
+
+comma-application-init "$@" < <( options-description )
+_run
\ No newline at end of file

From 827644cc4087db1b2f2284f7abbeff42e4079324 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 9 Feb 2024 12:23:14 +1100
Subject: [PATCH 0742/1056] name-value-form: --help: done for now

---
 name_value/applications/name-value-form | 24 +++++++++++++++++++++---
 1 file changed, 21 insertions(+), 3 deletions(-)

diff --git a/name_value/applications/name-value-form b/name_value/applications/name-value-form
index 2f17ea5ea..629f4fb26 100755
--- a/name_value/applications/name-value-form
+++ b/name_value/applications/name-value-form
@@ -9,7 +9,14 @@ source $( type -p comma-name-value-util )
 function prologue()
 {
     cat <<eof
-usage: todo
+read name-value pairs on stdin, display form, output initialised
+name-value pairs to stdout
+
+usage: cat <input> | name-value-form
+
+<input>     : <name>[=<value>]
+<value>     : [<default>][<delimiter><combo list values>]
+<delimiter> : value of --delimiter option (default: ',')
 eof
 }
 
@@ -17,14 +24,25 @@ function epilogue()
 {
     cat <<eof
 examples (try them)
-    todo
+    plain vanilla
+        { echo "hello"; echo "world"; } | name-value-form
+    form title
+        { echo "hello"; echo "world"; } | name-value-form --title "HELLO"
+    default values
+        { echo "hello"; echo "world=XXX"; } | name-value-form
+    combo lists
+        { echo "hello"; echo "world=,a,b,c"; } | name-value-form
+    combo lists with defaults
+        { echo "hello"; echo "world=b,a,b,c"; } | name-value-form
+    dry run
+        { echo "hello"; echo "world"; } | name-value-form --dry
 eof
 }
 
 function options-description()
 {
     cat <<eof
---delimiter=<character>; default=,
+--delimiter=<character>; default=,; value delimiter
 --dry-run,--dry; print zenity command and exit
 --height=[<pixels>]
 --title=[<title>]

From 5e835a93342e19e649af7af3546ff079fffd6f38 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Feb 2024 17:00:08 +1100
Subject: [PATCH 0743/1056] name-value-form: some bugs fixed; example added

---
 name_value/applications/name-value-form       | 16 +++++++++++----
 name_value/examples/name-value-form/menu.json | 20 +++++++++++++++++++
 name_value/examples/name-value-form/run       |  8 ++++++++
 3 files changed, 40 insertions(+), 4 deletions(-)
 create mode 100644 name_value/examples/name-value-form/menu.json
 create mode 100755 name_value/examples/name-value-form/run

diff --git a/name_value/applications/name-value-form b/name_value/applications/name-value-form
index 629f4fb26..2542e6148 100755
--- a/name_value/applications/name-value-form
+++ b/name_value/applications/name-value-form
@@ -59,14 +59,22 @@ function _run()
     [[ -z "$options_title" ]] || command+=" --text='$options_title'"
     local input=$( cat | grep -v '^#' )
     local label name value default_value combo_list names=() defaults=() values=()
+    function _strip() { sed -e 's#^"##' -e "s#^'##" -e 's#"$##' -e "s#'\$##"; } # todo: handle trailing whitespaces and alike
+    #local max_len=$( while IFS== read name value; do echo "${#name}"; done <<< "$input" | sort | tail -n1 )
     while IFS== read name value; do
-        IFS="$options_delimiter" read default_value combo_list <<< "$value"
+        stripped="$( _strip <<< "$value" )"
+        IFS="$options_delimiter" read default_value combo_list <<< "$stripped"
         label="$name"
         names+=( "$name" )
         defaults+=( "$default_value" )
-        [[ -z "$default_value" ]] || label+=" ($default_value)"
-        if [[ -n "$combo_list" ]]; then command+=" --add-combo='$label' --combo-values='$( sed 's#,#|#g' <<< "$combo_list" )'"
-        else command+=" --add-entry='$label'"; fi
+        #[[ -z "$default_value" ]] || { n=$(( max_len - ${#name} + 2 )) label+="$( printf ".%.0s" $( seq 1 $n ) )default: $default_value"; }
+        [[ -z "$default_value" ]] || { label+=" (default: $default_value)"; } # todo? zenity does not support markup for items
+        if [[ -n "$combo_list" ]]; then
+            [[ -z "$default_value" ]] || combo_list="$default_value,$combo_list"
+            command+=" --add-combo='$label' --combo-values='$( sed 's#,#|#g' <<< "$combo_list" )'"
+        else
+            command+=" --add-entry='$label'"
+        fi
     done <<< "$input"
     (( ! options_dry_run )) || { echo "$command"; exit; }
     while read value; do values+=( "$value" ); done < <( eval "$command" 2> >( if (( options_verbose )); then cat; else cat >/dev/null; fi ) | tr '|' '\n' )
diff --git a/name_value/examples/name-value-form/menu.json b/name_value/examples/name-value-form/menu.json
new file mode 100644
index 000000000..5263bcc7b
--- /dev/null
+++ b/name_value/examples/name-value-form/menu.json
@@ -0,0 +1,20 @@
+{
+    "breakfast":
+    {
+        "number_of_people": 1,
+        "food": "toast,egg,poached egg,poached rhino",
+        "drink": "coffee,tea"
+    },
+    "lunch":
+    {
+        "number_of_people": 20,
+        "food": "",
+        "drink": "water,beer"
+    },
+    "dinner":
+    {
+        "number_of_people": 2,
+        "food": "spam,spam,spam,lovely spam",
+        "drink": "wine"
+    }
+}
diff --git a/name_value/examples/name-value-form/run b/name_value/examples/name-value-form/run
new file mode 100755
index 000000000..2c11d75a1
--- /dev/null
+++ b/name_value/examples/name-value-form/run
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+echo "======== example 1: hello world =========================="
+( echo hello; echo world; echo star=sun,antares,betelgeuse ) | ../../applications/name-value-form --title menu
+
+echo "======== example 2: json ================================="
+cat menu.json | name-value-convert | ../../applications/name-value-form --title menu | name-value-convert --to json
+

From 2bb7b5c11e33a89c693bbd34bceec485deb0e5b1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Feb 2024 17:14:25 +1100
Subject: [PATCH 0744/1056] name-value-form renamed to name-value-forms for
 consistency with zenity

---
 name_value/applications/CMakeLists.txt             |  2 +-
 .../{name-value-form => name-value-forms}          | 14 +++++++-------
 .../menu.json                                      |  0
 .../{name-value-form => name-value-forms}/run      |  4 ++--
 4 files changed, 10 insertions(+), 10 deletions(-)
 rename name_value/applications/{name-value-form => name-value-forms} (91%)
 rename name_value/examples/{name-value-form => name-value-forms}/menu.json (100%)
 rename name_value/examples/{name-value-form => name-value-forms}/run (73%)

diff --git a/name_value/applications/CMakeLists.txt b/name_value/applications/CMakeLists.txt
index 50f29d37e..76611190c 100644
--- a/name_value/applications/CMakeLists.txt
+++ b/name_value/applications/CMakeLists.txt
@@ -36,4 +36,4 @@ install( TARGETS name-value-to-csv RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR}
 install( PROGRAMS name-value-apply DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS name-value-calc DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS name-value-eval DESTINATION ${comma_INSTALL_BIN_DIR} )
-install( PROGRAMS name-value-form DESTINATION ${comma_INSTALL_BIN_DIR} )
\ No newline at end of file
+install( PROGRAMS name-value-forms DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/name_value/applications/name-value-form b/name_value/applications/name-value-forms
similarity index 91%
rename from name_value/applications/name-value-form
rename to name_value/applications/name-value-forms
index 2542e6148..cb7b645c4 100755
--- a/name_value/applications/name-value-form
+++ b/name_value/applications/name-value-forms
@@ -12,7 +12,7 @@ function prologue()
 read name-value pairs on stdin, display form, output initialised
 name-value pairs to stdout
 
-usage: cat <input> | name-value-form
+usage: cat <input> | name-value-forms
 
 <input>     : <name>[=<value>]
 <value>     : [<default>][<delimiter><combo list values>]
@@ -25,17 +25,17 @@ function epilogue()
     cat <<eof
 examples (try them)
     plain vanilla
-        { echo "hello"; echo "world"; } | name-value-form
+        { echo "hello"; echo "world"; } | name-value-forms
     form title
-        { echo "hello"; echo "world"; } | name-value-form --title "HELLO"
+        { echo "hello"; echo "world"; } | name-value-forms --title "HELLO"
     default values
-        { echo "hello"; echo "world=XXX"; } | name-value-form
+        { echo "hello"; echo "world=XXX"; } | name-value-forms
     combo lists
-        { echo "hello"; echo "world=,a,b,c"; } | name-value-form
+        { echo "hello"; echo "world=,a,b,c"; } | name-value-forms
     combo lists with defaults
-        { echo "hello"; echo "world=b,a,b,c"; } | name-value-form
+        { echo "hello"; echo "world=b,a,b,c"; } | name-value-forms
     dry run
-        { echo "hello"; echo "world"; } | name-value-form --dry
+        { echo "hello"; echo "world"; } | name-value-forms --dry
 eof
 }
 
diff --git a/name_value/examples/name-value-form/menu.json b/name_value/examples/name-value-forms/menu.json
similarity index 100%
rename from name_value/examples/name-value-form/menu.json
rename to name_value/examples/name-value-forms/menu.json
diff --git a/name_value/examples/name-value-form/run b/name_value/examples/name-value-forms/run
similarity index 73%
rename from name_value/examples/name-value-form/run
rename to name_value/examples/name-value-forms/run
index 2c11d75a1..ef88e86da 100755
--- a/name_value/examples/name-value-form/run
+++ b/name_value/examples/name-value-forms/run
@@ -1,8 +1,8 @@
 #!/bin/bash
 
 echo "======== example 1: hello world =========================="
-( echo hello; echo world; echo star=sun,antares,betelgeuse ) | ../../applications/name-value-form --title menu
+( echo hello; echo world; echo star=sun,antares,betelgeuse ) | ../../applications/name-value-forms --title menu
 
 echo "======== example 2: json ================================="
-cat menu.json | name-value-convert | ../../applications/name-value-form --title menu | name-value-convert --to json
+cat menu.json | name-value-convert | ../../applications/name-value-forms --title menu | name-value-convert --to json
 

From 0c757aadf4837f7c58d540848c31c7461152b1cf Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Feb 2024 17:25:29 +1100
Subject: [PATCH 0745/1056] name_value/examples/name-value-form: examples
 brushed up

---
 name_value/examples/name-value-forms/run | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/name_value/examples/name-value-forms/run b/name_value/examples/name-value-forms/run
index ef88e86da..399f8bba0 100755
--- a/name_value/examples/name-value-forms/run
+++ b/name_value/examples/name-value-forms/run
@@ -1,8 +1,8 @@
 #!/bin/bash
 
 echo "======== example 1: hello world =========================="
-( echo hello; echo world; echo star=sun,antares,betelgeuse ) | ../../applications/name-value-forms --title menu
+( echo hello; echo world; echo star=sun,antares,betelgeuse ) | name-value-forms --title menu
 
 echo "======== example 2: json ================================="
-cat menu.json | name-value-convert | ../../applications/name-value-forms --title menu | name-value-convert --to json
+cat menu.json | name-value-convert | name-value-forms --title menu | name-value-convert --to json
 

From c2a8cf984fe02a9215c72ecfd9f3c1a232112e64 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 13 Feb 2024 17:26:13 +1100
Subject: [PATCH 0746/1056] name_value/examples/name-value-form: examples
 brushed up

---
 name_value/examples/name-value-forms/run | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/name_value/examples/name-value-forms/run b/name_value/examples/name-value-forms/run
index 399f8bba0..97531d8cd 100755
--- a/name_value/examples/name-value-forms/run
+++ b/name_value/examples/name-value-forms/run
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 echo "======== example 1: hello world =========================="
-( echo hello; echo world; echo star=sun,antares,betelgeuse ) | name-value-forms --title menu
+( echo hello; echo world; echo star=sun,antares,betelgeuse ) | name-value-forms --title "hello world"
 
 echo "======== example 2: json ================================="
 cat menu.json | name-value-convert | name-value-forms --title menu | name-value-convert --to json

From c7dd038fe0171f954a1fa32a4a3c9f5a3871f045 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 14 Feb 2024 11:17:45 +1100
Subject: [PATCH 0747/1056] comma_say macros: whitespaces added for visual
 alignment

---
 application/command_line_options.h | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/application/command_line_options.h b/application/command_line_options.h
index f33b082c4..bc2b50930 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -38,11 +38,11 @@ inline std::ostream& say( unsigned int verbosity=0, const std::string& prefix=""
 /// convenience macros
 #define _COMMA_SAY( _level, _message ) { if( _level <= ::comma::verbosity::level() ) { ::comma::say( _level ) << _message; } }
 #define COMMA_SAY( message )       _COMMA_SAY( 0,                message << std::endl )
-#define COMMA_SAY_ERROR( message ) _COMMA_SAY( 0, "error: "   << message << std::endl )
+#define COMMA_SAY_ERROR( message ) _COMMA_SAY( 0, "error:   "   << message << std::endl )
 #define COMMA_SAY_WARN( message )  _COMMA_SAY( 1, "warning: " << message << std::endl )
-#define COMMA_SAY_INFO( message )  _COMMA_SAY( 2, "info: "    << message << std::endl )
-#define COMMA_SAY_DEBUG( message ) _COMMA_SAY( 3, "debug: "   << message << std::endl )
-#define COMMA_SAY_TRACE( message ) _COMMA_SAY( 4, "trace: "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
+#define COMMA_SAY_INFO( message )  _COMMA_SAY( 2, "info:    "    << message << std::endl )
+#define COMMA_SAY_DEBUG( message ) _COMMA_SAY( 3, "debug:   "   << message << std::endl )
+#define COMMA_SAY_TRACE( message ) _COMMA_SAY( 4, "trace:   "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
 
 /// convenience alias of say( verbosity )
 /// @example

From f50032f9296bcac9445fee5cf702e9656e0b2926 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 14 Feb 2024 16:44:37 +1100
Subject: [PATCH 0748/1056] string: split_as(): convenience methods with
 vector-like defaults added

---
 string/split.h              | 61 +++++++++++++++++++++++++++++++------
 string/test/string_test.cpp | 24 +++++++++++++++
 2 files changed, 75 insertions(+), 10 deletions(-)

diff --git a/string/split.h b/string/split.h
index 47203f748..3257fd234 100644
--- a/string/split.h
+++ b/string/split.h
@@ -4,8 +4,10 @@
 
 #pragma once
 
+#include <array>
 #include <string>
 #include <vector>
+#include <boost/array.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 
@@ -23,13 +25,17 @@ std::vector< std::string > split( const std::string& s, const char* separators =
 /// split string into tokens (a quick implementation); always contains at least one element unless empty_if_empty_input is true
 std::vector< std::string > split( const std::string& s, char separator, bool empty_if_empty_input = false );
 
-/// split string into tokens (a quick implementation) and cast to a given type
-template < typename T >
-std::vector< T > split_as( const std::string& s, const char* separators, const boost::optional< T >& default_value = boost::none );
-
-/// split string into tokens (a quick implementation) and cast to a given type
-template < typename T >
-std::vector< T > split_as( const std::string& s, char separator, const boost::optional< T >& default_value = boost::none );
+/// split string into tokens and cast to a vector of given types
+template < typename T > std::vector< T > split_as( const std::string& s, const char* separators );
+template < typename T > std::vector< T > split_as( const std::string& s, const char* separators, const T& default_value );
+template < typename T > std::vector< T > split_as( const std::string& s, char separator );
+template < typename T > std::vector< T > split_as( const std::string& s, char separator, const T& default_value );
+template < typename T > std::vector< T > split_as( const std::string& s, const char* separators, const std::vector< T >& defaults ); // todo: re-implement using traits
+template < typename T > std::vector< T > split_as( const std::string& s, char separator, const std::vector< T >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, const char* separators, const std::array< T, N >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, char separator, const std::array< T, N >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, const char* separators, const boost::array< T, N >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, char separator, const boost::array< T, N >& defaults );
 
 /// Split string into tokens; always contains at least one element;
 /// skips backslash escaped separator, handle non-nested quotes;
@@ -55,8 +61,10 @@ std::vector< std::string > split_bracketed( const std::string& s, const char * s
 /// skips bracketed separators
 std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket = '(', char rbracket = ')', bool strip_brackets = true );
 
+namespace impl {
+
 template < typename T >
-inline std::vector< T > split_as( const std::string& s, const char* separators, const boost::optional< T >& default_value )
+inline std::vector< T > split_with_scalar_default( const std::string& s, const char* separators, const boost::optional< T >& default_value )
 {
     const auto& v = split( s, separators, true );
     std::vector< T > t( v.size() );
@@ -64,10 +72,43 @@ inline std::vector< T > split_as( const std::string& s, const char* separators,
     return t;
 }
 
-template < typename T > inline std::vector< T > split_as( const std::string& s, char separator, const boost::optional< T >& default_value )
+template < typename T, typename V > inline std::vector< T > split_as( const std::string& s, const char* separators, const V& defaults )
+{
+    const auto& v = split( s, separators, true );
+    std::vector< T > t( v.size() );
+    for( unsigned int i = 0; i < v.size(); ++i ) { t[i] = v[i].empty() && defaults.size() > i ? defaults[i] : boost::lexical_cast< T >( v[i] ); }
+    return t;
+}
+
+template < typename T, typename V > inline std::vector< T > split_as( const std::string& s, char separator, const V& defaults )
 {
     const char separators[] = { separator, 0 };
-    return split_as< T >( s, separators, default_value );
+    return split_as< T >( s, &separators[0], defaults );
 }
 
+} // namespace impl {
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, const char* separators ) { return impl::split_with_scalar_default( s, separators, boost::optional< T >() ); }
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, const char* separators, const T& default_value ) { return impl::split_with_scalar_default( s, separators, default_value ); }
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator )
+{ 
+    const char separators[] = { separator, 0 };
+    return impl::split_with_scalar_default( s, &separators[0], boost::optional< T >() );
+}
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator, const T& default_value )
+{ 
+    const char separators[] = { separator, 0 };
+    return impl::split_with_scalar_default( s, &separators[0], boost::optional< T >( default_value ) );
+}
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, const char* separators, const std::vector< T >& defaults ) { return impl::split_as< T >( s, separators, defaults ); }
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator, const std::vector< T >& defaults ) { return impl::split_as< T >( s, separator, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, const char* separators, const std::array< T, N >& defaults ) { return impl::split_as< T >( s, separators, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, char separator, const std::array< T, N >& defaults ) { return impl::split_as< T >( s, separator, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, const char* separators, const boost::array< T, N >& defaults ) { return impl::split_as< T >( s, separators, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, char separator, const boost::array< T, N >& defaults ) { return impl::split_as< T >( s, separator, defaults ); }
+
 } // namespace comma {
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 438c25a14..1636e182e 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -99,6 +99,30 @@ TEST( string, split )
     }
 }
 
+TEST( string, split_as )
+{
+    {
+        std::vector< int > expected{ 1, 2, 3 };
+        EXPECT_EQ( split_as< int >( "1,2,3", ',' ), expected );
+        EXPECT_EQ( split_as< int >( "1,2;3", ",;" ), expected );
+        EXPECT_EQ( split_as< int >( "1,2;3", ",;_" ), expected );
+    }
+    {
+        std::vector< int > expected{ 5, 5, 3, 5 };
+        EXPECT_EQ( split_as< int >( ",,3,", ',', 5 ), expected );
+    }
+    {
+        std::vector< int > expected{ 1, 5, 3 };
+        std::vector< int > defaults_vector{ 1, 5 };
+        std::array< int, 4 > defaults_std_array{ 1, 5, 1, 1 };
+        boost::array< int, 4 > defaults_boost_array{ 1, 5, 1, 1 };        
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_vector ), expected );
+        split_as< int >( std::string( ",,3" ), ',', defaults_boost_array );
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_boost_array ), expected );
+        EXPECT_EQ( split_as< int >( ",,3", ',', defaults_std_array ), expected );
+    }
+}
+
 TEST( string, escape )
 {
     EXPECT_EQ( "ab", escape( "ab" ) );

From bf7ac59a68bc359245467fe73379d9cbc7675b97 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 14 Feb 2024 16:54:30 +1100
Subject: [PATCH 0749/1056] string: split_as(): usage semantics for vector-like
 defaults made more consistent

---
 string/split.h              |  3 ++-
 string/test/string_test.cpp | 17 ++++++++++++++---
 2 files changed, 16 insertions(+), 4 deletions(-)

diff --git a/string/split.h b/string/split.h
index 3257fd234..ea578625e 100644
--- a/string/split.h
+++ b/string/split.h
@@ -75,8 +75,9 @@ inline std::vector< T > split_with_scalar_default( const std::string& s, const c
 template < typename T, typename V > inline std::vector< T > split_as( const std::string& s, const char* separators, const V& defaults )
 {
     const auto& v = split( s, separators, true );
-    std::vector< T > t( v.size() );
+    std::vector< T > t( v.size() < defaults.size() ? defaults.size() : v.size() );
     for( unsigned int i = 0; i < v.size(); ++i ) { t[i] = v[i].empty() && defaults.size() > i ? defaults[i] : boost::lexical_cast< T >( v[i] ); }
+    for( unsigned int i = v.size(); i < defaults.size(); ++i ) { t[i] = defaults[i]; }
     return t;
 }
 
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 1636e182e..ce987b63c 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -114,13 +114,24 @@ TEST( string, split_as )
     {
         std::vector< int > expected{ 1, 5, 3 };
         std::vector< int > defaults_vector{ 1, 5 };
-        std::array< int, 4 > defaults_std_array{ 1, 5, 1, 1 };
-        boost::array< int, 4 > defaults_boost_array{ 1, 5, 1, 1 };        
+        std::array< int, 2 > defaults_std_array{ 1, 5 };
+        boost::array< int, 2 > defaults_boost_array{ 1, 5 };
         EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_vector ), expected );
-        split_as< int >( std::string( ",,3" ), ',', defaults_boost_array );
         EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_boost_array ), expected );
         EXPECT_EQ( split_as< int >( ",,3", ',', defaults_std_array ), expected );
     }
+    {
+        std::vector< int > expected{ 1, 5, 3, 7 };
+        std::vector< int > defaults_vector{ 1, 5, 1, 7 };
+        std::array< int, 4 > defaults_std_array{ 1, 5, 1, 7 };
+        boost::array< int, 4 > defaults_boost_array{ 1, 5, 1, 7 };
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_vector ), expected );
+        EXPECT_EQ( split_as< int >( std::string( ",,3," ), ',', defaults_vector ), expected );
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_boost_array ), expected );
+        EXPECT_EQ( split_as< int >( std::string( ",,3," ), ',', defaults_boost_array ), expected );
+        EXPECT_EQ( split_as< int >( ",,3", ',', defaults_std_array ), expected );
+        EXPECT_EQ( split_as< int >( ",,3,", ',', defaults_std_array ), expected );
+    }
 }
 
 TEST( string, escape )

From 846d6cdfb6249ba480c4ec9c21b70c0464170732 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 21 Feb 2024 15:15:59 +1100
Subject: [PATCH 0750/1056] packed::struct::clear() implemented

---
 packed/struct.h | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/packed/struct.h b/packed/struct.h
index ba559e7ee..3ac27ecc7 100644
--- a/packed/struct.h
+++ b/packed/struct.h
@@ -12,20 +12,21 @@ namespace comma { namespace packed {
 
 /// packed structure
 template < class Derived, size_t S >
-class packed_struct
+struct packed_struct
 {
-    public:
-        enum { size = S };
+    enum { size = S };
 
-        packed_struct() throw() { static_assert( sizeof( Derived ) == size, "expected derived of provided size" ); }
+    packed_struct() throw() { static_assert( sizeof( Derived ) == size, "expected derived of provided size" ); }
 
-        const char* data() const throw() { return reinterpret_cast< const char* >( this ); }
+    const char* data() const throw() { return reinterpret_cast< const char* >( this ); }
 
-        char* data() throw() { return reinterpret_cast< char* >( this ); }
+    char* data() throw() { return reinterpret_cast< char* >( this ); }
 
-        bool operator==( const packed_struct& rhs ) const { return ::memcmp( this, &rhs, size ) == 0; }
+    bool operator==( const packed_struct& rhs ) const { return std::memcmp( this, &rhs, size ) == 0; }
 
-        bool operator!=( const packed_struct& rhs ) const { return !operator==( rhs ); }
+    bool operator!=( const packed_struct& rhs ) const { return !operator==( rhs ); }
+
+    void clear() { std::memset( ( char* )( this ), 0, size ); }
 };
 
 } } // namespace comma { namespace packed {

From 897adaca744f846a0e97a343752aed80c50e625d Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 27 Feb 2024 12:04:40 +1100
Subject: [PATCH 0751/1056] csv::names( aliases ) implemented

---
 csv/names.h | 23 ++++++++++++++++++-----
 1 file changed, 18 insertions(+), 5 deletions(-)

diff --git a/csv/names.h b/csv/names.h
index 4d379f48c..1fe53f86d 100644
--- a/csv/names.h
+++ b/csv/names.h
@@ -16,13 +16,18 @@ namespace comma { namespace csv {
 
 /// the most generic way: return default column names for
 /// a given sample and given subtree in comma-separated xpaths
-template < typename S > std::vector< std::string > names( const std::string& paths, bool useFullxpath = true, const S& sample = S() );
+template < typename S > std::vector< std::string > names( const std::string& paths, bool use_full_xpath = true, const S& sample = S() );
 
 /// return default column names for a given sample and given subtree in comma-separated xpaths
-template < typename S > std::vector< std::string > names( const char* paths, bool useFullxpath = true, const S& sample = S() ) { return names( std::string( paths ), useFullxpath, sample ); }
+template < typename S > std::vector< std::string > names( const char* paths, bool use_full_xpath = true, const S& sample = S() ) { return names( std::string( paths ), use_full_xpath, sample ); }
 
 /// return default column names for a given sample
-template < typename S > std::vector< std::string > names( bool useFullxpath, const S& sample = S() ) { return names( "", useFullxpath, sample ); }
+template < typename S > std::vector< std::string > names( bool use_full_xpath, const S& sample = S() ) { return names( "", use_full_xpath, sample ); }
+
+/// return default column names for a given sample replacing full field names with give aliases
+/// also see csv::options constructor with aliases
+/// attention! aliases: name-value pairs as passed to csv::options: key: alias; value: name
+template < typename S > std::vector< std::string > names( const std::unordered_map< std::string, std::string >& aliases, bool use_full_xpath = true, const S& sample = S() );
 
 /// return default column names for a given sample, use full xpath
 template < typename S > std::vector< std::string > names( const S& sample = S() ) { return names( true, sample ); }
@@ -37,7 +42,7 @@ bool fields_exist( const std::vector< std::string >& fields, const std::vector<
 bool fields_exist( const std::string& fields, const std::string& subset, char delimiter = ',', bool allow_empty = false );
 
 template < typename S >
-inline std::vector< std::string > names( const std::string& paths, bool useFullxpath, const S& sample )
+inline std::vector< std::string > names( const std::string& paths, bool use_full_xpath, const S& sample )
 {
     std::vector< std::string > p = split( paths, ',' );
     std::vector< std::string > r;
@@ -49,7 +54,7 @@ inline std::vector< std::string > names( const std::string& paths, bool useFullx
         }
         else
         {
-            impl::to_names v( p[i], useFullxpath );
+            impl::to_names v( p[i], use_full_xpath );
             visiting::apply( v, sample );
             if( v().empty() ) { r.push_back( p[i] ); } // unknown name, don't replace
             else { r.insert( r.end(), v().begin(), v().end() ); }
@@ -68,4 +73,12 @@ inline std::unordered_map< std::string, std::string > leaves( const std::string&
     return m;
 }
 
+template < typename S >
+inline std::vector< std::string > names( const std::unordered_map< std::string, std::string >& aliases, bool use_full_xpath, const S& sample )
+{
+    auto n = names( use_full_xpath, sample );
+    for( auto& m: n ) { for( auto i: aliases ) { if( i.second == m ) { m = i.first; break; } } } // quick and dirty
+    return n;
+}
+
 } } // namespace comma { namespace csv {

From 6b2734445efc3f75fabbbb4458ef1cb95ac9fc20 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 8 Mar 2024 18:22:53 +1100
Subject: [PATCH 0752/1056] application/command_line_options.cpp: includes
 fixed

---
 application/command_line_options.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index d303d5604..e8cfab9f8 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -10,9 +10,9 @@
 #include <unordered_map>
 #include <boost/bind/bind.hpp>
 #include <boost/config/warning_disable.hpp>
-//#include "boost/filesystem.hpp"
-#include "boost/iostreams/stream.hpp"
-#include "boost/iostreams/device/null.hpp"
+//#include <boost/filesystem.hpp>
+#include <boost/iostreams/stream.hpp>
+#include <boost/iostreams/device/null.hpp>
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>

From 08f801c62eb867d54511eec2014102abd45aa8fd Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 8 Mar 2024 18:36:07 +1100
Subject: [PATCH 0753/1056] io::terminal::ostream: first cut implemented

---
 io/terminal.h | 74 +++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 74 insertions(+)
 create mode 100644 io/terminal.h

diff --git a/io/terminal.h b/io/terminal.h
new file mode 100644
index 000000000..b947d7038
--- /dev/null
+++ b/io/terminal.h
@@ -0,0 +1,74 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <iostream>
+
+namespace comma { namespace io { namespace terminal {
+
+namespace controls {
+
+struct end { static constexpr char value[] = { 0x07, 0 }; };
+
+struct stderr { static constexpr char* start = ""; static constexpr char* end = "\n"; }; // quick and dirty
+
+struct titlebar { static constexpr char start[] = { 0x1b, ']', '0', ';', 0 }; static constexpr char end[] = { 0x07, 0 }; };
+
+template < unsigned int Colour >
+struct coloured; // todo
+
+// todo! combining multiple controls
+
+} // namespace controls {
+
+template < typename T >
+void write_to( const std::string& s ) { std::cerr << T::start << s << T::end; }
+
+namespace impl {
+
+template < typename S > struct traits
+{
+    template < typename T > static bool output_if_end( bool started ) { return false; }
+    static void output( const S& s ) { std::cerr << s; }
+};
+
+template <> struct traits< terminal::controls::end >
+{
+    template < typename T > static bool output_if_end( bool started ) { if( started ) { std::cerr << T::end; } return true; }
+    static void output( const terminal::controls::end& s ) {}
+};
+
+} // namespace impl {
+
+template < typename T >
+class ostream
+{
+    public:
+        ~ostream() { if( _started ) { std::cerr << T::end; _started = false; } }
+
+        static terminal::controls::end end() { return terminal::controls::end(); } // convenience method
+
+        template < typename S >
+        ostream& operator<<( const S& s )
+        {
+            if( impl::traits< S >::template output_if_end< T >( _started ) )
+            {
+                _started = false;
+            }
+            else
+            {
+                if( !_started ) { std::cerr << T::start; _started = true; }
+                impl::traits< S >::output( s );
+            }
+            return *this;
+        }
+
+    protected:
+        bool _started{false};
+};
+
+typedef ostream< controls::titlebar > titlebar_ostream;
+
+} } } // namespace comma { namespace io { namespace terminal {

From 7f7e6bed256ac09e2704f383f316e27002b02c0f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Mar 2024 20:09:33 +1100
Subject: [PATCH 0754/1056] io/terminal, application/command_line_options:
 --titlebar-application-name implemented

---
 application/command_line_options.cpp | 10 ++++++++--
 application/command_line_options.h   |  1 +
 io/terminal.h                        |  2 +-
 3 files changed, 10 insertions(+), 3 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index e8cfab9f8..09dc9f3b1 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -16,6 +16,7 @@
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>
+#include "../io/terminal.h"
 #include "../string/split.h"
 #include "../base/exception.h"
 #include "command_line_options.h"
@@ -26,6 +27,7 @@ namespace application { namespace detail {
 
 static std::string name;
 static unsigned int verbosity_level{0};
+static bool titlebar{false};
 static boost::iostreams::stream< boost::iostreams::null_sink > null_ostream( ( boost::iostreams::null_sink() ) );
 
 } } // namespace application { namespace detail {
@@ -51,6 +53,8 @@ const std::string verbosity::to_string( unsigned int v )
 std::string verbosity::usage()
 {
     const char* s = R"verbosity(verbosity options
+    --titlebar,--tb; output terminal-destined messages to terminal title bar, default: stderr
+    --titlebar-application-name,--tbn; on application start, set terminal title bar to application name
     --verbose,-v; more output on stderr, same as --verbosity=1
     --verbosity=<n>; default=0; verbosity level from 0 to 5 or 'none'(0), 'low'|'error'(1), 'medium'|'warning'(2), 'high'|'info'(3), 'extreme'|'debug'(4)
     -v,-vv,-vvv,-vvvv,-vvvvv; same as --verbosity from 1 to 5
@@ -73,6 +77,8 @@ void command_line_options::_init_verbose( const std::string& path )
     }
     comma::verbose.init( comma::application::detail::verbosity_level > 0, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
     comma::application::detail::name = comma::split( path, '/' ).back(); // boost::filesystem::basename( path );
+    comma::application::detail::titlebar = exists( "--titlebar,--tb" );
+    if( exists( "--titlebar-application-name,--tbn" ) ) { comma::io::terminal::titlebar_ostream s; s << comma::application::detail::name; }
 }
 
 command_line_options::command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage, boost::function< void( int, char** ) > bash_completion )
@@ -126,8 +132,8 @@ bool command_line_options::exists( const std::string& name ) const
 std::vector< std::string > command_line_options::unnamed( const std::string& valueless_options, const std::string& options_with_values ) const
 {
 
-    std::vector< std::string > valueless{ "--verbose", "-v", "-vv", "-vvv", "-vvvv", "-vvvvv" };
-    if( !valueless_options.empty() ) { valueless = split( valueless_options + ",--verbose,-v,-vv,-vvv,-vvvv,-vvvvv", ',' ); }
+    std::vector< std::string > valueless{ "--verbose", "-v", "-vv", "-vvv", "-vvvv", "-vvvvv", "--titlebar", "--tb", "--titlebar-application-name", "--tbn", "" };
+    if( !valueless_options.empty() ) { valueless = split( valueless_options + ",--verbose,-v,-vv,-vvv,-vvvv,-vvvvv,--titlebar,--tb,--titlebar-application-name,--tbn", ',' ); }
     std::vector< std::string > valued = split( options_with_values, ',' );
     std::vector< std::string > w;
     for( unsigned int i = 1; i < argv_.size(); ++i )
diff --git a/application/command_line_options.h b/application/command_line_options.h
index bc2b50930..59a4bb5bc 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -21,6 +21,7 @@ namespace comma {
 struct verbosity
 {
     enum levels { none=0, low=1, medium=2, high=3, extreme=4 }; // todo: more levels and or aliases like warning, info, debug - but when choosing names, remember: verbosity is not the same as logging!
+    enum target { stderr=0, terminal=1 };
     static unsigned int level();
     static unsigned int from_string( const std::string& s );
     static const std::string to_string( unsigned int v );
diff --git a/io/terminal.h b/io/terminal.h
index b947d7038..10d26beab 100644
--- a/io/terminal.h
+++ b/io/terminal.h
@@ -12,7 +12,7 @@ namespace controls {
 
 struct end { static constexpr char value[] = { 0x07, 0 }; };
 
-struct stderr { static constexpr char* start = ""; static constexpr char* end = "\n"; }; // quick and dirty
+struct stderr { static constexpr char start[] = { 0 }; static constexpr char end[] = { '\n', 0 }; }; // quick and dirty
 
 struct titlebar { static constexpr char start[] = { 0x1b, ']', '0', ';', 0 }; static constexpr char end[] = { 0x07, 0 }; };
 

From a89c4f718a0fbc78bd8dd57bf70e628ed65310d6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Mar 2024 22:13:53 +1100
Subject: [PATCH 0755/1056] application/command_line_options: COMMA_TITLE()
 implemented

---
 application/command_line_options.cpp | 14 +++++++++-----
 application/command_line_options.h   | 22 +++++++++++++++-------
 2 files changed, 24 insertions(+), 12 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 09dc9f3b1..a613259ec 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -5,8 +5,8 @@
 
 #include <algorithm>
 #include <array>
-#include <sstream>
 #include <set>
+#include <sstream>
 #include <unordered_map>
 #include <boost/bind/bind.hpp>
 #include <boost/config/warning_disable.hpp>
@@ -16,9 +16,8 @@
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>
-#include "../io/terminal.h"
-#include "../string/split.h"
 #include "../base/exception.h"
+#include "../string/split.h"
 #include "command_line_options.h"
 
 namespace comma {
@@ -27,13 +26,16 @@ namespace application { namespace detail {
 
 static std::string name;
 static unsigned int verbosity_level{0};
-static bool titlebar{false};
+static bool titlebar_enabled{false};
+static comma::io::terminal::titlebar_ostream titlebar_ostream;
 static boost::iostreams::stream< boost::iostreams::null_sink > null_ostream( ( boost::iostreams::null_sink() ) );
 
 } } // namespace application { namespace detail {
 
 unsigned int verbosity::level() { return comma::application::detail::verbosity_level; }
 
+bool verbosity::titlebar_enabled() { return comma::application::detail::titlebar_enabled; }
+
 unsigned int verbosity::from_string( const std::string& s )
 {
     return   s == "none"                     ? verbosity::none
@@ -67,6 +69,8 @@ std::ostream& say( std::ostream& os, unsigned int verbosity, const std::string&
     return ( verbosity > comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : os ) << comma::application::detail::name << ": " << ( prefix.empty() ? std::string() : ( prefix + ": " ) );
 }
 
+comma::io::terminal::titlebar_ostream titlebar() { return comma::application::detail::titlebar_ostream << comma::application::detail::name; }
+
 void command_line_options::_init_verbose( const std::string& path )
 {
     comma::application::detail::verbosity_level = verbosity::from_string( value< std::string >( "--verbosity", exists( "--verbose,-v" ) ? "1" : "0" ) );
@@ -77,7 +81,7 @@ void command_line_options::_init_verbose( const std::string& path )
     }
     comma::verbose.init( comma::application::detail::verbosity_level > 0, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
     comma::application::detail::name = comma::split( path, '/' ).back(); // boost::filesystem::basename( path );
-    comma::application::detail::titlebar = exists( "--titlebar,--tb" );
+    comma::application::detail::titlebar_enabled = exists( "--titlebar,--tb" );
     if( exists( "--titlebar-application-name,--tbn" ) ) { comma::io::terminal::titlebar_ostream s; s << comma::application::detail::name; }
 }
 
diff --git a/application/command_line_options.h b/application/command_line_options.h
index 59a4bb5bc..b5efa142f 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -5,14 +5,15 @@
 
 #pragma once
 
+#include <iostream>
 #include <map>
 #include <string>
 #include <vector>
-#include <iostream>
 #include <boost/function.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include "../base/exception.h"
+#include "../io/terminal.h"
 #include "../string/string.h"
 #include "verbose.h" // todo: deprecate
 
@@ -23,6 +24,7 @@ struct verbosity
     enum levels { none=0, low=1, medium=2, high=3, extreme=4 }; // todo: more levels and or aliases like warning, info, debug - but when choosing names, remember: verbosity is not the same as logging!
     enum target { stderr=0, terminal=1 };
     static unsigned int level();
+    static bool titlebar_enabled();
     static unsigned int from_string( const std::string& s );
     static const std::string to_string( unsigned int v );
     static std::string usage();
@@ -35,15 +37,21 @@ struct verbosity
 ///          my-application: some message
 std::ostream& say( std::ostream& os, unsigned int verbosity=0, const std::string& prefix="" );
 inline std::ostream& say( unsigned int verbosity=0, const std::string& prefix="" ) { return say( std::cerr, verbosity, prefix ); }
+/// set terminal title bar if --tb option present or force set to true
+/// @example
+///     todo
+comma::io::terminal::titlebar_ostream titlebar();
 
 /// convenience macros
 #define _COMMA_SAY( _level, _message ) { if( _level <= ::comma::verbosity::level() ) { ::comma::say( _level ) << _message; } }
-#define COMMA_SAY( message )       _COMMA_SAY( 0,                message << std::endl )
-#define COMMA_SAY_ERROR( message ) _COMMA_SAY( 0, "error:   "   << message << std::endl )
-#define COMMA_SAY_WARN( message )  _COMMA_SAY( 1, "warning: " << message << std::endl )
-#define COMMA_SAY_INFO( message )  _COMMA_SAY( 2, "info:    "    << message << std::endl )
-#define COMMA_SAY_DEBUG( message ) _COMMA_SAY( 3, "debug:   "   << message << std::endl )
-#define COMMA_SAY_TRACE( message ) _COMMA_SAY( 4, "trace:   "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
+#define COMMA_SAY( message )         _COMMA_SAY( 0,                message << std::endl )
+#define COMMA_SAY_ERROR( message )   _COMMA_SAY( 0, "error:   "   << message << std::endl )
+#define COMMA_SAY_WARN( message )    _COMMA_SAY( 1, "warning: " << message << std::endl )
+#define COMMA_SAY_INFO( message )    _COMMA_SAY( 2, "info:    "    << message << std::endl )
+#define COMMA_SAY_DEBUG( message )   _COMMA_SAY( 3, "debug:   "   << message << std::endl )
+#define COMMA_SAY_TRACE( message )   _COMMA_SAY( 4, "trace:   "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
+#define COMMA_TITLE( message )       { if( ::comma::verbosity::titlebar_enabled() ) { auto t = ::comma::tilebar(); t << message; } else { COMMA_SAY( message ); } }
+#define COMMA_TITLE_BARE( message )  { if( ::comma::verbosity::titlebar_enabled() ) { ::comma::io::terminal::titlebar_ostream t; t << message; } else { std::cerr << message << std::endl; } }
 
 /// convenience alias of say( verbosity )
 /// @example

From 9181f646299e303a6d0c694dcb9b817b3a2017ec Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Mar 2024 22:14:19 +1100
Subject: [PATCH 0756/1056] io-bandwidth: --porcelain mode and output to title
 bar implemented

---
 io/applications/io-bandwidth.cpp | 84 +++++++++++++++++++-------------
 1 file changed, 50 insertions(+), 34 deletions(-)

diff --git a/io/applications/io-bandwidth.cpp b/io/applications/io-bandwidth.cpp
index f774f9ec3..e82420912 100644
--- a/io/applications/io-bandwidth.cpp
+++ b/io/applications/io-bandwidth.cpp
@@ -31,11 +31,13 @@
 
 #include <iostream>
 #include <numeric>
+#include <sstream>
 #include <boost/algorithm/string/replace.hpp>
 #include <boost/array.hpp>
 #include <boost/circular_buffer.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
+#include "../../base/none.h"
 #include "../../io/select.h"
 #include "../../io/stream.h"
 
@@ -44,7 +46,7 @@ static const double default_window_resolution = 0.1f;
 static const double default_update_interval = 1.0f;
 static const char default_delimiter = ',';
 static const std::string standard_output_fields="timestamp,received_bytes,bytes_per_second/all_time,bytes_per_second/window";
-static const std::string extended_output_fields="timestamp,received_bytes,bytes_per_second/all_time,bytes_per_second/window,records_per_second/all_time,records_per_second/window";
+static const std::string extended_output_fields="timestamp,received_bytes,bytes_per_second/all_time,bytes_per_second/window,records_per_second/all_time,records_per_second/window,progress";
 
 static void bash_completion( unsigned const ac, char const * const * av )
 {
@@ -65,12 +67,17 @@ void usage( bool verbose = false )
     std::cerr << "usage: io-bandwidth [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
+    std::cerr << "    --delimiter,-d <delimiter>: default ','" << std::endl;
+    std::cerr << "    --output-fields: list output fields and exit" << std::endl;
+    std::cerr << "    --output-progress,--progress: output only progress indicator; todo: --fields=<output-fields>" << std::endl;
+    std::cerr << "    --porcelain: human-readable output" << std::endl;
+    std::cerr << "    --porcelain-title,--title=<title>; default=io-bandwidth: output will be prefixed with <title>" << std::endl;
+    std::cerr << "    --resolution,-r=[<n>]: sliding window resolution; default=" << default_window_resolution << "s" << std::endl;
     std::cerr << "    --size,-s=[<bytes>]: specify size of one record of input data" << std::endl;
-    std::cerr << "    --window,-w=[<n>]: sliding window; default=" << default_window << "s" << std::endl;
+    std::cerr << "    --total-count=[<n>]: total expected record count, if present, output progress in percent" << std::endl;
+    std::cerr << "    --total-size=[<bytes>]: total expected size in bytes, if present, output progress in percent" << std::endl;
     std::cerr << "    --update,-u=[<n>]: update interval; default=" << default_update_interval << "s" << std::endl;
-    std::cerr << "    --resolution,-r=[<n>]: sliding window resolution; default=" << default_window_resolution << "s" << std::endl;
-    std::cerr << "    --output-fields: list output fields and exit" << std::endl;
-    std::cerr << "    --delimiter,-d <delimiter>: default ','" << std::endl;
+    std::cerr << "    --window,-w=[<n>]: sliding window; default=" << default_window << "s" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    The sliding window consists of a number of buckets. The width of each" << std::endl;
     std::cerr << "    bucket is given by --resolution, and there are sufficient buckets to" << std::endl;
@@ -104,6 +111,15 @@ void usage( bool verbose = false )
     std::cerr << "            dd if=/dev/urandom bs=100 count=1 2> /dev/null; sleep 0.1" << std::endl;
     std::cerr << "        done | io-bandwidth 2> >( io-publish tcp:8888 ) | hexdump" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "    show values in terminal title bar" << std::endl;
+    std::cerr << "        yes | csv-repeat --pace --period 0.001 | head -n10000 \\" << std::endl;
+    std::cerr << "            | io-bandwidth --total-size 10000 --size 2 \\" << std::endl;
+    std::cerr << "                           --porcelain --titlebar >/dev/null" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    show progress indicator in terminal title bar" << std::endl;
+    std::cerr << "        yes | csv-repeat --pace --period 0.001 | head -n50000 \\" << std::endl;
+    std::cerr << "            | io-bandwidth --total-count 10000 --size 2 \\" << std::endl;
+    std::cerr << "                           --porcelain --titlebar --progress --title='counting yes' >/dev/null" << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
@@ -118,42 +134,43 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
-
         if( options.exists( "--output-fields" ))
         {
             if( options.exists( "--size,-s" )) { std::cout << extended_output_fields << std::endl; }
             else { std::cout << standard_output_fields << std::endl; }
             return 0;
         }
-
+        options.assert_mutually_exclusive( "--total-size", "--total-count" );
         // Functionally equivalent to boost::optional< std::size_t > record_size
         // but eliminates the gcc "maybe-uninitialized" warning
-        boost::optional< std::size_t > record_size = boost::make_optional< std::size_t >( false, 0 );
+        boost::optional< std::size_t > record_size = comma::silent_none< std::size_t >();
         if( options.exists( "--size,-s" )) { record_size = options.value< std::size_t >( "--size,-s" ); }
-
+        auto total_count = options.optional< std::uint64_t >( "--total-count" );
+        auto total_size = options.optional< std::uint64_t >( "--total-size" );
+        bool output_progress = options.exists( "--output-progress,--progress" ); // todo! --fields <output fields>
+        COMMA_ASSERT_BRIEF( !total_count || record_size, "--total-count given, please specify --size" );
+        COMMA_ASSERT_BRIEF( !output_progress || total_count || total_size, "--output-progress given; please specify --total-count or --total-size" );
         boost::posix_time::time_duration update_interval = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--update,-u", default_update_interval ) * 1000000) );
         double window = options.value< double >( "--window,-w", default_window );
         double bucket_width = options.value< double >( "--resolution,-r", default_window_resolution );
         boost::posix_time::time_duration bucket_duration = boost::posix_time::microseconds( static_cast<unsigned int> (bucket_width * 1000000) );
         char delimiter = options.value( "--delimiter,-d", default_delimiter );
-
+        bool porcelain = options.exists( "--porcelain" );
+        std::string porcelain_title = options.value< std::string >( "--porceilain-title,--title", "io-bandwidth" );
+        if( porcelain ) { delimiter = ' '; }
         comma::io::select select;
         select.read().add( comma::io::stdin_fd );
         comma::io::istream is( "-", comma::io::mode::binary );
-
         unsigned long long total_bytes = 0;
         unsigned int bucket_bytes = 0;
         boost::circular_buffer< unsigned int > window_buckets( std::ceil( window / bucket_width ));
-
         boost::posix_time::ptime start_time = boost::posix_time::microsec_clock::universal_time();
         boost::posix_time::ptime next_update = start_time + update_interval;
         boost::posix_time::ptime next_bucket = start_time + bucket_duration;
-
         bool end_of_stream = false;
         boost::array< char, 65536 > buffer;
         std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
         std::cin.tie( NULL ); // std::cin is tied to std::cout by default
-        
         while( !end_of_stream )
         {
             select.wait( wait_interval );
@@ -168,9 +185,7 @@ int main( int ac, char** av )
                 std::cout.write( &buffer[0], size );
                 std::cout.flush();
             }
-
             boost::posix_time::ptime now = boost::posix_time::microsec_clock::universal_time();
-
             if( now >= next_bucket )
             {
                 window_buckets.push_back( bucket_bytes );
@@ -183,29 +198,30 @@ int main( int ac, char** av )
                     next_bucket = now + bucket_duration;
                 }
             }
-
             if( now >= next_update && !window_buckets.empty() )
             {
                 double elapsed_time = double( ( now - start_time ).total_milliseconds() ) / 1000.0f;
-                double bandwidth = (double)total_bytes / elapsed_time;
-                double window_bandwidth = (double)std::accumulate( window_buckets.begin()
-                                                                 , window_buckets.end()
-                                                                 , 0.0f )
-                                                  / window_buckets.size() / bucket_width;
-
-                std::cerr << boost::posix_time::to_iso_string( now )
-                          << std::fixed
-                          << delimiter << total_bytes
-                          << delimiter << bandwidth
-                          << delimiter << window_bandwidth;
-                std::cerr.unsetf( std::ios_base::floatfield );
-                if( record_size )
+                double bandwidth = double( total_bytes ) / elapsed_time;
+                double window_bandwidth = static_cast< double >( std::accumulate( window_buckets.begin(), window_buckets.end(), 0.0f ) ) / window_buckets.size() / bucket_width;
+                std::ostringstream oss;
+                if( porcelain ) { oss << porcelain_title << ": "; }
+                if( !output_progress )
                 {
-                    std::cerr << delimiter << bandwidth / *record_size
-                              << delimiter << window_bandwidth / *record_size;
+                    oss << ( porcelain ? "time: " : "" ) << boost::posix_time::to_iso_string( now )
+                        << std::fixed
+                        << delimiter << ( porcelain ? "bytes: " : "" ) << total_bytes
+                        << delimiter << ( porcelain ? "bandwidth: " : "" ) << bandwidth
+                        << delimiter << ( porcelain ? "window-bandwidth: " : "" ) << window_bandwidth;
+                    oss.unsetf( std::ios_base::floatfield );
+                    if( record_size )
+                    {
+                        oss << delimiter << ( porcelain ? "record-rate: " : "" ) << bandwidth / *record_size
+                            << delimiter << ( porcelain ? "window-rate: " : "" ) << window_bandwidth / *record_size;
+                    }
                 }
-                std::cerr << std::endl;
-
+                if( total_count ) { oss << delimiter << ( porcelain ? "complete: " : "" ) << ( total_bytes / *record_size * 100 / *total_count ) << ( porcelain ? "%" : "" ); }
+                if( total_size ) { oss << delimiter << ( porcelain ? "complete: " : "" ) << ( total_bytes * 100 / *total_size ) << ( porcelain ? "%" : "" ); }
+                COMMA_TITLE_BARE( oss.str() );
                 next_update += update_interval;
                 // If there's been a large pause (for some reason), catch up
                 if( now > next_update ) { next_update = now + update_interval; }

From da7e773bcf9f5d31654aaf4e0e51cc8a84da3b2a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Mar 2024 22:20:09 +1100
Subject: [PATCH 0757/1056] io-bandwidth: --help: typo fixed

---
 io/applications/io-bandwidth.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/io-bandwidth.cpp b/io/applications/io-bandwidth.cpp
index e82420912..9a87bfb32 100644
--- a/io/applications/io-bandwidth.cpp
+++ b/io/applications/io-bandwidth.cpp
@@ -113,7 +113,7 @@ void usage( bool verbose = false )
     std::cerr << std::endl;
     std::cerr << "    show values in terminal title bar" << std::endl;
     std::cerr << "        yes | csv-repeat --pace --period 0.001 | head -n10000 \\" << std::endl;
-    std::cerr << "            | io-bandwidth --total-size 10000 --size 2 \\" << std::endl;
+    std::cerr << "            | io-bandwidth --total-count 10000 --size 2 \\" << std::endl;
     std::cerr << "                           --porcelain --titlebar >/dev/null" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    show progress indicator in terminal title bar" << std::endl;

From 27466bd72cacd80ba3f20ab13bd441444fb23164 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 9 Mar 2024 12:54:22 +1100
Subject: [PATCH 0758/1056] io-bandwidth: --spinner: a hidden option for now,
 first lousy cut impmlemented

---
 io/applications/io-bandwidth.cpp | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/io/applications/io-bandwidth.cpp b/io/applications/io-bandwidth.cpp
index 9a87bfb32..16ecb5664 100644
--- a/io/applications/io-bandwidth.cpp
+++ b/io/applications/io-bandwidth.cpp
@@ -156,6 +156,8 @@ int main( int ac, char** av )
         boost::posix_time::time_duration bucket_duration = boost::posix_time::microseconds( static_cast<unsigned int> (bucket_width * 1000000) );
         char delimiter = options.value( "--delimiter,-d", default_delimiter );
         bool porcelain = options.exists( "--porcelain" );
+        //std::pair< unsigned int, std::string > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? "-\\|/" : "" };
+        std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "<>     ", " <>    ", "  <>   ", "   <>  ", "  <> ", "     <>", "    <> ", "   <>  ", "  <>   ", " <>    " } : std::vector< std::string >{} };
         std::string porcelain_title = options.value< std::string >( "--porceilain-title,--title", "io-bandwidth" );
         if( porcelain ) { delimiter = ' '; }
         comma::io::select select;
@@ -221,6 +223,11 @@ int main( int ac, char** av )
                 }
                 if( total_count ) { oss << delimiter << ( porcelain ? "complete: " : "" ) << ( total_bytes / *record_size * 100 / *total_count ) << ( porcelain ? "%" : "" ); }
                 if( total_size ) { oss << delimiter << ( porcelain ? "complete: " : "" ) << ( total_bytes * 100 / *total_size ) << ( porcelain ? "%" : "" ); }
+                if( output_progress )
+                {
+                    if( !porcelain_spinner.second.empty() ) { oss << " " << porcelain_spinner.second[porcelain_spinner.first++]; }
+                    if( porcelain_spinner.first == porcelain_spinner.second.size() ) { porcelain_spinner.first = 0; }
+                }
                 COMMA_TITLE_BARE( oss.str() );
                 next_update += update_interval;
                 // If there's been a large pause (for some reason), catch up

From a6ff47539cfee6baa661ba758ac60c8e59c4e295 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 10 Mar 2024 11:14:17 +1100
Subject: [PATCH 0759/1056] io-bandwidth: --spinner: a hidden option for now,
 second lousy cut impmlemented

---
 io/applications/io-bandwidth.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/io/applications/io-bandwidth.cpp b/io/applications/io-bandwidth.cpp
index 16ecb5664..6db3e413e 100644
--- a/io/applications/io-bandwidth.cpp
+++ b/io/applications/io-bandwidth.cpp
@@ -157,7 +157,9 @@ int main( int ac, char** av )
         char delimiter = options.value( "--delimiter,-d", default_delimiter );
         bool porcelain = options.exists( "--porcelain" );
         //std::pair< unsigned int, std::string > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? "-\\|/" : "" };
-        std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "<>     ", " <>    ", "  <>   ", "   <>  ", "  <> ", "     <>", "    <> ", "   <>  ", "  <>   ", " <>    " } : std::vector< std::string >{} };
+        //std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "|<>       |", "| <>      |", "|  <>     |", "|   <>    |", "|    <>   |", "|     <>  |", "|      <> |", "|       <>|", "|      <> |", "|     <>  |", "|    <>   |", "|   <>    |", "|  <>     |", "| <>      |" } : std::vector< std::string >{} };
+        std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "[>________]", "[_>_______]", "[__>______]", "[___>_____]", "[____>____]", "[_____>___]", "[______>__]", "[_______>_]", "[________>]", "[________<]", "[_______<_]", "[______<__]", "[_____<___]", "[____<____]", "[___<_____]", "[__<______]", "[_<_______]", "[<________]" } : std::vector< std::string >{} };
+        //std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "\\/\\/\\/       ", " /\\/\\/\\      ", "  \\/\\/\\/     ", "   /\\/\\/\\    ", "  \\/\\/\\/   ", "     /\\/\\/\\  ", "    \\/\\/\\/   ", "   /\\/\\/\\    ", "  \\/\\/\\/     ", " /\\/\\/\\      " } : std::vector< std::string >{} };
         std::string porcelain_title = options.value< std::string >( "--porceilain-title,--title", "io-bandwidth" );
         if( porcelain ) { delimiter = ' '; }
         comma::io::select select;

From 1c710277003d1f1cc100a3494c28859b73f0d0e8 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 11 Mar 2024 18:15:44 +1100
Subject: [PATCH 0760/1056] CMakeFiles/check.c++.standard.cmake: compiler
 default set to c++17

---
 CMakeFiles/check.c++.standard.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeFiles/check.c++.standard.cmake b/CMakeFiles/check.c++.standard.cmake
index 1f4b01b82..c8ae95f44 100644
--- a/CMakeFiles/check.c++.standard.cmake
+++ b/CMakeFiles/check.c++.standard.cmake
@@ -1,7 +1,7 @@
     SET( CXX_STANDARDS "0x;11;14;17" CACHE STRING "list of known c++ standards" )
     MARK_AS_ADVANCED( FORCE CXX_STANDARDS )
     STRING( REGEX REPLACE ";" "," CXX_STANDARDS_READABLE "${CXX_STANDARDS}" )
-    SET( CXX_STANDARD_DEFAULT "14" CACHE STRING "default c++ standard to use" )
+    SET( CXX_STANDARD_DEFAULT "17" CACHE STRING "default c++ standard to use" )
     MARK_AS_ADVANCED( FORCE CXX_STANDARD_DEFAULT )
     SET( CXX_STANDARD_TO_USE "${CXX_STANDARD_DEFAULT}" CACHE STRING "c++ standard to use (one of ${CXX_STANDARDS_READABLE})" )
     SET_PROPERTY( CACHE CXX_STANDARD_TO_USE PROPERTY STRINGS ${CXX_STANDARDS} )

From 24589a2cf48e7e174cf82640185e5f625f73d674 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 10:39:19 +1100
Subject: [PATCH 0761/1056] io::terminal::controls: constants moved to cpp file
 for compatibility with c++14

---
 application/CMakeLists.txt |  2 +-
 io/terminal.cpp            | 19 +++++++++++++++++++
 io/terminal.h              |  6 +++---
 3 files changed, 23 insertions(+), 4 deletions(-)
 create mode 100644 io/terminal.cpp

diff --git a/application/CMakeLists.txt b/application/CMakeLists.txt
index 60b4211da..e622f07c2 100644
--- a/application/CMakeLists.txt
+++ b/application/CMakeLists.txt
@@ -10,7 +10,7 @@ ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 #set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
 #set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION "${comma_version}" ) #set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_string )
+TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_io comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( TARGETS ${TARGET_NAME}
diff --git a/io/terminal.cpp b/io/terminal.cpp
new file mode 100644
index 000000000..ff1a63139
--- /dev/null
+++ b/io/terminal.cpp
@@ -0,0 +1,19 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#include "terminal.h"
+
+namespace comma { namespace io { namespace terminal { namespace controls {
+
+char end::value[] = { 0x07, 0 };
+
+char stderr::start[] = { 0 };
+
+char stderr::end[] = { '\n', 0 }; // quick and dirty
+
+char titlebar::start[] = { 0x1b, ']', '0', ';', 0 };
+
+char titlebar::end[] = { 0x07, 0 };
+
+} } } } // namespace comma { namespace io { namespace terminal { namespace controls {
diff --git a/io/terminal.h b/io/terminal.h
index 10d26beab..bd38d6f5f 100644
--- a/io/terminal.h
+++ b/io/terminal.h
@@ -10,11 +10,11 @@ namespace comma { namespace io { namespace terminal {
 
 namespace controls {
 
-struct end { static constexpr char value[] = { 0x07, 0 }; };
+struct end { static char value[]; };
 
-struct stderr { static constexpr char start[] = { 0 }; static constexpr char end[] = { '\n', 0 }; }; // quick and dirty
+struct stderr { static char start[]; static char end[]; }; // quick and dirty
 
-struct titlebar { static constexpr char start[] = { 0x1b, ']', '0', ';', 0 }; static constexpr char end[] = { 0x07, 0 }; };
+struct titlebar { static char start[]; static char end[]; };
 
 template < unsigned int Colour >
 struct coloured; // todo

From 81201911dd457428aaba75dd6d39e007070ebd22 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 13:17:16 +1100
Subject: [PATCH 0762/1056] comma-test-query: application placeholder added

---
 util/applications/CMakeLists.txt   |  1 +
 util/applications/comma-test-query | 22 ++++++++++++++++++++++
 2 files changed, 23 insertions(+)
 create mode 100755 util/applications/comma-test-query

diff --git a/util/applications/CMakeLists.txt b/util/applications/CMakeLists.txt
index 263cb70f9..7486763b7 100644
--- a/util/applications/CMakeLists.txt
+++ b/util/applications/CMakeLists.txt
@@ -38,6 +38,7 @@ install( PROGRAMS comma-profile-graph DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-repeat DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-enforce DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-match DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-test-query DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-run DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-util DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-resources DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
new file mode 100755
index 000000000..9b9e6d3c9
--- /dev/null
+++ b/util/applications/comma-test-query
@@ -0,0 +1,22 @@
+#!/usr/bin/env python3
+
+# Copyright (c) 2024 Vsevolod Vlaskine
+
+import argparse, comma, json, sys
+
+def make_args():
+    description = 'usage: todo'
+    epilog = 'examples: todo'
+    parser = argparse.ArgumentParser( description=description, epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter )
+    parser.add_argument( '--dir', default='.', type=str, help='directory to traverse, "-": read paths from stdin (todo)' )
+    parser.add_argument( '--verbose', '-v', help='more human-readable output', action='store_true' )
+    subparsers = parser.add_subparsers( help='sub-command help' )
+    traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find readme.json, output combined json' )
+    transpose_parser = subparsers.add_parser( 'transpose', help='transpose into the given primary key' )
+    transpose_parser.add_argument( 'what', type=str, help='field name vs which to transpose' )
+    return parser.parse_args()
+
+def main():
+    args = make_args()
+
+if __name__ == '__main__': main()

From a2e94c5f30f23d42a46bc2ad194eced475d2f486 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 14:34:03 +1100
Subject: [PATCH 0763/1056] comma-test-query: list: first cut implemented

---
 util/applications/comma-test-query | 39 +++++++++++++++++++++++++++---
 1 file changed, 36 insertions(+), 3 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index 9b9e6d3c9..047b6b9d9 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -2,21 +2,54 @@
 
 # Copyright (c) 2024 Vsevolod Vlaskine
 
-import argparse, comma, json, sys
+import argparse, comma, json, os, sys
+
+def _find( args ):
+    if args.dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
+    dir = os.path.realpath( args.dir )
+    def _valid( path ): # quick and dirty, inefficient for now
+        # print(functools.reduce(lambda a, b: a if a > b else b, lis)) 
+        p = path
+        while os.path.realpath( p ) != dir:
+            if os.path.isfile( f'{p}/readme.json' ) or os.path.isfile( f'{p}/test' ): return True
+            p = os.path.dirname( p )
+        return False
+    d = [ i[0] for i in os.walk( args.dir, followlinks=True ) ]
+    r = sorted( filter( _valid, d ) )
+    if not args.absolute: r = [ p[ ( len( d[0] ) + 1 ) : ] for p in r ]
+    return r
+
+def _list( args ):
+    w = _find( args )
+    for e in w: print( f'{e}' )
+    #print( list( _find( args ) ) )
+
+def _transpose( args ):
+    _find( args )
+
+def _traverse( args ):
+    _find( args )
 
 def make_args():
     description = 'usage: todo'
     epilog = 'examples: todo'
     parser = argparse.ArgumentParser( description=description, epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter )
-    parser.add_argument( '--dir', default='.', type=str, help='directory to traverse, "-": read paths from stdin (todo)' )
+    parser.add_argument( '--dir', default='.', type=str, help='directory to traverse; default: current directory, "-": read paths from stdin (todo)' )
+    parser.add_argument( '--permissive', help='do not complain about directories that have test, but not readme.json', action='store_true' )
     parser.add_argument( '--verbose', '-v', help='more human-readable output', action='store_true' )
     subparsers = parser.add_subparsers( help='sub-command help' )
-    traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find readme.json, output combined json' )
+    list_parser = subparsers.add_parser( 'list', help='print subdirectories containing test or readme.json, following symlinks' )
+    list_parser.add_argument( '--absolute', help='output absolute path', action='store_true' )
+    list_parser.set_defaults( func=_list )
     transpose_parser = subparsers.add_parser( 'transpose', help='transpose into the given primary key' )
     transpose_parser.add_argument( 'what', type=str, help='field name vs which to transpose' )
+    transpose_parser.set_defaults( func=_transpose )
+    traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find readme.json, output combined json' )
+    traverse_parser.set_defaults( func=_traverse )
     return parser.parse_args()
 
 def main():
     args = make_args()
+    args.func( args )
 
 if __name__ == '__main__': main()

From 02bc25193c78af784f09e9e2ad600ec95147efe9 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 15:00:43 +1100
Subject: [PATCH 0764/1056] comma-test-query: list: filter out mounted
 directories

---
 util/applications/comma-test-query | 13 +++++++++----
 1 file changed, 9 insertions(+), 4 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index 047b6b9d9..34fd232b3 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -7,9 +7,14 @@ import argparse, comma, json, os, sys
 def _find( args ):
     if args.dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
     dir = os.path.realpath( args.dir )
-    def _valid( path ): # quick and dirty, inefficient for now
-        # print(functools.reduce(lambda a, b: a if a > b else b, lis)) 
-        p = path
+    def _is_mount( p ): # quick and dirty, excessive and inefficient for now
+        p = os.path.realpath( p )
+        while not p in ['', '/']:
+            if os.path.ismount( p ): return True
+            p = os.path.dirname( p )
+        return False
+    def _valid( p ): # quick and dirty, inefficient for now
+        if _is_mount( p ): return False
         while os.path.realpath( p ) != dir:
             if os.path.isfile( f'{p}/readme.json' ) or os.path.isfile( f'{p}/test' ): return True
             p = os.path.dirname( p )
@@ -38,7 +43,7 @@ def make_args():
     parser.add_argument( '--permissive', help='do not complain about directories that have test, but not readme.json', action='store_true' )
     parser.add_argument( '--verbose', '-v', help='more human-readable output', action='store_true' )
     subparsers = parser.add_subparsers( help='sub-command help' )
-    list_parser = subparsers.add_parser( 'list', help='print subdirectories containing test or readme.json, following symlinks' )
+    list_parser = subparsers.add_parser( 'list', help='print subdirectories containing test or readme.json, following symlinks, but skipping mounted drives (for now)' )
     list_parser.add_argument( '--absolute', help='output absolute path', action='store_true' )
     list_parser.set_defaults( func=_list )
     transpose_parser = subparsers.add_parser( 'transpose', help='transpose into the given primary key' )

From a41e4580e6bdf445697860db5e3b4e9882db87b6 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 15:16:48 +1100
Subject: [PATCH 0765/1056] comma-test-query: traverse: first cut implemented

---
 util/applications/comma-test-query | 32 +++++++++++++++++++-----------
 1 file changed, 20 insertions(+), 12 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index 34fd232b3..3810301b5 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -4,9 +4,9 @@
 
 import argparse, comma, json, os, sys
 
-def _find( args ):
-    if args.dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
-    dir = os.path.realpath( args.dir )
+def _find( dir, absolute=False ):
+    if dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
+    real_root = os.path.realpath( dir )
     def _is_mount( p ): # quick and dirty, excessive and inefficient for now
         p = os.path.realpath( p )
         while not p in ['', '/']:
@@ -15,25 +15,32 @@ def _find( args ):
         return False
     def _valid( p ): # quick and dirty, inefficient for now
         if _is_mount( p ): return False
-        while os.path.realpath( p ) != dir:
+        while os.path.realpath( p ) != real_root:
             if os.path.isfile( f'{p}/readme.json' ) or os.path.isfile( f'{p}/test' ): return True
             p = os.path.dirname( p )
         return False
-    d = [ i[0] for i in os.walk( args.dir, followlinks=True ) ]
+    d = [ i[0] for i in os.walk( dir, followlinks=True ) ]
+    root = d[0]
     r = sorted( filter( _valid, d ) )
-    if not args.absolute: r = [ p[ ( len( d[0] ) + 1 ) : ] for p in r ]
-    return r
+    if not absolute: r = [ p[ ( len( root ) + 1 ) : ] for p in r ]
+    return root, r
 
 def _list( args ):
-    w = _find( args )
-    for e in w: print( f'{e}' )
-    #print( list( _find( args ) ) )
+    _, paths = _find( args.dir, args.absolute )
+    for p in paths: print( f'{p}' )
 
 def _transpose( args ):
-    _find( args )
+    _, paths = _find( args.dir )
 
 def _traverse( args ):
-    _find( args )
+    d = {}
+    base, paths = _find( args.dir )
+    for path in paths:
+        readme = f'{base}/{path}/readme.json'
+        status = 'todo'
+        if os.path.isfile( readme ):
+            with open( readme ) as f: comma.dictionary.set( d, path, json.load( f ) )
+    json.dump( d, sys.stdout, indent = None if args.minify else 4 )
 
 def make_args():
     description = 'usage: todo'
@@ -50,6 +57,7 @@ def make_args():
     transpose_parser.add_argument( 'what', type=str, help='field name vs which to transpose' )
     transpose_parser.set_defaults( func=_transpose )
     traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find readme.json, output combined json' )
+    traverse_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
     traverse_parser.set_defaults( func=_traverse )
     return parser.parse_args()
 

From 6e0150f0a329eb995e63fbcff7493b210cd28ebc Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 15:24:40 +1100
Subject: [PATCH 0766/1056] comma-test-query: parametrised on <what>

---
 util/applications/comma-test-query | 26 ++++++++++++++------------
 1 file changed, 14 insertions(+), 12 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index 3810301b5..b942319c6 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -4,7 +4,7 @@
 
 import argparse, comma, json, os, sys
 
-def _find( dir, absolute=False ):
+def _find( what, dir, absolute=False ):
     if dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
     real_root = os.path.realpath( dir )
     def _is_mount( p ): # quick and dirty, excessive and inefficient for now
@@ -16,7 +16,7 @@ def _find( dir, absolute=False ):
     def _valid( p ): # quick and dirty, inefficient for now
         if _is_mount( p ): return False
         while os.path.realpath( p ) != real_root:
-            if os.path.isfile( f'{p}/readme.json' ) or os.path.isfile( f'{p}/test' ): return True
+            if os.path.isfile( f'{p}/{what}' ) or os.path.isfile( f'{p}/test' ): return True
             p = os.path.dirname( p )
         return False
     d = [ i[0] for i in os.walk( dir, followlinks=True ) ]
@@ -26,20 +26,20 @@ def _find( dir, absolute=False ):
     return root, r
 
 def _list( args ):
-    _, paths = _find( args.dir, args.absolute )
+    _, paths = _find( args.what, args.dir, args.absolute )
     for p in paths: print( f'{p}' )
 
 def _transpose( args ):
-    _, paths = _find( args.dir )
+    _, paths = _find( args.what, args.dir )
 
 def _traverse( args ):
     d = {}
-    base, paths = _find( args.dir )
+    base, paths = _find( args.what, args.dir )
     for path in paths:
-        readme = f'{base}/{path}/readme.json'
+        what = f'{base}/{path}/{args.what}'
         status = 'todo'
-        if os.path.isfile( readme ):
-            with open( readme ) as f: comma.dictionary.set( d, path, json.load( f ) )
+        if os.path.isfile( what ):
+            with open( what ) as f: comma.dictionary.set( d, path, json.load( f ) ) # todo: fix overfitting on loading files of various types
     json.dump( d, sys.stdout, indent = None if args.minify else 4 )
 
 def make_args():
@@ -47,16 +47,18 @@ def make_args():
     epilog = 'examples: todo'
     parser = argparse.ArgumentParser( description=description, epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter )
     parser.add_argument( '--dir', default='.', type=str, help='directory to traverse; default: current directory, "-": read paths from stdin (todo)' )
-    parser.add_argument( '--permissive', help='do not complain about directories that have test, but not readme.json', action='store_true' )
     parser.add_argument( '--verbose', '-v', help='more human-readable output', action='store_true' )
     subparsers = parser.add_subparsers( help='sub-command help' )
-    list_parser = subparsers.add_parser( 'list', help='print subdirectories containing test or readme.json, following symlinks, but skipping mounted drives (for now)' )
+    list_parser = subparsers.add_parser( 'list', help='print subdirectories containing test or <what>, following symlinks, but skipping mounted drives (for now)' )
+    list_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
     list_parser.add_argument( '--absolute', help='output absolute path', action='store_true' )
     list_parser.set_defaults( func=_list )
     transpose_parser = subparsers.add_parser( 'transpose', help='transpose into the given primary key' )
-    transpose_parser.add_argument( 'what', type=str, help='field name vs which to transpose' )
+    transpose_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
+    transpose_parser.add_argument( 'key', type=str, help='field name vs which to transpose' )
     transpose_parser.set_defaults( func=_transpose )
-    traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find readme.json, output combined json' )
+    traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find <what>, output combined json' )
+    traverse_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
     traverse_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
     traverse_parser.set_defaults( func=_traverse )
     return parser.parse_args()

From e2f1b0910a3edbece64f0c85d1d48e9008bcf214 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 15:40:57 +1100
Subject: [PATCH 0767/1056] comma-test-query: transpose: first cut implemented;
 in progress...

---
 util/applications/comma-test-query | 20 +++++++++++++++++---
 1 file changed, 17 insertions(+), 3 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index b942319c6..7b984bcaa 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -30,13 +30,25 @@ def _list( args ):
     for p in paths: print( f'{p}' )
 
 def _transpose( args ):
-    _, paths = _find( args.what, args.dir )
+    root, paths = _find( args.what, args.dir )
+    d = {}
+    for path in paths:
+        what = f'{root}/{path}/{args.what}'
+        status = 'todo'
+        if os.path.isfile( what ):
+            with open( what ) as f: r = json.load( f )
+            if not args.key in r:
+                if args.strict: raise KeyError( f'{args.key} not found in {what}' )
+                else: continue
+            for k in r[args.key]:
+                comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
+    json.dump( d, sys.stdout, indent = None if args.minify else 4 )    
 
 def _traverse( args ):
     d = {}
-    base, paths = _find( args.what, args.dir )
+    root, paths = _find( args.what, args.dir )
     for path in paths:
-        what = f'{base}/{path}/{args.what}'
+        what = f'{root}/{path}/{args.what}'
         status = 'todo'
         if os.path.isfile( what ):
             with open( what ) as f: comma.dictionary.set( d, path, json.load( f ) ) # todo: fix overfitting on loading files of various types
@@ -56,6 +68,8 @@ def make_args():
     transpose_parser = subparsers.add_parser( 'transpose', help='transpose into the given primary key' )
     transpose_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
     transpose_parser.add_argument( 'key', type=str, help='field name vs which to transpose' )
+    transpose_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
+    transpose_parser.add_argument( '--strict', help='fail if one of files does not have desired <key>', action='store_true' )
     transpose_parser.set_defaults( func=_transpose )
     traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find <what>, output combined json' )
     traverse_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )

From 7c22f3c387db287a7af8397f284b920706ef5f3d Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 15:46:58 +1100
Subject: [PATCH 0768/1056] comma-test-query: transpose: --output=<what>
 implemented; in progress...

---
 util/applications/comma-test-query | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index 7b984bcaa..de71ab2fd 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -40,8 +40,12 @@ def _transpose( args ):
             if not args.key in r:
                 if args.strict: raise KeyError( f'{args.key} not found in {what}' )
                 else: continue
-            for k in r[args.key]:
-                comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
+            if args.output == 'all':
+                for k in r[args.key]:
+                    comma.dictionary.set( d, f'{args.key}/{k}/{path}', r ) # todo! quick and dirty, super-overfit!
+            elif args.output == 'paths':
+                for k in r[args.key]:
+                    comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
     json.dump( d, sys.stdout, indent = None if args.minify else 4 )    
 
 def _traverse( args ):
@@ -69,6 +73,7 @@ def make_args():
     transpose_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
     transpose_parser.add_argument( 'key', type=str, help='field name vs which to transpose' )
     transpose_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
+    transpose_parser.add_argument( '--output', default='all', type=str, choices=['all', 'paths'], help='what to output' )
     transpose_parser.add_argument( '--strict', help='fail if one of files does not have desired <key>', action='store_true' )
     transpose_parser.set_defaults( func=_transpose )
     traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find <what>, output combined json' )

From fac379f44667ee5b9f522c8718a3c45445561ab1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 17:35:03 +1100
Subject: [PATCH 0769/1056] comma-test-query: fixed top level directory check;
 in progress...

---
 util/applications/comma-test-query | 36 +++++++++++++++++-------------
 1 file changed, 21 insertions(+), 15 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index de71ab2fd..c567aaef9 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -2,23 +2,24 @@
 
 # Copyright (c) 2024 Vsevolod Vlaskine
 
-import argparse, comma, json, os, sys
+import argparse, collections.abc, comma, json, os, sys
 
 def _find( what, dir, absolute=False ):
     if dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
     real_root = os.path.realpath( dir )
     def _is_mount( p ): # quick and dirty, excessive and inefficient for now
         p = os.path.realpath( p )
-        while not p in ['', '/']:
+        while True:
+            if p == '/': return False
             if os.path.ismount( p ): return True
+            if p == '': return False
             p = os.path.dirname( p )
-        return False
     def _valid( p ): # quick and dirty, inefficient for now
         if _is_mount( p ): return False
-        while os.path.realpath( p ) != real_root:
-            if os.path.isfile( f'{p}/{what}' ) or os.path.isfile( f'{p}/test' ): return True
+        while True:
+            if os.path.isfile( f'{p}/{what}' ): return True # if os.path.isfile( f'{p}/{what}' ) or os.path.isfile( f'{p}/test' ): return True
+            if os.path.realpath( p ) == real_root: return False
             p = os.path.dirname( p )
-        return False
     d = [ i[0] for i in os.walk( dir, followlinks=True ) ]
     root = d[0]
     r = sorted( filter( _valid, d ) )
@@ -26,7 +27,7 @@ def _find( what, dir, absolute=False ):
     return root, r
 
 def _list( args ):
-    _, paths = _find( args.what, args.dir, args.absolute )
+    _, paths = _find( args.what, args.dir )
     for p in paths: print( f'{p}' )
 
 def _transpose( args ):
@@ -41,12 +42,19 @@ def _transpose( args ):
                 if args.strict: raise KeyError( f'{args.key} not found in {what}' )
                 else: continue
             if args.output == 'all':
-                for k in r[args.key]:
-                    comma.dictionary.set( d, f'{args.key}/{k}/{path}', r ) # todo! quick and dirty, super-overfit!
+                if isinstance( r[args.key], list ):
+                    for k in r[args.key]:
+                        comma.dictionary.set( d, f'{args.key}/{k}/{path}', r ) # todo! quick and dirty, super-overfit!
+                else:
+                    comma.dictionary.set( d, f'{args.key}/{r[args.key]}/{path}', r ) # todo! quick and dirty, super-overfit!
             elif args.output == 'paths':
-                for k in r[args.key]:
+                if isinstance( r[args.key], list ):
+                    for k in r[args.key]: comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
+                else:
+                    k = r[args.key]
                     comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
-    json.dump( d, sys.stdout, indent = None if args.minify else 4 )    
+    #json.dump( sorted( d, key=lambda i: i[0] ), sys.stdout, indent = None if args.minify else 4 )    
+    json.dump( d, sys.stdout, sort_keys=True, indent = None if args.minify else 4 )
 
 def _traverse( args ):
     d = {}
@@ -62,22 +70,20 @@ def make_args():
     description = 'usage: todo'
     epilog = 'examples: todo'
     parser = argparse.ArgumentParser( description=description, epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter )
+    parser.add_argument( 'what', type=str, help='what to look for, e.g. readme.json' )
     parser.add_argument( '--dir', default='.', type=str, help='directory to traverse; default: current directory, "-": read paths from stdin (todo)' )
     parser.add_argument( '--verbose', '-v', help='more human-readable output', action='store_true' )
     subparsers = parser.add_subparsers( help='sub-command help' )
     list_parser = subparsers.add_parser( 'list', help='print subdirectories containing test or <what>, following symlinks, but skipping mounted drives (for now)' )
-    list_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
-    list_parser.add_argument( '--absolute', help='output absolute path', action='store_true' )
+    #list_parser.add_argument( '--absolute', help='output absolute path', action='store_true' )
     list_parser.set_defaults( func=_list )
     transpose_parser = subparsers.add_parser( 'transpose', help='transpose into the given primary key' )
-    transpose_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
     transpose_parser.add_argument( 'key', type=str, help='field name vs which to transpose' )
     transpose_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
     transpose_parser.add_argument( '--output', default='all', type=str, choices=['all', 'paths'], help='what to output' )
     transpose_parser.add_argument( '--strict', help='fail if one of files does not have desired <key>', action='store_true' )
     transpose_parser.set_defaults( func=_transpose )
     traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find <what>, output combined json' )
-    traverse_parser.add_argument( 'what', type=str, choices=['readme.json'], help='output absolute path' )
     traverse_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
     traverse_parser.set_defaults( func=_traverse )
     return parser.parse_args()

From 5353ec0e4cbc1026501c7c9860bc03aec7711066 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 12 Mar 2024 18:28:58 +1100
Subject: [PATCH 0770/1056] python: comma.filesystem: walk() and find(): first
 cut implemented

---
 python/comma/__init__.py            |  1 +
 python/comma/filesystem/__init__.py |  1 +
 python/comma/filesystem/impl.py     | 35 +++++++++++++++++++++++++++++
 python/setup.py                     |  2 +-
 util/applications/comma-test-query  | 27 ++++++----------------
 5 files changed, 45 insertions(+), 21 deletions(-)
 create mode 100644 python/comma/filesystem/__init__.py
 create mode 100644 python/comma/filesystem/impl.py

diff --git a/python/comma/__init__.py b/python/comma/__init__.py
index f62e8a2e0..a06fdb611 100644
--- a/python/comma/__init__.py
+++ b/python/comma/__init__.py
@@ -3,6 +3,7 @@
 
 from . import csv
 from . import dictionary
+from . import filesystem
 from . import io
 from . import numpy
 from . import signal
diff --git a/python/comma/filesystem/__init__.py b/python/comma/filesystem/__init__.py
new file mode 100644
index 000000000..ecf88f4d4
--- /dev/null
+++ b/python/comma/filesystem/__init__.py
@@ -0,0 +1 @@
+from .impl import find, walk
\ No newline at end of file
diff --git a/python/comma/filesystem/impl.py b/python/comma/filesystem/impl.py
new file mode 100644
index 000000000..cd731e23f
--- /dev/null
+++ b/python/comma/filesystem/impl.py
@@ -0,0 +1,35 @@
+# Copyright (c) 2024 Vsevolod Vlaskine
+
+import os
+
+# same as os.walk, but with followmounts flag
+def walk( dir, followlinks=False, followmounts=False, excluded=None ):
+    if excluded is None: excluded = []
+    real_root = os.path.realpath( dir )
+    def _valid( i ): # quick and dirty, excessive and inefficient for now
+        p = i[0]
+        if os.path.basename( p ) in excluded: return False
+        if followmounts: return True
+        p = os.path.realpath( i[0] )
+        while True:
+            if p == '/': return True
+            if os.path.ismount( p ): return False
+            if p == '': return True
+            p = os.path.dirname( p )
+    return filter( _valid, os.walk( dir, followlinks=followlinks ) )
+
+def find( what, dirs, find_children=False ):
+    if not isinstance( what, list ): what = [ what ]
+    def _valid( i ): # quick and dirty, inefficient for now
+        p = i[0]
+        if find_children:
+            while True:
+                for q in what:
+                    if os.path.exists( f'{p}/{q}' ): return True # if os.path.isfile( f'{p}/{what}' ) or os.path.isfile( f'{p}/test' ): return True
+                if p in ['', '/']: return False
+                p = os.path.dirname( p )
+        for q in what:
+            if os.path.exists( f'{p}/{q}' ): return True
+        return False
+    return filter( _valid, dirs )
+
diff --git a/python/setup.py b/python/setup.py
index 4b947fbf4..950ebe376 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -30,7 +30,7 @@
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
         python_requires     = '>=3.6',
         #install_requires    = [ 'numpy' ], # todo? does it need to be uncommented for packaging
-        packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.dictionary', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
+        packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.dictionary', 'comma.filesystem', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
         entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] } #scripts             = [ "comma/csv/applications/csv-eval" ]
diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index c567aaef9..488722c8a 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -6,28 +6,14 @@ import argparse, collections.abc, comma, json, os, sys
 
 def _find( what, dir, absolute=False ):
     if dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
-    real_root = os.path.realpath( dir )
-    def _is_mount( p ): # quick and dirty, excessive and inefficient for now
-        p = os.path.realpath( p )
-        while True:
-            if p == '/': return False
-            if os.path.ismount( p ): return True
-            if p == '': return False
-            p = os.path.dirname( p )
-    def _valid( p ): # quick and dirty, inefficient for now
-        if _is_mount( p ): return False
-        while True:
-            if os.path.isfile( f'{p}/{what}' ): return True # if os.path.isfile( f'{p}/{what}' ) or os.path.isfile( f'{p}/test' ): return True
-            if os.path.realpath( p ) == real_root: return False
-            p = os.path.dirname( p )
-    d = [ i[0] for i in os.walk( dir, followlinks=True ) ]
-    root = d[0]
-    r = sorted( filter( _valid, d ) )
-    if not absolute: r = [ p[ ( len( root ) + 1 ) : ] for p in r ]
-    return root, r
+    w = comma.filesystem.walk( dir, followlinks=True, followmounts=False )
+    f = comma.filesystem.find( what, w, find_children=True )
+    r = sorted( [ i[0] for i in f ] )
+    if not absolute: offset = len( dir ) + 1; r = [ p[offset:] for p in r ]
+    return dir, r
 
 def _list( args ):
-    _, paths = _find( args.what, args.dir )
+    _, paths = _find( args.what if isinstance( args.what, list ) else [ args.what ], args.dir )
     for p in paths: print( f'{p}' )
 
 def _transpose( args ):
@@ -90,6 +76,7 @@ def make_args():
 
 def main():
     args = make_args()
+    args.what = args.what.split( ',' )
     args.func( args )
 
 if __name__ == '__main__': main()

From 93325098d09895dbd1b3cb37110e7ce21f9c01eb Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 13 Mar 2024 13:19:07 +1100
Subject: [PATCH 0771/1056] comma-test-run: --followsymlinks and --followmounts
 implemented

---
 util/applications/comma-test-run | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index e3a933c1a..2017f1ab9 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -58,6 +58,8 @@ function description_test_selection()
 --black-list=[<file>]; do not run these tests mentioned in <file>, e.g. a lists of sub-directories in white list
   to be excluded; see '--white-list' below for file format.
 --end=[<dir>]; run tests up to a given test, the latter excluded, where test directories are ordered lexicographically
+--followsymlinks,-L; follow symlinks when looking for test directories, same as find -L
+--followmounts; search mounted filesystems when looking for test directories, same as find without -mount
 --from,--begin=[<dir>]; run tests starting from a given test, where test directories are ordered lexicographically
 --run-disabled; run disabled tests
 --run-optional,--optional; run tests having file called "optional" (same logic as for --run-disabled)
@@ -1081,7 +1083,10 @@ function test_directories()
         options_black_list="^(\./)?($( sed 's#\./##' <$options_black_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//' ))";
     fi
 
-    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find . -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list ) )
+    local followsymlinks followmounts="-mount"
+    (( ! options_followsymlinks )) || followsymlinks="-L"
+    (( ! options_followmounts )) || followmounts=
+    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find $followsymlinks . $followmounts -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list ) )
     [[ -n "$options_from" || -n "$options_to" || -n "$options_end" ]] || { echo ${test_script_dirs_all[@]} ; return ; }
     [[ -z "$options_from" ]] || { local from="${options_from#\.\/}" ; }
     [[ -z "$options_to" ]] || { local to="${options_to#\.\/}" ; }

From 112b45840b9d0a24a15622bd5b57d9d0d3de3019 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 13 Mar 2024 13:26:21 +1100
Subject: [PATCH 0772/1056] comma-test-query: bug fixed; what handled as a list

---
 util/applications/comma-test-query | 50 ++++++++++++++++--------------
 1 file changed, 27 insertions(+), 23 deletions(-)

diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
index 488722c8a..41ce0aef2 100755
--- a/util/applications/comma-test-query
+++ b/util/applications/comma-test-query
@@ -20,36 +20,40 @@ def _transpose( args ):
     root, paths = _find( args.what, args.dir )
     d = {}
     for path in paths:
-        what = f'{root}/{path}/{args.what}'
-        status = 'todo'
-        if os.path.isfile( what ):
-            with open( what ) as f: r = json.load( f )
-            if not args.key in r:
-                if args.strict: raise KeyError( f'{args.key} not found in {what}' )
-                else: continue
-            if args.output == 'all':
-                if isinstance( r[args.key], list ):
-                    for k in r[args.key]:
-                        comma.dictionary.set( d, f'{args.key}/{k}/{path}', r ) # todo! quick and dirty, super-overfit!
-                else:
-                    comma.dictionary.set( d, f'{args.key}/{r[args.key]}/{path}', r ) # todo! quick and dirty, super-overfit!
-            elif args.output == 'paths':
-                if isinstance( r[args.key], list ):
-                    for k in r[args.key]: comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
-                else:
-                    k = r[args.key]
-                    comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
+        for w in args.what:
+            what = f'{root}/{path}/{w}'
+            status = 'todo'
+            if os.path.isfile( what ):
+                with open( what ) as f: r = json.load( f )
+                if not args.key in r:
+                    if args.strict: raise KeyError( f'{args.key} not found in {what}' )
+                    else: continue
+                if args.output == 'all':
+                    if isinstance( r[args.key], list ):
+                        for k in r[args.key]:
+                            comma.dictionary.set( d, f'{args.key}/{k}/{path}', r ) # todo! quick and dirty, super-overfit!
+                    else:
+                        comma.dictionary.set( d, f'{args.key}/{r[args.key]}/{path}', r ) # todo! quick and dirty, super-overfit!
+                elif args.output == 'paths':
+                    if isinstance( r[args.key], list ):
+                        for k in r[args.key]: comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
+                    else:
+                        k = r[args.key]
+                        comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
     #json.dump( sorted( d, key=lambda i: i[0] ), sys.stdout, indent = None if args.minify else 4 )    
     json.dump( d, sys.stdout, sort_keys=True, indent = None if args.minify else 4 )
 
 def _traverse( args ):
     d = {}
     root, paths = _find( args.what, args.dir )
+    print( f'a: {root=}', file=sys.stderr )
+    print( f'b: {paths=}', file=sys.stderr )
     for path in paths:
-        what = f'{root}/{path}/{args.what}'
-        status = 'todo'
-        if os.path.isfile( what ):
-            with open( what ) as f: comma.dictionary.set( d, path, json.load( f ) ) # todo: fix overfitting on loading files of various types
+        for w in args.what:
+            what = f'{root}/{path}/{w}'
+            print( f'c: {what=}', file=sys.stderr )
+            if os.path.isfile( what ):
+                with open( what ) as f: comma.dictionary.set( d, path, json.load( f ) ) # todo: fix overfitting on loading files of various types
     json.dump( d, sys.stdout, indent = None if args.minify else 4 )
 
 def make_args():

From e22012c15451599e7e52b93efba109b2eabba656 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 20 Mar 2024 11:33:27 +1100
Subject: [PATCH 0773/1056] csv-paste: --repeat implemented and tests

---
 csv/applications/csv-paste.cpp | 41 ++++++++++++++++++-----------
 csv/test/csv-paste/expected    | 48 ++++++++++++++++++++++++++++++++++
 csv/test/csv-paste/input       |  8 ++++++
 3 files changed, 82 insertions(+), 15 deletions(-)

diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index 8eacc7c71..ec660a6ea 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -61,6 +61,10 @@ static void usage( bool verbose )
     std::cerr << "            --block-size,--size=<size>: number of records with the same line number; default: 1" << std::endl;
     std::cerr << "                 WARNING: --size: deprecated, since it is confusing for files" << std::endl;
     std::cerr << "            --index; instead of block number output record index in the block" << std::endl;
+    std::cerr << "            --repeat=[<n>]; repeat a given pattern <n> times" << std::endl;
+    std::cerr << "                no --size: same as --head" << std::endl;
+    std::cerr << "                --size: repeat block of a given size <n> times" << std::endl;
+    std::cerr << "                --shape: repeat a given shape <n> times, e.g. 'line-number;shape=4,3,5;repeat=2'" << std::endl;
     std::cerr << "            --reverse; if --index, output index in descending order" << std::endl;
     std::cerr << "            --shape=<shape>; iterate through indices of a given shape; <shape>: same meaning as in numpy, e.g. 'line-number;shape=10,5,4'" << std::endl;
     std::cerr << "            --step=<value>; default=1; line number increment/decrement step" << std::endl;        
@@ -173,27 +177,29 @@ class line_number : public source
         class options
         {
             public:
-                comma::uint32 size;
-                bool index;
-                bool reverse;
-                comma::int32 step;
-                comma::int32 begin;
+                comma::uint32 size{0};
+                bool index{false};
+                bool reverse{false};
+                comma::int32 step{0};
+                comma::int32 begin{0};
                 std::vector< comma::uint32 > shape;
                 std::string format;
+                comma::uint32 repeat{0};
                 
-                options( const boost::optional< comma::int32 >& b = boost::optional< comma::int32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false, int s = 1 )
+                options( const boost::optional< comma::int32 >& b = boost::optional< comma::int32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false, int s = 1, unsigned int repeat = 0 )
                     : size( size )
                     , index( index )
                     , reverse( reverse )
                     , step( s )
                     , begin( begin_( b ) )
+                    , repeat( repeat )
                 {
                 }
                 
                 options( const std::string& properties, const comma::command_line_options& o ) // quick and dirty: use visiting instead
                 {
                     o.assert_mutually_exclusive( "--shape", "--block-size,--size,--reverse,--begin" );
-                    options defaults( boost::optional< comma::int32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::int32 >( "--step", 1 ) );
+                    options defaults( boost::optional< comma::int32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::int32 >( "--step", 1 ), o.value< comma::uint32 >( "--repeat", 0 ) );
                     comma::name_value::map map( properties, ';', '=' );
                     map.assert_mutually_exclusive( "shape", "block-size,size,reverse,begin,step" );
                     std::string s = map.value< std::string >( "shape", o.value< std::string >( "--shape", "" ) );
@@ -215,6 +221,7 @@ class line_number : public source
                         shape.resize( v.size() );
                         for( unsigned int i = 0; i < v.size(); ++i ) { shape[i] = boost::lexical_cast< unsigned int >( v[i] ); }
                     }
+                    repeat = map.value< comma::int32 >( "repeat", defaults.repeat );
                 }
                 
             private:
@@ -237,27 +244,28 @@ class line_number : public source
         const std::string* read()
         { 
             serialized_ = values_.empty() ? boost::lexical_cast< std::string >( value_ ) : comma::join( values_, ',' );
-            update_();
-            return &serialized_;
+            return update_() ? &serialized_ : nullptr;
         }
         
         const char* read( char* buf ) // quick and dirty
         {
             if( values_.empty() ) { comma::csv::format::traits< comma::int32 >::to_bin( value_, buf ); }
             else { for( unsigned int i = 0; i < values_.size(); ++i, buf += sizeof( comma::int32 ) ) { comma::csv::format::traits< comma::int32 >::to_bin( values_[i], buf ); } }
-            update_();
-            return buf;
+            return update_() ? buf : nullptr;
         }
         
     private:
         options options_;
-        comma::uint32 count_;
-        comma::int32 value_;
+        comma::uint32 count_{0};
+        comma::int32 value_{0};
+        comma::uint32 _repeats{0};
         std::vector< comma::uint32 > values_;
         std::string serialized_;
+        bool _done{false};
         
-        void update_()
+        bool update_()
         {
+            if( _done ) { return false; }
             if( values_.empty() )
             {
                 ++count_; //count_ += options_.step;
@@ -269,6 +277,7 @@ class line_number : public source
                 {
                     value_ = options_.index ? options_.begin : ( value_ + options_.step );
                     count_ = 0;
+                    if( options_.repeat > 0 ) { ++_repeats; if( _repeats == options_.repeat ) { _done = true; } }
                 }
             }
             else
@@ -277,9 +286,11 @@ class line_number : public source
                 {
                     ++values_[i];
                     if( values_[i] < options_.shape[i] ) { break; }
+                    if( i == 0 && options_.repeat > 0 ) { ++_repeats; if( _repeats == options_.repeat ) { _done = true; } }
                     values_[i] = 0;
                 }
             }
+            return true;
         }
 };
 
@@ -289,7 +300,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         char delimiter = options.value( "--delimiter,-d", ',' );
-        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--step,--block-size,--head" );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--step,--block-size,--head,--repeat" );
         bool flush = options.exists( "--flush" );
         boost::ptr_vector< source > sources;
         bool is_binary = false;
diff --git a/csv/test/csv-paste/expected b/csv/test/csv-paste/expected
index ff6857aae..dce417c7f 100644
--- a/csv/test/csv-paste/expected
+++ b/csv/test/csv-paste/expected
@@ -170,3 +170,51 @@ line_number/shape[1]/output/line[9]="1,0"
 line_number/shape[1]/output/line[10]="1,1"
 line_number/shape[1]/output/line[11]="1,2"
 line_number/shape[1]/status=0
+
+line_number/repeat[0]/output/line[0]="0"
+line_number/repeat[0]/output/line[1]="1"
+line_number/repeat[0]/output/line[2]="2"
+line_number/repeat[0]/status=0
+line_number/repeat[1]/output/line[0]="0"
+line_number/repeat[1]/output/line[1]="1"
+line_number/repeat[1]/output/line[2]="2"
+line_number/repeat[1]/status=0
+line_number/repeat[3]/output/line[0]="0"
+line_number/repeat[3]/output/line[1]="0"
+line_number/repeat[3]/output/line[2]="1"
+line_number/repeat[3]/output/line[3]="1"
+line_number/repeat[3]/status=0
+line_number/repeat[4]/output/line[0]="0"
+line_number/repeat[4]/output/line[1]="0"
+line_number/repeat[4]/output/line[2]="1"
+line_number/repeat[4]/output/line[3]="1"
+line_number/repeat[4]/output/line[4]="2"
+line_number/repeat[4]/output/line[5]="2"
+line_number/repeat[4]/status=0
+line_number/repeat[5]/output/line[0]="0"
+line_number/repeat[5]/output/line[1]="1"
+line_number/repeat[5]/output/line[2]="0"
+line_number/repeat[5]/output/line[3]="1"
+line_number/repeat[5]/output/line[4]="0"
+line_number/repeat[5]/output/line[5]="1"
+line_number/repeat[5]/status=0
+line_number/repeat[6]/output/line[0]="1"
+line_number/repeat[6]/output/line[1]="0"
+line_number/repeat[6]/output/line[2]="1"
+line_number/repeat[6]/output/line[3]="0"
+line_number/repeat[6]/output/line[4]="1"
+line_number/repeat[6]/output/line[5]="0"
+line_number/repeat[6]/status=0
+line_number/repeat[7]/output/line[0]="0,0"
+line_number/repeat[7]/output/line[1]="0,1"
+line_number/repeat[7]/output/line[2]="0,2"
+line_number/repeat[7]/output/line[3]="1,0"
+line_number/repeat[7]/output/line[4]="1,1"
+line_number/repeat[7]/output/line[5]="1,2"
+line_number/repeat[7]/output/line[6]="0,0"
+line_number/repeat[7]/output/line[7]="0,1"
+line_number/repeat[7]/output/line[8]="0,2"
+line_number/repeat[7]/output/line[9]="1,0"
+line_number/repeat[7]/output/line[10]="1,1"
+line_number/repeat[7]/output/line[11]="1,2"
+line_number/repeat[7]/status=0
diff --git a/csv/test/csv-paste/input b/csv/test/csv-paste/input
index 7976dbbaf..fa3d03564 100644
--- a/csv/test/csv-paste/input
+++ b/csv/test/csv-paste/input
@@ -45,3 +45,11 @@ head[2]="csv-paste 'line-number;size=10;index' --head=2"
 
 line_number/shape[0]="csv-paste 'line-number;shape=2,3' --head=12"
 line_number/shape[1]="csv-paste 'line-number;shape=2,3;binary=2ui' --head=12 | csv-from-bin 2ui"
+
+line_number/repeat[0]="csv-paste 'line-number' --repeat=3"
+line_number/repeat[1]="csv-paste 'line-number;repeat=3'"
+line_number/repeat[3]="csv-paste 'line-number;size=2' --repeat=2"
+line_number/repeat[4]="csv-paste 'line-number;size=2;repeat=3'"
+line_number/repeat[5]="csv-paste 'line-number;size=2;index;repeat=3'"
+line_number/repeat[6]="csv-paste 'line-number;size=2;index;reverse;repeat=3'"
+line_number/repeat[7]="csv-paste 'line-number;shape=2,3;repeat=2'"

From 6a1b635ec5ce5ba61e9465a59865971773cdbbff Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 20 Mar 2024 14:10:47 +1100
Subject: [PATCH 0774/1056] name_value/ptree: from/to: std::optional support
 added

---
 name_value/ptree.h | 19 ++++++++++++++++---
 1 file changed, 16 insertions(+), 3 deletions(-)

diff --git a/name_value/ptree.h b/name_value/ptree.h
index c49d5feaa..49471ab34 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -7,6 +7,7 @@
 
 #include <array>
 #include <iostream>
+#include <optional>
 #include <sstream>
 #include <boost/array.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
@@ -133,6 +134,13 @@ struct property_tree // quick and dirty
                 apply( name, *value );
             }
 
+            template < typename K, typename T > void apply_next( const K& name, std::optional< T >& value )
+            {
+                if( !cur_ || cur_->find( name ) == cur_->not_found() ) { return; }
+                if( !value ) { value = T(); }
+                apply( name, *value );
+            }
+
             template < typename K, typename T, typename A > void apply_next( const K& key, std::vector< T, A >& value ) { _apply_to_arraylike( key, value ); }
 
             template < typename K, typename T, std::size_t Size > void apply_next( const K& key, boost::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
@@ -259,10 +267,8 @@ class to_ptree
         /// @param branch: path to the subtree to visit (i.e. other branches will be pruned)
         to_ptree( boost::property_tree::ptree& ptree, const xpath& root = xpath(), const xpath& branch = xpath() ) : ptree_( ptree ), path_( root ), branch_( branch ) {}
 
-        /// constructor
         to_ptree( boost::property_tree::ptree& ptree, const char* root ) : ptree_( ptree ), path_( root ) {}
 
-        /// apply_next on boost optional
         template < typename K, typename T > void apply_next( const K& name, const boost::optional< T >& value )
         {
             if( !value ) { return; }
@@ -271,7 +277,14 @@ class to_ptree
                                 && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
         }
 
-        /// apply to vector
+        template < typename K, typename T > void apply_next( const K& name, const std::optional< T >& value )
+        {
+            if( !value ) { return; }
+            visiting::do_while<    !boost::is_fundamental< T >::value
+                                && !boost::is_same< T, boost::posix_time::ptime >::value
+                                && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
+        }
+
         template < typename K, typename T, typename A > void apply( const K& name, const std::vector< T, A >& value ) // do we even need it?
         {
             if( !( path_ <= branch_ ) ) { return; } // visit, only if on the branch

From fdd37a1fab443e05ee0bfc3b6d5240b8253b698a Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 20 Mar 2024 14:58:13 +1100
Subject: [PATCH 0775/1056] visiting::optional implemented and tested

---
 visiting/optional.h             | 32 +++++++++++++++++++
 visiting/test/visiting_test.cpp | 55 ++++++++++++++++++++++++++++++---
 visiting/traits.h               | 17 ++++++++++
 3 files changed, 100 insertions(+), 4 deletions(-)
 create mode 100644 visiting/optional.h

diff --git a/visiting/optional.h b/visiting/optional.h
new file mode 100644
index 000000000..fd22afbb4
--- /dev/null
+++ b/visiting/optional.h
@@ -0,0 +1,32 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+namespace comma { namespace visiting {
+
+/// convenience class when std::optional or boost::optional is not enough
+/// e.g. if in visiting we would like to have an explicit is-set flag field 
+/// in csv, json, or alike, where it may be essential in fixed-width data
+/// (e.g. csv) where the optional value may or may not be present
+template < typename T >
+struct optional
+{
+    T value;
+    bool is_set{false};
+
+    optional() = default;
+    optional( const T& t ): value( t ), is_set( true ) {}
+    template < class... Args > optional( Args... args ): value( args... ), is_set( true ) {}
+    template < class... Args > void emplace( Args... args ); // todo
+    optional& operator=( const T& rhs ) { value = rhs; is_set = true; return *this; }
+    void reset() { is_set = false; }
+    operator bool() const { return is_set; }
+    T* operator->() { return &value; }
+    const T* operator->() const { return &value; }
+    T& operator*() { return value; }
+    const T& operator*() const { return value; }
+};
+
+} } // namespace comma { namespace visiting {
diff --git a/visiting/test/visiting_test.cpp b/visiting/test/visiting_test.cpp
index a0e062d9f..cfc909e84 100644
--- a/visiting/test/visiting_test.cpp
+++ b/visiting/test/visiting_test.cpp
@@ -83,13 +83,18 @@ struct old_plain
     nested world;
 };
 
+struct optionals
+{
+    comma::visiting::optional< int > a;
+    comma::visiting::optional< std::pair< int, int > > b;
+};
+
 } } } // namespace comma { namespace visiting { namespace test {
 
 namespace comma { namespace visiting {
 
 /// traits specialization for old_plain
-template <>
-struct traits< test::old_plain >
+template <> struct traits< test::old_plain >
 {
     template < typename Key, typename visitor >
     static void visit( const Key&, const test::old_plain& p, visitor& v )
@@ -101,8 +106,7 @@ struct traits< test::old_plain >
 };
 
 /// traits specialization for old_plain::nested
-template <>
-struct traits< test::old_plain::nested >
+template <> struct traits< test::old_plain::nested >
 {
     template < typename Key, typename visitor >
     static void visit( const Key&, const test::old_plain::nested& p, visitor& v )
@@ -113,6 +117,16 @@ struct traits< test::old_plain::nested >
     }
 };
 
+template <> struct traits< test::optionals >
+{
+    template < typename Key, typename visitor >
+    static void visit( const Key&, const test::optionals& p, visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+    }
+};
+
 } } // namespace comma { namespace visiting {
 
 namespace comma { namespace visiting { namespace test {
@@ -207,6 +221,39 @@ TEST( visiting, tuple )
     EXPECT_EQ( oss.str(), "{ int:0=5 double:1=10 string:2=\"hello\" }" ); // EXPECT_EQ( oss.str(), "{ int:elem_0=5 double:elem_1=10 string:elem_2=\"hello\" }" );
 }
 
+TEST( visiting, optional )
+{
+    {
+        test::optionals t;
+        t.a.value = 0; // quick and dirty
+        t.b.value = {0, 0}; // quick and dirty
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:a={ int:value=0 bool:is_set=false } object:b={ object:value={ int:first=0 int:second=0 } bool:is_set=false } }" );
+    }
+    {
+        test::optionals t;
+        t.a.value = 0; // quick and dirty
+        t.b.value = {0, 0}; // quick and dirty
+        t.a = 5;
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:a={ int:value=5 bool:is_set=true } object:b={ object:value={ int:first=0 int:second=0 } bool:is_set=false } }" );
+    }
+    {
+        test::optionals t;
+        t.a.value = 0; // quick and dirty
+        t.b.value = {0, 0}; // quick and dirty
+        t.b = std::make_pair( 3, 4 );
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:a={ int:value=0 bool:is_set=false } object:b={ object:value={ int:first=3 int:second=4 } bool:is_set=true } }" );
+    }
+}
+
 } } } /// namespace comma { namespace visiting { namespace test {
 
 int main( int argc, char* argv[] )
diff --git a/visiting/traits.h b/visiting/traits.h
index 5887f2855..b5c8d5af5 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -19,6 +19,7 @@
 #include <vector>
 #include <boost/array.hpp>
 #include "../base/none.h"
+#include "optional.h"
 
 namespace comma { namespace visiting {
 
@@ -53,6 +54,22 @@ struct traits< std::pair< T, S > >
     }    
 };
 
+template < typename T >
+struct traits< comma::visiting::optional< T > >
+{
+    template < typename K, typename V > static void visit( const K& key, comma::visiting::optional< T >& t, V& v )
+    {
+        v.apply( "value", t.value );
+        v.apply( "is_set", t.is_set );
+    }
+    
+    template < typename K, typename V > static void visit( const K&, const comma::visiting::optional< T >& t, V& v )
+    {
+        v.apply( "value", t.value );
+        v.apply( "is_set", t.is_set );
+    }    
+};
+
 template < typename T >
 struct traits< std::complex< T > >
 {

From 86698334626c7b371260ea6271f311243f397adf Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 20 Mar 2024 16:26:35 +1100
Subject: [PATCH 0776/1056] optional moved from visiting to base

---
 {visiting => base}/optional.h   | 4 ++--
 visiting/test/visiting_test.cpp | 5 +++--
 visiting/traits.h               | 8 ++++----
 3 files changed, 9 insertions(+), 8 deletions(-)
 rename {visiting => base}/optional.h (92%)

diff --git a/visiting/optional.h b/base/optional.h
similarity index 92%
rename from visiting/optional.h
rename to base/optional.h
index fd22afbb4..475dc3619 100644
--- a/visiting/optional.h
+++ b/base/optional.h
@@ -4,7 +4,7 @@
 
 #pragma once
 
-namespace comma { namespace visiting {
+namespace comma {
 
 /// convenience class when std::optional or boost::optional is not enough
 /// e.g. if in visiting we would like to have an explicit is-set flag field 
@@ -29,4 +29,4 @@ struct optional
     const T& operator*() const { return value; }
 };
 
-} } // namespace comma { namespace visiting {
+} // namespace comma {
diff --git a/visiting/test/visiting_test.cpp b/visiting/test/visiting_test.cpp
index cfc909e84..0dd98d8b7 100644
--- a/visiting/test/visiting_test.cpp
+++ b/visiting/test/visiting_test.cpp
@@ -10,6 +10,7 @@
 #include <vector>
 #include <boost/array.hpp>
 #include <boost/noncopyable.hpp>
+#include "../../base/optional.h"
 #include "../../base/types.h"
 #include "../apply.h"
 #include "../visit.h"
@@ -85,8 +86,8 @@ struct old_plain
 
 struct optionals
 {
-    comma::visiting::optional< int > a;
-    comma::visiting::optional< std::pair< int, int > > b;
+    comma::optional< int > a;
+    comma::optional< std::pair< int, int > > b;
 };
 
 } } } // namespace comma { namespace visiting { namespace test {
diff --git a/visiting/traits.h b/visiting/traits.h
index b5c8d5af5..d8ecdcaac 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -19,7 +19,7 @@
 #include <vector>
 #include <boost/array.hpp>
 #include "../base/none.h"
-#include "optional.h"
+#include "../base/optional.h"
 
 namespace comma { namespace visiting {
 
@@ -55,15 +55,15 @@ struct traits< std::pair< T, S > >
 };
 
 template < typename T >
-struct traits< comma::visiting::optional< T > >
+struct traits< comma::optional< T > >
 {
-    template < typename K, typename V > static void visit( const K& key, comma::visiting::optional< T >& t, V& v )
+    template < typename K, typename V > static void visit( const K& key, comma::optional< T >& t, V& v )
     {
         v.apply( "value", t.value );
         v.apply( "is_set", t.is_set );
     }
     
-    template < typename K, typename V > static void visit( const K&, const comma::visiting::optional< T >& t, V& v )
+    template < typename K, typename V > static void visit( const K&, const comma::optional< T >& t, V& v )
     {
         v.apply( "value", t.value );
         v.apply( "is_set", t.is_set );

From f7a3652c0aa67140731ce30d68f6815dc81191d2 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 21 Mar 2024 20:21:58 +1100
Subject: [PATCH 0777/1056] name_value/ptree.h: only include std::optional code
 in C++17 and beyond

---
 name_value/ptree.h | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/name_value/ptree.h b/name_value/ptree.h
index 49471ab34..b2f28bac3 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -7,7 +7,9 @@
 
 #include <array>
 #include <iostream>
+#if __cplusplus >= 201703L
 #include <optional>
+#endif
 #include <sstream>
 #include <boost/array.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
@@ -134,12 +136,14 @@ struct property_tree // quick and dirty
                 apply( name, *value );
             }
 
+            #if __cplusplus >= 201703L
             template < typename K, typename T > void apply_next( const K& name, std::optional< T >& value )
             {
                 if( !cur_ || cur_->find( name ) == cur_->not_found() ) { return; }
                 if( !value ) { value = T(); }
                 apply( name, *value );
             }
+            #endif
 
             template < typename K, typename T, typename A > void apply_next( const K& key, std::vector< T, A >& value ) { _apply_to_arraylike( key, value ); }
 
@@ -277,6 +281,7 @@ class to_ptree
                                 && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
         }
 
+        #if __cplusplus >= 201703L
         template < typename K, typename T > void apply_next( const K& name, const std::optional< T >& value )
         {
             if( !value ) { return; }
@@ -284,6 +289,7 @@ class to_ptree
                                 && !boost::is_same< T, boost::posix_time::ptime >::value
                                 && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
         }
+        #endif
 
         template < typename K, typename T, typename A > void apply( const K& name, const std::vector< T, A >& value ) // do we even need it?
         {

From 683af03e37f1b6658f6a19a72277a7bc4b779985 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 5 Apr 2024 15:27:59 +1100
Subject: [PATCH 0778/1056] added TAI support to csv-time and timing library

---
 csv/applications/CMakeLists.txt |  2 +-
 csv/applications/csv-time.cpp   | 21 ++++++--
 csv/test/csv-time/expected      | 51 ++++++++++++++++++
 csv/test/csv-time/input         | 28 +++++++++-
 timing/tai.cpp                  | 95 +++++++++++++++++++++++++++++++++
 timing/tai.h                    | 26 +++++++++
 6 files changed, 217 insertions(+), 6 deletions(-)
 create mode 100644 timing/tai.cpp
 create mode 100644 timing/tai.h

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index 98d7f5ed1..1583dfff2 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -49,7 +49,7 @@ target_link_libraries ( csv-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_applicati
 target_link_libraries ( csv-sort ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
 target_link_libraries ( csv-select ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string comma_name_value )
 target_link_libraries ( csv-paste ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_io comma_name_value )
-target_link_libraries ( csv-time ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
+target_link_libraries ( csv-time ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string comma_timing )
 target_link_libraries ( csv-time-delay ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string comma_xpath )
 target_link_libraries ( csv-time-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_string comma_xpath comma_name_value )
 target_link_libraries ( csv-time-stamp ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string )
diff --git a/csv/applications/csv-time.cpp b/csv/applications/csv-time.cpp
index 8a73940f8..273cc24e6 100644
--- a/csv/applications/csv-time.cpp
+++ b/csv/applications/csv-time.cpp
@@ -47,6 +47,7 @@
 #include "../../csv/stream.h"
 #include "../../csv/impl/epoch.h"
 #include "../../string/string.h"
+#include "../../timing/tai.h"
 #include "../../visiting/traits.h"
 
 static void usage( bool )
@@ -58,8 +59,8 @@ static void usage( bool )
                  "\n    cat log.csv | csv-time <options> > converted.csv"
                  "\n"
                  "\nOptions"
-                 "\n    --from <what>: input format: any, iso, seconds, sql, xsd, local; default iso"
-                 "\n    --to <what>: output format: iso, seconds, sql, xsd, local; default iso"
+                 "\n    --from <what>: input format: any, iso, seconds, sql, xsd, local, tai; default iso"
+                 "\n    --to <what>: output format: iso, seconds, sql, xsd, local, tai; default iso"
                  "\n    --delimiter,-d <delimiter> : default: ','"
                  "\n    --fields <fields> : time field names or field numbers as in \"cut\""
                  "\n                        e.g. \"1,5,7\" or \"a,b,,d\""
@@ -88,6 +89,8 @@ static void usage( bool )
                  "\n            seconds since UNIX epoch as double"
                  "\n    - sql, posix, ieee-std-1003.1"
                  "\n            e.g. 2014-01-01 00:11:22"
+                 "\n    - tai"
+                 "\n            same as iso but converts from/to the TAI time standard"
                  "\n    - xsd, iso-8601-extended"
                  "\n            used in xsd:dateTime, xs:dateTime, gml and derivatives"
                  "\n            e.g. 2014-12-25T00:00:00.000Z"
@@ -103,7 +106,7 @@ static void usage( bool )
     exit( 0 );
 }
 
-enum what_t { guess, iso, seconds, microseconds, sql, xsd, local, format, iso_always_with_fractions };
+enum what_t { guess, iso, seconds, microseconds, sql, xsd, local, format, iso_always_with_fractions, tai };
 static what_t from = guess;
 static what_t to = iso;
 static std::string from_format;
@@ -174,8 +177,12 @@ static what_t what( const std::string& option, const comma::command_line_options
         {
             return local;
         }
+        else if( s == "tai" )
+        {
+            return tai;
+        }
     }
-    std::cerr << "csv-time: expected seconds, sql, or iso; got: \"" << s << "\"" << std::endl;
+    std::cerr << "csv-time: expected seconds, sql, tai, or iso; got: \"" << s << "\"" << std::endl;
     exit( 1 );
 }
 
@@ -257,6 +264,9 @@ static boost::posix_time::ptime from_string( const std::string& s, const what_t
         case sql:
             return s == "NULL" || s == "null" ? boost::posix_time::not_a_date_time : boost::posix_time::time_from_string( s );
 
+        case tai:
+            return comma::timing::tai::to_utc( boost::posix_time::from_iso_string( s ));
+
         case xsd: // 2014-03-05T23:00:00.000Z
             return from_string_xsd( s );
 
@@ -356,6 +366,9 @@ std::string to_string( const boost::posix_time::ptime& t, what_t w )
         case sql:
             return t.is_not_a_date_time() ? std::string( "NULL" ) : comma::split( boost::replace_all_copy( boost::posix_time::to_iso_extended_string( t ), "T", " " ), '.' )[0];
 
+        case tai:
+            return boost::posix_time::to_iso_string( comma::timing::tai::from_utc( t ));
+
         case xsd: // 2014-03-05T23:00:00.000Z
             return boost::posix_time::to_iso_extended_string( t );
 
diff --git a/csv/test/csv-time/expected b/csv/test/csv-time/expected
index 2b4551879..036aaea01 100644
--- a/csv/test/csv-time/expected
+++ b/csv/test/csv-time/expected
@@ -47,6 +47,57 @@ sql[1]/status=0
 sql[2]/output="1394060400"
 sql[2]/status=0
 
+tai_to_tai[0]/output="19700101T000000"
+tai_to_tai[0]/status=0
+tai_to_tai[1]/output="19711231T235959"
+tai_to_tai[1]/status=0
+tai_to_tai[2]/output="19720101T000010"
+tai_to_tai[2]/status=0
+tai_to_tai[3]/output="19720101T000011"
+tai_to_tai[3]/status=0
+tai_to_tai[4]/output="19720701T000009"
+tai_to_tai[4]/status=0
+tai_to_tai[5]/output="19720701T000011"
+tai_to_tai[5]/status=0
+tai_to_tai[6]/output="19720701T000012"
+tai_to_tai[6]/status=0
+tai_to_tai[7]/output="20170101T000035"
+tai_to_tai[7]/status=0
+tai_to_tai[8]/output="20170101T000037"
+tai_to_tai[8]/status=0
+tai_to_tai[9]/output="20170101T000038"
+tai_to_tai[9]/status=0
+tai_to_tai[10]/output="20240101T000037"
+tai_to_tai[10]/status=0
+
+tai_stream[0]/output/line[0]="20170101T000035"
+tai_stream[0]/output/line[1]="20170101T000037"
+tai_stream[0]/output/line[2]="20170101T000038"
+tai_stream[0]/status=0
+tai_stream[1]/output/line[0]="20240101T000037"
+tai_stream[1]/output/line[1]="20240101T000038"
+tai_stream[1]/output/line[2]="20240101T000039"
+tai_stream[1]/status=0
+
+tai_from_tai[0]/output="19720101T000000"
+tai_from_tai[0]/status=0
+tai_from_tai[1]/output="19720630T235959"
+tai_from_tai[1]/status=0
+tai_from_tai[2]/output="19720701T000000"
+tai_from_tai[2]/status=0
+tai_from_tai[3]/output="19720701T000000"
+tai_from_tai[3]/status=0
+tai_from_tai[4]/output="19720701T000001"
+tai_from_tai[4]/status=0
+tai_from_tai[5]/output="20170101T000000"
+tai_from_tai[5]/status=0
+tai_from_tai[6]/output="20170101T000000"
+tai_from_tai[6]/status=0
+tai_from_tai[7]/output="20170101T000001"
+tai_from_tai[7]/status=0
+tai_from_tai[8]/output="20240101T000000"
+tai_from_tai[8]/status=0
+
 xsd[0]/output="1394060400"
 xsd[0]/status=0
 xsd[1]/output="1394060400"
diff --git a/csv/test/csv-time/input b/csv/test/csv-time/input
index e5983b608..04a419ddc 100644
--- a/csv/test/csv-time/input
+++ b/csv/test/csv-time/input
@@ -28,6 +28,33 @@ sql[0]="echo '2014-03-05 23:00:00' | csv-time --from sql --to seconds"
 sql[1]="echo '2014-03-05 23:00:00' | csv-time --from posix --to seconds"
 sql[2]="echo '2014-03-05 23:00:00' | csv-time --from 'ieee-std-1003.1' --to seconds"
 
+# I'd like to test datetimes like 19720630T235960 (that was a leap-second) but
+# boost doesn't understand them. It treats them as identical to 19720701T000000
+tai_to_tai[0]="echo 19700101T000000 | csv-time --to tai"
+tai_to_tai[1]="echo 19711231T235959 | csv-time --to tai"
+tai_to_tai[2]="echo 19720101T000000 | csv-time --to tai"
+tai_to_tai[3]="echo 19720101T000001 | csv-time --to tai"
+tai_to_tai[4]="echo 19720630T235959 | csv-time --to tai"
+tai_to_tai[5]="echo 19720701T000000 | csv-time --to tai"
+tai_to_tai[6]="echo 19720701T000001 | csv-time --to tai"
+tai_to_tai[7]="echo 20161231T235959 | csv-time --to tai"
+tai_to_tai[8]="echo 20170101T000000 | csv-time --to tai"
+tai_to_tai[9]="echo 20170101T000001 | csv-time --to tai"
+tai_to_tai[10]="echo 20240101T000000 | csv-time --to tai"
+
+tai_stream[0]="echo -e '20161231T235959\\n20170101T000000\\n20170101T000001' | csv-time --to tai"
+tai_stream[1]="echo -e '20240101T000000\\n20240101T000001\\n20240101T000002' | csv-time --to tai"
+
+tai_from_tai[0]="echo 19720101T000010 | csv-time --from tai"
+tai_from_tai[1]="echo 19720701T000009 | csv-time --from tai"
+tai_from_tai[2]="echo 19720701T000010 | csv-time --from tai"
+tai_from_tai[3]="echo 19720701T000011 | csv-time --from tai"
+tai_from_tai[4]="echo 19720701T000012 | csv-time --from tai"
+tai_from_tai[5]="echo 20170101T000036 | csv-time --from tai"
+tai_from_tai[6]="echo 20170101T000037 | csv-time --from tai"
+tai_from_tai[7]="echo 20170101T000038 | csv-time --from tai"
+tai_from_tai[8]="echo 20240101T000037 | csv-time --from tai"
+
 xsd[0]="echo '2014-03-05T23:00:00.000Z' | csv-time --from xsd --to seconds"
 xsd[1]="echo '2014-03-05T23:00:00.000Z' | csv-time --from 'iso-8601-extended' --to seconds"
 
@@ -85,4 +112,3 @@ precision[6]="echo 19700101T000000.000001 | csv-time --from=iso --to=seconds | c
 
 format[0]="echo 20180102T123456 | csv-time --from 'format;%Y%m%dT%H%M%S'"
 format[1]="echo 10m23s | csv-time --from 'format;%Mm%S' --to seconds"
-
diff --git a/timing/tai.cpp b/timing/tai.cpp
new file mode 100644
index 000000000..4be717c4f
--- /dev/null
+++ b/timing/tai.cpp
@@ -0,0 +1,95 @@
+// Copyright (c) 2024 Mission Systems Pty Ltd
+//
+// Data extracted from https://hpiers.obspm.fr/eoppc/bul/bulc/UTC-TAI.history
+// which is linked to from https://www.iers.org/IERS/EN/Publications/Bulletins/bulletins.html
+//
+// For an overview see https://en.wikipedia.org/wiki/Leap_second
+//
+// Note that boost::posix_time doesn't really support leap seconds. It treats
+// 19720630T235960 as identical to 19720701T000000. You can see this with:
+//   $ echo 19720630T235959 | csv-time --to seconds
+//   78796799
+//   $ echo 19720630T235960 | csv-time --to seconds
+//   78796800
+//   $ echo 19720701T000000 | csv-time --to seconds
+//   78796800
+//
+// There should be an extra second there
+//
+// Note that C++20 introduces std::chrono::tai_clock
+// https://en.cppreference.com/w/cpp/chrono/tai_clock
+
+/// @author dave jennings
+
+#include "tai.h"
+#include <utility>
+#include <vector>
+
+namespace comma { namespace timing { namespace tai {
+
+typedef std::pair< boost::posix_time::ptime, int > leap_seconds_entry;
+
+using boost::posix_time::ptime;
+using boost::gregorian::date;
+using boost::date_time::Jan;
+using boost::date_time::Jul;
+
+static std::vector< leap_seconds_entry > leap_seconds_table = {
+    leap_seconds_entry(  boost::date_time::neg_infin, 0 ),
+    leap_seconds_entry( ptime( date( 1972, Jan, 1 )), 10 ),
+    leap_seconds_entry( ptime( date( 1972, Jul, 1 )), 11 ),
+    leap_seconds_entry( ptime( date( 1973, Jan, 1 )), 12 ),
+    leap_seconds_entry( ptime( date( 1974, Jan, 1 )), 13 ),
+    leap_seconds_entry( ptime( date( 1975, Jan, 1 )), 14 ),
+    leap_seconds_entry( ptime( date( 1976, Jan, 1 )), 15 ),
+    leap_seconds_entry( ptime( date( 1977, Jan, 1 )), 16 ),
+    leap_seconds_entry( ptime( date( 1978, Jan, 1 )), 17 ),
+    leap_seconds_entry( ptime( date( 1979, Jan, 1 )), 18 ),
+    leap_seconds_entry( ptime( date( 1980, Jan, 1 )), 19 ),
+    leap_seconds_entry( ptime( date( 1981, Jul, 1 )), 20 ),
+    leap_seconds_entry( ptime( date( 1982, Jul, 1 )), 21 ),
+    leap_seconds_entry( ptime( date( 1983, Jul, 1 )), 22 ),
+    leap_seconds_entry( ptime( date( 1985, Jul, 1 )), 23 ),
+    leap_seconds_entry( ptime( date( 1988, Jan, 1 )), 24 ),
+    leap_seconds_entry( ptime( date( 1990, Jan, 1 )), 25 ),
+    leap_seconds_entry( ptime( date( 1991, Jan, 1 )), 26 ),
+    leap_seconds_entry( ptime( date( 1992, Jul, 1 )), 27 ),
+    leap_seconds_entry( ptime( date( 1993, Jul, 1 )), 28 ),
+    leap_seconds_entry( ptime( date( 1994, Jul, 1 )), 29 ),
+    leap_seconds_entry( ptime( date( 1996, Jan, 1 )), 30 ),
+    leap_seconds_entry( ptime( date( 1997, Jul, 1 )), 31 ),
+    leap_seconds_entry( ptime( date( 1999, Jan, 1 )), 32 ),
+    leap_seconds_entry( ptime( date( 2006, Jan, 1 )), 33 ),
+    leap_seconds_entry( ptime( date( 2009, Jan, 1 )), 34 ),
+    leap_seconds_entry( ptime( date( 2012, Jul, 1 )), 35 ),
+    leap_seconds_entry( ptime( date( 2015, Jul, 1 )), 36 ),
+    leap_seconds_entry( ptime( date( 2017, Jan, 1 )), 37 )
+};
+
+// The switch over times are in UTC. That's how we get a time of 23:59:60.
+// So when working out the leap_second offset we need the UTC timestamp.
+// See https://en.wikipedia.org/wiki/Leap_second#Process
+int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc )
+{
+    // Timestamps are likely to be recent so look backwards through the table to
+    // find the right entry
+    std::vector< leap_seconds_entry >::reverse_iterator riter;
+    for( riter = leap_seconds_table.rbegin(); riter != leap_seconds_table.rend(); ++riter )
+    {
+        boost::posix_time::ptime utc = ( time_is_utc ? time : time - boost::posix_time::seconds( riter->second ));
+        if( utc >= riter->first ) { break; }
+    }
+    return riter->second;
+}
+
+boost::posix_time::ptime from_utc( const boost::posix_time::ptime& utc )
+{
+    return utc + boost::posix_time::seconds( leap_seconds( utc, true ));
+}
+
+boost::posix_time::ptime to_utc( const boost::posix_time::ptime& tai )
+{
+    return tai - boost::posix_time::seconds( leap_seconds( tai, false ));
+}
+
+} } } // namespace comma { namespace timing { namespace tai {
diff --git a/timing/tai.h b/timing/tai.h
new file mode 100644
index 000000000..56fe6bade
--- /dev/null
+++ b/timing/tai.h
@@ -0,0 +1,26 @@
+// Copyright (c) 2024 Mission Systems Pty Ltd
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time_types.hpp>
+
+namespace comma { namespace timing {
+
+namespace tai {
+
+// For conversion of fast streaming data you probably want to just get the leap
+// seconds once then apply that offset to all the data (utc = tai - leap_seconds).
+// This will not be accurate if the data crosses a leap-second boundary but is much faster.
+int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc = true );
+
+// Otherwise use the from/to functions which are accurate across boundaries.
+// Although note that boost doesn't understand UTC times of 23:59:60.
+// It thinks it's the same as 00:00:00 even if it aligns with a leap-second.
+boost::posix_time::ptime from_utc( const boost::posix_time::ptime& utc );
+boost::posix_time::ptime to_utc( const boost::posix_time::ptime& tai );
+
+} // namespace tai {
+
+inline int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc = true ) { return tai::leap_seconds( time, time_is_utc ); }
+
+} } // namespace comma { namespace timing {

From 6c5355ecb169f4b0d63469ff0c6b8cb856ad00a9 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 9 Apr 2024 17:48:12 +1000
Subject: [PATCH 0779/1056] timing/tai.cpp,h: added
 leap_seconds_with_valid_time

---
 timing/tai.cpp | 20 ++++++++++++++++----
 timing/tai.h   |  5 +++++
 2 files changed, 21 insertions(+), 4 deletions(-)

diff --git a/timing/tai.cpp b/timing/tai.cpp
index 4be717c4f..49fd26648 100644
--- a/timing/tai.cpp
+++ b/timing/tai.cpp
@@ -63,13 +63,14 @@ static std::vector< leap_seconds_entry > leap_seconds_table = {
     leap_seconds_entry( ptime( date( 2009, Jan, 1 )), 34 ),
     leap_seconds_entry( ptime( date( 2012, Jul, 1 )), 35 ),
     leap_seconds_entry( ptime( date( 2015, Jul, 1 )), 36 ),
-    leap_seconds_entry( ptime( date( 2017, Jan, 1 )), 37 )
+    leap_seconds_entry( ptime( date( 2017, Jan, 1 )), 37 ),
+    leap_seconds_entry(  boost::date_time::pos_infin, 37 )
 };
 
-// The switch over times are in UTC. That's how we get a time of 23:59:60.
+// The switch-over times are in UTC. That's how we get a time of 23:59:60.
 // So when working out the leap_second offset we need the UTC timestamp.
 // See https://en.wikipedia.org/wiki/Leap_second#Process
-int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc )
+static std::vector< leap_seconds_entry >::reverse_iterator lookup_table( const boost::posix_time::ptime& time, bool time_is_utc )
 {
     // Timestamps are likely to be recent so look backwards through the table to
     // find the right entry
@@ -79,7 +80,18 @@ int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc )
         boost::posix_time::ptime utc = ( time_is_utc ? time : time - boost::posix_time::seconds( riter->second ));
         if( utc >= riter->first ) { break; }
     }
-    return riter->second;
+    return riter;
+}
+
+int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc )
+{
+    return lookup_table( time, time_is_utc )->second;
+}
+
+std::pair< int, boost::posix_time::ptime > leap_seconds_with_valid_time( const boost::posix_time::ptime& time, bool time_is_utc )
+{
+    std::vector< leap_seconds_entry >::reverse_iterator riter = lookup_table( time, time_is_utc );
+    return std::pair< int, boost::posix_time::ptime >( riter->second, ( riter - 1 )->first );
 }
 
 boost::posix_time::ptime from_utc( const boost::posix_time::ptime& utc )
diff --git a/timing/tai.h b/timing/tai.h
index 56fe6bade..9650eee9c 100644
--- a/timing/tai.h
+++ b/timing/tai.h
@@ -13,6 +13,11 @@ namespace tai {
 // This will not be accurate if the data crosses a leap-second boundary but is much faster.
 int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc = true );
 
+// If you want accurate time across a boundary, use this call, check your
+// timestamps and update the leap seconds when you go past the valid time.
+// Valid time is in UTC.
+std::pair< int, boost::posix_time::ptime > leap_seconds_with_valid_time( const boost::posix_time::ptime& time, bool time_is_utc );
+
 // Otherwise use the from/to functions which are accurate across boundaries.
 // Although note that boost doesn't understand UTC times of 23:59:60.
 // It thinks it's the same as 00:00:00 even if it aligns with a leap-second.

From 08b514239ed8b1265f9d3e3d657d9f5555a11ce2 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 17 Apr 2024 12:48:55 +1000
Subject: [PATCH 0780/1056] csv, name-value visitors: std::optional and
 std::unique_ptr support added

---
 csv/impl/to_names.h               | 83 +++++++++++----------------
 name_value/impl/from_name_value.h | 95 +++++++++++++------------------
 name_value/impl/to_name_value.h   | 45 +++++----------
 3 files changed, 84 insertions(+), 139 deletions(-)

diff --git a/csv/impl/to_names.h b/csv/impl/to_names.h
index 6be9c5f12..80a8c7e59 100644
--- a/csv/impl/to_names.h
+++ b/csv/impl/to_names.h
@@ -30,9 +30,10 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_IMPL_TONAMES_H_
-#define COMMA_CSV_IMPL_TONAMES_H_
+#pragma once
 
+#include <memory>
+#include <optional>
 #include <sstream>
 #include <boost/optional.hpp>
 #include <boost/scoped_ptr.hpp>
@@ -51,74 +52,58 @@ namespace comma { namespace csv { namespace impl {
 class to_names
 {
     public:
-        /// constructor
-        to_names( bool full_path_as_name = true );
+        to_names( bool full_path_as_name = true ): _full_path_as_name( full_path_as_name ) {}
         
-        /// constructor
-        to_names( const xpath& root, bool full_path_as_name );
+        to_names( const xpath& root, bool full_path_as_name ): _full_path_as_name( full_path_as_name ), _root( root ) {}
         
-        /// traverse
         template < typename K, typename T >
-        void apply( const K& name, const boost::optional< T >& value );
+        void apply( const K& name, const boost::optional< T >& value ) { apply( name, value ? *value : T() ); }
+
+        template < typename K, typename T >
+        void apply( const K& name, const std::optional< T >& value ) { apply( name, value ? *value : T() ); }
         
-        /// traverse
         template < typename K, typename T >
         void apply( const K& name, const boost::scoped_ptr< T >& value );
         
-        /// traverse
         template < typename K, typename T >
         void apply( const K& name, const boost::shared_ptr< T >& value );
+
+        template < typename K, typename T >
+        void apply( const K& name, const std::unique_ptr< T >& value );
         
-        /// traverse
         template < typename K, typename T >
         void apply( const K& name, const T& value );
         
-        /// traverse
         template < typename K, typename T >
         void apply_next( const K& name, const T& value );
         
-        /// output a non-string type
         template < typename K, typename T >
         void apply_final( const K& name, const T& value );
         
-        /// return string
-        const std::vector< std::string >& operator()() const;
+        const std::vector< std::string >& operator()() const { return _names; }
         
     private:
-        bool full_path_as_name_;
-        xpath xpath_;
-        xpath root_;
-        boost::optional< std::size_t > index_;
-        std::vector< std::string > names_;
-        const xpath& append( std::size_t index ) { xpath_.elements.back().index = index; return xpath_; }
-        const xpath& append( const char* name ) { xpath_ /= xpath::element( name ); return xpath_; }
-        const xpath& append( const std::string& name ) { xpath_ /= xpath::element( name ); return xpath_; }
-        const xpath& trim( std::size_t ) { xpath_.elements.back().index = boost::optional< std::size_t >(); return xpath_; }
-        const xpath& trim( const char* ) { xpath_ = xpath_.head(); return xpath_; }
-        const xpath& trim( const std::string& ) { xpath_ = xpath_.head(); return xpath_; }
+        bool _full_path_as_name;
+        xpath _xpath;
+        xpath _root;
+        std::optional< std::size_t > _index;
+        std::vector< std::string > _names;
+        const xpath& _append( std::size_t index ) { _xpath.elements.back().index = index; return _xpath; }
+        const xpath& _append( const char* name ) { _xpath /= xpath::element( name ); return _xpath; }
+        const xpath& _append( const std::string& name ) { _xpath /= xpath::element( name ); return _xpath; }
+        const xpath& _trim( std::size_t ) { _xpath.elements.back().index = boost::optional< std::size_t >(); return _xpath; }
+        const xpath& _trim( const char* ) { _xpath = _xpath.head(); return _xpath; }
+        const xpath& _trim( const std::string& ) { _xpath = _xpath.head(); return _xpath; }
 };
 
-inline to_names::to_names( bool full_path_as_name ) : full_path_as_name_( full_path_as_name ) {}
-
-inline to_names::to_names( const xpath& root, bool full_path_as_name ) : full_path_as_name_( full_path_as_name ), root_( root ) {}
-
 template < typename K, typename T >
-inline void to_names::apply( const K& name, const boost::optional< T >& value )
-{
-    apply( name, value ? *value : T() );
-}
+inline void to_names::apply( const K& name, const boost::scoped_ptr< T >& value ) { if( value ) { apply( name, *value ); } else { T v; apply( name, v ); } }
 
 template < typename K, typename T >
-inline void to_names::apply( const K& name, const boost::scoped_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); } else { T v; apply( name, v ); }
-}
+inline void to_names::apply( const K& name, const boost::shared_ptr< T >& value ) { if( value ) { apply( name, *value ); } else { T v; apply( name, v ); } }
 
 template < typename K, typename T >
-inline void to_names::apply( const K& name, const boost::shared_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); } else { T v; apply( name, v ); }
-}
+inline void to_names::apply( const K& name, const std::unique_ptr< T >& value ) { if( value ) { apply( name, *value ); } else { T v; apply( name, v ); } }
 
 template < typename K, typename T >
 inline void to_names::apply( const K& name, const T& value )
@@ -131,21 +116,17 @@ inline void to_names::apply( const K& name, const T& value )
 template < typename K, typename T >
 inline void to_names::apply_next( const K& name, const T& value )
 {
-    append( name );
+    _append( name );
     comma::visiting::visit( name, value, *this );
-    trim( name );
+    _trim( name );
 }
 
 template < typename K, typename T >
 inline void to_names::apply_final( const K& name, const T& )
 {
-    append( name );
-    if( xpath_ <= root_ ) { names_.push_back( full_path_as_name_ ? xpath_.to_string() : xpath_.elements.back().to_string() ); }
-    trim( name );
+    _append( name );
+    if( _xpath <= _root ) { _names.push_back( _full_path_as_name ? _xpath.to_string() : _xpath.elements.back().to_string() ); }
+    _trim( name );
 }
 
-inline const std::vector< std::string >& to_names::operator()() const { return names_; }
-
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // COMMA_CSV_IMPL_TONAMES_H_
diff --git a/name_value/impl/from_name_value.h b/name_value/impl/from_name_value.h
index 2da37b876..47dae9da8 100644
--- a/name_value/impl/from_name_value.h
+++ b/name_value/impl/from_name_value.h
@@ -27,14 +27,14 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
-#ifndef COMMA_APPLICATION_FROM_NAME_VALUE_H
-#define COMMA_APPLICATION_FROM_NAME_VALUE_H
+#pragma once
 
 #include <deque>
 #include <map>
+#include <memory>
+#include <optional>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
@@ -59,35 +59,32 @@ class from_name_value
     /// constructor
     /// @param values values to read from
     /// @param full_path_as_name use full path as name
-    from_name_value( const map_type& values, bool full_path_as_name = true ):
-        m_values( values ), m_full_path_as_name(full_path_as_name){};
+    from_name_value( const map_type& values, bool full_path_as_name = true ): _values( values ), _full_path_as_name( full_path_as_name ) {};
+
+    template < typename K, typename T > void apply( const K& name, boost::optional< T >& value ) { _apply_optional< K, T >( name, value ); }
 
-    /// apply
-    template < typename K, typename T > void apply( const K& name, boost::optional< T >& value );
+    template < typename K, typename T > void apply( const K& name, std::optional< T >& value ) { _apply_optional< K, T >( name, value ); }
     
-    /// apply
-    template < typename K, typename T > void apply( const K& name, boost::scoped_ptr< T >& value );
+    template < typename K, typename T > void apply( const K& name, boost::scoped_ptr< T >& value ) { _apply_ptr< K, T >( name, value ); }
     
-    /// apply
-    template < typename K, typename T > void apply( const K& name, boost::shared_ptr< T >& value );
+    template < typename K, typename T > void apply( const K& name, boost::shared_ptr< T >& value ) { _apply_ptr< K, T >( name, value ); }
+
+    template < typename K, typename T > void apply( const K& name, std::unique_ptr< T >& value ) { _apply_ptr< K, T >( name, value ); }
         
-    /// apply
     template < typename K, typename T > void apply( const K& name, T& value );
 
-    /// apply to non-leaf elements
     template < typename K, typename T > void apply_next( const K& name, T& value );
 
-    /// apply to leaf elements
     template < typename K, typename T > void apply_final( const K& name, T& value );
 
 private:
-    const map_type& m_values;
-    bool m_full_path_as_name;
-    xpath m_xpath;
-    std::deque< bool > m_empty;
-    static void lexical_cast( bool& v, const std::string& s ) { v = s == "" || boost::lexical_cast< bool >( s ); }
-    static void lexical_cast( boost::posix_time::ptime& v, const std::string& s ) { v = boost::posix_time::from_iso_string( s ); }
-    static void lexical_cast( boost::posix_time::time_duration& v, const std::string& s )
+    const map_type& _values;
+    bool _full_path_as_name;
+    xpath _xpath;
+    std::deque< bool > _empty;
+    static void _lexical_cast( bool& v, const std::string& s ) { v = s == "" || boost::lexical_cast< bool >( s ); }
+    static void _lexical_cast( boost::posix_time::ptime& v, const std::string& s ) { v = boost::posix_time::from_iso_string( s ); }
+    static void _lexical_cast( boost::posix_time::time_duration& v, const std::string& s )
     {
         std::vector< std::string > t = comma::split( s, '.' );
         if( t.size() > 2 ) { COMMA_THROW_STREAM( comma::exception, "expected duration in seconds, got " << s ); }
@@ -98,65 +95,49 @@ class from_name_value
         if( seconds < 0 ) { microseconds = -microseconds; }
         v = boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds );
     }
-    template < typename T > static void lexical_cast( T& v, const std::string& s ) { v = boost::lexical_cast< T >( s ); }
+    template < typename T > static void _lexical_cast( T& v, const std::string& s ) { v = boost::lexical_cast< T >( s ); }
+    template < typename K, typename T, template < typename > class Optional > void _apply_optional( const K& name, Optional< T >& value );
+    template < typename K, typename T, template < typename > class Ptr > void _apply_ptr( const K& name, Ptr< T >& value );
 };
 
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, boost::optional< T >& value )
-{
-    if( value ) { apply( name, *value ); return; }
-    T t;
-    m_empty.push_back( true );
-    apply( name, t );
-    if( !m_empty.back() ) { value = t; }
-    m_empty.pop_back();
-}
-
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, boost::scoped_ptr< T >& value )
+template < typename K, typename T, template < typename > class Optional > inline void from_name_value::_apply_optional( const K& name, Optional< T >& value )
 {
     if( value ) { apply( name, *value ); return; }
     T t;
-    m_empty.push_back( true );
+    _empty.push_back( true );
     apply( name, t );
-    if( !m_empty.back() ) { value.reset( new T( t ) ); }
-    m_empty.pop_back();
+    if( !_empty.back() ) { value = t; }
+    _empty.pop_back();    
 }
 
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, boost::shared_ptr< T >& value )
+template < typename K, typename T, template < typename > class Ptr > inline void from_name_value::_apply_ptr( const K& name, Ptr< T >& value )
 {
     if( value ) { apply( name, *value ); return; }
     T t;
-    m_empty.push_back( true );
+    _empty.push_back( true );
     apply( name, t );
-    if( !m_empty.back() ) { value.reset( new T( t ) ); }
-    m_empty.pop_back();
+    if( !_empty.back() ) { value.reset(); value.reset( new T( t ) ); } // todo? emplace? 
+    _empty.pop_back();
 }
 
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, T& value )
+template < typename K, typename T > inline void from_name_value::apply( const K& name, T& value )
 {
-    m_xpath /= xpath::element( name );
+    _xpath /= xpath::element( name );
     visiting::do_while<    !boost::is_fundamental< T >::value
                         && !boost::is_same< T, boost::posix_time::ptime >::value
                         && !boost::is_same< T, boost::posix_time::time_duration >::value
                         && !boost::is_same< T, std::string >::value >::visit( name, value, *this );
-    m_xpath = m_xpath.head();
+    _xpath = _xpath.head();
 }
 
-template < typename K, typename T >
-inline void from_name_value::apply_next( const K& name, T& value ) { comma::visiting::visit( name, value, *this ); }
+template < typename K, typename T > inline void from_name_value::apply_next( const K& name, T& value ) { comma::visiting::visit( name, value, *this ); }
 
-template < typename K, typename T >
-inline void from_name_value::apply_final( const K& key, T& value )
+template < typename K, typename T > inline void from_name_value::apply_final( const K& key, T& value )
 {
-    map_type::const_iterator iter = m_values.find( m_full_path_as_name ? m_xpath.to_string() : m_xpath.elements.back().to_string() );
-    if( iter == m_values.end() ) { return; }
-    lexical_cast( value, iter->second );
-    for( std::size_t i = 0; i < m_empty.size(); ++i ) { m_empty[i] = false; }
+    map_type::const_iterator iter = _values.find( _full_path_as_name ? _xpath.to_string() : _xpath.elements.back().to_string() );
+    if( iter == _values.end() ) { return; }
+    _lexical_cast( value, iter->second );
+    for( std::size_t i = 0; i < _empty.size(); ++i ) { _empty[i] = false; }
 }
 
 } } } // namespace comma { namespace name_value { namespace impl {
-
-#endif // COMMA_APPLICATION_FROM_NAME_VALUE_H
diff --git a/name_value/impl/to_name_value.h b/name_value/impl/to_name_value.h
index 653a2a42c..192ac46bd 100644
--- a/name_value/impl/to_name_value.h
+++ b/name_value/impl/to_name_value.h
@@ -6,6 +6,7 @@
 #pragma once
 
 #include <map>
+#include <memory>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include <boost/scoped_ptr.hpp>
@@ -25,54 +26,36 @@ class to_name_value
     /// constructor
     /// @param delimiter delimiter between name and value
     /// @param full_path_as_name use full path as name
-    to_name_value( char delimiter = '=', bool full_path_as_name = true ): m_delimiter(delimiter), m_full_path_as_name( full_path_as_name ) {};
-
-    /// apply
+    to_name_value( char delimiter = '=', bool full_path_as_name = true ): _delimiter(delimiter), _full_path_as_name( full_path_as_name ) {};
     template < typename K, typename T > void apply( const K& name, const boost::optional< T >& value ) { if( value ) { apply( name, *value ); } }
-    
-    /// apply
+    template < typename K, typename T > void apply( const K& name, const std::optional< T >& value ) { if( value ) { apply( name, *value ); } }
     template < typename K, typename T > void apply( const K& name, const boost::scoped_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
-    
-    /// apply
     template < typename K, typename T > void apply( const K& name, const boost::shared_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
-        
-    /// apply
+    template < typename K, typename T > void apply( const K& name, const std::unique_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
     template < typename K, typename T > void apply( const K& name, const T& value );
-
-    /// apply to non-leaf elements
     template < typename K, typename T > void apply_next( const K& name, const T& value ) { comma::visiting::visit( name, value, *this ); }
-
-    /// apply to leaf elements
     template < typename K, typename T > void apply_final( const K& name, const T& value );
-
-    /// return named values as strings
-    const std::vector< std::string >& strings() const { return m_strings; }
+    const std::vector< std::string >& strings() const { return _strings; }
 
 private:
-    template < typename T > std::string as_string( T v )
-    {
-        std::ostringstream oss;
-        oss << v;
-        return oss.str();
-    }
-        
-    char m_delimiter;
-    bool m_full_path_as_name;
-    std::vector< std::string > m_strings;
-    xpath m_xpath;
-     
+    char _delimiter;
+    bool _full_path_as_name;
+    std::vector< std::string > _strings;
+    xpath _xpath;
+
+    template < typename T > std::string _as_string( T v ) { std::ostringstream oss; oss << v; return oss.str(); } 
 };
 
 template < typename K, typename T >
 inline void to_name_value::apply( const K& name, const T& value )
 {
-    m_xpath /= xpath::element( name );
+    _xpath /= xpath::element( name );
     visiting::do_while<    !boost::is_fundamental< T >::value
                         && !boost::is_same< T, std::string >::value >::visit( name, value, *this );
-    m_xpath = m_xpath.head();
+    _xpath = _xpath.head();
 }
 
 template < typename K, typename T >
-inline void to_name_value::apply_final( const K&, const T& value ) { m_strings.push_back( std::string( m_full_path_as_name ? m_xpath.to_string() : m_xpath.elements.back().to_string() ) + m_delimiter + as_string( value ) ); }
+inline void to_name_value::apply_final( const K&, const T& value ) { _strings.push_back( std::string( _full_path_as_name ? _xpath.to_string() : _xpath.elements.back().to_string() ) + _delimiter + _as_string( value ) ); }
 
 } } } // namespace comma { namespace name_value { namespace impl {

From 212fbc0c9f9e7d9be79f68f0898fc662a4a6fd72 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 17 Apr 2024 17:47:19 +1000
Subject: [PATCH 0781/1056] csv, name_value: visitors: std::optional
 conditioned by #ifdef on compiler version (it is not available with c++14,
 while some higher versions have problems with boost::intervals, which are
 happily fixed in the latest apt installs

---
 csv/impl/to_names.h               | 6 +++++-
 name_value/impl/from_name_value.h | 4 ++++
 name_value/impl/to_name_value.h   | 5 +++++
 3 files changed, 14 insertions(+), 1 deletion(-)

diff --git a/csv/impl/to_names.h b/csv/impl/to_names.h
index 80a8c7e59..fe877901e 100644
--- a/csv/impl/to_names.h
+++ b/csv/impl/to_names.h
@@ -33,7 +33,9 @@
 #pragma once
 
 #include <memory>
+#if __cplusplus >= 201703L
 #include <optional>
+#endif // #if __cplusplus >= 201703L
 #include <sstream>
 #include <boost/optional.hpp>
 #include <boost/scoped_ptr.hpp>
@@ -59,8 +61,10 @@ class to_names
         template < typename K, typename T >
         void apply( const K& name, const boost::optional< T >& value ) { apply( name, value ? *value : T() ); }
 
+        #if __cplusplus >= 201703L
         template < typename K, typename T >
         void apply( const K& name, const std::optional< T >& value ) { apply( name, value ? *value : T() ); }
+        #endif // #if __cplusplus >= 201703L
         
         template < typename K, typename T >
         void apply( const K& name, const boost::scoped_ptr< T >& value );
@@ -86,7 +90,7 @@ class to_names
         bool _full_path_as_name;
         xpath _xpath;
         xpath _root;
-        std::optional< std::size_t > _index;
+        boost::optional< std::size_t > _index;
         std::vector< std::string > _names;
         const xpath& _append( std::size_t index ) { _xpath.elements.back().index = index; return _xpath; }
         const xpath& _append( const char* name ) { _xpath /= xpath::element( name ); return _xpath; }
diff --git a/name_value/impl/from_name_value.h b/name_value/impl/from_name_value.h
index 47dae9da8..a88b18117 100644
--- a/name_value/impl/from_name_value.h
+++ b/name_value/impl/from_name_value.h
@@ -34,7 +34,9 @@
 #include <deque>
 #include <map>
 #include <memory>
+#if __cplusplus >= 201703L
 #include <optional>
+#endif // #if __cplusplus >= 201703L
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
@@ -63,7 +65,9 @@ class from_name_value
 
     template < typename K, typename T > void apply( const K& name, boost::optional< T >& value ) { _apply_optional< K, T >( name, value ); }
 
+    #if __cplusplus >= 201703L
     template < typename K, typename T > void apply( const K& name, std::optional< T >& value ) { _apply_optional< K, T >( name, value ); }
+    #endif // #if __cplusplus >= 201703L
     
     template < typename K, typename T > void apply( const K& name, boost::scoped_ptr< T >& value ) { _apply_ptr< K, T >( name, value ); }
     
diff --git a/name_value/impl/to_name_value.h b/name_value/impl/to_name_value.h
index 192ac46bd..de6fa961f 100644
--- a/name_value/impl/to_name_value.h
+++ b/name_value/impl/to_name_value.h
@@ -7,6 +7,9 @@
 
 #include <map>
 #include <memory>
+#if __cplusplus >= 201703L
+#include <optional>
+#endif // #if __cplusplus >= 201703L
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include <boost/scoped_ptr.hpp>
@@ -28,7 +31,9 @@ class to_name_value
     /// @param full_path_as_name use full path as name
     to_name_value( char delimiter = '=', bool full_path_as_name = true ): _delimiter(delimiter), _full_path_as_name( full_path_as_name ) {};
     template < typename K, typename T > void apply( const K& name, const boost::optional< T >& value ) { if( value ) { apply( name, *value ); } }
+    #if __cplusplus >= 201703L
     template < typename K, typename T > void apply( const K& name, const std::optional< T >& value ) { if( value ) { apply( name, *value ); } }
+    #endif // #if __cplusplus >= 201703L
     template < typename K, typename T > void apply( const K& name, const boost::scoped_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
     template < typename K, typename T > void apply( const K& name, const boost::shared_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
     template < typename K, typename T > void apply( const K& name, const std::unique_ptr< T >& value ) { if( value ) { apply( name, *value ); } }

From 0aba9101b8bf99a0050b3d18436045eb80285a90 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 29 Apr 2024 16:19:21 +1000
Subject: [PATCH 0782/1056] io-cat: --help: --size documented

---
 io/applications/io-cat.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index fb55c6531..f12534c88 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -112,6 +112,7 @@ void usage( bool verbose = false )
     std::cerr << "                                         all available data" << std::endl;
     std::cerr << "                                         ignored for udp streams, where one full udp" << std::endl;
     std::cerr << "                                         packet at a time is always read" << std::endl;
+    std::cerr << "    --size=[<bytes>]; on fixed-width binary records, size of the record in bytes, for --round-robin or --head" << std::endl;
     std::cerr << std::endl;
     std::cerr << "connect options" << std::endl;
     std::cerr << "    --connect-max-attempts,--connect-attempts,--attempts,--max-attempts=<n>; default=1; number of attempts to reconnect or 'unlimited'" << std::endl;

From 1d79d9b9ac7b6893be07b4901cd640ee438615d1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 30 Apr 2024 18:02:32 +1000
Subject: [PATCH 0783/1056] name_value: write_path_value: optional prefix added

---
 name_value/ptree.cpp               | 21 +++++++++++----------
 name_value/ptree.h                 |  6 +++---
 name_value/serialize.h             | 12 ++++++------
 name_value/test/serialise_test.cpp |  7 +++++++
 4 files changed, 27 insertions(+), 19 deletions(-)

diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index 15ac3a896..2c9d2c4dd 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -135,7 +135,8 @@ static void ptree_to_path_value_string_impl( std::ostream* os
                                            , char equal_sign
                                            , char delimiter
                                            , const std::string& root
-                                           , bool const unquote_numbers )
+                                           , bool const unquote_numbers
+                                           , const std::string& prefix )
 {
     if( i->second.begin() == i->second.end() )
     {
@@ -162,7 +163,7 @@ static void ptree_to_path_value_string_impl( std::ostream* os
             // Test if it is json array data, if so all keys are empty. If so display indices in path if requested
             if( mode == property_tree::without_brackets && j->first.empty()  ) { display_path /= boost::lexical_cast< std::string >( index++ ); }
             else if( mode == property_tree::with_brackets && j->first.empty() ) { display_path.elements.back().index = index++; }
-            ptree_to_path_value_string_impl( os, pv, j, is_begin, path, display_path, mode, equal_sign, delimiter, root, unquote_numbers );
+            ptree_to_path_value_string_impl( os, pv, j, is_begin, path, display_path, mode, equal_sign, delimiter, root, unquote_numbers, prefix );
             if( mode == property_tree::without_brackets && j->first.empty() ) { display_path = display_path.head(); }
             is_begin = false;
         }
@@ -175,7 +176,7 @@ static void ptree_to_path_value_string_impl( std::ostream* os
 
 namespace comma {
 
-void property_tree::to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode mode, char equal_sign, char delimiter, const xpath& root, bool const unquote_numbers )
+void property_tree::to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode mode, char equal_sign, char delimiter, const xpath& root, bool unquote_numbers, const std::string& prefix )
 {
     std::vector< std::pair< xpath, std::string > > dummy; // quick and dirty
     for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
@@ -186,12 +187,12 @@ void property_tree::to_path_value( std::ostream& os, const boost::property_tree:
         //         If a node has both named and unnamed child nodes, it cannot be mapped to a JSON representation."
         // http://www.boost.org/doc/libs/1_41_0/doc/html/boost_propertytree/parsers.html#boost_propertytree.parsers.json_parser
         xpath path;
-        xpath display_path;
-        impl::ptree_to_path_value_string_impl( &os, dummy, i, i == ptree.begin(), path, display_path, mode, equal_sign, delimiter, root.to_string(), unquote_numbers ); // quick and dirty
+        xpath display_path( prefix );
+        impl::ptree_to_path_value_string_impl( &os, dummy, i, i == ptree.begin(), path, display_path, mode, equal_sign, delimiter, root.to_string(), unquote_numbers, prefix ); // quick and dirty
     }
 }
 
-std::vector< std::pair< xpath, std::string > > property_tree::to_path_value( const boost::property_tree::ptree& ptree, const xpath& root, path_mode mode )
+std::vector< std::pair< xpath, std::string > > property_tree::to_path_value( const boost::property_tree::ptree& ptree, const xpath& root, path_mode mode, const std::string& prefix )
 {
     std::vector< std::pair< xpath, std::string > > pv; // quick and dirty
     for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
@@ -202,8 +203,8 @@ std::vector< std::pair< xpath, std::string > > property_tree::to_path_value( con
         //         If a node has both named and unnamed child nodes, it cannot be mapped to a JSON representation."
         // http://www.boost.org/doc/libs/1_41_0/doc/html/boost_propertytree/parsers.html#boost_propertytree.parsers.json_parser
         xpath path;
-        xpath display_path;
-        impl::ptree_to_path_value_string_impl( nullptr, pv, i, i == ptree.begin(), path, display_path, mode, '=', ',', root.to_string(), true ); // quick and dirty
+        xpath display_path( prefix );
+        impl::ptree_to_path_value_string_impl( nullptr, pv, i, i == ptree.begin(), path, display_path, mode, '=', ',', root.to_string(), true, prefix ); // quick and dirty
     }
     return pv;
 }
@@ -222,10 +223,10 @@ void property_tree::from_path_value( std::istream& is, boost::property_tree::ptr
     ptree = comma::property_tree::from_path_value_string( s, equal_sign, delimiter, check_type, use_index );
 }
 
-std::string property_tree::to_path_value_string( const boost::property_tree::ptree& ptree, property_tree::path_mode mode, char equal_sign, char delimiter, bool const unquote_numbers )
+std::string property_tree::to_path_value_string( const boost::property_tree::ptree& ptree, property_tree::path_mode mode, char equal_sign, char delimiter, bool unquote_numbers, const std::string& prefix )
 {
     std::ostringstream oss;
-    to_path_value( oss, ptree, mode, equal_sign, delimiter, xpath(), unquote_numbers );
+    to_path_value( oss, ptree, mode, equal_sign, delimiter, xpath(), unquote_numbers, prefix );
     return oss.str();
 }
 
diff --git a/name_value/ptree.h b/name_value/ptree.h
index b2f28bac3..d80996b99 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -44,13 +44,13 @@ struct property_tree // quick and dirty
     enum path_mode { disabled, with_brackets, without_brackets  };
 
     /// write as path-value to output stream
-    static void to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode indices_mode = disabled, char equal_sign = '=', char delimiter = ',', const xpath& root = xpath(), bool const unquote_numbers = false );
+    static void to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode indices_mode = disabled, char equal_sign = '=', char delimiter = ',', const xpath& root = xpath(), bool unquote_numbers = false, const std::string& prefix = "" );
 
     /// return path-value pairs
-    static std::vector< std::pair< xpath, std::string > > to_path_value( const boost::property_tree::ptree& ptree, const xpath& root = xpath(), path_mode indices_mode = with_brackets );
+    static std::vector< std::pair< xpath, std::string > > to_path_value( const boost::property_tree::ptree& ptree, const xpath& root = xpath(), path_mode indices_mode = with_brackets, const std::string& prefix = "" );
 
     /// convert boost parameter tree into path=value-style string (equal sign and delimiter have to be escaped)
-    static std::string to_path_value_string( const boost::property_tree::ptree& ptree, path_mode mode=disabled, char equal_sign = '=', char delimiter = ',', bool const unquote_numbers = false );
+    static std::string to_path_value_string( const boost::property_tree::ptree& ptree, path_mode mode=disabled, char equal_sign = '=', char delimiter = ',', bool unquote_numbers = false, const std::string& prefix = "" );
     
     /// put an xpath like a/b[5]/c/d[3]=4 into ptree
     static void put( boost::property_tree::ptree& ptree, const xpath& path, const std::string& value, bool use_index = true );
diff --git a/name_value/serialize.h b/name_value/serialize.h
index 8716a4c09..de99a9c26 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -207,10 +207,10 @@ template < typename T > std::ostream& write_xml( const T& t, std::ostream& strea
 /// write path-value object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 /// @todo parametrize on equality sign and delimiter?
-template < typename T > void write_path_value( const T& t, const std::string& filename, const xpath& root );
+template < typename T > void write_path_value( const T& t, const std::string& filename, const xpath& root, const std::string& prefix = "" );
 template < typename T > void write_path_value( const T& t, const std::string& filename, const char* root );
 template < typename T > void write_path_value( const T& t, const std::string& filename );
-template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers = false );
+template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool unquote_numbers = false, const std::string& prefix = "" );
 template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream, const char* root );
 template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream );
 
@@ -436,21 +436,21 @@ template < typename T > inline void write_xml( const T& t, const std::string& fi
 template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream, const char* root ) { return write_xml( t, stream, xpath( root ) ); }
 template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream ) { return write_xml( t, stream, xpath() ); }
 
-template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers )
+template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool unquote_numbers, const std::string& prefix )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
-    comma::property_tree::to_path_value( stream, p, comma::property_tree::disabled, '=', '\n', xpath(), unquote_numbers );
+    comma::property_tree::to_path_value( stream, p, comma::property_tree::disabled, '=', '\n', xpath(), unquote_numbers, prefix );
     return stream;
 }
 
-template < typename T > inline void write_path_value( const T& t, const std::string& filename, const xpath& root )
+template < typename T > inline void write_path_value( const T& t, const std::string& filename, const xpath& root, const std::string& prefix )
 {
     std::ofstream ofs( &filename[0] );
     if( !ofs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
-    write_path_value< T >( t, ofs, root );
+    write_path_value< T >( t, ofs, root, prefix );
     ofs.close();
 }
 
diff --git a/name_value/test/serialise_test.cpp b/name_value/test/serialise_test.cpp
index 706cc9910..a2f5c2276 100644
--- a/name_value/test/serialise_test.cpp
+++ b/name_value/test/serialise_test.cpp
@@ -356,6 +356,13 @@ TEST( serialise, path_value )
         comma::read_path_value< config >( c, ss, comma::xpath( "root/item" ), true );
         test_config( c );
     }
+    {
+        std::stringstream ss;
+        comma::write_path_value< config >( d, ss, "root/item", true, "hello/world" );
+        config c;
+        comma::read_path_value< config >( c, ss, "hello/world/root/item", true );
+        test_config( c );
+    }
 }
 
 } } } // namespace comma { namespace test { namespace serialise {

From 1fe09a8d441d836366f94b8c587d9da549e701b6 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 1 May 2024 14:32:14 +1000
Subject: [PATCH 0784/1056] CMakeLists.txt: minor whitespace and capitalisation
 tweak

---
 CMakeLists.txt | 9 +++------
 1 file changed, 3 insertions(+), 6 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index cf8379b41..958e63de6 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -152,13 +152,10 @@ CMAKE_DEPENDENT_OPTION( BUILD_CPP_PYTHON_BINDINGS "build C++/Python bindings" OF
 OPTION( BUILD_APPLICATIONS "build applications" ON )
 SET( comma_BUILD_APPLICATIONS ${BUILD_APPLICATIONS} )
 
-OPTION( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
-
 option( BUILD_SHARED_LIBS "build with shared libraries" ON )
-
-OPTION( comma_BUILD_PYTHON "build python" ON )
-
-OPTION( comma_BUILD_XML "build xml" OFF )
+option( comma_BUILD_PYTHON "build python" ON )
+option( comma_BUILD_XML "build xml" OFF )
+option( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
 
 SET(comma_BUILD_SHARED_LIBS ${BUILD_SHARED_LIBS})
 

From 9aa03138ee28782605639beefa36118038705580 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Thu, 2 May 2024 17:32:47 +1000
Subject: [PATCH 0785/1056] optionally use std::filesystem rather than
 boost::filesystem

default to std::filesystem, use comma_USE_BOOST_FILESYSTEM=ON to use boost
---
 CMakeLists.txt                       | 21 +++++++++++++---
 application/command_line_options.cpp |  4 +--
 application/verbose.cpp              |  5 ++--
 csv/applications/csv-strings.cpp     | 10 ++++----
 csv/applications/split/split.cpp     | 10 ++++----
 io/applications/io-buffer.cpp        |  1 -
 io/impl/filesystem.h                 | 37 ++++++++++++++++++++++++++++
 io/impl/publisher.cpp                |  1 -
 io/load.h                            |  4 +--
 io/stream.cpp                        |  7 +++---
 io/test/stream_test.cpp              | 22 ++++++++---------
 xml/applications/xml-split.cpp       |  9 +++----
 12 files changed, 88 insertions(+), 43 deletions(-)
 create mode 100644 io/impl/filesystem.h

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 958e63de6..4d69ec426 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -156,6 +156,16 @@ option( BUILD_SHARED_LIBS "build with shared libraries" ON )
 option( comma_BUILD_PYTHON "build python" ON )
 option( comma_BUILD_XML "build xml" OFF )
 option( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
+option( comma_USE_BOOST_FILESYSTEM "use boost::filesystem rather than std::filesystem" OFF )
+
+if( comma_USE_BOOST_FILESYSTEM )
+    set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DCOMMA_USE_BOOST_FILESYSTEM -DBOOST_FILESYSTEM_NO_DEPRECATED" )
+else()
+    # see https://gcc.gnu.org/onlinedocs/libstdc++/manual/status.html#status.iso.2017
+    if( CMAKE_CXX_COMPILER_ID STREQUAL "GNU" AND CMAKE_CXX_COMPILER_VERSION VERSION_LESS 9 )
+        link_libraries( "-lstdc++fs" )
+    endif()
+endif()
 
 SET(comma_BUILD_SHARED_LIBS ${BUILD_SHARED_LIBS})
 
@@ -163,6 +173,11 @@ IF( NOT BUILD_SHARED_LIBS )
     SET( Boost_USE_STATIC_LIBS ON )
 ENDIF( NOT BUILD_SHARED_LIBS )
 
+set( comma_boost_components thread system date_time iostreams program_options regex )
+if( comma_USE_BOOST_FILESYSTEM )
+    set( comma_boost_components ${comma_boost_components} filesystem )
+endif()
+
 IF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
     IF( NOT BUILD_SHARED_LIBS )
         MESSAGE( WARNING "Linking C++/Python bindings with static libraries is requested. If linking fails, recompile required libraries with -fPIC or use shared libraries. Note that this feature has only been tested with shared libraries." )
@@ -170,10 +185,10 @@ IF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
     SET( Python_ADDITIONAL_VERSIONS 2.7 )
     FIND_PACKAGE( PythonLibs REQUIRED )
     INCLUDE_DIRECTORIES( ${PYTHON_INCLUDE_DIRS} )
-    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time iostreams program_options regex python )
-ELSE( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
-    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time iostreams program_options regex )
+    set( comma_boost_components ${comma_boost_components} python )
 ENDIF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
+
+FIND_PACKAGE( Boost COMPONENTS ${comma_boost_components} )
 INCLUDE_DIRECTORIES( ${Boost_INCLUDE_DIRS} )
 LINK_DIRECTORIES( ${Boost_LIBRARY_DIRS} )
 
diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index a613259ec..b63331704 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -10,13 +10,13 @@
 #include <unordered_map>
 #include <boost/bind/bind.hpp>
 #include <boost/config/warning_disable.hpp>
-//#include <boost/filesystem.hpp>
 #include <boost/iostreams/stream.hpp>
 #include <boost/iostreams/device/null.hpp>
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>
 #include "../base/exception.h"
+#include "../io/impl/filesystem.h"
 #include "../string/split.h"
 #include "command_line_options.h"
 
@@ -80,7 +80,7 @@ void command_line_options::_init_verbose( const std::string& path )
         if( exists( v[i] ) ) { comma::application::detail::verbosity_level = v.size() - i; break; }
     }
     comma::verbose.init( comma::application::detail::verbosity_level > 0, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
-    comma::application::detail::name = comma::split( path, '/' ).back(); // boost::filesystem::basename( path );
+    comma::application::detail::name = comma::filesystem::path( path ).filename().string(); // comma::split( path, '/' ).back()
     comma::application::detail::titlebar_enabled = exists( "--titlebar,--tb" );
     if( exists( "--titlebar-application-name,--tbn" ) ) { comma::io::terminal::titlebar_ostream s; s << comma::application::detail::name; }
 }
diff --git a/application/verbose.cpp b/application/verbose.cpp
index b620ae127..0e6c12257 100644
--- a/application/verbose.cpp
+++ b/application/verbose.cpp
@@ -1,6 +1,6 @@
 // Copyright (c) 2015 The University of Sydney
 
-//#include <boost/filesystem.hpp>
+#include "../io/impl/filesystem.h"
 #include "../string/string.h"
 #include "verbose.h"
 
@@ -13,7 +13,7 @@ verbose_t::operator bool () const {return enabled_;}
 const std::string& verbose_t::app_name() const {return app_name_;}
 void verbose_t::init(bool enabled, const std::string& argv0)
 {
-    if(!argv0.empty()) { app_name_ = comma::split( argv0, '/' ).back(); } // app_name_=boost::filesystem::basename(argv0);
+    if(!argv0.empty()) { app_name_ = comma::filesystem::path(argv0).filename().string(); } // comma::split( argv0, '/' ).back();
     enabled_=enabled;
     start_of_line=true;
 }
@@ -29,4 +29,3 @@ verbose_t& verbose_t::operator<<(std::basic_ostream<char>& (*pf)(std::basic_ostr
 }
 
 }//namespace comma {
-
diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
index 78e0e0258..be7510b40 100644
--- a/csv/applications/csv-strings.cpp
+++ b/csv/applications/csv-strings.cpp
@@ -6,13 +6,13 @@
 #include <functional>
 #include <iostream>
 
-#include <boost/filesystem.hpp>
 #include <boost/lexical_cast.hpp>
 
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
 #include "../../csv/traits.h"
+#include "../../io/impl/filesystem.h"
 #include "../../string/string.h"
 
 static void usage( bool verbose )
@@ -232,21 +232,21 @@ struct canonical
 {
     typedef input output_t;
     
-    boost::filesystem::path base;
+    comma::filesystem::path base;
 
     static constexpr char const* name() { return "canonical"; }
     
     canonical( const comma::command_line_options& options )
         : base( options.exists( "--base" )
-        ? boost::filesystem::path( options.value< std::string >( "--base" ) )
-        : boost::filesystem::current_path() )
+        ? comma::filesystem::path( options.value< std::string >( "--base" ) )
+        : comma::filesystem::current_path() )
     {
         if( ( options.value( "--path-delimiter,-p", '/' ) ) != '/' ) { COMMA_THROW( comma::exception, "path-canonical: expected path delimiter '/'; got: '" << options.value( "--path-delimiter,-p", '/' ) << "'" ); }
     }
 
     std::string convert( const std::string& s ) const
     {
-        try { return boost::filesystem::canonical( boost::filesystem::path( s ), base ).string(); } catch( ... ) { if( strict ) { throw; } }
+        try { return comma::filesystem::canonical( base / comma::filesystem::path( s )).string(); } catch( ... ) { if( strict ) { throw; } }
         return s;
     }
 };
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 7a8034eed..69acfdb43 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -39,12 +39,12 @@
 #endif
 
 #include <unordered_map>
-#include <boost/filesystem.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../../base/exception.h"
 #include "../../../csv/stream.h"
 #include "../../../csv/traits.h"
 #include "../../../io/file_descriptor.h"
+#include "../../../io/impl/filesystem.h"
 #include "../../../name_value/parser.h"
 #include "../../../visiting/traits.h"
 #include "split.h"
@@ -321,8 +321,8 @@ std::ofstream* split< T >::ofstream_by_block_()
             auto it = filenames_.find( filenames_have_id_ ? current_.block : id );
             if( it == filenames_.end() ) { return nullptr; }
             filename = it->second;
-            const auto& dirname = boost::filesystem::path( filename ).parent_path();
-            if( !( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) ) { COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << filename << "'" ); }
+            const auto& dirname = comma::filesystem::path( filename ).parent_path();
+            if( !( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ) ) ) { COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << filename << "'" ); }
         }
         if( filename.empty() ) { filename = boost::lexical_cast< std::string >( current_.block ) + suffix_; }
         file_.open( &filename[0], mode_ );
@@ -368,8 +368,8 @@ std::ofstream* split< T >::ofstream_by_id_()
         else { mode |= std::ofstream::app; }
         std::string name = filename_from_id_( current_.id );
         if( name.empty() ) { return nullptr; }
-        const auto& dirname = boost::filesystem::path( name ).parent_path();
-        if( !( dirname.empty() || boost::filesystem::is_directory( dirname ) || boost::filesystem::create_directories( dirname ) ) )
+        const auto& dirname = comma::filesystem::path( name ).parent_path();
+        if( !( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ) ) )
         {
             COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << name << "'" );
         }
diff --git a/io/applications/io-buffer.cpp b/io/applications/io-buffer.cpp
index 23cbf7d78..4463bbd04 100644
--- a/io/applications/io-buffer.cpp
+++ b/io/applications/io-buffer.cpp
@@ -43,7 +43,6 @@
 #include <cctype>
 #include <vector>
 #include <fstream>
-#include <boost/filesystem/operations.hpp>
 #include <boost/interprocess/sync/file_lock.hpp>
 #include <boost/interprocess/sync/scoped_lock.hpp>
 #include <boost/algorithm/string.hpp>
diff --git a/io/impl/filesystem.h b/io/impl/filesystem.h
new file mode 100644
index 000000000..9a8d93804
--- /dev/null
+++ b/io/impl/filesystem.h
@@ -0,0 +1,37 @@
+// Copyright (c) 2024 Mission Systems Pty Ltd
+//
+// Allow selection of filesystem library from either boost or C++ standard library
+//
+// Can assist with interoperation with other libraries that require or conflict
+// with one or the other
+//
+// Usage:
+// #include "io/impl/filesystem.h"
+// ...
+// comma::filesystem::<some-op>
+//
+// Configuration:
+//   in CMake set comma_USE_BOOST_FILESYSTEM
+//     "ON" will use boost::filesystem
+//     "OFF" will use std::filesystem or std::experimental::filesystem
+//           if you're using gcc older than version 8.1
+
+#pragma once
+
+#ifdef COMMA_USE_BOOST_FILESYSTEM
+  #include <boost/filesystem.hpp>
+  namespace comma { namespace filesystem = boost::filesystem; }
+#else
+  #if defined(__GNUC__)
+    #if __has_include (<filesystem>)
+      #include <filesystem>
+      namespace comma { namespace filesystem = std::filesystem; }
+    #else
+      #include <experimental/filesystem>
+      namespace comma { namespace filesystem = std::experimental::filesystem; }
+    #endif
+  #else
+    #include <filesystem>
+    namespace comma { namespace filesystem = std::filesystem; }
+  #endif
+#endif
diff --git a/io/impl/publisher.cpp b/io/impl/publisher.cpp
index b8d0e0c50..66d14d531 100644
--- a/io/impl/publisher.cpp
+++ b/io/impl/publisher.cpp
@@ -13,7 +13,6 @@
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
 #include <boost/bind/bind.hpp>
-#include <boost/filesystem/operations.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../base/exception.h"
 #include "../../io/file_descriptor.h"
diff --git a/io/load.h b/io/load.h
index 35ee617fc..44fc8f598 100644
--- a/io/load.h
+++ b/io/load.h
@@ -7,7 +7,7 @@
 #include <fstream>
 #include <string>
 #include <vector>
-#include <boost/filesystem.hpp>
+#include "impl/filesystem.h"
 #include "../base/exception.h"
 
 namespace comma { namespace io {
@@ -27,7 +27,7 @@ inline C< T, A >& load_array( C< T, A >& a, const std::string& path )
 {
     std::ifstream ifs( path );
     if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << path << "\"" ); }
-    a.resize( boost::filesystem::file_size( path ) / sizeof( T ) ); // todo? will file_size work on symlinks?
+    a.resize( comma::filesystem::file_size( path ) / sizeof( T ) ); // todo? will file_size work on symlinks?
     ifs.read( reinterpret_cast< char * >( &a[0] ), a.size() * sizeof( T ) );
     if( ifs.gcount() != int( a.size() * sizeof( T ) ) ) { COMMA_THROW( comma::exception, "expected to read " << a.size() * sizeof( T ) << " bytes (" << a.size() << " elements " << sizeof( T ) << " byte(s) each) from \"" << path << "\"; got: " << ifs.gcount() << " byte(s)" ); }
     return a;
diff --git a/io/stream.cpp b/io/stream.cpp
index a17208b53..604b14763 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -22,10 +22,9 @@
 #include <boost/asio/ip/udp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
 #include <boost/bind/bind.hpp>
-#include <boost/filesystem.hpp>
-#include <boost/filesystem/operations.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#include "impl/filesystem.h"
 #include "../base/exception.h"
 #include "../string/string.h"
 #include "file_descriptor.h"
@@ -146,7 +145,7 @@ S* stream< S >::lazily_make_stream_()
     #ifndef WIN32
     if( stream_ == NULL ) // quick and dirty: if fstream, cannot open on construction, as pipe might block
     {
-        if( !boost::filesystem::is_regular_file( name_ ) && !blocking_ ) // quick and dirty
+        if( !comma::filesystem::is_regular_file( name_ ) && !blocking_ ) // quick and dirty
         {
             io::select select;
             select.read().add( fd_ ); // todo: express via traits
@@ -356,7 +355,7 @@ stream< S >::stream( const std::string& name, mode::value m, mode::blocking_valu
 
         fd_ = impl::traits< S >::open( name );
         if( fd_ != io::invalid_file_descriptor ) { set_non_blocking_flags_( fd_ ); return; }
-        if( boost::filesystem::is_regular_file( name ) ) { COMMA_THROW( comma::exception, "failed to open \"" << name << "\"" ); }
+        if( comma::filesystem::is_regular_file( name ) ) { COMMA_THROW( comma::exception, "failed to open \"" << name << "\"" ); }
         #endif // #ifdef WIN32
     }
 }
diff --git a/io/test/stream_test.cpp b/io/test/stream_test.cpp
index 4fdab8db1..1b8cc0b98 100644
--- a/io/test/stream_test.cpp
+++ b/io/test/stream_test.cpp
@@ -6,7 +6,7 @@
 #include <boost/asio/io_service.hpp>
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
-#include <boost/filesystem/operations.hpp>
+#include "../impl/filesystem.h"
 #include "../load.h" // just to make sure it compiles
 #include "../select.h"
 #include "../stream.h"
@@ -14,8 +14,8 @@
 TEST( io, file_stream )
 {
     {
-        boost::filesystem::remove( "./test.pipe" );
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.pipe" );
+        comma::filesystem::remove( "./test.file" );
         comma::io::ostream ostream( "./test.file" );
         comma::io::istream istream( "./test.file" );
         std::string line;
@@ -25,12 +25,12 @@ TEST( io, file_stream )
         EXPECT_EQ( line, "hello, world" );
         ostream.close();
         istream.close();
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.file" );
     }
     // todo: more testing?
     EXPECT_EQ( system( "mkfifo test.pipe" ), 0 );
-    EXPECT_TRUE( boost::filesystem::exists( "./test.pipe" ) );
-    EXPECT_TRUE( !boost::filesystem::is_regular_file( "./test.pipe" ) );
+    EXPECT_TRUE( comma::filesystem::exists( "./test.pipe" ) );
+    EXPECT_TRUE( !comma::filesystem::is_regular_file( "./test.pipe" ) );
     EXPECT_TRUE( ::open( "./test.pipe", O_RDONLY | O_NONBLOCK ) > 0 );
     comma::io::ostream os( "./test.pipe" );
     EXPECT_TRUE( os() != NULL );
@@ -90,7 +90,7 @@ TEST( io, local_stream )
 {
     #ifndef WIN32
     {
-        boost::filesystem::remove( "./test.localsocket" );
+        comma::filesystem::remove( "./test.localsocket" );
         boost::asio::local::stream_protocol::endpoint endpoint( "test.localsocket" );
         EXPECT_TRUE( !boost::asio::local::stream_protocol::iostream( endpoint ) );
         boost::asio::io_service service;
@@ -102,17 +102,17 @@ TEST( io, local_stream )
         ostream.close();
         acceptor.close();
         EXPECT_TRUE( !boost::asio::local::stream_protocol::iostream( endpoint ) );
-        EXPECT_TRUE( !boost::filesystem::is_regular_file( "./test.localsocket" ) );
-        boost::filesystem::remove( "./test.localsocket" );
+        EXPECT_TRUE( !comma::filesystem::is_regular_file( "./test.localsocket" ) );
+        comma::filesystem::remove( "./test.localsocket" );
     }
     {
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.file" );
         comma::io::ostream ostream( "./test.file" );
         ostream.close();
         boost::asio::io_service service;
         boost::asio::local::stream_protocol::endpoint endpoint( "test.file" );
         try { boost::asio::local::stream_protocol::acceptor acceptor( service, endpoint ); EXPECT_TRUE( false ); } catch( ... ) {}
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.file" );
     }
     #endif
 }
diff --git a/xml/applications/xml-split.cpp b/xml/applications/xml-split.cpp
index 0f5fbd4fb..1d215c7ce 100644
--- a/xml/applications/xml-split.cpp
+++ b/xml/applications/xml-split.cpp
@@ -40,14 +40,11 @@
 
 #include <expat.h>
 
-#include <boost/filesystem.hpp>
-
 #include "../../application/command_line_options.h"
+#include "../../io/impl/filesystem.h"
 #include "../../xpath/xpath.h"
 #include "expat_util.h"
 
-namespace FS = boost::filesystem;
-
 #define CMDNAME "xml-split"
 
 static unsigned TOTAL_MAX = std::numeric_limits<unsigned>::max() - 1;
@@ -190,14 +187,14 @@ output_wrapper::start()
     
     if (0 == _total_count)
     {
-        if (FS::exists(oss.str()))
+        if (comma::filesystem::exists(oss.str()))
         {
             std::cerr << CMDNAME ": Error: Output Directory Name '" << oss.str() << "' Already Exists on Filesystem. Abort!" << std::endl;
             exit(1);
         }
         else
         {
-            if (! FS::create_directory(oss.str()))
+            if (! comma::filesystem::create_directory(oss.str()))
             {
                 std::cerr << CMDNAME ": Error: Could not Create Output Directory '" << oss.str() << "'. Abort!" << std::endl;
                 return _destination;

From 0415bd4cb4f2a05e5ea356a3726bc5d249da0267 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 7 May 2024 12:59:37 +1000
Subject: [PATCH 0786/1056] string: split_head() and split_tail(): first cut
 implemented; basic unit test added

---
 string/split.cpp            | 59 +++++++++++++++++++++++++++++++++----
 string/split.h              |  8 +++--
 string/test/string_test.cpp | 42 ++++++++++++++++++++++++++
 3 files changed, 102 insertions(+), 7 deletions(-)

diff --git a/string/split.cpp b/string/split.cpp
index 579c98cfa..a2a6c420c 100644
--- a/string/split.cpp
+++ b/string/split.cpp
@@ -4,11 +4,11 @@
 /// @author mathew hounsell
 
 #include <boost/optional.hpp>
-
-// Don't use <> foc comma as that requires the code to be installed first.
 #include "../base/exception.h"
 #include "split.h"
 
+#include <iostream>
+
 namespace comma {
 
 bool string::is_one_of( char c, const char * characters )
@@ -17,7 +17,7 @@ bool string::is_one_of( char c, const char * characters )
     return false;
 }
 
-std::vector< std::string > split( const std::string & s, const char * separators, bool empty_if_empty_input )
+static std::vector< std::string > split_impl( const std::string & s, const char * separators, bool empty_if_empty_input, unsigned int size, bool head )
 {
     std::vector< std::string > v;
     if( empty_if_empty_input && s.empty() ) { return v; }
@@ -26,9 +26,36 @@ std::vector< std::string > split( const std::string & s, const char * separators
     v.push_back( std::string() );
     for( const char* p = begin; p < end; ++p )
     {
-        if( string::is_one_of( *p, separators ) ) { v.push_back( std::string() ); } else { v.back() += *p; }
+        if( string::is_one_of( *p, separators ) )
+        {
+            v.push_back( std::string() );
+        }
+        else
+        {
+            v.back() += *p;
+        }
     }
-    return v;
+    if( size == 0 || v.size() <= size ) { return v; }
+    std::vector< std::string > r( size );
+    if( head ) // quick and dirty for now
+    {
+        unsigned int sum{0};
+        for( unsigned int i = 0; i < size; ++i ) { r[i] = v[i]; sum += v[i].size() + 1; }
+        r.back() += std::string( s.substr( sum - 1 ) );
+    }
+    else
+    {
+        unsigned int sum{0}, k{0};
+        for( unsigned int i = 0; i < v.size() - size + 1; ++i ) { sum += v[i].size() + 1; ++k; }
+        r[0] = s.substr( 0, sum - 1 );
+        for( unsigned int i = 1; i < size; ++i ) { r[i] = v[k + i - 1]; }
+    }
+    return r;
+}
+
+std::vector< std::string > split( const std::string & s, const char * separators, bool empty_if_empty_input )
+{
+    return split_impl( s, separators, empty_if_empty_input, 0, true ); 
 }
 
 std::vector< std::string > split( const std::string & s, char separator, bool empty_if_empty_input )
@@ -37,6 +64,28 @@ std::vector< std::string > split( const std::string & s, char separator, bool em
     return split( s, separators, empty_if_empty_input );
 }
 
+std::vector< std::string > split_head( const std::string& s, unsigned int size, const char* separators, bool empty_if_empty_input )
+{
+    return split_impl( s, separators, empty_if_empty_input, size, true ); 
+}
+
+std::vector< std::string > split_head( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input )
+{
+    const char separators[] = { separator, 0 };
+    return split_head( s, size, separators, empty_if_empty_input );
+}
+
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, const char* separators, bool empty_if_empty_input )
+{
+    return split_impl( s, separators, empty_if_empty_input, size, false ); 
+}
+
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input )
+{
+    const char separators[] = { separator, 0 };
+    return split_tail( s, size, separators, empty_if_empty_input );
+}
+
 std::vector< std::string > split_escaped( const std::string & s, const char * separators, const char * quotes, char escape )
 {
     std::vector< std::string > v;
diff --git a/string/split.h b/string/split.h
index ea578625e..629e5645e 100644
--- a/string/split.h
+++ b/string/split.h
@@ -21,9 +21,13 @@ bool is_one_of( char c, const char* characters );
 
 /// split string into tokens (a quick implementation); always contains at least one element unless empty_if_empty_input is true
 std::vector< std::string > split( const std::string& s, const char* separators = " ", bool empty_if_empty_input = false );
-
-/// split string into tokens (a quick implementation); always contains at least one element unless empty_if_empty_input is true
 std::vector< std::string > split( const std::string& s, char separator, bool empty_if_empty_input = false );
+/// split to up to <size> elements starting from the start of the string
+std::vector< std::string > split_head( const std::string& s, unsigned int size, const char* separators = " ", bool empty_if_empty_input = false );
+std::vector< std::string > split_head( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input = false );
+/// split to up to <size> elements starting from the end of the string
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, const char* separators = " ", bool empty_if_empty_input = false );
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input = false );
 
 /// split string into tokens and cast to a vector of given types
 template < typename T > std::vector< T > split_as( const std::string& s, const char* separators );
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index ce987b63c..b37dd6603 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -56,6 +56,23 @@ TEST( string, join )
     }
 }
 
+static inline void make_vector_impl( std::vector< std::string >& v ) {}
+
+template < typename T, typename... Args >
+static inline void make_vector_impl( std::vector< std::string >& v, T arg, Args... args )
+{
+    v.push_back( arg );
+    make_vector_impl( v, args... );
+}
+
+template < typename... Args >
+static inline std::vector< std::string > make_vector( Args... args )
+{
+    std::vector< std::string > v;
+    make_vector_impl( v, args... );
+    return v;
+}
+
 TEST( string, split )
 {
     {
@@ -97,6 +114,31 @@ TEST( string, split )
         EXPECT_TRUE( v.size() == 4 );
         for( unsigned int i = 0; i < 4; ++i ) { EXPECT_TRUE( v.at(i) == "" ); }
     }
+    {
+        EXPECT_EQ( split_head( "",              1, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_head( "",              5, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_head( "a",             1, ',', true ), make_vector( "a" ) );
+        EXPECT_EQ( split_head( "abc",           1, ',', true ), make_vector( "abc" ) );
+        EXPECT_EQ( split_head( "a,b",           1, ',', true ), make_vector( "a,b" ) );
+        EXPECT_EQ( split_head( "ab,cd",         1, ',', true ), make_vector( "ab,cd" ) );
+        EXPECT_EQ( split_head( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_head( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_head( "a,b",           3, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_head( "a,b,c,d,e,f,g", 5, ',', true ), make_vector( "a", "b", "c", "d", "e,f,g" ) );
+    }
+    {
+        EXPECT_EQ( split_tail( "",              1, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_tail( "",              5, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_tail( "a",             1, ',', true ), make_vector( "a" ) );
+        EXPECT_EQ( split_tail( "abc",           1, ',', true ), make_vector( "abc" ) );
+        EXPECT_EQ( split_tail( "a,b",           1, ',', true ), make_vector( "a,b" ) );
+        EXPECT_EQ( split_tail( "ab,cd",         1, ',', true ), make_vector( "ab,cd" ) );
+        EXPECT_EQ( split_tail( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_tail( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_tail( "a,b",           3, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_tail( "a,b,c,d,e,f",   5, ',', true ), make_vector( "a,b", "c", "d", "e", "f" ) );
+        EXPECT_EQ( split_tail( "a,b,c,d,e,f,g", 5, ',', true ), make_vector( "a,b,c", "d", "e", "f", "g" ) );
+    }
 }
 
 TEST( string, split_as )

From 2e4b8d6c34d3a83ee17f8f219832261509b83929 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 7 May 2024 13:20:06 +1000
Subject: [PATCH 0787/1056] string: split: unnecessary include removed

---
 string/split.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/string/split.cpp b/string/split.cpp
index a2a6c420c..71ca2d7af 100644
--- a/string/split.cpp
+++ b/string/split.cpp
@@ -7,8 +7,6 @@
 #include "../base/exception.h"
 #include "split.h"
 
-#include <iostream>
-
 namespace comma {
 
 bool string::is_one_of( char c, const char * characters )

From 9343aeaaf85b3d729dd044b6c0406bfc1df8acd1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 13 May 2024 12:59:49 +1000
Subject: [PATCH 0788/1056] cyclic_buffer::data() implemented

---
 containers/cyclic_buffer.h | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/containers/cyclic_buffer.h b/containers/cyclic_buffer.h
index 5490ff320..4b1d7128c 100644
--- a/containers/cyclic_buffer.h
+++ b/containers/cyclic_buffer.h
@@ -64,6 +64,12 @@ class cyclic_buffer
         
         /// clear
         void clear();
+
+        /// accessor to underlying data
+        const std::vector< T >& data() const { return vector_; }
+
+        /// accessor to underlying data
+        std::vector< T >& data() { return vector_; }
         
     protected:
         std::vector< T > vector_;

From 14a929fcf4f25a002f5b18920bcace7919acd86a Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 13 May 2024 14:53:17 +1000
Subject: [PATCH 0789/1056] containers: cyclic_buffer::push( ..., force )
 implemented

---
 containers/cyclic_buffer.h             | 43 ++++++++++++--------------
 containers/test/cyclic_buffer_test.cpp | 26 ++++++++++++++--
 2 files changed, 43 insertions(+), 26 deletions(-)

diff --git a/containers/cyclic_buffer.h b/containers/cyclic_buffer.h
index 4b1d7128c..bfdbc45a9 100644
--- a/containers/cyclic_buffer.h
+++ b/containers/cyclic_buffer.h
@@ -21,54 +21,41 @@ template < typename T >
 class cyclic_buffer
 {
     public:
-        /// constructor
         cyclic_buffer( std::size_t size, const T& t = T() );
         
-        /// copy constructor
         cyclic_buffer( const cyclic_buffer& rhs ) { operator=( rhs ); }
         
-        /// assignment
         const cyclic_buffer& operator=( const cyclic_buffer& rhs );
         
-        /// return front
         T& front();
         
-        /// return front
         const T& front() const;
         
-        /// return back
         T& back();
         
-        /// return back
-        
         const T& back() const;
+
+        std::size_t front_index() const { return begin_(); }
+
+        std::size_t end_index() const { return end_(); }
         
-        /// push a new element at the end of the list
-        void push( const T& t );
+        void push( const T& t, bool force = false );
         
-        /// push a new element at the end of the list
         template < typename Iterator >
-        void push( Iterator begin, Iterator end );
+        void push( Iterator begin, Iterator end, bool force = false );
         
-        /// pop the new element at the front of the list
         void pop( std::size_t n = 1 );
         
-        /// return current size
         std::size_t size() const;
         
-        /// return capacity
         std::size_t capacity() const;
         
-        /// return true, if empty
         bool empty() const;
         
-        /// clear
         void clear();
 
-        /// accessor to underlying data
         const std::vector< T >& data() const { return vector_; }
 
-        /// accessor to underlying data
         std::vector< T >& data() { return vector_; }
         
     protected:
@@ -150,19 +137,27 @@ template < typename T >
 inline std::size_t cyclic_buffer< T >::capacity() const { return vector_.size(); }
 
 template < typename T >
-inline void cyclic_buffer< T >::push( const T& t )
+inline void cyclic_buffer< T >::push( const T& t, bool force )
 {
-    if( size() == vector_.size() ) { COMMA_THROW( comma::exception, "full" ); }
-    vector_[ end_() ] = t;
+    if( size() == vector_.size() )
+    { 
+        if( !force ) { COMMA_THROW( comma::exception, "full" ); }
+        vector_[ begin_() ] = t;
+        ++begin_;
+    }
+    else
+    {
+        vector_[ end_() ] = t;
+    }
     ++end_;
     empty_ = false;
 }
 
 template < typename T >
 template < typename Iterator >
-inline void cyclic_buffer< T >::push( Iterator begin, Iterator end )
+inline void cyclic_buffer< T >::push( Iterator begin, Iterator end, bool force )
 {
-    for( Iterator it = begin; it != end; ++it ) { push( *it ); }
+    for( Iterator it = begin; it != end; ++it ) { push( *it, force ); }
 }
 
 template < typename T >
diff --git a/containers/test/cyclic_buffer_test.cpp b/containers/test/cyclic_buffer_test.cpp
index 29eb69e8e..cc12f841d 100644
--- a/containers/test/cyclic_buffer_test.cpp
+++ b/containers/test/cyclic_buffer_test.cpp
@@ -29,6 +29,7 @@
 
 
 #include <gtest/gtest.h>
+#include "../../base/exception.h"
 #include "../cyclic_buffer.h"
 
 namespace comma {
@@ -82,8 +83,7 @@ TEST( cyclic_buffer, push_pop )
         EXPECT_EQ( b.size(), 4 - i );
     }
     EXPECT_TRUE( b.empty() );
-    EXPECT_EQ( b.size(), 0u );    
-    
+    EXPECT_EQ( b.size(), 0u );
     for( unsigned int i = 0; i < 5u; ++i )
     {
         b.push( i );
@@ -92,6 +92,28 @@ TEST( cyclic_buffer, push_pop )
     EXPECT_EQ( b.size(), 1u );    
 }
 
+TEST( cyclic_buffer, push_force )
+{
+    cyclic_buffer< unsigned int > b( 3 );
+    b.push( 0 );
+    b.push( 1 );
+    b.push( 2 );
+    EXPECT_EQ( b.front(), 0 );
+    EXPECT_EQ( b.back(), 2 );
+    EXPECT_THROW( b.push( 3 ), comma::exception );
+    b.push( 3, true );
+    EXPECT_EQ( b.front(), 1 );
+    EXPECT_EQ( b.back(), 3 );
+    EXPECT_THROW( b.push( 4 ), comma::exception );
+    b.push( 4, true );
+    EXPECT_EQ( b.front(), 2 );
+    EXPECT_EQ( b.back(), 4 );
+    EXPECT_THROW( b.push( 5 ), comma::exception );
+    b.push( 5, true );
+    EXPECT_EQ( b.front(), 3 );
+    EXPECT_EQ( b.back(), 5 );
+}
+
 TEST( cyclic_buffer, fixed_cyclic_buffer )
 {
     fixed_cyclic_buffer< unsigned int, 3 > b;

From 512c1fd2f59880253f95420422e49b4cd2e3d0d0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 May 2024 21:18:45 +1000
Subject: [PATCH 0790/1056] base: variant: in progress...

---
 base/test/base_test.cpp | 37 ++++++++++++++++++++++
 base/variant.h          | 68 +++++++++++++++++++++++++++++++++++++++++
 2 files changed, 105 insertions(+)
 create mode 100644 base/variant.h

diff --git a/base/test/base_test.cpp b/base/test/base_test.cpp
index ea78c602c..7105b1696 100644
--- a/base/test/base_test.cpp
+++ b/base/test/base_test.cpp
@@ -1,6 +1,7 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 
 #include "../exception.h"
+#include "../variant.h"
 #include <gtest/gtest.h>
 
 namespace comma {
@@ -17,6 +18,42 @@ TEST( base, exception )
     EXPECT_THROW( COMMA_THROW_IF( 2 * 2 == 4, "all bad" ), comma::exception );
 }
 
+TEST( base, variant )
+{
+    {
+        comma::impl::variant< int, float, double > v;
+        v.t = 1;
+        v.values.t = 2;
+        v.values.values.t = 3;
+    }
+    {
+        comma::impl::variant< int, float, double > v;
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( *v.t, 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< float >( 5 );
+        EXPECT_EQ( *v.values.t, 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_TRUE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< double >( 5 );
+        EXPECT_EQ( *v.values.values.t, 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_TRUE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( *v.t, 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+    }
+}
+
 } // namespace comma {
 
 int main( int argc, char* argv[] )
diff --git a/base/variant.h b/base/variant.h
new file mode 100644
index 000000000..8dfdec3b5
--- /dev/null
+++ b/base/variant.h
@@ -0,0 +1,68 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+// todo
+// #if __cplusplus >= 201703L
+// #include <optional>
+// #else
+// #include <boost/optional.hpp>
+// #endif
+#include <type_traits>
+#include <boost/optional.hpp>
+
+namespace comma {
+
+// todo
+//   ? use tuple instead?
+//   - check that types don't repeat
+
+namespace impl {
+
+template < typename T, bool B > struct variant_traits
+{
+    template < typename S > static void set( boost::optional< T >& t, const S& ) { t.reset(); }
+    template < typename S > static void set( boost::optional< T >& t, const boost::optional< S >& ) { t.reset(); }
+};
+
+template < typename T > struct variant_traits< T, true >
+{
+    template < typename S > static void set( boost::optional< T >& t, const S& s ) { t = s; }
+    template < typename S > static void set( boost::optional< T >& t, const boost::optional< S >& s ) { t = s; }
+};
+
+template < typename T, typename... Args > struct variant  // todo? use tuple instead?
+{
+    boost::optional< T > t;
+    variant< Args... > values;
+ 
+    template < typename S > bool is() const { return ( std::is_same< T, S >::value && bool( t ) ) || values.template is< S >(); }
+    operator bool() const { return bool( t ) || bool( values ); }
+    template < typename S > void set( const S& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); values.set( s ); }
+    template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); values.set( s ); }
+};
+
+template < typename T > struct variant< T >  // todo? use tuple instead?
+{
+    boost::optional< T > t;
+
+    template < typename S > bool is() const { return std::is_same< T, S >::value && bool( t ); }
+    operator bool() const { return bool( t ); }
+    template < typename S > void set( const S& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); }
+    template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); }
+};
+
+} // namespace impl {
+
+template < typename... Args >
+class variant
+{
+    public:
+        // todo
+    private:
+        impl::variant< Args... > _values;
+};
+
+} // namespace comma {

From 4327923a72dbad22c788b15d10046b86792fa324 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 May 2024 21:52:26 +1000
Subject: [PATCH 0791/1056] base: variant: first cut implemented and tested;
 todo: traits...

---
 base/test/base_test.cpp | 43 +++++++++++++++++++++++++++++++++++++++++
 base/variant.h          | 24 ++++++++++++++++++++---
 2 files changed, 64 insertions(+), 3 deletions(-)

diff --git a/base/test/base_test.cpp b/base/test/base_test.cpp
index 7105b1696..704eafb53 100644
--- a/base/test/base_test.cpp
+++ b/base/test/base_test.cpp
@@ -52,6 +52,49 @@ TEST( base, variant )
         EXPECT_FALSE( v.is< float >() );
         EXPECT_FALSE( v.is< double >() );
     }
+    {
+        comma::variant< int, float, double > v;
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( v.get< int >(), 5 );
+        EXPECT_TRUE( v.optional< int >() );
+        EXPECT_FALSE( v.optional< float >() );
+        EXPECT_FALSE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< int >(), 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< float >( 5 );
+        EXPECT_EQ( v.get< float >(), 5 );
+        EXPECT_FALSE( v.optional< int >() );
+        EXPECT_TRUE( v.optional< float >() );
+        EXPECT_FALSE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< float >(), 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_TRUE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< double >( 5 );
+        EXPECT_EQ( v.get< double >(), 5 );
+        EXPECT_FALSE( v.optional< int >() );
+        EXPECT_FALSE( v.optional< float >() );
+        EXPECT_TRUE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< double >(), 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_TRUE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( v.get< int >(), 5 );
+        EXPECT_TRUE( v.optional< int >() );
+        EXPECT_FALSE( v.optional< float >() );
+        EXPECT_FALSE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< float >(), 5 );
+        EXPECT_EQ( *v.optional< int >(), 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+    }
 }
 
 } // namespace comma {
diff --git a/base/variant.h b/base/variant.h
index 8dfdec3b5..b3bfc263e 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -18,30 +18,41 @@ namespace comma {
 // todo
 //   ? use tuple instead?
 //   - check that types don't repeat
+//   - visiting traits
 
 namespace impl {
 
-template < typename T, bool B > struct variant_traits
+struct type_is_not_on_type_list{}; // quick and dirty, a tag struct
+
+template < typename T, bool B > struct variant_traits;
+
+template < typename T > struct variant_traits< T, false >
 {
     template < typename S > static void set( boost::optional< T >& t, const S& ) { t.reset(); }
     template < typename S > static void set( boost::optional< T >& t, const boost::optional< S >& ) { t.reset(); }
+    template < typename S, typename V > static const S& get( const boost::optional< T >&, const V& v ) { return v.template get< S >(); }
+    template < typename S, typename V > static const boost::optional< S >& optional( const boost::optional< T >&, const V& v ) { return v.template optional< S >(); }
 };
 
 template < typename T > struct variant_traits< T, true >
 {
     template < typename S > static void set( boost::optional< T >& t, const S& s ) { t = s; }
     template < typename S > static void set( boost::optional< T >& t, const boost::optional< S >& s ) { t = s; }
+    template < typename S, typename V > static const S& get( const boost::optional< T >& t, const V& ) { return *t; }
+    template < typename S, typename V > static const boost::optional< S >& optional( const boost::optional< T >& t, const V& ) { return t; }
 };
 
 template < typename T, typename... Args > struct variant  // todo? use tuple instead?
 {
     boost::optional< T > t;
     variant< Args... > values;
- 
+
     template < typename S > bool is() const { return ( std::is_same< T, S >::value && bool( t ) ) || values.template is< S >(); }
     operator bool() const { return bool( t ) || bool( values ); }
     template < typename S > void set( const S& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); values.set( s ); }
     template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); values.set( s ); }
+    template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, values ); }
+    template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, values ); }
 };
 
 template < typename T > struct variant< T >  // todo? use tuple instead?
@@ -52,6 +63,8 @@ template < typename T > struct variant< T >  // todo? use tuple instead?
     operator bool() const { return bool( t ); }
     template < typename S > void set( const S& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); }
     template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); }
+    template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, type_is_not_on_type_list() ); }
+    template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, type_is_not_on_type_list() ); }
 };
 
 } // namespace impl {
@@ -60,7 +73,12 @@ template < typename... Args >
 class variant
 {
     public:
-        // todo
+        template < typename S > bool is() const { return _values.template is< S >(); }
+        operator bool() const { return bool( _values ); }
+        template < typename S > void set( const S& s ) { _values.set( s ); }
+        template < typename S > void set( const boost::optional< S >& s ) { _values.set( s ); }
+        template < typename S > const S& get() const { return _values.template get< S >(); }
+        template < typename S > const boost::optional< S >& optional() const { return _values.template optional< S >(); }
     private:
         impl::variant< Args... > _values;
 };

From 802e6f3c1402194b17b54e3fd17015ab052cf0d4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 May 2024 21:58:35 +1000
Subject: [PATCH 0792/1056] base: variant: traits: in progress...

---
 visiting/traits.h | 30 ++++++++++++++++++++++++++++++
 1 file changed, 30 insertions(+)

diff --git a/visiting/traits.h b/visiting/traits.h
index d8ecdcaac..4fff090d7 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -20,6 +20,7 @@
 #include <boost/array.hpp>
 #include "../base/none.h"
 #include "../base/optional.h"
+#include "../base/variant.h"
 
 namespace comma { namespace visiting {
 
@@ -70,6 +71,35 @@ struct traits< comma::optional< T > >
     }    
 };
 
+template < typename T, typename... Args >
+struct traits< comma::variant< T, Args... > >
+{
+    template < typename K, typename V > static void visit( const K& key, comma::variant< T, Args... >& t, V& v )
+    {
+        // todo
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const comma::variant< T, Args... >& t, V& v )
+    {
+        // todo
+    }    
+};
+
+//template < typename T > struct variant< T >
+template < typename T >
+struct traits< comma::variant< T > >
+{
+    template < typename K, typename V > static void visit( const K& key, comma::variant< T >& t, V& v )
+    {
+        // todo
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const comma::variant< T >& t, V& v )
+    {
+        // todo
+    }    
+};
+
 template < typename T >
 struct traits< std::complex< T > >
 {

From 1289981b20e20b130a6c5db542e995d202a65dcb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 May 2024 22:08:57 +1000
Subject: [PATCH 0793/1056] base: variant: traits: in progress...

---
 visiting/traits.h | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/visiting/traits.h b/visiting/traits.h
index 4fff090d7..8237a609b 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -81,11 +81,10 @@ struct traits< comma::variant< T, Args... > >
     
     template < typename K, typename V > static void visit( const K& key, const comma::variant< T, Args... >& t, V& v )
     {
-        // todo
+        if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
     }    
 };
 
-//template < typename T > struct variant< T >
 template < typename T >
 struct traits< comma::variant< T > >
 {
@@ -96,7 +95,7 @@ struct traits< comma::variant< T > >
     
     template < typename K, typename V > static void visit( const K& key, const comma::variant< T >& t, V& v )
     {
-        // todo
+        if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
     }    
 };
 

From 3ba697e82090a73b47cbd282371a69181f5386e4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 May 2024 22:10:59 +1000
Subject: [PATCH 0794/1056] base: variant: traits: in progress...

---
 visiting/traits.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/visiting/traits.h b/visiting/traits.h
index 8237a609b..47fa670a0 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -81,7 +81,7 @@ struct traits< comma::variant< T, Args... > >
     
     template < typename K, typename V > static void visit( const K& key, const comma::variant< T, Args... >& t, V& v )
     {
-        if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
+        // todo if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
     }    
 };
 
@@ -95,7 +95,7 @@ struct traits< comma::variant< T > >
     
     template < typename K, typename V > static void visit( const K& key, const comma::variant< T >& t, V& v )
     {
-        if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
+        // if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
     }    
 };
 

From e9c6acb619d8bb40fe108ae89b90083b4e79d9e1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 May 2024 23:34:16 +1000
Subject: [PATCH 0795/1056] base: variant: visiting traits implemented;
 debugging and testing...

---
 base/variant.h    |  4 +++
 visiting/traits.h | 62 ++++++++++++++++++++++++++++++++++++++---------
 2 files changed, 54 insertions(+), 12 deletions(-)

diff --git a/base/variant.h b/base/variant.h
index b3bfc263e..e50dcd43e 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -53,6 +53,7 @@ template < typename T, typename... Args > struct variant  // todo? use tuple ins
     template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); values.set( s ); }
     template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, values ); }
     template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, values ); }
+    void reset() { t.reset(); values.reset(); }
 };
 
 template < typename T > struct variant< T >  // todo? use tuple instead?
@@ -65,6 +66,7 @@ template < typename T > struct variant< T >  // todo? use tuple instead?
     template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); }
     template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, type_is_not_on_type_list() ); }
     template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, type_is_not_on_type_list() ); }
+    void reset() { t.reset(); }
 };
 
 } // namespace impl {
@@ -73,12 +75,14 @@ template < typename... Args >
 class variant
 {
     public:
+        // todo: template constructor
         template < typename S > bool is() const { return _values.template is< S >(); }
         operator bool() const { return bool( _values ); }
         template < typename S > void set( const S& s ) { _values.set( s ); }
         template < typename S > void set( const boost::optional< S >& s ) { _values.set( s ); }
         template < typename S > const S& get() const { return _values.template get< S >(); }
         template < typename S > const boost::optional< S >& optional() const { return _values.template optional< S >(); }
+        void reset() { _values.reset(); }
     private:
         impl::variant< Args... > _values;
 };
diff --git a/visiting/traits.h b/visiting/traits.h
index 47fa670a0..7870c69a7 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -18,6 +18,7 @@
 #include <unordered_set>
 #include <vector>
 #include <boost/array.hpp>
+#include "../base/exception.h"
 #include "../base/none.h"
 #include "../base/optional.h"
 #include "../base/variant.h"
@@ -71,32 +72,69 @@ struct traits< comma::optional< T > >
     }    
 };
 
-template < typename T, typename... Args >
-struct traits< comma::variant< T, Args... > >
+template < typename... Args >
+struct traits< comma::variant< Args... > > // todo? should it be in the visitors instead?
 {
-    template < typename K, typename V > static void visit( const K& key, comma::variant< T, Args... >& t, V& v )
+    typedef comma::variant< Args... > variant_t;
+
+    template < typename S, Args... > struct _variant_traits // todo
+    {
+        template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            v.apply( key, s );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+            _variant_traits< Args... >::_visit( key, t, v, bool( s ) );
+        }
+        template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { v.apply( key, *s ); } else { _variant_traits< Args... >::_visit( key, t, v ); }
+        }
+    };
+
+    template < typename K, typename V > static void visit( const K& key, variant_t& t, V& v )
     {
-        // todo
+        _variant_traits< Args... >::visit( key, t, v, false );
     }
     
-    template < typename K, typename V > static void visit( const K& key, const comma::variant< T, Args... >& t, V& v )
+    template < typename K, typename V > static void visit( const K& key, const variant_t& t, V& v )
     {
-        // todo if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
-    }    
+        _variant_traits< Args... >::visit( key, t, v );
+    }
 };
 
 template < typename T >
 struct traits< comma::variant< T > >
 {
-    template < typename K, typename V > static void visit( const K& key, comma::variant< T >& t, V& v )
+    typedef comma::variant< T > variant_t;
+
+    template < typename S > struct _variant_traits // todo
+    {
+        template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            v.apply( key, s );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+        }
+        template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { v.apply( key, *s ); }
+        }
+    };
+
+    template < typename K, typename V > static void visit( const K& key, variant_t& t, V& v )
     {
-        // todo
+        _variant_traits< T >::visit( key, t, v, false );
     }
     
-    template < typename K, typename V > static void visit( const K& key, const comma::variant< T >& t, V& v )
+    template < typename K, typename V > static void visit( const K& key, const variant_t& t, V& v )
     {
-        // if( t.template is< T >() ) { traits< T >::visit( key, t.template get< T >(), v ); }
-    }    
+        _variant_traits< T >::visit( key, t, v );
+    }
 };
 
 template < typename T >

From 7497a3f552f940e47a8c05479a662300bda6ae39 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 14 May 2024 23:56:27 +1000
Subject: [PATCH 0796/1056] base: variant: constructors implemented; debugging
 and testing...

---
 base/variant.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/base/variant.h b/base/variant.h
index e50dcd43e..c437f55f6 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -75,7 +75,8 @@ template < typename... Args >
 class variant
 {
     public:
-        // todo: template constructor
+        variant() = default;
+        template < typename S > variant( const S& s ) { set( s ); }
         template < typename S > bool is() const { return _values.template is< S >(); }
         operator bool() const { return bool( _values ); }
         template < typename S > void set( const S& s ) { _values.set( s ); }

From 1d2725a66e81c7fb051bb8f09b5643db87ab9bee Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 15 May 2024 13:09:33 +1000
Subject: [PATCH 0797/1056] base: name_variant: implemented; visiting traits
 implemented; unit test: in progress...

---
 base/variant.h                     | 16 +++++-
 name_value/test/serialise_test.cpp | 91 +++++++++++++++++++++++++++++
 visiting/traits.h                  | 92 ++++++++++++++++++++++++++++--
 visiting/visit.h                   |  8 +--
 4 files changed, 193 insertions(+), 14 deletions(-)

diff --git a/base/variant.h b/base/variant.h
index c437f55f6..b623620fc 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -18,7 +18,6 @@ namespace comma {
 // todo
 //   ? use tuple instead?
 //   - check that types don't repeat
-//   - visiting traits
 
 namespace impl {
 
@@ -84,8 +83,21 @@ class variant
         template < typename S > const S& get() const { return _values.template get< S >(); }
         template < typename S > const boost::optional< S >& optional() const { return _values.template optional< S >(); }
         void reset() { _values.reset(); }
-    private:
+    protected:
         impl::variant< Args... > _values;
 };
 
+template < typename Names, typename... Args >
+struct named_variant : public variant< Args... >, public Names
+{
+    typedef Names names_t;
+    typedef variant< Args... > variant_t;
+};
+
+template < typename Names >
+struct make_named_variant
+{
+    template < typename... Args > struct variant { typedef named_variant< Names, Args... > type; };
+};
+
 } // namespace comma {
diff --git a/name_value/test/serialise_test.cpp b/name_value/test/serialise_test.cpp
index a2f5c2276..a5ae4a828 100644
--- a/name_value/test/serialise_test.cpp
+++ b/name_value/test/serialise_test.cpp
@@ -29,6 +29,7 @@
 
 
 #include <gtest/gtest.h>
+#include "../../base/variant.h"
 #include "../../name_value/serialize.h"
 #include "../../visiting/traits.h"
 #include "../../xpath/xpath.h"
@@ -366,3 +367,93 @@ TEST( serialise, path_value )
 }
 
 } } } // namespace comma { namespace test { namespace serialise {
+
+struct forest
+{
+    struct chirp { int a{1}; int b{2}; };
+    struct whistle { int a{3}; int b{4}; };
+    struct warble { int x{5}; int y{6}; };
+
+    struct naming { static std::array< std::string, 3 > names() { return { "chirp", "whistle", "warble" }; } };
+
+    typedef comma::named_variant< naming, chirp, whistle, warble > variant_t;
+    comma::make_named_variant< naming >::variant< chirp, whistle, warble >::type madeup;
+    comma::named_variant< naming, chirp, whistle, warble > sound;
+    std::array< variant_t, 3 > sounds;
+};
+
+namespace comma { namespace visiting {
+
+template <> struct traits< forest::chirp >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+};
+
+template <> struct traits< forest::whistle >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+};
+
+template <> struct traits< forest::warble >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
+};
+
+template <> struct traits< forest >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest& t, Visitor& v )
+    {
+        v.apply( "madeup", t.madeup );
+        v.apply( "sound", t.sound );
+        v.apply( "sounds", t.sounds );
+    }
+    template < typename Key, class Visitor > static void visit( Key, const forest& t, Visitor& v )
+    {
+        v.apply( "madeup", t.madeup );
+        v.apply( "sound", t.sound );
+        v.apply( "sounds", t.sounds );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+TEST( DISABLED_serialise, variant )
+{
+    forest f;
+    std::cerr << "=================================" << std::endl;
+
+
+    std::cerr << "=== chirp ===" << std::endl;
+
+    f.sound.set( forest::chirp() );
+    comma::write_json( f, std::cerr ); // comma::write_json( f, std::cerr, false );
+
+    std::cerr << std::endl;
+
+
+    std::cerr << "=== whistle ===" << std::endl;
+
+    f.sound.set( forest::whistle() );
+    f.madeup.set( forest::warble{555, 666} );
+    comma::write_json( f, std::cerr ); // comma::write_json( f, std::cerr, false );
+    
+    std::cerr << std::endl;
+
+
+    std::cerr << "=== warble ===" << std::endl;
+
+    f.sound.set( forest::warble() );
+    f.sounds[2].set( forest::whistle() );
+    f.madeup.reset();
+    comma::write_json( f, std::cerr ); // comma::write_json( f, std::cerr, false );
+    std::cerr << "-------------------" << std::endl;
+    comma::write_xml( f, std::cerr ); // comma::write_json( f, std::cerr, false );
+    std::cerr << "-------------------" << std::endl;
+    comma::write_path_value( f, std::cerr ); // comma::write_json( f, std::cerr, false );
+
+    std::cerr << std::endl;
+    std::cerr << "=================================" << std::endl;
+}
diff --git a/visiting/traits.h b/visiting/traits.h
index 7870c69a7..780b63c55 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -73,7 +73,7 @@ struct traits< comma::optional< T > >
 };
 
 template < typename... Args >
-struct traits< comma::variant< Args... > > // todo? should it be in the visitors instead?
+struct traits< comma::variant< Args... > > // todo? should it be in the visitors instead? todo!
 {
     typedef comma::variant< Args... > variant_t;
 
@@ -82,7 +82,7 @@ struct traits< comma::variant< Args... > > // todo? should it be in the visitors
         template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set )
         {
             boost::optional< S > s = t.template optional< S >();
-            v.apply( key, s );
+            traits< boost::optional< S > >::visit( key, s, v );
             COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
             if( s ) { t.set( s ); }
             _variant_traits< Args... >::_visit( key, t, v, bool( s ) );
@@ -90,7 +90,7 @@ struct traits< comma::variant< Args... > > // todo? should it be in the visitors
         template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v )
         {
             const boost::optional< S >& s = t.template optional< S >();
-            if( s ) { v.apply( key, *s ); } else { _variant_traits< Args... >::_visit( key, t, v ); }
+            if( s ) { traits< S >::visit( key, *s, v ); } else { _variant_traits< Args... >::_visit( key, t, v ); }
         }
     };
 
@@ -115,14 +115,14 @@ struct traits< comma::variant< T > >
         template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set )
         {
             boost::optional< S > s = t.template optional< S >();
-            v.apply( key, s );
+            traits< boost::optional< S > >::visit( key, s, v );
             COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
             if( s ) { t.set( s ); }
         }
         template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v )
         {
             const boost::optional< S >& s = t.template optional< S >();
-            if( s ) { v.apply( key, *s ); }
+            if( s ) { traits< S >::visit( key, *s, v ); }
         }
     };
 
@@ -137,6 +137,88 @@ struct traits< comma::variant< T > >
     }
 };
 
+template < typename Names, typename... NArgs >
+struct traits< comma::named_variant< Names, NArgs... > > // todo? should it be in the visitors instead?
+{
+    typedef comma::named_variant< Names, NArgs... > named_variant_t;
+    typedef comma::variant< NArgs... > variant_t;
+
+    template < typename S, typename... Args > struct _variant_traits // todo
+    {
+        template < typename V > static void visit( variant_t& t, V& v, unsigned int i, bool is_set )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            v.apply( named_variant_t::names()[i], s );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+            _variant_traits< Args... >::visit( t, v, ++i, bool( s ) );
+        }
+        template < typename V > static void visit( const variant_t& t, V& v, unsigned int i )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { v.apply( named_variant_t::names()[i], *s ); } else { _variant_traits< Args... >::visit( t, v, ++i ); }
+        }
+    };
+
+    template < typename S > struct _variant_traits< S > // todo
+    {
+        template < typename V > static void visit( variant_t& t, V& v, bool is_set, unsigned int i )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            v.apply( named_variant_t::names()[i], s );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+        }
+        template < typename V > static void visit( const variant_t& t, V& v, unsigned int i )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { v.apply( named_variant_t::names()[i], *s ); }
+        }
+    };
+
+    template < typename K, typename V > static void visit( const K&, named_variant_t& t, V& v )
+    {
+        _variant_traits< NArgs... >::visit( static_cast< variant_t& >( t ), v, 0, false );
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const named_variant_t& t, V& v )
+    {
+        _variant_traits< NArgs... >::visit( static_cast< const variant_t& >( t ), v, 0 );
+    }
+};
+
+// template < typename Names, typename T >
+// struct traits< comma::named_variant< T > >
+// {
+//     typedef typename comma::variant< T >::variant_t variant_t;
+
+//     template < typename S > struct _variant_traits // todo
+//     {
+//         template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set, unsigned int i )
+//         {
+//             boost::optional< S > s = t.template optional< S >();
+//             v.apply( variant_t::names()[i], s );
+//             COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+//             if( s ) { t.set( s ); }
+//         }
+//         template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v, unsigned int i )
+//         {
+//             const boost::optional< S >& s = t.template optional< S >();
+//             if( s ) { v.apply( variant_t::names()[i], *s ); }
+//         }
+//     };
+
+//     template < typename K, typename V > static void visit( const K& key, variant_t& t, V& v )
+//     {
+//         _variant_traits< T >::visit( key, t, v, false );
+//     }
+    
+//     template < typename K, typename V > static void visit( const K& key, const variant_t& t, V& v )
+//     {
+//         _variant_traits< T >::visit( key, t, v );
+//     }
+// };
+
 template < typename T >
 struct traits< std::complex< T > >
 {
diff --git a/visiting/visit.h b/visiting/visit.h
index 09d23246b..f799b3ccf 100644
--- a/visiting/visit.h
+++ b/visiting/visit.h
@@ -27,24 +27,18 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_VISITING_VISIT_HEADER_GUARD_
-#define COMMA_VISITING_VISIT_HEADER_GUARD_
+#pragma once
 
 #include "traits.h"
 
 namespace comma { namespace visiting {
     
-/// visit
 template < typename K, typename T, typename V >
 inline void visit( const K& key, T& t, V& v ) { traits< T >::visit( key, t, v ); }
 
-/// visit const
 template < typename K, typename T, typename V >
 inline void visit( const K& key, const T& t, V& v ) { traits< T >::visit( key, t, v ); }
     
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_VISITING_VISIT_HEADER_GUARD_

From f6b05ed88680f8b3c56e5542c4d43a73142185e6 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 15 May 2024 15:06:41 +1000
Subject: [PATCH 0798/1056] name_value: test: basic named_variant test cases
 added

---
 name_value/test/serialise_test.cpp | 64 ++++++++++++++----------------
 1 file changed, 30 insertions(+), 34 deletions(-)

diff --git a/name_value/test/serialise_test.cpp b/name_value/test/serialise_test.cpp
index a5ae4a828..0eefeb736 100644
--- a/name_value/test/serialise_test.cpp
+++ b/name_value/test/serialise_test.cpp
@@ -420,40 +420,36 @@ template <> struct traits< forest >
 
 } } // namespace comma { namespace visiting {
 
-TEST( DISABLED_serialise, variant )
+TEST( serialise, variant )
 {
     forest f;
-    std::cerr << "=================================" << std::endl;
-
-
-    std::cerr << "=== chirp ===" << std::endl;
-
-    f.sound.set( forest::chirp() );
-    comma::write_json( f, std::cerr ); // comma::write_json( f, std::cerr, false );
-
-    std::cerr << std::endl;
-
-
-    std::cerr << "=== whistle ===" << std::endl;
-
-    f.sound.set( forest::whistle() );
-    f.madeup.set( forest::warble{555, 666} );
-    comma::write_json( f, std::cerr ); // comma::write_json( f, std::cerr, false );
-    
-    std::cerr << std::endl;
-
-
-    std::cerr << "=== warble ===" << std::endl;
-
-    f.sound.set( forest::warble() );
-    f.sounds[2].set( forest::whistle() );
-    f.madeup.reset();
-    comma::write_json( f, std::cerr ); // comma::write_json( f, std::cerr, false );
-    std::cerr << "-------------------" << std::endl;
-    comma::write_xml( f, std::cerr ); // comma::write_json( f, std::cerr, false );
-    std::cerr << "-------------------" << std::endl;
-    comma::write_path_value( f, std::cerr ); // comma::write_json( f, std::cerr, false );
-
-    std::cerr << std::endl;
-    std::cerr << "=================================" << std::endl;
+    {
+        std::ostringstream oss;
+        comma::write_json( f, oss, false );
+        EXPECT_EQ( oss.str(), "{}" );
+    }
+    {
+        f.sound.set( forest::chirp{11, 22} );
+        std::ostringstream oss;
+        comma::write_json( f, oss, false );
+        EXPECT_EQ( oss.str(), "{\"sound\":{\"chirp\":{\"a\":11,\"b\":22}}}" );
+    }
+    {
+        f.sound.set( forest::whistle{33, 44} );
+        std::ostringstream oss;
+        comma::write_json( f, oss, false );
+        EXPECT_EQ( oss.str(), "{\"sound\":{\"whistle\":{\"a\":33,\"b\":44}}}" );
+    }
+    {
+        f.sound.set( forest::warble{55, 66} );
+        std::ostringstream oss;
+        comma::write_json( f, oss, false );
+        EXPECT_EQ( oss.str(), "{\"sound\":{\"warble\":{\"x\":55,\"y\":66}}}" );
+    }
+    {
+        f.sound.reset();
+        std::ostringstream oss;
+        comma::write_json( f, oss, false );
+        EXPECT_EQ( oss.str(), "{}" );
+    }
 }

From f64015aa8c70caec869d22d138e882fdf6839afb Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 15 May 2024 15:09:23 +1000
Subject: [PATCH 0799/1056] base: variant, named_variant: basic usage examples
 added

---
 base/variant.h | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/base/variant.h b/base/variant.h
index b623620fc..0bc4548c4 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -70,6 +70,11 @@ template < typename T > struct variant< T >  // todo? use tuple instead?
 
 } // namespace impl {
 
+/// @example
+///     struct chirp { int a{1}; int b{2}; };
+///     struct whistle { int a{3}; int b{4}; };
+///     struct warble { int x{5}; int y{6}; };
+///     comma::named_variant< naming, chirp, whistle, warble > sound;
 template < typename... Args >
 class variant
 {
@@ -87,6 +92,17 @@ class variant
         impl::variant< Args... > _values;
 };
 
+/// @example
+///     struct forest
+///     {
+///         struct chirp { int a{1}; int b{2}; };
+///         struct whistle { int a{3}; int b{4}; };
+///         struct warble { int x{5}; int y{6}; };
+///
+///         struct naming { static std::array< std::string, 3 > names() { return { "chirp", "whistle", "warble" }; } };
+///
+///         comma::named_variant< naming, chirp, whistle, warble > sound;
+/// };
 template < typename Names, typename... Args >
 struct named_variant : public variant< Args... >, public Names
 {

From 153a9b4d3f1ee46abe5d4130d4de8a66c244b7cd Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 15 May 2024 18:08:52 +1000
Subject: [PATCH 0800/1056] visiting: traits: named_variant: typo fixed in
 non-const traits, basic unit tests added

---
 name_value/test/serialise_test.cpp | 71 ++++++++++++++++++++----------
 visiting/traits.h                  |  6 +--
 2 files changed, 51 insertions(+), 26 deletions(-)

diff --git a/name_value/test/serialise_test.cpp b/name_value/test/serialise_test.cpp
index 0eefeb736..f6911ec9c 100644
--- a/name_value/test/serialise_test.cpp
+++ b/name_value/test/serialise_test.cpp
@@ -370,51 +370,54 @@ TEST( serialise, path_value )
 
 struct forest
 {
-    struct chirp { int a{1}; int b{2}; };
-    struct whistle { int a{3}; int b{4}; };
-    struct warble { int x{5}; int y{6}; };
+    struct sounds
+    {
+        struct chirp { int a{1}; int b{2}; };
+        struct whistle { int a{3}; int b{4}; };
+        struct warble { int x{5}; int y{6}; };
+    };
 
     struct naming { static std::array< std::string, 3 > names() { return { "chirp", "whistle", "warble" }; } };
 
-    typedef comma::named_variant< naming, chirp, whistle, warble > variant_t;
-    comma::make_named_variant< naming >::variant< chirp, whistle, warble >::type madeup;
-    comma::named_variant< naming, chirp, whistle, warble > sound;
-    std::array< variant_t, 3 > sounds;
+    typedef comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble > variant_t;
+    comma::make_named_variant< naming >::variant< sounds::chirp, sounds::whistle, sounds::warble >::type madeup;
+    std::array< variant_t, 3 > choir;
+    comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble > sound;    
 };
 
 namespace comma { namespace visiting {
 
-template <> struct traits< forest::chirp >
+template <> struct traits< forest::sounds::chirp >
 {
-    template < typename Key, class Visitor > static void visit( Key, forest::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
-    template < typename Key, class Visitor > static void visit( Key, const forest::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
 };
 
-template <> struct traits< forest::whistle >
+template <> struct traits< forest::sounds::whistle >
 {
-    template < typename Key, class Visitor > static void visit( Key, forest::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
-    template < typename Key, class Visitor > static void visit( Key, const forest::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
 };
 
-template <> struct traits< forest::warble >
+template <> struct traits< forest::sounds::warble >
 {
-    template < typename Key, class Visitor > static void visit( Key, forest::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
-    template < typename Key, class Visitor > static void visit( Key, const forest::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
 };
 
 template <> struct traits< forest >
 {
     template < typename Key, class Visitor > static void visit( Key, forest& t, Visitor& v )
     {
-        v.apply( "madeup", t.madeup );
+        v.apply( "madeup", t.madeup ); // todo
+        v.apply( "choir", t.choir ); // todo
         v.apply( "sound", t.sound );
-        v.apply( "sounds", t.sounds );
     }
     template < typename Key, class Visitor > static void visit( Key, const forest& t, Visitor& v )
     {
-        v.apply( "madeup", t.madeup );
+        v.apply( "madeup", t.madeup ); // todo
+        v.apply( "choir", t.choir ); // todo
         v.apply( "sound", t.sound );
-        v.apply( "sounds", t.sounds );
     }
 };
 
@@ -429,19 +432,19 @@ TEST( serialise, variant )
         EXPECT_EQ( oss.str(), "{}" );
     }
     {
-        f.sound.set( forest::chirp{11, 22} );
+        f.sound.set( forest::sounds::chirp{11, 22} );
         std::ostringstream oss;
         comma::write_json( f, oss, false );
         EXPECT_EQ( oss.str(), "{\"sound\":{\"chirp\":{\"a\":11,\"b\":22}}}" );
     }
     {
-        f.sound.set( forest::whistle{33, 44} );
+        f.sound.set( forest::sounds::whistle{33, 44} );
         std::ostringstream oss;
         comma::write_json( f, oss, false );
         EXPECT_EQ( oss.str(), "{\"sound\":{\"whistle\":{\"a\":33,\"b\":44}}}" );
     }
     {
-        f.sound.set( forest::warble{55, 66} );
+        f.sound.set( forest::sounds::warble{55, 66} );
         std::ostringstream oss;
         comma::write_json( f, oss, false );
         EXPECT_EQ( oss.str(), "{\"sound\":{\"warble\":{\"x\":55,\"y\":66}}}" );
@@ -453,3 +456,25 @@ TEST( serialise, variant )
         EXPECT_EQ( oss.str(), "{}" );
     }
 }
+
+TEST( deserialise, variant )
+{
+    {
+        forest g;
+        {
+            std::istringstream iss( "{\"sound\":{\"warble\":{\"x\":55,\"y\":66}}}" );
+            comma::read_json( g, iss );
+            EXPECT_TRUE( g.sound.is< forest::sounds::warble >() );
+            EXPECT_EQ( g.sound.get< forest::sounds::warble >().x, 55 );
+            EXPECT_EQ( g.sound.get< forest::sounds::warble >().y, 66 );
+            
+        }
+        {
+            std::istringstream iss( "{\"sound\":{\"chirp\":{\"a\":77,\"b\":88}}}" );
+            comma::read_json( g, iss );
+            EXPECT_TRUE( g.sound.is< forest::sounds::chirp >() );
+            EXPECT_EQ( g.sound.get< forest::sounds::chirp >().a, 77 );
+            EXPECT_EQ( g.sound.get< forest::sounds::chirp >().b, 88 );
+        }
+    }
+}
diff --git a/visiting/traits.h b/visiting/traits.h
index 780b63c55..2d96b5b35 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -143,7 +143,7 @@ struct traits< comma::named_variant< Names, NArgs... > > // todo? should it be i
     typedef comma::named_variant< Names, NArgs... > named_variant_t;
     typedef comma::variant< NArgs... > variant_t;
 
-    template < typename S, typename... Args > struct _variant_traits // todo
+    template < typename S, typename... Args > struct _variant_traits
     {
         template < typename V > static void visit( variant_t& t, V& v, unsigned int i, bool is_set )
         {
@@ -160,9 +160,9 @@ struct traits< comma::named_variant< Names, NArgs... > > // todo? should it be i
         }
     };
 
-    template < typename S > struct _variant_traits< S > // todo
+    template < typename S > struct _variant_traits< S >
     {
-        template < typename V > static void visit( variant_t& t, V& v, bool is_set, unsigned int i )
+        template < typename V > static void visit( variant_t& t, V& v, unsigned int i, bool is_set )
         {
             boost::optional< S > s = t.template optional< S >();
             v.apply( named_variant_t::names()[i], s );

From f3b562274d841cc4f2d439a56057fc46b8504419 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 15 May 2024 18:54:08 +1000
Subject: [PATCH 0801/1056] csv::split: tentative placeholder implemented -
 should it be called something like stream_split instead?

---
 csv/split.cpp | 10 ++++++++++
 csv/split.h   | 51 +++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 61 insertions(+)
 create mode 100644 csv/split.cpp
 create mode 100644 csv/split.h

diff --git a/csv/split.cpp b/csv/split.cpp
new file mode 100644
index 000000000..f5dd7f5d0
--- /dev/null
+++ b/csv/split.cpp
@@ -0,0 +1,10 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#include "split.h"
+
+namespace comma { namespace csv {
+
+
+} } // namespace comma { namespace csv {
diff --git a/csv/split.h b/csv/split.h
new file mode 100644
index 000000000..4953f6068
--- /dev/null
+++ b/csv/split.h
@@ -0,0 +1,51 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <fstream>
+#include "options.h"
+#include "stream.h"
+
+namespace comma { namespace csv {
+
+template < typename T, typename How >
+class split
+{
+    public:
+        split( const How& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) { _init(); }
+        split( How&& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) { _init(); }
+        split& operator<<( const T& t );
+
+    protected:
+        How _how;
+        options _options;
+        T _sample;
+        std::ostream* _os{nullptr};
+        std::unique_ptr< output_stream< T > > _ostream;
+        void _init();
+
+};
+
+template < typename T, typename How > inline void split< T, How >::_init()
+{
+    // todo: validate options
+    // todo: init
+}
+
+template < typename T, typename How > inline split< T, How >& split< T, How >::operator<<( const T& t )
+{
+    std::ostream* os = _how.stream( t );
+    if( _os != os )
+    {
+        _os->flush(); // paranoia
+        _ostream.reset();
+        _os = os;
+        _ostream = std::make_unique< output_stream< T > >( *_os, _options, _sample );
+    }
+    _ostream.write( t );
+    return *this;
+}
+
+} } // namespace comma { namespace csv {

From 744d02eecc136bc8e55214a68c0926061d1fd3ed Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 15 May 2024 20:23:34 +1000
Subject: [PATCH 0802/1056] base: variant::index_of() and
 named_variant::name_of() implemented and tested

---
 base/test/base_test.cpp | 23 +++++++++++++++++++++++
 base/variant.h          |  8 ++++++++
 2 files changed, 31 insertions(+)

diff --git a/base/test/base_test.cpp b/base/test/base_test.cpp
index 704eafb53..5e1df090c 100644
--- a/base/test/base_test.cpp
+++ b/base/test/base_test.cpp
@@ -95,6 +95,29 @@ TEST( base, variant )
         EXPECT_FALSE( v.is< float >() );
         EXPECT_FALSE( v.is< double >() );
     }
+    {
+        { auto size = comma::variant< int >::size; EXPECT_EQ( size, 1 ); }
+        { auto size = comma::variant< int, float >::size; EXPECT_EQ( size, 2 ); }
+        { auto size = comma::variant< int, float, double >::size; EXPECT_EQ( size, 3 ); }
+    }
+    {
+        typedef comma::variant< int, float, double > variant_t;
+        EXPECT_EQ( variant_t::index_of< int >(), 0 );
+        EXPECT_EQ( variant_t::index_of< float >(), 1 );
+        EXPECT_EQ( variant_t::index_of< double >(), 2 );
+    }
+}
+
+TEST( base, named_variant )
+{
+    {
+        struct naming { static std::array< std::string, 3 > names() { return { "a", "b", "c" }; } };
+        typedef comma::named_variant< naming, int, float, double > variant_t;
+        variant_t v;
+        EXPECT_EQ( variant_t::name_of< int >(), "a" );
+        EXPECT_EQ( variant_t::name_of< float >(), "b" );
+        EXPECT_EQ( variant_t::name_of< double >(), "c" );
+    }
 }
 
 } // namespace comma {
diff --git a/base/variant.h b/base/variant.h
index 0bc4548c4..27be453bd 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -12,6 +12,7 @@
 // #endif
 #include <type_traits>
 #include <boost/optional.hpp>
+#include "exception.h"
 
 namespace comma {
 
@@ -43,6 +44,7 @@ template < typename T > struct variant_traits< T, true >
 
 template < typename T, typename... Args > struct variant  // todo? use tuple instead?
 {
+    enum { size = variant< Args... >::size + 1 };
     boost::optional< T > t;
     variant< Args... > values;
 
@@ -53,10 +55,12 @@ template < typename T, typename... Args > struct variant  // todo? use tuple ins
     template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, values ); }
     template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, values ); }
     void reset() { t.reset(); values.reset(); }
+    template < typename S > static unsigned int rindex() { return std::is_same< T, S >::value ? size - 1 : variant< Args... >::template rindex< S >(); }
 };
 
 template < typename T > struct variant< T >  // todo? use tuple instead?
 {
+    enum { size = 1 };
     boost::optional< T > t;
 
     template < typename S > bool is() const { return std::is_same< T, S >::value && bool( t ); }
@@ -66,6 +70,7 @@ template < typename T > struct variant< T >  // todo? use tuple instead?
     template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, type_is_not_on_type_list() ); }
     template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, type_is_not_on_type_list() ); }
     void reset() { t.reset(); }
+    template < typename S > static unsigned int rindex() { bool same_type = std::is_same< T, S >::value; COMMA_ASSERT( same_type, "type not found in type list" ); return 0; }
 };
 
 } // namespace impl {
@@ -79,6 +84,7 @@ template < typename... Args >
 class variant
 {
     public:
+        enum { size = impl::variant< Args... >::size };
         variant() = default;
         template < typename S > variant( const S& s ) { set( s ); }
         template < typename S > bool is() const { return _values.template is< S >(); }
@@ -88,6 +94,7 @@ class variant
         template < typename S > const S& get() const { return _values.template get< S >(); }
         template < typename S > const boost::optional< S >& optional() const { return _values.template optional< S >(); }
         void reset() { _values.reset(); }
+        template < typename S > static unsigned int index_of() { return impl::variant< Args... >::size - impl::variant< Args... >::template rindex< S >() - 1; }
     protected:
         impl::variant< Args... > _values;
 };
@@ -108,6 +115,7 @@ struct named_variant : public variant< Args... >, public Names
 {
     typedef Names names_t;
     typedef variant< Args... > variant_t;
+    template < typename S > static const std::string& name_of() { return Names::names()[ variant_t::template index_of< S >() ]; }
 };
 
 template < typename Names >

From 4ac1052ac93243c2a3e2c611d824ed96e9c386d3 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 11:07:55 +1000
Subject: [PATCH 0803/1056] csv::split: in progress...

---
 csv/split.h | 68 +++++++++++++++++++++++++++++++++++++++++++++--------
 1 file changed, 58 insertions(+), 10 deletions(-)

diff --git a/csv/split.h b/csv/split.h
index 4953f6068..bd81a13fb 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -5,41 +5,89 @@
 #pragma once
 
 #include <fstream>
+#include "../base/exception.h"
+#include "../io/stream.h"
+#include "../timing/duration.h"
 #include "options.h"
 #include "stream.h"
 
 namespace comma { namespace csv {
 
+namespace splitting {
+
+class none
+{
+    public:
+        none( const std::string& address ): _ostream( address ) {}
+        template < typename T >
+        std::ostream* stream( const T& t ) { return _ostream(); }
+
+    private:
+        io::ostream _ostream;
+};
+
+class by_time
+{
+    public:
+        by_time( boost::posix_time::time_duration period ): _period( period ) {}
+        by_time( double period ): _period( timing::duration::from_seconds( period ) ) {}
+        template < typename T >
+        std::ostream* stream( const T& t );
+
+    private:
+        boost::posix_time::ptime _deadline;
+        boost::posix_time::time_duration _period;
+        std::unique_ptr< std::ofstream > _ofs;
+};
+
+class by_size
+{
+    public:
+        by_size( std::size_t size ): _size( size ) {}
+        template < typename T >
+        std::ostream* stream( const T& t );
+
+    private:
+        std::size_t _size{0};
+        std::size_t _remaining{0};
+        std::unique_ptr< std::ofstream > _ofs;
+};
+
+class by_id; // todo
+
+} // namespace splitting {
+
 template < typename T, typename How >
 class split
 {
     public:
-        split( const How& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) { _init(); }
-        split( How&& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) { _init(); }
+        split( const How& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) {}
+        split( How&& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) {}
         split& operator<<( const T& t );
+        bool eof() const { return _eof; }
 
     protected:
         How _how;
         options _options;
         T _sample;
+        bool _eof{false};
         std::ostream* _os{nullptr};
         std::unique_ptr< output_stream< T > > _ostream;
         void _init();
-
 };
 
-template < typename T, typename How > inline void split< T, How >::_init()
-{
-    // todo: validate options
-    // todo: init
-}
-
 template < typename T, typename How > inline split< T, How >& split< T, How >::operator<<( const T& t )
 {
+    COMMA_ASSERT( !_eof, "end of stream" );
     std::ostream* os = _how.stream( t );
+    if( !os )
+    {
+        _eof = true;
+        _os = nullptr;
+        return *this;
+    }
     if( _os != os )
     {
-        _os->flush(); // paranoia
         _ostream.reset();
         _os = os;
         _ostream = std::make_unique< output_stream< T > >( *_os, _options, _sample );

From db859f0050b21887c43dea4a588ba80b8a5f11d1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 12:14:48 +1000
Subject: [PATCH 0804/1056] csv::split: in progress...

---
 csv/split.cpp | 28 +++++++++++++++++++++--
 csv/split.h   | 61 +++++++++++++++++++++++++++++++++++++++++++--------
 2 files changed, 78 insertions(+), 11 deletions(-)

diff --git a/csv/split.cpp b/csv/split.cpp
index f5dd7f5d0..46b7197b6 100644
--- a/csv/split.cpp
+++ b/csv/split.cpp
@@ -4,7 +4,31 @@
 
 #include "split.h"
 
-namespace comma { namespace csv {
+namespace comma { namespace csv { namespace splitting {
 
+bool by_time::_is_due( boost::posix_time::ptime t ) const
+{
+    // todo
+    return false;
+}
 
-} } // namespace comma { namespace csv {
+by_size::by_size( std::size_t size, const std::string& dir, const options& csv )
+    : _ofs( dir, csv )
+    , _size( size )
+    , _record_size( csv.binary() ? csv.format().size() : 0 )
+{
+}
+
+bool by_size::_is_due() const
+{
+    // todo
+    return false;
+}
+
+bool by_block::_is_due( unsigned int block ) const
+{
+    // todo
+    return false;
+}
+
+} } } // namespace comma { namespace csv { namespace splitting {
diff --git a/csv/split.h b/csv/split.h
index bd81a13fb..4c467e44e 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -6,6 +6,7 @@
 
 #include <fstream>
 #include "../base/exception.h"
+#include "../base/none.h"
 #include "../io/stream.h"
 #include "../timing/duration.h"
 #include "options.h"
@@ -15,6 +16,14 @@ namespace comma { namespace csv {
 
 namespace splitting {
 
+template < typename T >
+struct type_traits
+{
+    static boost::posix_time::ptime time( const T& t ) { return t.t; }
+    static unsigned int block( const T& t ) { return t.block; }
+    static unsigned int id( const T& t ) { return t.id; }
+};
+
 class none
 {
     public:
@@ -26,31 +35,65 @@ class none
         io::ostream _ostream;
 };
 
+class ofstream
+{
+    public:
+        ofstream( const std::string& dir, const std::string& suffix ): _dir( dir ), _suffix( suffix ) {}
+        ofstream( const std::string& dir, const options& csv ): _dir( dir ), _suffix( csv.binary() ? "bin" : "csv" ) {}
+        ofstream* update( boost::posix_time::ptime t );
+        template < typename T > ofstream* update( const T& t ) { return update( splitting::type_traits< T >::time( t ) ); }
+        std::ofstream* operator()() { return _ofs.get(); }
+    protected:
+        std::string _dir;
+        std::string _suffix;
+        std::unique_ptr< std::ofstream > _ofs;
+};
+
 class by_time
 {
     public:
-        by_time( boost::posix_time::time_duration period ): _period( period ) {}
-        by_time( double period ): _period( timing::duration::from_seconds( period ) ) {}
-        template < typename T >
-        std::ostream* stream( const T& t );
+        by_time( boost::posix_time::time_duration period, const std::string& dir, const options& csv ): _ofs( dir, csv ), _period( period ) {}
+        by_time( double period, const std::string& dir, const options& csv ): by_time( timing::duration::from_seconds( period ), dir, csv ) {}
+        template < typename T > std::ostream* stream( const T& t ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? _ofs.update( d ) : _ofs(); }
 
     private:
-        boost::posix_time::ptime _deadline;
+        splitting::ofstream _ofs;
         boost::posix_time::time_duration _period;
-        std::unique_ptr< std::ofstream > _ofs;
+        boost::posix_time::ptime _deadline;
+
+        bool _is_due( boost::posix_time::ptime t ) const;
 };
 
 class by_size
 {
     public:
-        by_size( std::size_t size ): _size( size ) {}
+        by_size( std::size_t size, const std::string& dir, const options& csv );
         template < typename T >
-        std::ostream* stream( const T& t );
+        std::ostream* stream( const T& t ) { return _is_due() ? _ofs.update( t ) : _ofs(); }
 
     private:
+        splitting::ofstream _ofs;
         std::size_t _size{0};
+        std::size_t _record_size{0};
+        std::size_t _estimated_record_size{0};
         std::size_t _remaining{0};
-        std::unique_ptr< std::ofstream > _ofs;
+
+        bool _is_due() const;
+        
+};
+
+class by_block
+{
+    public:
+        by_block( const std::string& dir, const options& csv ): _ofs( dir, csv ), _block( silent_none< unsigned int >() ) {}
+        template < typename T >
+        std::ostream* stream( const T& t ) { return _is_due( splitting::type_traits< T >::block( t ) ) ? _ofs.update( t ) : _ofs(); }
+
+    private:
+        splitting::ofstream _ofs;
+        boost::optional< unsigned int > _block;
+
+        bool _is_due( unsigned int block ) const;
 };
 
 class by_id; // todo

From d024f38a77b33eaa23f3321ee93e3e6b6cdf0018 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 13:04:58 +1000
Subject: [PATCH 0805/1056] timing/conversions: timing::to_iso_string()
 implemented, circular dependency on csv removed; csv/split: in progress...

---
 csv/CMakeLists.txt     |  2 +-
 csv/split.cpp          | 10 ++++++++++
 csv/split.h            |  5 ++---
 timing/CMakeLists.txt  |  2 +-
 timing/conversions.cpp | 19 +++++++++++++++++++
 timing/conversions.h   | 19 +++++++++++++++++++
 timing/stats.cpp       | 11 ++++++-----
 timing/tai.cpp         |  2 +-
 8 files changed, 59 insertions(+), 11 deletions(-)
 create mode 100644 timing/conversions.cpp
 create mode 100644 timing/conversions.h

diff --git a/csv/CMakeLists.txt b/csv/CMakeLists.txt
index 3de46ff97..ec9d76ec4 100644
--- a/csv/CMakeLists.txt
+++ b/csv/CMakeLists.txt
@@ -11,7 +11,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+target_link_libraries( ${TARGET_NAME} comma_application comma_timing comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/csv/split.cpp b/csv/split.cpp
index 46b7197b6..eb2089bd1 100644
--- a/csv/split.cpp
+++ b/csv/split.cpp
@@ -3,9 +3,19 @@
 /// @author vsevolod vlaskine
 
 #include "split.h"
+#include "../timing/conversions.h"
 
 namespace comma { namespace csv { namespace splitting {
 
+std::ofstream* ofstream::update( boost::posix_time::ptime t )
+{
+    if( _ofs ) { _ofs.reset(); }
+    std::string filename = _dir + "/" + timing::to_iso_string( t ) + "." + _suffix;
+    _ofs = std::make_unique< std::ofstream >( filename );
+    COMMA_ASSERT( _ofs->is_open(), "failed to open '" << filename << "'" );
+    return _ofs.get();
+}
+
 bool by_time::_is_due( boost::posix_time::ptime t ) const
 {
     // todo
diff --git a/csv/split.h b/csv/split.h
index 4c467e44e..11c67f044 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -40,8 +40,8 @@ class ofstream
     public:
         ofstream( const std::string& dir, const std::string& suffix ): _dir( dir ), _suffix( suffix ) {}
         ofstream( const std::string& dir, const options& csv ): _dir( dir ), _suffix( csv.binary() ? "bin" : "csv" ) {}
-        ofstream* update( boost::posix_time::ptime t );
-        template < typename T > ofstream* update( const T& t ) { return update( splitting::type_traits< T >::time( t ) ); }
+        std::ofstream* update( boost::posix_time::ptime t );
+        template < typename T > std::ofstream* update( const T& t ) { return update( splitting::type_traits< T >::time( t ) ); }
         std::ofstream* operator()() { return _ofs.get(); }
     protected:
         std::string _dir;
@@ -79,7 +79,6 @@ class by_size
         std::size_t _remaining{0};
 
         bool _is_due() const;
-        
 };
 
 class by_block
diff --git a/timing/CMakeLists.txt b/timing/CMakeLists.txt
index 3029a3fc4..61fd19ea4 100644
--- a/timing/CMakeLists.txt
+++ b/timing/CMakeLists.txt
@@ -8,7 +8,7 @@ FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
 SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
-target_link_libraries( ${TARGET_NAME} comma_csv comma_name_value comma_string )
+target_link_libraries( ${TARGET_NAME} comma_string ) # target_link_libraries( ${TARGET_NAME} comma_csv comma_name_value comma_string )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/timing/conversions.cpp b/timing/conversions.cpp
new file mode 100644
index 000000000..0e70f0acf
--- /dev/null
+++ b/timing/conversions.cpp
@@ -0,0 +1,19 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "../base/exception.h"
+#include "conversions.h"
+
+namespace comma { namespace timing {
+
+std::string to_iso_string( boost::posix_time::ptime t, unsigned int fraction_digits, bool strict )
+{
+    std::string s = boost::posix_time::to_iso_string( t );
+    unsigned int size = 16 + fraction_digits;
+    if( t.is_not_a_date_time() || t.is_neg_infinity() || t.is_infinity() ) { COMMA_THROW_IF( strict, "expected valid time; got: '" << s << "'" ); return s; }
+    return s.size() < size ? s + std::string( '0', size - s.size() ) : s.substr( 0, size );
+}
+
+} } // namespace comma { namespace timing {
diff --git a/timing/conversions.h b/timing/conversions.h
new file mode 100644
index 000000000..1fa02a02a
--- /dev/null
+++ b/timing/conversions.h
@@ -0,0 +1,19 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time.hpp>
+#include "duration.h"
+
+namespace comma { namespace timing {
+
+/// same as boost::posix_time::to_iso_string, but pads second fractions with zeroes
+/// @param t: time
+/// @param fraction_digits: number of second fraction digits
+/// @param strict: throw on uninitialised time and infinity
+std::string to_iso_string( boost::posix_time::ptime t, unsigned int fraction_digits = 6, bool strict = false );
+
+} } // namespace comma { namespace timing {
diff --git a/timing/stats.cpp b/timing/stats.cpp
index 773dc5dc6..6e3e8a318 100644
--- a/timing/stats.cpp
+++ b/timing/stats.cpp
@@ -3,10 +3,10 @@
 
 /// @author vsevolod vlaskine
 
-#include "../csv/ascii.h" // quick and dirty
+// introduces circular dependencies: #include "../csv/ascii.h" // quick and dirty
 #include "../name_value/ptree.h"
 #include "../timing/stats.h"
-#include "../timing/traits.h"
+//#include "../timing/traits.h"
 
 namespace comma { namespace timing {
 
@@ -39,10 +39,11 @@ void stats::output( std::ostream& os, const std::string& prefix, bool csv ) // t
     os.setf( std::ios::fixed, std::ios::floatfield );
     os << std::setprecision( 6 ) << prefix;
     std::cerr << std::setprecision( 6 );
-    if( csv )
+    if( csv ) // quick and dirty for now to avoid circular dependencies; todo? csv::timing::stats wrapper or something along those lines
     {
-        static comma::csv::ascii< stats > ascii;
-        os << ascii.put( *this ) << std::endl;
+        //static comma::csv::ascii< stats > ascii; // introduces circular dependencies
+        //os << ascii.put( *this ) << std::endl;
+        os << elapsed() << ',' << count() << ',' << rate() << ',' << min() << ',' << max() << ',' << ema() << std::endl;
     }
     else
     {
diff --git a/timing/tai.cpp b/timing/tai.cpp
index 49fd26648..39a45a369 100644
--- a/timing/tai.cpp
+++ b/timing/tai.cpp
@@ -21,9 +21,9 @@
 
 /// @author dave jennings
 
-#include "tai.h"
 #include <utility>
 #include <vector>
+#include "tai.h"
 
 namespace comma { namespace timing { namespace tai {
 

From c55d103ec6882b6e93c64c126543410486e6e762 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 14:00:10 +1000
Subject: [PATCH 0806/1056] csv::output_stream::last_size() implemented

---
 csv/stream.h | 21 +++++++++++++++++----
 1 file changed, 17 insertions(+), 4 deletions(-)

diff --git a/csv/stream.h b/csv/stream.h
index b1e92116a..51d5df091 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -134,8 +134,11 @@ class ascii_output_stream : public boost::noncopyable
         /// return fields
         const std::vector< std::string >& fields() const { return fields_; }
 
+        /// return size of last output record in bytes
+        unsigned int last_size() const { return _last_size; }
+
     private:
-        friend class output_stream<S>;
+        friend class output_stream< S >;
         template < typename W, typename T>
         friend class tied;
         template < typename V, typename T, typename Data >
@@ -144,6 +147,7 @@ class ascii_output_stream : public boost::noncopyable
         std::ostream& os_;
         csv::ascii< S > ascii_;
         std::vector< std::string > fields_;
+        unsigned int _last_size{0};
 };
 
 /// binary csv input stream
@@ -224,6 +228,9 @@ class binary_output_stream : public boost::noncopyable
         /// return fields
         const std::vector< std::string >& fields() const { return fields_; }
 
+        /// record size
+        unsigned int size() const { return _size; }
+
     private:
         template < typename W, typename T>
         friend class tied;
@@ -240,6 +247,7 @@ class binary_output_stream : public boost::noncopyable
         //char* cur_;
         std::vector< std::string > fields_;
         bool flush_;
+        unsigned int _size{};
         /// bool is_stdout;
 };
 
@@ -345,6 +353,9 @@ class output_stream : public boost::noncopyable
 
         std::ostream& os() { return binary_ ? binary_->os_ : ascii_->os_; }
 
+        /// return size of last output record in bytes
+        unsigned int last_size() const { return binary_ ? binary_->size() : ascii_->last_size(); }
+
     private:
         boost::scoped_ptr< ascii_output_stream< S > > ascii_;
         boost::scoped_ptr< binary_output_stream< S > > binary_;
@@ -634,8 +645,7 @@ inline void ascii_output_stream< S >::write( const S& s )
 template < typename S >
 inline void ascii_output_stream< S >::write( const S& s, const std::string& line )
 {
-    write( s, split
-( line, ascii_.delimiter() ) );
+    write( s, split( line, ascii_.delimiter() ) );
 }
 
 template < typename S >
@@ -651,7 +661,8 @@ inline void ascii_output_stream< S >::write( const S& s, std::vector< std::strin
     ascii_.put( s, v );
     if( v.empty() ) { return; } // never here, though
     os_ << v[0];
-    for( std::size_t i = 1; i < v.size(); ++i ) { os_ << ascii_.delimiter() << v[i]; }
+    _last_size = 0;
+    for( std::size_t i = 1; i < v.size(); ++i ) { os_ << ascii_.delimiter() << v[i]; _last_size += v[i].size() + 1; }
     os_ << std::endl;
 }
 
@@ -715,6 +726,7 @@ inline binary_output_stream< S >::binary_output_stream( std::ostream& os, const
     //, cur_( begin_ )
     , fields_( split( column_names, ',' ) )
     , flush_( flush )
+    , _size( binary_.format().size() )
     /// , is_stdout( os_.rdbuf() == std::cout.rdbuf() )
 {
     #ifdef WIN32
@@ -735,6 +747,7 @@ inline binary_output_stream< S >::binary_output_stream( std::ostream& os, const
     , fields_( split( o.fields, ',' ) )
     , flush_( o.flush )
     /// , is_stdout( os_.rdbuf() == std::cout.rdbuf() )
+    , _size( binary_.format().size() )
 {
     #ifdef WIN32
     if( &os == &std::cout ) { _setmode( _fileno( stdout ), _O_BINARY ); }

From 3a4e300210d9ea1a0ec5b5b7d8adde0c90c50da2 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 14:00:28 +1000
Subject: [PATCH 0807/1056] csv::split: first cut implemented; debugging...

---
 csv/split.cpp | 26 +++++++++++++++++---------
 csv/split.h   | 17 +++++++++++------
 2 files changed, 28 insertions(+), 15 deletions(-)

diff --git a/csv/split.cpp b/csv/split.cpp
index eb2089bd1..9cd2ea9c4 100644
--- a/csv/split.cpp
+++ b/csv/split.cpp
@@ -16,10 +16,11 @@ std::ofstream* ofstream::update( boost::posix_time::ptime t )
     return _ofs.get();
 }
 
-bool by_time::_is_due( boost::posix_time::ptime t ) const
+bool by_time::_is_due( boost::posix_time::ptime t )
 {
-    // todo
-    return false;
+    if( !_deadline.is_not_a_date_time() && t < _deadline ) { return false; }
+    _deadline = t + _max_duration;
+    return true;
 }
 
 by_size::by_size( std::size_t size, const std::string& dir, const options& csv )
@@ -29,16 +30,23 @@ by_size::by_size( std::size_t size, const std::string& dir, const options& csv )
 {
 }
 
-bool by_size::_is_due() const
+bool by_size::_is_due()
 {
-    // todo
-    return false;
+    if( _estimated_record_size <= _remaining ) { return false; }
+    _remaining = _size;
+    return true;
 }
 
-bool by_block::_is_due( unsigned int block ) const
+void by_size::wrote( unsigned int size )
 {
-    // todo
-    return false;
+    _remaining = _remaining > size ? _remaining - size : 0;
+}
+
+bool by_block::_is_due( unsigned int block )
+{
+    if( _block && *_block == block ) { return false; }
+    _block = block;
+    return true;
 }
 
 } } } // namespace comma { namespace csv { namespace splitting {
diff --git a/csv/split.h b/csv/split.h
index 11c67f044..f68faa698 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -30,6 +30,7 @@ class none
         none( const std::string& address ): _ostream( address ) {}
         template < typename T >
         std::ostream* stream( const T& t ) { return _ostream(); }
+        void wrote( unsigned int ) {}
 
     private:
         io::ostream _ostream;
@@ -52,16 +53,17 @@ class ofstream
 class by_time
 {
     public:
-        by_time( boost::posix_time::time_duration period, const std::string& dir, const options& csv ): _ofs( dir, csv ), _period( period ) {}
-        by_time( double period, const std::string& dir, const options& csv ): by_time( timing::duration::from_seconds( period ), dir, csv ) {}
+        by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv ): _ofs( dir, csv ), _max_duration( max_duration ) {}
+        by_time( double max_duration, const std::string& dir, const options& csv ): by_time( timing::duration::from_seconds( max_duration ), dir, csv ) {}
         template < typename T > std::ostream* stream( const T& t ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? _ofs.update( d ) : _ofs(); }
+        void wrote( unsigned int ) {}
 
     private:
         splitting::ofstream _ofs;
-        boost::posix_time::time_duration _period;
+        boost::posix_time::time_duration _max_duration;
         boost::posix_time::ptime _deadline;
 
-        bool _is_due( boost::posix_time::ptime t ) const;
+        bool _is_due( boost::posix_time::ptime t );
 };
 
 class by_size
@@ -70,6 +72,7 @@ class by_size
         by_size( std::size_t size, const std::string& dir, const options& csv );
         template < typename T >
         std::ostream* stream( const T& t ) { return _is_due() ? _ofs.update( t ) : _ofs(); }
+        void wrote( unsigned int size );
 
     private:
         splitting::ofstream _ofs;
@@ -78,7 +81,7 @@ class by_size
         std::size_t _estimated_record_size{0};
         std::size_t _remaining{0};
 
-        bool _is_due() const;
+        bool _is_due();
 };
 
 class by_block
@@ -87,12 +90,13 @@ class by_block
         by_block( const std::string& dir, const options& csv ): _ofs( dir, csv ), _block( silent_none< unsigned int >() ) {}
         template < typename T >
         std::ostream* stream( const T& t ) { return _is_due( splitting::type_traits< T >::block( t ) ) ? _ofs.update( t ) : _ofs(); }
+        void wrote( unsigned int ) {}
 
     private:
         splitting::ofstream _ofs;
         boost::optional< unsigned int > _block;
 
-        bool _is_due( unsigned int block ) const;
+        bool _is_due( unsigned int block );
 };
 
 class by_id; // todo
@@ -135,6 +139,7 @@ template < typename T, typename How > inline split< T, How >& split< T, How >::o
         _ostream = std::make_unique< output_stream< T > >( *_os, _options, _sample );
     }
     _ostream.write( t );
+    _how.wrote( _ostream.last_size() );
     return *this;
 }
 

From 692638d90c279522a29d0f70376d1af5d9f20cc1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 15:58:53 +1000
Subject: [PATCH 0808/1056] csv::splitting::usage() implemented;
 io::stream::usage(): verbose flag added

---
 csv/split.cpp | 31 ++++++++++++++++++++++++++++++-
 csv/split.h   |  7 +++++--
 io/stream.cpp | 50 ++++++++++++++++++++++++--------------------------
 io/stream.h   |  6 +++---
 4 files changed, 62 insertions(+), 32 deletions(-)

diff --git a/csv/split.cpp b/csv/split.cpp
index 9cd2ea9c4..1ff2bfb8b 100644
--- a/csv/split.cpp
+++ b/csv/split.cpp
@@ -2,11 +2,32 @@
 
 /// @author vsevolod vlaskine
 
-#include "split.h"
+#include <sstream>
 #include "../timing/conversions.h"
+#include "split.h"
 
 namespace comma { namespace csv { namespace splitting {
 
+std::string usage( unsigned int size, bool verbose )
+{
+    std::string indent( size, ' ' );
+    std::ostringstream oss;
+    oss << indent << "split:<options>      : todo" << std::endl;
+    oss << indent << "log:<dir>;<options>  : log in timestamped files" << std::endl;
+    if( verbose )
+    {
+        oss << indent << "    <options>: <how>[;<parameters>]" << std::endl;
+        oss << indent << "        by-time;period=<seconds>[;align]" << std::endl;
+        oss << indent << "        by-size;size=<bytes>" << std::endl;
+        oss << indent << "        by-block" << std::endl;
+    }
+    else
+    {
+        oss << indent << "    run --help --verbose for details..." << std::endl;
+    }
+    return oss.str();
+}
+
 std::ofstream* ofstream::update( boost::posix_time::ptime t )
 {
     if( _ofs ) { _ofs.reset(); }
@@ -16,6 +37,14 @@ std::ofstream* ofstream::update( boost::posix_time::ptime t )
     return _ofs.get();
 }
 
+by_time::by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align )
+    : _ofs( dir, csv )
+    , _max_duration( max_duration )
+    , _align( align )
+{
+    COMMA_THROW_IF( align, "align: todo" );
+}
+
 bool by_time::_is_due( boost::posix_time::ptime t )
 {
     if( !_deadline.is_not_a_date_time() && t < _deadline ) { return false; }
diff --git a/csv/split.h b/csv/split.h
index f68faa698..cf6553dcb 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -16,6 +16,8 @@ namespace comma { namespace csv {
 
 namespace splitting {
 
+std::string usage( unsigned int indent = 0, bool verbose = false );
+
 template < typename T >
 struct type_traits
 {
@@ -53,14 +55,15 @@ class ofstream
 class by_time
 {
     public:
-        by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv ): _ofs( dir, csv ), _max_duration( max_duration ) {}
-        by_time( double max_duration, const std::string& dir, const options& csv ): by_time( timing::duration::from_seconds( max_duration ), dir, csv ) {}
+        by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align = false );
+        by_time( double max_duration, const std::string& dir, const options& csv, bool align ): by_time( timing::duration::from_seconds( max_duration ), dir, csv, align ) {}
         template < typename T > std::ostream* stream( const T& t ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? _ofs.update( d ) : _ofs(); }
         void wrote( unsigned int ) {}
 
     private:
         splitting::ofstream _ofs;
         boost::posix_time::time_duration _max_duration;
+        bool _align{false};
         boost::posix_time::ptime _deadline;
 
         bool _is_due( boost::posix_time::ptime t );
diff --git a/io/stream.cpp b/io/stream.cpp
index 604b14763..d0db2bfae 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -39,11 +39,9 @@ namespace comma { namespace io {
 
 namespace impl {
 
-template < typename S >
-struct traits {};
+template < typename S > struct traits {};
 
-template <>
-struct traits < std::istream >
+template <> struct traits < std::istream >
 {
     typedef std::ifstream file_stream;
     static bool is_standard( const std::istream* is ) { return is == &std::cin; }
@@ -69,8 +67,7 @@ struct traits < std::istream >
     #endif
 };
 
-template <>
-struct traits < std::ostream >
+template <> struct traits < std::ostream >
 {
     typedef std::ofstream file_stream;
     static bool is_standard( const std::ostream* is ) { return is == &std::cout || is == &std::cerr; }
@@ -104,8 +101,7 @@ struct traits < std::ostream >
     #endif
 };
 
-template <>
-struct traits < std::iostream >
+template <> struct traits < std::iostream >
 {
     typedef std::fstream file_stream; // quick and dirty, does not matter for now
     static bool is_standard( const std::iostream* ) { return false; }
@@ -130,8 +126,7 @@ template < typename S > void close_file_stream( typename traits< S >::file_strea
 
 } // namespace impl
 
-template < typename S >
-stream< S >::~stream()
+template < typename S > stream< S >::~stream()
 {
     if( stream_ == NULL || impl::traits< S >::is_standard( stream_ ) ) { return; }
     delete stream_;
@@ -139,8 +134,7 @@ stream< S >::~stream()
     close_ = NULL;
 }
 
-template < typename S >
-S* stream< S >::lazily_make_stream_()
+template < typename S > S* stream< S >::lazily_make_stream_()
 {
     #ifndef WIN32
     if( stream_ == NULL ) // quick and dirty: if fstream, cannot open on construction, as pipe might block
@@ -185,8 +179,7 @@ static void set_non_blocking_flags_( io::file_descriptor fd )
 #endif // #ifndef WIN32
 }
 
-template < typename S >
-comma::io::file_descriptor stream< S >::fd() const
+template < typename S > comma::io::file_descriptor stream< S >::fd() const
 {
     #ifdef WIN32
     if( fd_ == io::invalid_file_descriptor )
@@ -200,8 +193,7 @@ comma::io::file_descriptor stream< S >::fd() const
     return fd_;
 }
 
-template < typename S >
-std::size_t stream< S >::available_on_file_descriptor() const
+template < typename S > std::size_t stream< S >::available_on_file_descriptor() const
 {
     int count = 0;
 #ifdef WIN32
@@ -215,8 +207,7 @@ std::size_t stream< S >::available_on_file_descriptor() const
 
 template < typename S > const std::string& stream< S >::name() const { return name_; }
 
-template < typename S >
-stream< S >::stream( const std::string& name, mode::value m, mode::blocking_value blocking )
+template < typename S > stream< S >::stream( const std::string& name, mode::value m, mode::blocking_value blocking )
     : name_( name )
     , mode_( m )
     , stream_( NULL )
@@ -362,23 +353,30 @@ stream< S >::stream( const std::string& name, mode::value m, mode::blocking_valu
 
 namespace impl {
 
-static std::string usage( const std::string& what, const std::string& dash, unsigned int indent )
+static std::string usage( const std::string& what, const std::string& dash, unsigned int indent, bool verbose )
 {
     std::string i( indent, ' ' );
     std::ostringstream oss;
     oss << i << "<" << what << ">" << std::endl;
-    oss << i << "    '-'                  : " << dash << std::endl;
-    oss << i << "    <path>               : path to input file or named pipe" << std::endl;
-    oss << i << "    local:<path>         : local linux socket" << std::endl;
-    oss << i << "    tcp:<address>:<port> : tcp socket" << std::endl;
+    if( verbose )
+    {
+        oss << i << "    '-'                  : " << dash << std::endl;
+        oss << i << "    <path>               : path to input file or named pipe" << std::endl;
+        oss << i << "    local:<path>         : local linux socket" << std::endl;
+        oss << i << "    tcp:<address>:<port> : tcp socket" << std::endl;
+    }
+    else
+    {
+        oss << i << "    run --help --verbose for details" << std::endl;
+    }
     return oss.str();
 }
 
 } // namespace impl {
 
-std::string istream::usage( unsigned int indent ) { return impl::usage( "input", "stdin", indent ); }
-std::string ostream::usage( unsigned int indent ) { return impl::usage( "output", "stdout", indent ); }
-std::string iostream::usage( unsigned int indent ) { return impl::usage( "input/output", "n/a", indent ); }
+std::string istream::usage( unsigned int indent, bool verbose ) { return impl::usage( "input", "stdin", indent, verbose ); }
+std::string ostream::usage( unsigned int indent, bool verbose ) { return impl::usage( "output", "stdout", indent, verbose ); }
+std::string iostream::usage( unsigned int indent, bool verbose ) { return impl::usage( "input/output", "n/a", indent, verbose ); }
 
 template class stream< std::istream >;
 template class stream< std::ostream >;
diff --git a/io/stream.h b/io/stream.h
index 9c028fd01..227fc9af1 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -93,7 +93,7 @@ struct istream : public stream< std::istream >
     istream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
     istream( std::istream* s, io::file_descriptor fd, mode::value mode, boost::function< void() > close );
     istream( std::istream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close );
-    static std::string usage( unsigned int indent = 0 );
+    static std::string usage( unsigned int indent = 0, bool verbose = false );
 };
 
 /// output stream owner
@@ -102,14 +102,14 @@ struct ostream : public stream< std::ostream >
     ostream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
     ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, boost::function< void() > close );
     ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close );
-    static std::string usage( unsigned int indent = 0 );
+    static std::string usage( unsigned int indent = 0, bool verbose = false );
 };
 
 /// input/output stream owner
 struct iostream : public stream< std::iostream >
 {
     iostream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
-    static std::string usage( unsigned int indent = 0 );
+    static std::string usage( unsigned int indent = 0, bool verbose = false );
 };
 
 } } // namespace comma { namespace io {

From b78de3ad11970e20f2d91b2f7906075dc8927c16 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 16:26:26 +1000
Subject: [PATCH 0809/1056] csv::splitting::by_size: average record size
 calculation implemented

---
 csv/split.cpp | 13 ++++++++++++-
 csv/split.h   |  3 ++-
 2 files changed, 14 insertions(+), 2 deletions(-)

diff --git a/csv/split.cpp b/csv/split.cpp
index 1ff2bfb8b..4f565e302 100644
--- a/csv/split.cpp
+++ b/csv/split.cpp
@@ -18,7 +18,13 @@ std::string usage( unsigned int size, bool verbose )
     {
         oss << indent << "    <options>: <how>[;<parameters>]" << std::endl;
         oss << indent << "        by-time;period=<seconds>[;align]" << std::endl;
+        oss << indent << "            period=<seconds>: create a new file if next" << std::endl;
+        oss << indent << "                              timestamp passes <seconds> deadline" << std::endl;
+        oss << indent << "            align : align deadline timestamp and respective filename" << std::endl;
+        oss << indent << "                    exactly with the period (todo, just ask)" << std::endl;
         oss << indent << "        by-size;size=<bytes>" << std::endl;
+        oss << indent << "            size=<bytes>: create files not larger than <bytes>" << std::endl;
+        oss << indent << "                          may not be exact on ascii output" << std::endl;
         oss << indent << "        by-block" << std::endl;
     }
     else
@@ -61,7 +67,7 @@ by_size::by_size( std::size_t size, const std::string& dir, const options& csv )
 
 bool by_size::_is_due()
 {
-    if( _estimated_record_size <= _remaining ) { return false; }
+    if( ( _record_size ? _record_size : ( unsigned int )( _average_record_size ) ) <= _remaining ) { return false; }
     _remaining = _size;
     return true;
 }
@@ -69,6 +75,11 @@ bool by_size::_is_due()
 void by_size::wrote( unsigned int size )
 {
     _remaining = _remaining > size ? _remaining - size : 0;
+    if( _record_size ) { return; }
+    ++_count;
+    if( _count == 1 ) { _average_record_size = size; return; }
+    double r = 1. / _count;
+    _average_record_size = ( 1 - r ) * _average_record_size + r * size; // quick and dirty
 }
 
 bool by_block::_is_due( unsigned int block )
diff --git a/csv/split.h b/csv/split.h
index cf6553dcb..9d777f7c3 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -81,7 +81,8 @@ class by_size
         splitting::ofstream _ofs;
         std::size_t _size{0};
         std::size_t _record_size{0};
-        std::size_t _estimated_record_size{0};
+        double _average_record_size{0};
+        std::size_t _count{0};
         std::size_t _remaining{0};
 
         bool _is_due();

From 119269bca3ae6c8a05195def356f475944a02ada Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 17:44:22 +1000
Subject: [PATCH 0810/1056] csv::split::write() implemented; make(): in
 progress...

---
 csv/split.cpp |  46 -------------------
 csv/split.h   | 125 +++++++++++++++++++++++++++++++++++++++-----------
 2 files changed, 98 insertions(+), 73 deletions(-)

diff --git a/csv/split.cpp b/csv/split.cpp
index 4f565e302..64838cbe1 100644
--- a/csv/split.cpp
+++ b/csv/split.cpp
@@ -43,50 +43,4 @@ std::ofstream* ofstream::update( boost::posix_time::ptime t )
     return _ofs.get();
 }
 
-by_time::by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align )
-    : _ofs( dir, csv )
-    , _max_duration( max_duration )
-    , _align( align )
-{
-    COMMA_THROW_IF( align, "align: todo" );
-}
-
-bool by_time::_is_due( boost::posix_time::ptime t )
-{
-    if( !_deadline.is_not_a_date_time() && t < _deadline ) { return false; }
-    _deadline = t + _max_duration;
-    return true;
-}
-
-by_size::by_size( std::size_t size, const std::string& dir, const options& csv )
-    : _ofs( dir, csv )
-    , _size( size )
-    , _record_size( csv.binary() ? csv.format().size() : 0 )
-{
-}
-
-bool by_size::_is_due()
-{
-    if( ( _record_size ? _record_size : ( unsigned int )( _average_record_size ) ) <= _remaining ) { return false; }
-    _remaining = _size;
-    return true;
-}
-
-void by_size::wrote( unsigned int size )
-{
-    _remaining = _remaining > size ? _remaining - size : 0;
-    if( _record_size ) { return; }
-    ++_count;
-    if( _count == 1 ) { _average_record_size = size; return; }
-    double r = 1. / _count;
-    _average_record_size = ( 1 - r ) * _average_record_size + r * size; // quick and dirty
-}
-
-bool by_block::_is_due( unsigned int block )
-{
-    if( _block && *_block == block ) { return false; }
-    _block = block;
-    return true;
-}
-
 } } } // namespace comma { namespace csv { namespace splitting {
diff --git a/csv/split.h b/csv/split.h
index 9d777f7c3..7e4b1f5a6 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -19,21 +19,28 @@ namespace splitting {
 std::string usage( unsigned int indent = 0, bool verbose = false );
 
 template < typename T >
-struct type_traits
+struct method
+{
+    virtual ~method() {}
+    virtual void wrote( unsigned int size ) {}
+    virtual std::ostream* stream( const T& t, unsigned int size = 0 ) = 0;
+};
+
+template < typename T >
+struct type_traits: public method< T >
 {
     static boost::posix_time::ptime time( const T& t ) { return t.t; }
     static unsigned int block( const T& t ) { return t.block; }
     static unsigned int id( const T& t ) { return t.id; }
 };
 
-class none
+template < typename T >
+class none: public method< T >
 {
     public:
         none( const std::string& address ): _ostream( address ) {}
-        template < typename T >
-        std::ostream* stream( const T& t ) { return _ostream(); }
-        void wrote( unsigned int ) {}
-
+        std::ostream* stream( const T&, unsigned int ) { return _ostream(); }
+    
     private:
         io::ostream _ostream;
 };
@@ -46,20 +53,21 @@ class ofstream
         std::ofstream* update( boost::posix_time::ptime t );
         template < typename T > std::ofstream* update( const T& t ) { return update( splitting::type_traits< T >::time( t ) ); }
         std::ofstream* operator()() { return _ofs.get(); }
+    
     protected:
         std::string _dir;
         std::string _suffix;
         std::unique_ptr< std::ofstream > _ofs;
 };
 
-class by_time
+template < typename T >
+class by_time: public method< T >
 {
     public:
         by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align = false );
         by_time( double max_duration, const std::string& dir, const options& csv, bool align ): by_time( timing::duration::from_seconds( max_duration ), dir, csv, align ) {}
-        template < typename T > std::ostream* stream( const T& t ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? _ofs.update( d ) : _ofs(); }
-        void wrote( unsigned int ) {}
-
+        std::ostream* stream( const T& t, unsigned int ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? _ofs.update( d ) : _ofs(); }
+    
     private:
         splitting::ofstream _ofs;
         boost::posix_time::time_duration _max_duration;
@@ -69,12 +77,12 @@ class by_time
         bool _is_due( boost::posix_time::ptime t );
 };
 
-class by_size
+template < typename T >
+class by_size: public method< T >
 {
     public:
         by_size( std::size_t size, const std::string& dir, const options& csv );
-        template < typename T >
-        std::ostream* stream( const T& t ) { return _is_due() ? _ofs.update( t ) : _ofs(); }
+        std::ostream* stream( const T& t, unsigned int size = 0 ) { return _is_due( size ) ? _ofs.update( t ) : _ofs(); }
         void wrote( unsigned int size );
 
     private:
@@ -85,16 +93,15 @@ class by_size
         std::size_t _count{0};
         std::size_t _remaining{0};
 
-        bool _is_due();
+        bool _is_due( unsigned int extra_size );
 };
 
+template < typename T >
 class by_block
 {
     public:
         by_block( const std::string& dir, const options& csv ): _ofs( dir, csv ), _block( silent_none< unsigned int >() ) {}
-        template < typename T >
-        std::ostream* stream( const T& t ) { return _is_due( splitting::type_traits< T >::block( t ) ) ? _ofs.update( t ) : _ofs(); }
-        void wrote( unsigned int ) {}
+        std::ostream* stream( const T& t, unsigned int ) { return _is_due( splitting::type_traits< T >::block( t ) ) ? _ofs.update( t ) : _ofs(); }
 
     private:
         splitting::ofstream _ofs;
@@ -103,21 +110,23 @@ class by_block
         bool _is_due( unsigned int block );
 };
 
+template < typename T >
 class by_id; // todo
 
 } // namespace splitting {
 
-template < typename T, typename How >
+template < typename T >
 class split
 {
     public:
-        split( const How& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) {}
-        split( How&& how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) {}
-        split& operator<<( const T& t );
-        bool eof() const { return _eof; }
+        split( splitting::method< T >* how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) {}
+        split& write( const T& t, const char* buf, unsigned int size );
+        split& operator<<( const T& t ) { return write( t, nullptr, 0 ); }
+        bool eof() const { return _eof || ( _os && _os->eof() ); }
+        static split< T >* make( const std::string& options, const csv::options& csv );
 
     protected:
-        How _how;
+        std::unique_ptr< splitting::method< T > > _how;
         options _options;
         T _sample;
         bool _eof{false};
@@ -126,11 +135,11 @@ class split
         void _init();
 };
 
-template < typename T, typename How > inline split< T, How >& split< T, How >::operator<<( const T& t )
+template < typename T > inline split< T >& split< T >::write( const T& t, const char* buf, unsigned int size )
 {
     COMMA_ASSERT( !_eof, "end of stream" );
-    std::ostream* os = _how.stream( t );
-    if( !os )
+    std::ostream* os = _how->stream( t );
+    if( !os || os->eof() )
     {
         _eof = true;
         _os = nullptr;
@@ -143,8 +152,70 @@ template < typename T, typename How > inline split< T, How >& split< T, How >::o
         _ostream = std::make_unique< output_stream< T > >( *_os, _options, _sample );
     }
     _ostream.write( t );
-    _how.wrote( _ostream.last_size() );
+    if( buf ) { _os->write( buf, size ); }
+    _how->wrote( _ostream.last_size() + size );
     return *this;
 }
 
+template < typename T > inline split< T >* split< T >::make( const std::string& options, const csv::options& csv )
+{
+    return nullptr; // todo
+}
+
+namespace splitting {
+
+template < typename T >
+inline by_time< T >::by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align )
+    : _ofs( dir, csv )
+    , _max_duration( max_duration )
+    , _align( align )
+{
+    COMMA_THROW_IF( align, "align: todo, just ask" );
+}
+
+template < typename T >
+inline bool by_time< T >::_is_due( boost::posix_time::ptime t )
+{
+    if( !_deadline.is_not_a_date_time() && t < _deadline ) { return false; }
+    _deadline = t + _max_duration;
+    return true;
+}
+
+template < typename T >
+inline by_size< T >::by_size( std::size_t size, const std::string& dir, const options& csv )
+    : _ofs( dir, csv )
+    , _size( size )
+    , _record_size( csv.binary() ? csv.format().size() : 0 )
+{
+}
+
+template < typename T >
+inline bool by_size< T >::_is_due( unsigned int extra_size )
+{
+    if( ( _record_size ? _record_size + extra_size : ( unsigned int )( _average_record_size ) ) <= _remaining ) { return false; }
+    _remaining = _size + extra_size;
+    return true;
+}
+
+template < typename T >
+inline void by_size< T >::wrote( unsigned int size )
+{
+    _remaining = _remaining > size ? _remaining - size : 0;
+    if( _record_size ) { return; }
+    ++_count;
+    if( _count == 1 ) { _average_record_size = size; return; }
+    double r = 1. / _count;
+    _average_record_size = ( 1 - r ) * _average_record_size + r * size; // quick and dirty
+}
+
+template < typename T >
+inline bool by_block< T >::_is_due( unsigned int block )
+{
+    if( _block && *_block == block ) { return false; }
+    _block = block;
+    return true;
+}
+
+} // namespace splitting {
+
 } } // namespace comma { namespace csv {

From 24d13754ee1da1d73108e40cd370beb4cbf1ae6b Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 18:23:23 +1000
Subject: [PATCH 0811/1056] csv::split::make(): in progress...

---
 csv/split.h | 30 +++++++++++++++++++++++++++---
 1 file changed, 27 insertions(+), 3 deletions(-)

diff --git a/csv/split.h b/csv/split.h
index 7e4b1f5a6..aeb7e11e9 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -8,6 +8,7 @@
 #include "../base/exception.h"
 #include "../base/none.h"
 #include "../io/stream.h"
+#include "../string/string.h"
 #include "../timing/duration.h"
 #include "options.h"
 #include "stream.h"
@@ -123,7 +124,7 @@ class split
         split& write( const T& t, const char* buf, unsigned int size );
         split& operator<<( const T& t ) { return write( t, nullptr, 0 ); }
         bool eof() const { return _eof || ( _os && _os->eof() ); }
-        static split< T >* make( const std::string& options, const csv::options& csv );
+        static split< T >* make( const std::string& options, const csv::options& csv, bool permissive = false, const T& sample = T() );
 
     protected:
         std::unique_ptr< splitting::method< T > > _how;
@@ -157,9 +158,32 @@ template < typename T > inline split< T >& split< T >::write( const T& t, const
     return *this;
 }
 
-template < typename T > inline split< T >* split< T >::make( const std::string& options, const csv::options& csv )
+template < typename T > inline split< T >* split< T >::make( const std::string& options, const csv::options& csv, bool permissive, const T& sample )
 {
-    return nullptr; // todo
+    const auto& v = comma::split_head( options, 1, ':' );
+    if( v[0] == "split" ) { COMMA_THROW( comma::exception, "on '" << options << "': 'split': todo, just ask" ); }
+    if( v[0] == "log" ) // todo: reimplement using comma::variant
+    {
+        const auto& w = comma::split( v[1], ';' );
+        COMMA_ASSERT( w.size() >= 2, "expected log:<dir>;<method>[;<options>]; got: '" << options );
+        std::string dir = w[0];
+        std::string method = w[1];
+        if( method == "by-time" ) { return nullptr; } // todo
+        if( method == "by-size" )
+        {
+            for( unsigned int i = 2; i < w.size(); ++i )
+            {
+                const auto& s = comma::split( w[i], '=' );
+                if( s[0] == "size" && s.size() == 2 ) { return new split< T >( new splitting::by_size< T >( boost::lexical_cast< unsigned int >( s[1] ), dir, csv ), csv, sample ); }
+            }
+            COMMA_THROW( comma::exception, "expected 'log:<dir>;by-size;size=<bytes>'" );
+        }
+        if( method == "by-block" ) { return new split< T >( new splitting::by_block< T >( dir, csv ), csv, sample ); }
+        if( permissive ) { return nullptr; }
+        COMMA_THROW( comma::exception, "expected 'by-time', 'by-size' or 'by-block', got: '" << v[0] << " in '" << options << "'" );
+    }
+    if( permissive ) { return nullptr; }
+    COMMA_THROW( comma::exception, "expected 'split' or 'log', got: '" << v[0] << " in '" << options << "'" );
 }
 
 namespace splitting {

From 7e1c0bcb7464d07ed4541ba90dd8f33e4b2dbd3e Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 16 May 2024 19:14:43 +1000
Subject: [PATCH 0812/1056] name_value::parser::mangle() method implemented

---
 name_value/parser.cpp | 18 ++++++++++++++++++
 name_value/parser.h   | 14 ++++++++++++++
 2 files changed, 32 insertions(+)
 create mode 100644 name_value/parser.cpp

diff --git a/name_value/parser.cpp b/name_value/parser.cpp
new file mode 100644
index 000000000..da6138e3a
--- /dev/null
+++ b/name_value/parser.cpp
@@ -0,0 +1,18 @@
+// Copyright (c) 2011 The University of Sydney
+
+#include "parser.h"
+
+namespace comma { namespace name_value {
+
+std::string parser::mangled( const std::string& line, const std::string& prefix, char delimiter )
+{
+    const auto& s = comma::split( line, delimiter, true );
+    if( s.empty() ) { return line; }
+    std::string p = prefix.empty() ? s[0] : prefix;
+    std::string r;
+    std::string d;
+    for( unsigned int i = prefix.empty() ? 1 : 0; i < s.size(); ++i ) { r += d + p + '/' + s[i]; d = delimiter; }
+    return r;
+}
+
+} } // namespace comma { namespace name_value {
diff --git a/name_value/parser.h b/name_value/parser.h
index 9cb4e16aa..23f112c28 100644
--- a/name_value/parser.h
+++ b/name_value/parser.h
@@ -42,6 +42,20 @@ class parser
     template < typename S >
     void put( std::string& line, const S& s ) const;
 
+    /// mangle string as in following examples
+    ///     - prefix: "abc"; line: "x=1;y/z=2"; mangled: "abc/x=1;abc/y/z=2"
+    ///     - self-mangled (prefix: ""); line: "my-operation;x=1;y/z=2"; mangled: "my-operation/x=1;my-operation/y/z=2"
+    /// usage example
+    ///     struct naming { static std::array< std::string, 3 > names() { return { "some-operation", "another-operation" } } };
+    ///     struct some_operation { int a; float b; };
+    ///     struct another_operation { double c; std::string d; };
+    ///     typedef comma::named_variant< naming, some_operation, another_operation > operation_t;
+    ///     operation_t operation = parser().get< operation_t >( parser::mangled( operation_options ) );
+    ///     if( operation.is< some_operation >() ) { /* handle */ }
+    ///     else if( operation.is< some_operation >() ) { /* handle */ }
+    ///     etc
+    static std::string mangled( const std::string& line, const std::string& prefix = "", char delimiter = ';' );
+
 private:
     impl::options _options;
 };

From 9c2367f20e72db4fcf01430c0d321e24f307235b Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 17 May 2024 13:49:25 +1000
Subject: [PATCH 0813/1056] csv::split::make(): first cut implemented;
 debugging...

---
 csv/split.h                        | 49 ++++++++++++-----
 name_value/test/serialise_test.cpp | 84 +++++++++++++++++++-----------
 2 files changed, 88 insertions(+), 45 deletions(-)

diff --git a/csv/split.h b/csv/split.h
index aeb7e11e9..a5931e186 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -20,19 +20,19 @@ namespace splitting {
 std::string usage( unsigned int indent = 0, bool verbose = false );
 
 template < typename T >
-struct method
+struct type_traits
 {
-    virtual ~method() {}
-    virtual void wrote( unsigned int size ) {}
-    virtual std::ostream* stream( const T& t, unsigned int size = 0 ) = 0;
+    static boost::posix_time::ptime time( const T& t ) { return t.t; }
+    static unsigned int block( const T& t ) { return t.block; }
+    static unsigned int id( const T& t ) { return t.id; }
 };
 
 template < typename T >
-struct type_traits: public method< T >
+struct method
 {
-    static boost::posix_time::ptime time( const T& t ) { return t.t; }
-    static unsigned int block( const T& t ) { return t.block; }
-    static unsigned int id( const T& t ) { return t.id; }
+    virtual ~method() {}
+    virtual void wrote( unsigned int size ) {}
+    virtual std::ostream* stream( const T& t, unsigned int size = 0 ) = 0;
 };
 
 template < typename T >
@@ -98,7 +98,7 @@ class by_size: public method< T >
 };
 
 template < typename T >
-class by_block
+class by_block: public method< T >
 {
     public:
         by_block( const std::string& dir, const options& csv ): _ofs( dir, csv ), _block( silent_none< unsigned int >() ) {}
@@ -165,20 +165,41 @@ template < typename T > inline split< T >* split< T >::make( const std::string&
     if( v[0] == "log" ) // todo: reimplement using comma::variant
     {
         const auto& w = comma::split( v[1], ';' );
-        COMMA_ASSERT( w.size() >= 2, "expected log:<dir>;<method>[;<options>]; got: '" << options );
+        COMMA_ASSERT( w.size() >= 2, "expected log:<dir>;<method>[;<options>]; got: '" << options << "'" );
         std::string dir = w[0];
         std::string method = w[1];
-        if( method == "by-time" ) { return nullptr; } // todo
+        if( method == "by-time" )
+        {
+            boost::optional< double > period = silent_none< double >();
+            bool align{false};
+            for( unsigned int i = 2; i < w.size(); ++i )
+            {
+                const auto& s = comma::split( w[i], '=' );
+                if( s[0] == "period" && s.size() == 2 ) { period = boost::lexical_cast< double >( s[1] ); }
+                else if( ( s[0] == "align" && s.size() == 1 ) || w[i] == "align=true" || w[i] == "align=1" ) { align = true; }
+            }
+            if( period ) { return new split< T >( new splitting::by_time< T >( *period, dir, csv, align ), csv, sample ); }
+            if( permissive ) { return nullptr; }
+            COMMA_THROW( comma::exception, "expected 'log:<dir>;by-time;period=<seconds>[;align]'; got: '" << options << "'" );
+        }
         if( method == "by-size" )
         {
             for( unsigned int i = 2; i < w.size(); ++i )
             {
                 const auto& s = comma::split( w[i], '=' );
-                if( s[0] == "size" && s.size() == 2 ) { return new split< T >( new splitting::by_size< T >( boost::lexical_cast< unsigned int >( s[1] ), dir, csv ), csv, sample ); }
+                if( s[0] == "size" && s.size() == 2 )
+                { 
+                    if( permissive ) { return nullptr; }
+                    return new split< T >( new splitting::by_size< T >( boost::lexical_cast< unsigned int >( s[1] ), dir, csv ), csv, sample );
+                }
             }
-            COMMA_THROW( comma::exception, "expected 'log:<dir>;by-size;size=<bytes>'" );
+            if( permissive ) { return nullptr; }
+            COMMA_THROW( comma::exception, "expected 'log:<dir>;by-size;size=<bytes>'; got: '" << options << "'" );
+        }
+        if( method == "by-block" )
+        {
+            return new split< T >( new splitting::by_block< T >( dir, csv ), csv, sample );
         }
-        if( method == "by-block" ) { return new split< T >( new splitting::by_block< T >( dir, csv ), csv, sample ); }
         if( permissive ) { return nullptr; }
         COMMA_THROW( comma::exception, "expected 'by-time', 'by-size' or 'by-block', got: '" << v[0] << " in '" << options << "'" );
     }
diff --git a/name_value/test/serialise_test.cpp b/name_value/test/serialise_test.cpp
index f6911ec9c..7ae8f8e79 100644
--- a/name_value/test/serialise_test.cpp
+++ b/name_value/test/serialise_test.cpp
@@ -375,14 +375,17 @@ struct forest
         struct chirp { int a{1}; int b{2}; };
         struct whistle { int a{3}; int b{4}; };
         struct warble { int x{5}; int y{6}; };
+        struct silence {};
     };
 
     struct naming { static std::array< std::string, 3 > names() { return { "chirp", "whistle", "warble" }; } };
 
     typedef comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble > variant_t;
-    comma::make_named_variant< naming >::variant< sounds::chirp, sounds::whistle, sounds::warble >::type madeup;
-    std::array< variant_t, 3 > choir;
-    comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble > sound;    
+    comma::make_named_variant< naming >::variant< sounds::chirp, sounds::whistle, sounds::warble >::type madeup; // todo
+    std::array< variant_t, 3 > choir; // todo
+    comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble, sounds::silence > maybesound; // todo
+    comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble > sound;
+    
 };
 
 namespace comma { namespace visiting {
@@ -405,18 +408,26 @@ template <> struct traits< forest::sounds::warble >
     template < typename Key, class Visitor > static void visit( Key, const forest::sounds::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
 };
 
+template <> struct traits< forest::sounds::silence >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::silence& t, Visitor& v ) {}
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::silence& t, Visitor& v ) {}
+};
+
 template <> struct traits< forest >
 {
     template < typename Key, class Visitor > static void visit( Key, forest& t, Visitor& v )
     {
         v.apply( "madeup", t.madeup ); // todo
         v.apply( "choir", t.choir ); // todo
+        v.apply( "maybesound", t.maybesound ); // todo
         v.apply( "sound", t.sound );
     }
     template < typename Key, class Visitor > static void visit( Key, const forest& t, Visitor& v )
     {
         v.apply( "madeup", t.madeup ); // todo
         v.apply( "choir", t.choir ); // todo
+        v.apply( "maybesound", t.maybesound ); // todo
         v.apply( "sound", t.sound );
     }
 };
@@ -425,36 +436,47 @@ template <> struct traits< forest >
 
 TEST( serialise, variant )
 {
-    forest f;
-    {
-        std::ostringstream oss;
-        comma::write_json( f, oss, false );
-        EXPECT_EQ( oss.str(), "{}" );
-    }
-    {
-        f.sound.set( forest::sounds::chirp{11, 22} );
-        std::ostringstream oss;
-        comma::write_json( f, oss, false );
-        EXPECT_EQ( oss.str(), "{\"sound\":{\"chirp\":{\"a\":11,\"b\":22}}}" );
-    }
-    {
-        f.sound.set( forest::sounds::whistle{33, 44} );
-        std::ostringstream oss;
-        comma::write_json( f, oss, false );
-        EXPECT_EQ( oss.str(), "{\"sound\":{\"whistle\":{\"a\":33,\"b\":44}}}" );
-    }
-    {
-        f.sound.set( forest::sounds::warble{55, 66} );
-        std::ostringstream oss;
-        comma::write_json( f, oss, false );
-        EXPECT_EQ( oss.str(), "{\"sound\":{\"warble\":{\"x\":55,\"y\":66}}}" );
-    }
     {
-        f.sound.reset();
-        std::ostringstream oss;
-        comma::write_json( f, oss, false );
-        EXPECT_EQ( oss.str(), "{}" );
+        forest f;
+        {
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{}" );
+        }
+        {
+            f.sound.set( forest::sounds::chirp{11, 22} );
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{\"sound\":{\"chirp\":{\"a\":11,\"b\":22}}}" );
+        }
+        {
+            f.sound.set( forest::sounds::whistle{33, 44} );
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{\"sound\":{\"whistle\":{\"a\":33,\"b\":44}}}" );
+        }
+        {
+            f.sound.set( forest::sounds::warble{55, 66} );
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{\"sound\":{\"warble\":{\"x\":55,\"y\":66}}}" );
+        }
+        {
+            f.sound.reset();
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{}" );
+        }
     }
+    // { // todo?
+    //     forest f;
+    //     std::ostringstream oss;
+    //     comma::write_json( f, oss, false );
+    //     EXPECT_EQ( oss.str(), "{}" );
+    //     f.maybesound.set( forest::sounds::silence() );
+    //     comma::write_json( f, oss, false );
+    //     //EXPECT_EQ( oss.str(), "{\"sound\":{\"silence\":\"\"}}" );
+    // }
 }
 
 TEST( deserialise, variant )

From 9a196d6601f47c71a22f042479d4f85956c5a96d Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 17 May 2024 15:40:47 +1000
Subject: [PATCH 0814/1056] csv::split: typo fixed; debugging...

---
 csv/split.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/split.h b/csv/split.h
index a5931e186..bd52ed6ce 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -152,9 +152,9 @@ template < typename T > inline split< T >& split< T >::write( const T& t, const
         _os = os;
         _ostream = std::make_unique< output_stream< T > >( *_os, _options, _sample );
     }
-    _ostream.write( t );
+    _ostream->write( t );
     if( buf ) { _os->write( buf, size ); }
-    _how->wrote( _ostream.last_size() + size );
+    _how->wrote( _ostream->last_size() + size );
     return *this;
 }
 

From f82b3f172e0cc13761ba06b2ee65fe87d510ccd2 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 17 May 2024 15:53:19 +1000
Subject: [PATCH 0815/1056] csv::split: another typo fixed; debugging...

---
 csv/split.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/split.h b/csv/split.h
index bd52ed6ce..d1e89ef85 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -160,7 +160,7 @@ template < typename T > inline split< T >& split< T >::write( const T& t, const
 
 template < typename T > inline split< T >* split< T >::make( const std::string& options, const csv::options& csv, bool permissive, const T& sample )
 {
-    const auto& v = comma::split_head( options, 1, ':' );
+    const auto& v = comma::split_head( options, 2, ':' );
     if( v[0] == "split" ) { COMMA_THROW( comma::exception, "on '" << options << "': 'split': todo, just ask" ); }
     if( v[0] == "log" ) // todo: reimplement using comma::variant
     {

From cbe844d9b576e02f31efa53a268a8558ecf0bf68 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 20 May 2024 10:42:54 +1000
Subject: [PATCH 0816/1056] csv::split: by-size::wrote(): bug fixed: reset once
 size is reached

---
 csv/split.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/split.h b/csv/split.h
index d1e89ef85..f654d6513 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -245,7 +245,7 @@ inline bool by_size< T >::_is_due( unsigned int extra_size )
 template < typename T >
 inline void by_size< T >::wrote( unsigned int size )
 {
-    _remaining = _remaining > size ? _remaining - size : 0;
+    _remaining = _remaining >= size ? _remaining - size : 0;
     if( _record_size ) { return; }
     ++_count;
     if( _count == 1 ) { _average_record_size = size; return; }

From 21d7a7abdb59ecf30c8758e3a513222881496536 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 29 May 2024 14:50:57 +1000
Subject: [PATCH 0817/1056] csv::split::write(): flush flag added

---
 csv/split.h | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/csv/split.h b/csv/split.h
index f654d6513..f58918025 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -121,7 +121,8 @@ class split
 {
     public:
         split( splitting::method< T >* how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) {}
-        split& write( const T& t, const char* buf, unsigned int size );
+        split& write( const T& t, const char* buf, unsigned int size, bool flush = false );
+        void flush() { if( _os ) { _os->flush(); } }
         split& operator<<( const T& t ) { return write( t, nullptr, 0 ); }
         bool eof() const { return _eof || ( _os && _os->eof() ); }
         static split< T >* make( const std::string& options, const csv::options& csv, bool permissive = false, const T& sample = T() );
@@ -136,7 +137,7 @@ class split
         void _init();
 };
 
-template < typename T > inline split< T >& split< T >::write( const T& t, const char* buf, unsigned int size )
+template < typename T > inline split< T >& split< T >::write( const T& t, const char* buf, unsigned int size, bool flusj )
 {
     COMMA_ASSERT( !_eof, "end of stream" );
     std::ostream* os = _how->stream( t );
@@ -154,6 +155,7 @@ template < typename T > inline split< T >& split< T >::write( const T& t, const
     }
     _ostream->write( t );
     if( buf ) { _os->write( buf, size ); }
+    if( flush ) { _os->flush(); }
     _how->wrote( _ostream->last_size() + size );
     return *this;
 }

From b8287f17c75e3cb8c60d5b555cf6282258267ae5 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 29 May 2024 14:53:42 +1000
Subject: [PATCH 0818/1056] csv::split::write(): flush flag: trivial typo

---
 csv/split.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/split.h b/csv/split.h
index f58918025..472732566 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -137,7 +137,7 @@ class split
         void _init();
 };
 
-template < typename T > inline split< T >& split< T >::write( const T& t, const char* buf, unsigned int size, bool flusj )
+template < typename T > inline split< T >& split< T >::write( const T& t, const char* buf, unsigned int size, bool flush )
 {
     COMMA_ASSERT( !_eof, "end of stream" );
     std::ostream* os = _how->stream( t );

From c8f843e0e1a2aa501b004715caf2727e9ae4adae Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 29 May 2024 17:22:32 +1000
Subject: [PATCH 0819/1056] util/applications/comma-top

---
 util/applications/comma-top | 121 ++++++++++++++++--------------------
 1 file changed, 54 insertions(+), 67 deletions(-)

diff --git a/util/applications/comma-top b/util/applications/comma-top
index 55cf66aef..43d9d702c 100755
--- a/util/applications/comma-top
+++ b/util/applications/comma-top
@@ -29,32 +29,15 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-name=$( basename $0 )
-
-source $( which comma-application-util ) 2>/dev/null || { echo "$name: could not source 'comma-application-util'" >&2; exit 1; }
-
-function description()
-{
-    cat <<EOF
---help,-h; show this help
---accumulated; if present for --io, passed to iotop
---debug; much more debug output
---io; if present, run iotop instead of top
---output-fields; output the field names to stdout and exit
---num-procs=[<N>]; output the top N processes (default: totals)
---num-samples=[<N>]; number of samples to take, default: forever, until terminated
---sampling-interval,--delay=[<time>]; sampling interval, see '-d' option of top (1), default: defined by top (1)
---top-options=[<options>]; extra command line argument(s) pass to the top (1) utility
-EOF
-}
+source $( type -p comma-application-util ) 2>/dev/null || { echo "io-top: could not source 'comma-application-util'" >&2; exit 1; }
 
 function usage()
 {
-    cat >&2 <<EOF
+    cat <<eof
 Invokes the performance monitoring utility top (1) or iotop in continuous mode, parses
 top (1) output, and collects the results into CVS file (sent to stdout).
 
-Usage: ${name} <options> [ > output_file.csv ]
+Usage: io-top <options> [ > output_file.csv ]
 
 Note: top (1) output is affected by its global and user configuration files.
 There is no option to ignore those files. This utility assumes the default format
@@ -62,29 +45,36 @@ of top (1) output and will fail if alternative output layout is enforced through
 the configuration file(s). It shall be possible to explicitly mandate the desired
 output layout through command-line switches to top that override configuration
 files. This is a possible future extension.
+eof
+}
 
-Options:
-EOF
-    description | sed 's/^/    /g' >&2
-    cat >&2 <<EOF
-
-Examples:
-
-    Collect data until terminated by the user:
-
-        $name > results.csv
-
-    Take 1000 samples and quit (default sampling interval of top (1) is 3s; thus,
+function epilogue()
+{
+    cat << eof
+examples
+    collect data until terminated by the user:
+        io-top > results.csv
+    take 1000 samples and quit (default sampling interval of top (1) is 3s; thus,
     collect 3000s of data):
+        io-top --num-samples=1000 > results.csv
+    facilitate parsing io-top output:
+        io-top --output-fields
+eof
+}
 
-        $name --num-samples=1000 > results.csv
-
-    Facilitate parsing $name output:
-
-        $name --output-fields
-
-EOF
-    exit 0
+function options-description()
+{
+    cat <<eof
+--help,-h; show this help
+--accumulated; if present for --io, passed to iotop
+--debug; much more debug output
+--io; if present, run iotop instead of top
+--num-procs,--number-of-processes,--processes=[<N>]; output the top N processes (default: totals)
+--num-samples,--number-of-samples,--samples=[<N>]; number of samples to take, default: forever, until terminated
+--output-fields; output the field names to stdout and exit
+--sampling-interval,--delay=[<time>]; sampling interval, see '-d' option of top (1), default: defined by top (1)
+--top-options=[<options>]; extra command line argument(s) pass to the top (1) utility
+eof
 }
 
 function feeder()
@@ -93,9 +83,7 @@ function feeder()
     local extra_opts=$2
     local top_opts="-b $extra_opts"
     [[ -n "$num" ]] && top_opts="$top_opts -n $num"
-    
-    # make all buffering per-line
-    stdbuf -oL -eL top $top_opts 
+    stdbuf -oL -eL top $top_opts # make all buffering per-line
 }
 
 function extract_cpus()
@@ -123,6 +111,7 @@ function parser_totals()
     local timestamp line first shared
     first="true"
     grep --line-buffered -A 4 '^top' \
+    | tee 0.csv \
     | while true ; do
         read line
         [[ -z "$line" ]] && break
@@ -136,33 +125,36 @@ function parser_totals()
         [[ "$line" = "KiB Swap"* ]] && { extract_mem  "$line" ; echo ; }
         [[ "$line" = "--" ]] && first="true"
     done \
-    | sed -u -n '1!p'
+    | tee 1.csv \
+    | sed -u -n '1!p' \
+    | tee 2.csv
 }
 
 function parser_num_procs()
 {
-    grep --line-buffered -E -A $((num_procs + 1)) '^[ ]+PID ' \
+    grep --line-buffered -E -A $((options_num_procs + 1)) '^[ ]+PID ' \
     | sed -r -u -n 's/[[:blank:]]+/,/g ; s/^,// ; /^[0-9]+,/p'
 }
 
 io_payload_fields="total/read,total/write,actual/read,actual/write"
 io_fields="timestamp,$io_payload_fields"
-total_fields="timestamp,cpu/user,cpu/system,cpu/total,memory/ram,memory/shared,memory/swap"
+all_fields="timestamp,cpu/user,cpu/system,cpu/total,memory/ram,memory/shared,memory/swap"
 procs_fields="timestamp,pid,user,priority,nice,memory/virtual,memory/physical,memory/shared,status,cpu/percent,memory/percent,uptime,command"
 
-function output_fields()
+function maybe_output_fields()
 {
-    if (( $( comma_options_has --io $@ ) )) ; then echo $io_fields
-    elif (( $(comma_options_has --num-procs $@ ) )); then echo $procs_fields
-    else echo "$total_fields" ; fi
+    (( options_output_fields )) || return
+    if (( options_io )) ; then echo $io_fields; exit; fi
+    if (( options_num_procs )); then echo $procs_fields; exit; fi
+    echo "$all_fields"; exit
 }
 
 function run_iotop()
 {
     local total actual
-    [[ -z "$sampling_interval" ]] || delay="--delay=$sampling_interval"
-    [[ -z "$accumulated" ]] || accumulated="--accumulated"
-    sudo iotop --batch --kilobytes -o $delay $accumulated $top_options \
+    [[ -z "$options_sampling_interval" ]] || delay="--delay=$options_sampling_interval"
+    [[ -z "$options_accumulated" ]] || options_accumulated="--accumulated"
+    sudo iotop --batch --kilobytes -o $delay $options_accumulated $options_top_options \
         | egrep -e 'Total DISK|Actual DISK' --line-buffered \
         | sed -u -e 's#[a-zA-Z:/ ]##g' -e 's/|/,/g' \
         | while read total ; do
@@ -173,22 +165,17 @@ function run_iotop()
         | csv-time-stamp 2>/dev/null
 }
 
-if (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )) ; then usage ; exit ; fi
-if (( $( comma_options_has --output-fields "$@" ) )) ; then output_fields "$@" ; exit ; fi
-
-debug=0
-
-description | comma-options-validate "$@"
-comma_path_value_to_var --export < <( description | comma-options-to-name-value "$@" )
-
-if [[ -n "$io" ]] ; then
+options-description | comma-options-validate "$@"
+comma-application-init $@ < <( options-description ) || die "failed" # comma_path_value_to_var --export < <( description | comma-options-to-name-value "$@" )
+maybe_output_fields
+if [[ -n "$options_io" ]] ; then
     [[ -n "$( sudo which iotop )" ]] || { echo "comma-top: make sure iotop installed" >&2 ; exit 1 ; }
     run_iotop
 else
     feeder_opts=""
-    [[ -n "$sampling_interval" ]] && feeder_opts="-d $sampling_interval"
-    [[ -n "$top_options" ]] && feeder_opts="$feeder_opts $top_options"
-    [[ -n "$num_samples" && -z "$num_procs" ]] && (( ++num_samples )) # first line will be ignored, leaving num_samples lines
-    if [[ -n "$num_procs" ]]; then parser="parser_num_procs"; else parser="parser_totals"; fi
-    feeder "$num_samples" "$feeder_opts" "$num_procs" | $parser | csv-time-stamp 2>/dev/null 
+    [[ -n "$options_sampling_interval" ]] && feeder_opts="-d $options_sampling_interval"
+    [[ -n "$options_top_options" ]] && feeder_opts="$feeder_opts $options_top_options"
+    [[ -n "$options_num_samples" && -z "$options_num_procs" ]] && (( ++options_num_samples )) # first line will be ignored, leaving options_num_samples lines
+    if [[ -n "$options_num_procs" ]]; then parser="parser_num_procs"; else parser="parser_totals"; fi
+    feeder "$options_num_samples" "$feeder_opts" "$options_num_procs" | $parser | tee 3.csv | csv-time-stamp 2>/dev/null
 fi

From 6729f9280c0f04471bd2dd5bafaeeecd7297b309 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 29 May 2024 17:36:30 +1000
Subject: [PATCH 0820/1056] comma-top: brushed up, default mode: bug fixed in
 quick and dirty top output parsing

---
 util/applications/comma-top | 15 +++++----------
 1 file changed, 5 insertions(+), 10 deletions(-)

diff --git a/util/applications/comma-top b/util/applications/comma-top
index 43d9d702c..bf55b082d 100755
--- a/util/applications/comma-top
+++ b/util/applications/comma-top
@@ -31,14 +31,12 @@
 
 source $( type -p comma-application-util ) 2>/dev/null || { echo "io-top: could not source 'comma-application-util'" >&2; exit 1; }
 
-function usage()
+function prologue()
 {
     cat <<eof
 Invokes the performance monitoring utility top (1) or iotop in continuous mode, parses
 top (1) output, and collects the results into CVS file (sent to stdout).
 
-Usage: io-top <options> [ > output_file.csv ]
-
 Note: top (1) output is affected by its global and user configuration files.
 There is no option to ignore those files. This utility assumes the default format
 of top (1) output and will fail if alternative output layout is enforced through
@@ -108,8 +106,7 @@ function extract_mem()
 function parser_totals()
 {
     shopt -s extglob
-    local timestamp line first shared
-    first="true"
+    local timestamp line first="true" shared
     grep --line-buffered -A 4 '^top' \
     | tee 0.csv \
     | while true ; do
@@ -120,9 +117,8 @@ function parser_totals()
             first="false"
         }
         [[ "$line" = "%Cpu(s)"* ]]  && extract_cpus "$line"
-        [[ "$line" = "KiB Mem"* ]]  && { extract_mem  "$line" ; echo -n ",$shared" ; }
-        # swap is last, finish the line
-        [[ "$line" = "KiB Swap"* ]] && { extract_mem  "$line" ; echo ; }
+        [[ "$line" = [KMG]"iB Mem"* || "$line" = [KMG]"iB Mem"* ]]  && { extract_mem  "$line" ; echo -n ",$shared" ; }
+        [[ "$line" = [KMG]"iB Swap"* || "$line" = [KMG]"iB Swap"* ]] && { extract_mem  "$line" ; echo ; } # swap is last, finish the line
         [[ "$line" = "--" ]] && first="true"
     done \
     | tee 1.csv \
@@ -133,7 +129,7 @@ function parser_totals()
 function parser_num_procs()
 {
     grep --line-buffered -E -A $((options_num_procs + 1)) '^[ ]+PID ' \
-    | sed -r -u -n 's/[[:blank:]]+/,/g ; s/^,// ; /^[0-9]+,/p'
+        | sed -r -u -n 's/[[:blank:]]+/,/g ; s/^,// ; /^[0-9]+,/p'
 }
 
 io_payload_fields="total/read,total/write,actual/read,actual/write"
@@ -165,7 +161,6 @@ function run_iotop()
         | csv-time-stamp 2>/dev/null
 }
 
-options-description | comma-options-validate "$@"
 comma-application-init $@ < <( options-description ) || die "failed" # comma_path_value_to_var --export < <( description | comma-options-to-name-value "$@" )
 maybe_output_fields
 if [[ -n "$options_io" ]] ; then

From 2592263880a1ea04ccef3580266f0216092975c9 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 3 Jun 2024 17:15:51 +1000
Subject: [PATCH 0821/1056] name-value-from-csv: unnamed: bug fixed:
 --unquote-numbers added to the list of valueless options

---
 name_value/applications/name-value-from-csv.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/name_value/applications/name-value-from-csv.cpp b/name_value/applications/name-value-from-csv.cpp
index a5cb18ffc..eddcd99cd 100644
--- a/name_value/applications/name-value-from-csv.cpp
+++ b/name_value/applications/name-value-from-csv.cpp
@@ -105,7 +105,7 @@ int main( int ac, char** av )
         
         if( fields.empty() )
         { 
-            const std::vector< std::string >& unnamed = options.unnamed( "--strict,--no-brackets,--output-line-number,--line-number,-n,--indices", "-.*" );
+            const std::vector< std::string >& unnamed = options.unnamed( "--strict,--no-brackets,--output-line-number,--line-number,-n,--indices,--unquote-numbers", "-.*" );
             if( unnamed.empty() || unnamed[0].empty() ) { std::cerr << "name-value-from-csv: please specify fields" << std::endl; return 1; }
             fields = unnamed[0];
         }

From ff38e79c310a30d2bf2e7c09e8eb069e388a1b47 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 6 Jun 2024 16:59:15 +1000
Subject: [PATCH 0822/1056] csv-time-join: --output-diff implemented

---
 csv/applications/csv-time-join.cpp | 847 +++++++++++++++--------------
 1 file changed, 433 insertions(+), 414 deletions(-)

diff --git a/csv/applications/csv-time-join.cpp b/csv/applications/csv-time-join.cpp
index 290cbeeff..227f8fea0 100644
--- a/csv/applications/csv-time-join.cpp
+++ b/csv/applications/csv-time-join.cpp
@@ -1,414 +1,433 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-/// @author vsevolod vlaskine
-
-#include <deque>
-#include <iostream>
-#include <string>
-#include <boost/date_time/posix_time/posix_time.hpp>
-#include <boost/optional.hpp>
-#include "../../application/command_line_options.h"
-#include "../../application/signal_flag.h"
-#include "../../base/types.h"
-#include "../../csv/stream.h"
-#include "../../io/stream.h"
-#include "../../csv/traits.h"
-#include "../../io/select.h"
-#include "../../name_value/parser.h"
-#include "../../string/string.h"
-#include "../../visiting/traits.h"
-
-static void bash_completion( unsigned const ac, char const * const * av )
-{
-    static const char* completion_options =
-        " --help --verbose"
-        " --by-lower --by-upper --nearest --realtime"
-        " --binary --delimiter --fields"
-        " --bound --do-not-append --select --timestamp-only"
-        " --buffer --discard-bounding"
-        ;
-    std::cout << completion_options << std::endl;
-    exit( 0 );
-}
-
-static void usage( bool verbose )
-{
-    std::cerr << std::endl;
-    std::cerr << "join timestamped data from stdin with corresponding timestamped data from the" << std::endl;
-    std::cerr << "second input" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "timestamps are expected to be fully ordered" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "note: on windows only files are supported as bounding data" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: cat a.csv | csv-time-join <how> [<options>] bounding.csv [-] > joined.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<how>" << std::endl;
-    std::cerr << "    --by-lower: join by lower timestamp (default)" << std::endl;
-    std::cerr << "    --by-upper: join by upper timestamp" << std::endl;
-    std::cerr << "    --nearest:  join by nearest timestamp" << std::endl;
-    std::cerr << "                if 'block' given in --fields, output the whole block" << std::endl;
-    std::cerr << "    --realtime: (streams only) output input immediately joined with current" << std::endl;
-    std::cerr << "                latest bounding timestamp. The joined bounding timestamp may" << std::endl;
-    std::cerr << "                be less than or greater than the timestamp from stdin." << std::endl;
-    std::cerr << "                No timestamp comparisons are made before outputting a record." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<input/output options>" << std::endl;
-    std::cerr << "    -: if csv-time-join - b.csv, concatenate output as: <stdin><b.csv>" << std::endl;
-    std::cerr << "       if csv-time-join b.csv -, concatenate output as: <b.csv><stdin>" << std::endl;
-    std::cerr << "       default: csv-time-join - b.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    --help,-h:                  this help" << std::endl;
-    std::cerr << "    --verbose,-v:               more output" << std::endl;
-    std::cerr << "    --binary,-b <format>:       binary format" << std::endl;
-    std::cerr << "    --delimiter,-d <delimiter>: ascii only; default ','" << std::endl;
-    std::cerr << "    --fields,-f <fields>:       input fields; default: t" << std::endl;
-    std::cerr << "    --bound=[<seconds>]:        output only points within given bound" << std::endl;
-    std::cerr << "    --do-not-append,--select:   do not append any field from the second input" << std::endl;
-    std::cerr << "    --timestamp-only:           append only timestamp from the second input" << std::endl;
-    std::cerr << "    --buffer=[<records>]:       bounding data buffer size; default: infinite" << std::endl;
-    std::cerr << "    --discard-bounding:         discard bounding data if buffer size reached;" << std::endl;
-    std::cerr << "                                default is to block until stdin catches up" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    first field on stdin is timestamp, the first field of filter is timestamp" << std::endl;
-    std::cerr << "        - default:" << std::endl;
-    std::cerr << "            cat a.csv | csv-time-join b.csv" << std::endl;
-    std::cerr << "        - explicit:" << std::endl;
-    std::cerr << "            cat a.csv | csv-time-join --fields=t \"b.csv;fields=t\"" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    3rd field on stdin is timestamp, the 2nd field of filter is timestamp" << std::endl;
-    std::cerr << "        cat a.csv | csv-time-join --fields=,,t \"b.csv;fields=,t\"" << std::endl;
-    std::cerr << std::endl;
-    if( verbose )
-    {
-        std::cerr << "    echo \"20170101T115955,a\" >  a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120001,b\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120002,c\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120007,d\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120012,e\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120015,f\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120000,y\" >  b.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120010,z\" >> b.csv" << std::endl;
-        std::cerr << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --by-upper" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --select" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --timestamp-only" << std::endl;
-        std::cerr << std::endl;
-        std::cerr << "    ( sleep 1; cat a.csv ) | csv-play |" << std::endl;
-        std::cerr << "        csv-time-join --realtime <( cat b.csv | csv-play )" << std::endl;
-}
-    else
-    {
-        std::cerr << "    try --help --verbose for more examples" << std::endl;
-    }
-    std::cerr << std::endl;
-    std::cerr << std::endl;
-    exit( 0 );
-}
-
-struct Point
-{
-    boost::optional<boost::posix_time::ptime> timestamp;
-    Point() {}
-    Point( const boost::posix_time::ptime& timestamp ) : timestamp( timestamp ) {}
-};
-
-namespace comma { namespace visiting {
-
-template <> struct traits< Point >
-{
-    template < typename K, typename V > static void visit( const K&, const Point& p, V& v ) { v.apply( "t", p.timestamp ); }
-    template < typename K, typename V > static void visit( const K&, Point& p, V& v ) { v.apply( "t", p.timestamp ); }
-};
-    
-} } // namespace comma { namespace visiting {
-
-enum class how { by_lower, by_upper, nearest, realtime };
-how method = how::by_lower;
-bool timestamp_only;
-bool select_only;
-comma::csv::options stdin_csv;
-comma::csv::options bounding_csv;
-boost::optional< boost::posix_time::time_duration > bound;
-typedef std::pair< boost::posix_time::ptime, std::string > timestring_t;
-
-boost::posix_time::ptime get_time( const Point& p ) { return p.timestamp ? *p.timestamp : boost::posix_time::microsec_clock::universal_time(); }
-
-static void output_bounding( std::ostream& os, const timestring_t& bounding, bool stdin_first )
-{
-    if( !select_only )
-    {
-        if( stdin_csv.binary() )
-        {
-            if( timestamp_only )
-            {
-                static const unsigned int time_size = comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::size;
-                static char timestamp[ time_size ];
-                comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( bounding.first, timestamp );
-                os.write( (char*)&timestamp, time_size );
-            }
-            else
-            {
-                os.write( &bounding.second[0], bounding.second.size() );
-            }
-        }
-        else
-        {
-            if( stdin_first ) { os << stdin_csv.delimiter; }
-            os << ( timestamp_only ? boost::posix_time::to_iso_string( bounding.first ) : bounding.second );
-            if( !stdin_first ) { os << stdin_csv.delimiter; }
-        }
-    }
-}
-
-static void output_input( std::ostream& os, const timestring_t& input )
-{
-    if( stdin_csv.binary() ) { os.write( &input.second[0], stdin_csv.format().size() ); } else { os << input.second; }
-}
-
-static void output( const timestring_t& input, const timestring_t& bounding, bool stdin_first )
-{
-    if( bounding.first.is_infinity() ) { return; }
-    if( bound && ( input.first - bounding.first > bound || bounding.first - input.first > bound )) { return; }
-    if( stdin_first )
-    {
-        output_input( std::cout, input );
-        output_bounding( std::cout, bounding, stdin_first );
-    }
-    else
-    {
-        output_bounding( std::cout, bounding, stdin_first );
-        output_input( std::cout, input );
-    }
-    if( !stdin_csv.binary() ) { std::cout << '\n'; }
-    std::cout.flush();
-}
-
-int main( int ac, char** av )
-{
-    try
-    {
-        comma::signal_flag is_shutdown(comma::signal_flag::hard);
-        comma::command_line_options options( ac, av, usage );
-        if( options.exists( "--bash-completion" )) bash_completion( ac, av );
-        options.assert_mutually_exclusive( "--by-lower,--by-upper,--nearest,--realtime" );
-        if( options.exists( "--by-upper" )) { method = how::by_upper; }
-        if( options.exists( "--nearest" )) { method = how::nearest; }
-        if( options.exists( "--realtime" )) { method = how::realtime; }
-        timestamp_only = options.exists( "--timestamp-only,--time-only" );
-        select_only = options.exists( "--do-not-append,--select" );
-        if( select_only && timestamp_only ) { std::cerr << "csv-time-join: --timestamp-only specified with --select, ignoring --timestamp-only" << std::endl; }
-        bool discard_bounding = options.exists( "--discard-bounding" );
-        boost::optional< unsigned int > buffer_size = options.optional< unsigned int >( "--buffer" );
-        if( options.exists( "--bound" ) ) { bound = boost::posix_time::microseconds( static_cast<unsigned int>(options.value< double >( "--bound" ) * 1000000 )); }
-        stdin_csv = comma::csv::options( options, "t" );
-        std::vector< std::string > unnamed = options.unnamed(
-            "--by-lower,--by-upper,--nearest,--realtime,--select,--do-not-append,--timestamp-only,--time-only,--discard-bounding",
-            "--binary,-b,--delimiter,-d,--fields,-f,--bound,--buffer,--verbose,-v" );
-        std::string properties;
-        bool stdin_first = true;
-        switch( unnamed.size() )
-        {
-            case 0:
-                std::cerr << "csv-time-join: please specify bounding source" << std::endl;
-                return 1;
-            case 1:
-                properties = unnamed[0];
-                break;
-            case 2:
-                if( unnamed[0] == "-" ) { properties = unnamed[1]; }
-                else if( unnamed[1] == "-" ) { properties = unnamed[0]; stdin_first = false; }
-                else { std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
-                break;
-            default:
-                std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl;
-                return 1;
-        }
-        comma::name_value::parser parser( "filename" );
-        bounding_csv = parser.get< comma::csv::options >( properties );
-        if( bounding_csv.fields.empty() ) { bounding_csv.fields = "t"; }
-
-        comma::csv::input_stream< Point > stdin_stream( std::cin, stdin_csv );
-        #ifdef WIN32
-        if( stdin_csv.binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
-        #endif // #ifdef WIN32
-
-        comma::io::istream bounding_istream( comma::split( properties, ';' )[0], bounding_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii );
-        comma::csv::input_stream< Point > bounding_stream( *bounding_istream, bounding_csv );
-
-        #ifndef WIN32
-        comma::io::select select;
-        comma::io::select bounding_stream_select;
-        select.read().add( 0 );
-        select.read().add( bounding_istream.fd() );
-        bounding_stream_select.read().add( bounding_istream.fd() );
-        #endif // #ifndef WIN32
-
-        const Point* p = NULL;
-        if( method == how::realtime )
-        {
-            #ifdef WIN32
-            COMMA_THROW( comma::exception, "--realtime mode not supported in WIN32" );
-            #else
-            bool end_of_input = false;
-            bool end_of_bounds = false;
-            boost::optional< timestring_t > joined_line;
-            while( !is_shutdown && !end_of_input )
-            {
-                if( !bounding_stream.ready() && !stdin_stream.ready() ) { select.wait(boost::posix_time::milliseconds(1)); }
-                if( !is_shutdown && !end_of_input && ( stdin_stream.ready() || ( select.check() && select.read().ready( comma::io::stdin_fd ) ) ) )
-                {
-                    p = stdin_stream.read();
-                    if( p )
-                    {
-                        timestring_t input_line = std::make_pair( get_time( *p ), stdin_stream.last() );
-                        if( joined_line ) { output( input_line, *joined_line, stdin_first ); }
-                    }
-                    else
-                    {
-                        comma::verbose << "end of input stream" << std::endl;
-                        end_of_input = true;
-                    }
-                }
-                if( !is_shutdown && !end_of_bounds && ( bounding_stream.ready() || ( select.check() && select.read().ready( bounding_istream.fd() ) ) ) )
-                {
-                    p = bounding_stream.read();
-                    if( p )
-                    {
-                        joined_line = std::make_pair( get_time( *p ), bounding_stream.last() );
-                    }
-                    else
-                    {
-                        comma::verbose << "end of bounding stream" << std::endl;
-                        end_of_bounds = true;
-                    }
-                }
-            }
-            if( is_shutdown ) { comma::verbose << "got a signal" << std::endl; return 0; }
-            #endif // #ifdef WIN32
-        }
-        else
-        {
-            std::deque< timestring_t > bounding_queue;
-            bool next = true;
-            bool bounding_data_available;
-            bool upper_bound_added = false;
-            bounding_queue.push_back( std::make_pair( boost::posix_time::neg_infin, "" ) ); // add a fake entry for an lower bound to allow stdin before first bound to match
-            while( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) )
-            {
-                if( !std::cin.good() ) { select.read().remove( 0 ); }
-                if( !bounding_istream->good() ) { select.read().remove( bounding_istream.fd() ); }
-                bounding_data_available = bounding_stream.ready() || ( bounding_istream->good() && !bounding_istream->eof() );
-                #ifdef WIN32
-                bool bounding_stream_ready = true;
-                bool stdin_stream_ready = true;
-                #else // #ifdef WIN32
-                //check so we do not block
-                bool bounding_stream_ready = bounding_stream.ready();
-                bool stdin_stream_ready = stdin_stream.ready();
-                if( next )
-                {
-                    if( !bounding_stream_ready || !stdin_stream_ready )
-                    {
-                        if( !bounding_stream_ready && !stdin_stream_ready ) { select.wait( boost::posix_time::milliseconds( 10 ) ); }
-                        else { select.check(); }
-                        if( select.read().ready( bounding_istream.fd() )) { bounding_stream_ready = true; }
-                        if( select.read().ready(0) ) { stdin_stream_ready = true; }
-                    }
-                }
-                else
-                {
-                    if( !bounding_stream_ready )
-                    {
-                        bounding_stream_select.wait( boost::posix_time::milliseconds( 10 ) );
-                        if( bounding_stream_select.read().ready( bounding_istream.fd() )) { bounding_stream_ready=true; }
-                    }
-                }
-                #endif //#ifdef WIN32
-                //keep storing available bounding data
-                if( bounding_stream_ready )
-                {
-                    if( !buffer_size || bounding_queue.size() < *buffer_size || discard_bounding )
-                    {
-                        const Point* q = bounding_stream.read();
-                        if( q ) { bounding_queue.push_back( std::make_pair( get_time( *q ), bounding_stream.last() )); }
-                        else { bounding_data_available = false; }
-                    }
-                    if( buffer_size && bounding_queue.size() > *buffer_size && discard_bounding ) { bounding_queue.pop_front(); }
-                }
-                if( !upper_bound_added && bounding_istream->eof() )
-                {
-                    // add a fake entry for an upper bound to allow stdin data above last bound to match
-                    bounding_queue.push_back( std::make_pair( boost::posix_time::pos_infin, "" ));
-                    upper_bound_added = true;
-                }
-                //if we are done with the last bounded point get next
-                if( next )
-                {
-                    if( !stdin_stream_ready ) { continue; }
-                    p = stdin_stream.read();
-                    if( !p ) { break; }
-                }
-                boost::posix_time::ptime t = get_time( *p );
-                //get bound
-                for( ; bounding_queue.size() >= 2 && t >= bounding_queue[1].first; bounding_queue.pop_front() );
-                if( bounding_queue.size() < 2 )
-                {
-                    //bound not found
-                    //do we have more data?
-                    if( !bounding_data_available ) { break; }
-                    next = false;
-                    continue;
-                }
-                //bound available
-                if( method == how::by_lower && t < bounding_queue.front().first )
-                {
-                    next = true;
-                    continue;
-                }
-                bool is_first = ( method == how::by_lower )
-                    || ( method == how::nearest && ( t - bounding_queue[0].first ) < ( bounding_queue[1].first - t ));
-                const timestring_t& chosen_bound = is_first ? bounding_queue[0] : bounding_queue[1];;
-                timestring_t input_line = std::make_pair( t, stdin_stream.last() );
-                output( input_line, chosen_bound, stdin_first );
-                next = true;
-            }
-        }
-        return 0;     
-    }
-    catch( std::exception& ex ) { std::cerr << "csv-time-join: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-time-join: unknown exception" << std::endl; }
-    return 1;
-}
+// This file is part of comma, a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+/// @author vsevolod vlaskine
+
+#include <cmath>
+#include <deque>
+#include <iostream>
+#include <string>
+#include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/optional.hpp>
+#include "../../application/command_line_options.h"
+#include "../../application/signal_flag.h"
+#include "../../base/types.h"
+#include "../../csv/stream.h"
+#include "../../io/stream.h"
+#include "../../csv/traits.h"
+#include "../../io/select.h"
+#include "../../name_value/parser.h"
+#include "../../string/string.h"
+#include "../../visiting/traits.h"
+
+static void bash_completion( unsigned const ac, char const * const * av )
+{
+    static const char* completion_options =
+        " --help --verbose"
+        " --by-lower --by-upper --nearest --realtime"
+        " --binary --delimiter --fields"
+        " --bound --do-not-append --select --timestamp-only"
+        " --buffer --discard-bounding"
+        ;
+    std::cout << completion_options << std::endl;
+    exit( 0 );
+}
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "join timestamped data from stdin with corresponding timestamped data from the" << std::endl;
+    std::cerr << "second input" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "timestamps are expected to be fully ordered" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "note: on windows only files are supported as bounding data" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat a.csv | csv-time-join <how> [<options>] bounding.csv [-] > joined.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "<how>" << std::endl;
+    std::cerr << "    --by-lower: join by lower timestamp (default)" << std::endl;
+    std::cerr << "    --by-upper: join by upper timestamp" << std::endl;
+    std::cerr << "    --nearest:  join by nearest timestamp" << std::endl;
+    std::cerr << "                if 'block' given in --fields, output the whole block" << std::endl;
+    std::cerr << "    --realtime: (streams only) output input immediately joined with current" << std::endl;
+    std::cerr << "                latest bounding timestamp. The joined bounding timestamp may" << std::endl;
+    std::cerr << "                be less than or greater than the timestamp from stdin." << std::endl;
+    std::cerr << "                No timestamp comparisons are made before outputting a record." << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "<input/output options>" << std::endl;
+    std::cerr << "    -: if csv-time-join - b.csv, concatenate output as: <stdin><b.csv>" << std::endl;
+    std::cerr << "       if csv-time-join b.csv -, concatenate output as: <b.csv><stdin>" << std::endl;
+    std::cerr << "       default: csv-time-join - b.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    --help,-h:                    this help" << std::endl;
+    std::cerr << "    --verbose,-v:                 more output" << std::endl;
+    std::cerr << "    --binary,-b <format>:         binary format" << std::endl;
+    std::cerr << "    --delimiter,-d <delimiter>:   ascii only; default ','" << std::endl;
+    std::cerr << "    --fields,-f <fields>:         input fields; default: t" << std::endl;
+    std::cerr << "    --bound=[<seconds>]:          output only points within given bound" << std::endl;
+    std::cerr << "    --buffer=[<records>]:         bounding data buffer size; default: infinite" << std::endl;
+    std::cerr << "    --discard-bounding:           discard bounding data if buffer size reached;" << std::endl;
+    std::cerr << "                                  default is to block until stdin catches up" << std::endl;
+    std::cerr << "    --do-not-append,--select:     do not append any field from the second input" << std::endl;
+    std::cerr << "    --output-diff-abs,--abs-diff: append abs difference between first and second input" << std::endl;
+    std::cerr << "                                  input timestamps as seconds (double)" << std::endl;
+    std::cerr << "    --output-diff,--diff:         append difference between first and second input" << std::endl;
+    std::cerr << "                                  input timestamps as seconds (double)" << std::endl;
+    std::cerr << "    --timestamp-only:             append only timestamp from the second input" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "    first field on stdin is timestamp, the first field of filter is timestamp" << std::endl;
+    std::cerr << "        - default:" << std::endl;
+    std::cerr << "            cat a.csv | csv-time-join b.csv" << std::endl;
+    std::cerr << "        - explicit:" << std::endl;
+    std::cerr << "            cat a.csv | csv-time-join --fields=t \"b.csv;fields=t\"" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    3rd field on stdin is timestamp, the 2nd field of filter is timestamp" << std::endl;
+    std::cerr << "        cat a.csv | csv-time-join --fields=,,t \"b.csv;fields=,t\"" << std::endl;
+    std::cerr << std::endl;
+    if( verbose )
+    {
+        std::cerr << "    echo \"20170101T115955,a\" >  a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120001,b\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120002,c\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120007,d\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120012,e\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120015,f\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120000,y\" >  b.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120010,z\" >> b.csv" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --by-upper" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --select" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --timestamp-only" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    ( sleep 1; cat a.csv ) | csv-play |" << std::endl;
+        std::cerr << "        csv-time-join --realtime <( cat b.csv | csv-play )" << std::endl;
+}
+    else
+    {
+        std::cerr << "    try --help --verbose for more examples" << std::endl;
+    }
+    std::cerr << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+struct Point
+{
+    boost::optional<boost::posix_time::ptime> timestamp;
+    Point() {}
+    Point( const boost::posix_time::ptime& timestamp ) : timestamp( timestamp ) {}
+};
+
+namespace comma { namespace visiting {
+
+template <> struct traits< Point >
+{
+    template < typename K, typename V > static void visit( const K&, const Point& p, V& v ) { v.apply( "t", p.timestamp ); }
+    template < typename K, typename V > static void visit( const K&, Point& p, V& v ) { v.apply( "t", p.timestamp ); }
+};
+    
+} } // namespace comma { namespace visiting {
+
+enum class how { by_lower, by_upper, nearest, realtime };
+how method = how::by_lower;
+static bool timestamp_only;
+static bool output_diff_abs;
+static bool output_diff;
+static bool select_only;
+static comma::csv::options stdin_csv;
+static comma::csv::options bounding_csv;
+static boost::optional< boost::posix_time::time_duration > bound;
+typedef std::pair< boost::posix_time::ptime, std::string > timestring_t;
+
+static boost::posix_time::ptime get_time( const Point& p ) { return p.timestamp ? *p.timestamp : boost::posix_time::microsec_clock::universal_time(); }
+
+static void output_bounding( std::ostream& os, const timestring_t& bounding, bool stdin_first )
+{
+    if( !select_only )
+    {
+        if( stdin_csv.binary() )
+        {
+            if( timestamp_only )
+            {
+                static const unsigned int time_size = comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::size;
+                static char timestamp[ time_size ];
+                comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( bounding.first, timestamp );
+                os.write( ( const char* )( &timestamp ), time_size );
+            }
+            else
+            {
+                os.write( &bounding.second[0], bounding.second.size() );
+            }
+        }
+        else
+        {
+            if( stdin_first ) { os << stdin_csv.delimiter; }
+            os << ( timestamp_only ? boost::posix_time::to_iso_string( bounding.first ) : bounding.second );
+            if( !stdin_first ) { os << stdin_csv.delimiter; }
+        }
+    }
+}
+
+static void _output_diff( std::ostream& os, boost::posix_time::ptime bounded, boost::posix_time::ptime bounding )
+{
+    if( !output_diff && !output_diff_abs ) { return; }
+    double diff = double( ( bounded - bounding ).total_microseconds() ) * 1e-6;
+    if( output_diff_abs ) { diff = std::abs( diff ); }
+    if( stdin_csv.binary() ) { os.write( reinterpret_cast< const char* >( &diff ), sizeof( double ) ); } else { os << stdin_csv.delimiter << diff; }    
+}
+
+static void output_input( std::ostream& os, const timestring_t& input )
+{
+    if( stdin_csv.binary() ) { os.write( &input.second[0], stdin_csv.format().size() ); } else { os << input.second; }
+}
+
+static void output( const timestring_t& input, const timestring_t& bounding, bool stdin_first )
+{
+    if( bounding.first.is_infinity() ) { return; }
+    if( bound && ( input.first - bounding.first > bound || bounding.first - input.first > bound )) { return; }
+    if( stdin_first )
+    {
+        output_input( std::cout, input );
+        output_bounding( std::cout, bounding, stdin_first );
+    }
+    else
+    {
+        output_bounding( std::cout, bounding, stdin_first );
+        output_input( std::cout, input );
+    }
+    _output_diff( std::cout, input.first, bounding.first );
+    if( !stdin_csv.binary() ) { std::cout << '\n'; }
+    std::cout.flush();
+}
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::signal_flag is_shutdown(comma::signal_flag::hard);
+        comma::command_line_options options( ac, av, usage );
+        if( options.exists( "--bash-completion" )) bash_completion( ac, av );
+        options.assert_mutually_exclusive( "--by-lower,--by-upper,--nearest,--realtime" );
+        options.assert_mutually_exclusive( "--output-diff,--diff", "--output-diff-abs,--abs-diff" );
+        if( options.exists( "--by-upper" )) { method = how::by_upper; }
+        if( options.exists( "--nearest" )) { method = how::nearest; }
+        if( options.exists( "--realtime" )) { method = how::realtime; }
+        timestamp_only = options.exists( "--timestamp-only,--time-only" );
+        output_diff = options.exists( "--output-diff,--diff" );
+        output_diff_abs = options.exists( "--output-diff-abs,--abs-diff" );
+        select_only = options.exists( "--do-not-append,--select" );
+        if( select_only && timestamp_only ) { std::cerr << "csv-time-join: --timestamp-only specified with --select, ignoring --timestamp-only" << std::endl; }
+        bool discard_bounding = options.exists( "--discard-bounding" );
+        boost::optional< unsigned int > buffer_size = options.optional< unsigned int >( "--buffer" );
+        if( options.exists( "--bound" ) ) { bound = boost::posix_time::microseconds( static_cast<unsigned int>(options.value< double >( "--bound" ) * 1000000 )); }
+        stdin_csv = comma::csv::options( options, "t" );
+        std::vector< std::string > unnamed = options.unnamed(
+            "--by-lower,--by-upper,--nearest,--realtime,--select,--do-not-append,--timestamp-only,--time-only,--discard-bounding",
+            "--binary,-b,--delimiter,-d,--fields,-f,--bound,--buffer,--verbose,-v,--output-diff-abs,--abs-diff,--diff-abs,--diff" );
+        std::string properties;
+        bool stdin_first = true;
+        switch( unnamed.size() )
+        {
+            case 0:
+                std::cerr << "csv-time-join: please specify bounding source" << std::endl;
+                return 1;
+            case 1:
+                properties = unnamed[0];
+                break;
+            case 2:
+                if( unnamed[0] == "-" ) { properties = unnamed[1]; }
+                else if( unnamed[1] == "-" ) { properties = unnamed[0]; stdin_first = false; }
+                else { std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
+                break;
+            default:
+                std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl;
+                return 1;
+        }
+        comma::name_value::parser parser( "filename" );
+        bounding_csv = parser.get< comma::csv::options >( properties );
+        if( bounding_csv.fields.empty() ) { bounding_csv.fields = "t"; }
+
+        comma::csv::input_stream< Point > stdin_stream( std::cin, stdin_csv );
+        #ifdef WIN32
+        if( stdin_csv.binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        #endif // #ifdef WIN32
+
+        comma::io::istream bounding_istream( comma::split( properties, ';' )[0], bounding_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii );
+        comma::csv::input_stream< Point > bounding_stream( *bounding_istream, bounding_csv );
+
+        #ifndef WIN32
+        comma::io::select select;
+        comma::io::select bounding_stream_select;
+        select.read().add( 0 );
+        select.read().add( bounding_istream.fd() );
+        bounding_stream_select.read().add( bounding_istream.fd() );
+        #endif // #ifndef WIN32
+
+        const Point* p = NULL;
+        if( method == how::realtime )
+        {
+            #ifdef WIN32
+            COMMA_THROW( comma::exception, "--realtime mode not supported in WIN32" );
+            #else
+            bool end_of_input = false;
+            bool end_of_bounds = false;
+            boost::optional< timestring_t > joined_line;
+            while( !is_shutdown && !end_of_input )
+            {
+                if( !bounding_stream.ready() && !stdin_stream.ready() ) { select.wait(boost::posix_time::milliseconds(1)); }
+                if( !is_shutdown && !end_of_input && ( stdin_stream.ready() || ( select.check() && select.read().ready( comma::io::stdin_fd ) ) ) )
+                {
+                    p = stdin_stream.read();
+                    if( p )
+                    {
+                        timestring_t input_line = std::make_pair( get_time( *p ), stdin_stream.last() );
+                        if( joined_line ) { output( input_line, *joined_line, stdin_first ); }
+                    }
+                    else
+                    {
+                        comma::verbose << "end of input stream" << std::endl;
+                        end_of_input = true;
+                    }
+                }
+                if( !is_shutdown && !end_of_bounds && ( bounding_stream.ready() || ( select.check() && select.read().ready( bounding_istream.fd() ) ) ) )
+                {
+                    p = bounding_stream.read();
+                    if( p )
+                    {
+                        joined_line = std::make_pair( get_time( *p ), bounding_stream.last() );
+                    }
+                    else
+                    {
+                        comma::verbose << "end of bounding stream" << std::endl;
+                        end_of_bounds = true;
+                    }
+                }
+            }
+            if( is_shutdown ) { comma::verbose << "got a signal" << std::endl; return 0; }
+            #endif // #ifdef WIN32
+        }
+        else
+        {
+            std::deque< timestring_t > bounding_queue;
+            bool next = true;
+            bool bounding_data_available;
+            bool upper_bound_added = false;
+            bounding_queue.push_back( std::make_pair( boost::posix_time::neg_infin, "" ) ); // add a fake entry for an lower bound to allow stdin before first bound to match
+            while( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) )
+            {
+                if( !std::cin.good() ) { select.read().remove( 0 ); }
+                if( !bounding_istream->good() ) { select.read().remove( bounding_istream.fd() ); }
+                bounding_data_available = bounding_stream.ready() || ( bounding_istream->good() && !bounding_istream->eof() );
+                #ifdef WIN32
+                bool bounding_stream_ready = true;
+                bool stdin_stream_ready = true;
+                #else // #ifdef WIN32
+                //check so we do not block
+                bool bounding_stream_ready = bounding_stream.ready();
+                bool stdin_stream_ready = stdin_stream.ready();
+                if( next )
+                {
+                    if( !bounding_stream_ready || !stdin_stream_ready )
+                    {
+                        if( !bounding_stream_ready && !stdin_stream_ready ) { select.wait( boost::posix_time::milliseconds( 10 ) ); }
+                        else { select.check(); }
+                        if( select.read().ready( bounding_istream.fd() )) { bounding_stream_ready = true; }
+                        if( select.read().ready(0) ) { stdin_stream_ready = true; }
+                    }
+                }
+                else
+                {
+                    if( !bounding_stream_ready )
+                    {
+                        bounding_stream_select.wait( boost::posix_time::milliseconds( 10 ) );
+                        if( bounding_stream_select.read().ready( bounding_istream.fd() )) { bounding_stream_ready=true; }
+                    }
+                }
+                #endif //#ifdef WIN32
+                //keep storing available bounding data
+                if( bounding_stream_ready )
+                {
+                    if( !buffer_size || bounding_queue.size() < *buffer_size || discard_bounding )
+                    {
+                        const Point* q = bounding_stream.read();
+                        if( q ) { bounding_queue.push_back( std::make_pair( get_time( *q ), bounding_stream.last() )); }
+                        else { bounding_data_available = false; }
+                    }
+                    if( buffer_size && bounding_queue.size() > *buffer_size && discard_bounding ) { bounding_queue.pop_front(); }
+                }
+                if( !upper_bound_added && bounding_istream->eof() )
+                {
+                    // add a fake entry for an upper bound to allow stdin data above last bound to match
+                    bounding_queue.push_back( std::make_pair( boost::posix_time::pos_infin, "" ));
+                    upper_bound_added = true;
+                }
+                //if we are done with the last bounded point get next
+                if( next )
+                {
+                    if( !stdin_stream_ready ) { continue; }
+                    p = stdin_stream.read();
+                    if( !p ) { break; }
+                }
+                boost::posix_time::ptime t = get_time( *p );
+                //get bound
+                for( ; bounding_queue.size() >= 2 && t >= bounding_queue[1].first; bounding_queue.pop_front() );
+                if( bounding_queue.size() < 2 )
+                {
+                    //bound not found
+                    //do we have more data?
+                    if( !bounding_data_available ) { break; }
+                    next = false;
+                    continue;
+                }
+                //bound available
+                if( method == how::by_lower && t < bounding_queue.front().first )
+                {
+                    next = true;
+                    continue;
+                }
+                bool is_first = ( method == how::by_lower )
+                    || ( method == how::nearest && ( t - bounding_queue[0].first ) < ( bounding_queue[1].first - t ));
+                const timestring_t& chosen_bound = is_first ? bounding_queue[0] : bounding_queue[1];;
+                timestring_t input_line = std::make_pair( t, stdin_stream.last() );
+                output( input_line, chosen_bound, stdin_first );
+                next = true;
+            }
+        }
+        return 0;     
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-time-join: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-time-join: unknown exception" << std::endl; }
+    return 1;
+}

From 74c23881815ea3fb5cc674a2fa46a8567c35c13b Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 6 Jun 2024 16:59:41 +1000
Subject: [PATCH 0823/1056] io::istreams: in progress...

---
 io/stream.cpp | 12 ++++++++++--
 io/stream.h   | 35 +++++++++++++++++++++++++++++++++++
 2 files changed, 45 insertions(+), 2 deletions(-)

diff --git a/io/stream.cpp b/io/stream.cpp
index d0db2bfae..ba9e31baa 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -17,16 +17,15 @@
 #include <fcntl.h>
 #include <fstream>
 #include <sstream>
-#include <vector>
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/ip/udp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
 #include <boost/bind/bind.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
-#include "impl/filesystem.h"
 #include "../base/exception.h"
 #include "../string/string.h"
+#include "impl/filesystem.h"
 #include "file_descriptor.h"
 #include "select.h"
 #include "stream.h"
@@ -377,6 +376,7 @@ static std::string usage( const std::string& what, const std::string& dash, unsi
 std::string istream::usage( unsigned int indent, bool verbose ) { return impl::usage( "input", "stdin", indent, verbose ); }
 std::string ostream::usage( unsigned int indent, bool verbose ) { return impl::usage( "output", "stdout", indent, verbose ); }
 std::string iostream::usage( unsigned int indent, bool verbose ) { return impl::usage( "input/output", "n/a", indent, verbose ); }
+std::string istreams::usage( unsigned int indent, bool verbose ) { return impl::usage( "input", "stdin", indent, verbose ); } // todo: improve; kind bogus...
 
 template class stream< std::istream >;
 template class stream< std::ostream >;
@@ -390,4 +390,12 @@ ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, boo
 ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close ) : stream< std::ostream >( s, fd, mode, blocking, close ) {}
 iostream::iostream( const std::string& name, mode::value mode , mode::blocking_value blocking ) : stream< std::iostream >( name, mode, blocking ) {}
 
+istreams::istreams( const std::vector< std::string >& names, mode::value mode, mode::blocking_value blocking ): _istream( std::make_unique< istream >( names[0], mode, blocking ) ), _names( names ), _index( 0 ) {}
+
+stream< std::istream >& istreams::operator++()
+{
+    // todo
+    COMMA_THROW( comma::exception, "todo" );
+}
+
 } } // namespace comma { namespace io {
diff --git a/io/stream.h b/io/stream.h
index 227fc9af1..90b4d04ab 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -6,7 +6,9 @@
 #pragma once
 
 #include <iostream>
+#include <memory>
 #include <string>
+#include <vector>
 #include <boost/function.hpp>
 #include <boost/noncopyable.hpp>
 #include "file_descriptor.h"
@@ -64,6 +66,12 @@ class stream : boost::noncopyable
         /// @return stream name
         const std::string& name() const;
 
+        /// @return stream mode
+        io::mode::value mode() const { return mode_; }
+
+        /// @return true if stream is blocking
+        bool blocking() const { return blocking_; }
+
     protected:
         stream( const std::string& name, mode::value mode, mode::blocking_value blocking );
         template < typename T >
@@ -112,4 +120,31 @@ struct iostream : public stream< std::iostream >
     static std::string usage( unsigned int indent = 0, bool verbose = false );
 };
 
+/// convenience class: multiple input streams read one by one
+/// use case
+///     - we have log files split by size, e.g. 1MB each: 0.bin, 1.bin, 2.bin, etc
+///     - we want to read records from those files seamlessly
+/// @todo currently, we assume a record never is split across two input files
+///       support for split records: todo, just ask
+/// @todo derive from std::istream (kinda super-fiddly, forwarding lots of methods...)
+/// @todo support constructing from a directory name
+class istreams
+{
+    public:
+        // todo: istreams( const std::string& dir...
+        istreams( const std::vector< std::string >& names, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
+        static std::string usage( unsigned int indent = 0, bool verbose = false );
+        bool eof() const { return _index + 1 < _names.size() || ( *_istream )->eof(); }
+        void read( char* buf, std::size_t size );
+        std::string getline();
+        void seek( std::uint64_t offset );
+        stream< std::istream >& operator()() { return *_istream; }
+        const stream< std::istream >& operator()() const { return *_istream; }
+        stream< std::istream >& operator++();
+    protected:
+        std::unique_ptr< istream > _istream;
+        std::vector< std::string > _names;
+        unsigned int _index{0};
+};
+
 } } // namespace comma { namespace io {

From 70d2fae7a1c7c3ea138b7ad5fd9f0edf97bc7889 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 6 Jun 2024 17:00:12 +1000
Subject: [PATCH 0824/1056] timing: timestamped: moved here from snark

---
 timing/timestamped.h | 57 ++++++++++++++++++++++++++++++++++++++++++++
 timing/traits.h      | 16 +++++++++++++
 2 files changed, 73 insertions(+)
 create mode 100644 timing/timestamped.h

diff --git a/timing/timestamped.h b/timing/timestamped.h
new file mode 100644
index 000000000..988e38cfa
--- /dev/null
+++ b/timing/timestamped.h
@@ -0,0 +1,57 @@
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time.hpp>
+
+namespace comma {
+
+template < typename T >
+struct timestamped
+{
+    boost::posix_time::ptime t;
+
+    T data;
+
+    timestamped() {}
+
+    timestamped( const T& data ) : t( boost::posix_time::microsec_clock::universal_time() ), data( data ) {}
+
+    timestamped( T&& data ) : t( boost::posix_time::microsec_clock::universal_time() ), data( data ) {}
+
+    timestamped( boost::posix_time::ptime t, const T& data ) : t( t ), data( data ) {}
+
+    timestamped( boost::posix_time::ptime t, T&& data ) : t( t ), data( data ) {}
+};
+
+template < typename T > inline timestamped< T > make_timestamped( T&& data ) { return timestamped< T >( data ); }
+
+template < typename T > inline timestamped< T > make_timestamped( boost::posix_time::ptime t, T&& data ) { return timestamped< T >( t, data ); }
+
+} // namespace comma {
diff --git a/timing/traits.h b/timing/traits.h
index 83b82cae6..7ba90b210 100644
--- a/timing/traits.h
+++ b/timing/traits.h
@@ -4,6 +4,7 @@
 /// @author vsevolod vlaskine
 
 #include "../timing/stats.h"
+#include "../timing/timestamped.h"
 #include "../visiting/traits.h"
 
 namespace comma { namespace visiting {
@@ -21,4 +22,19 @@ template <> struct traits< comma::timing::stats > // quick and dirty
     }
 };
 
+template < typename T > struct traits< comma::timestamped< T > >
+{
+    template< typename K, typename V > static void visit( const K&, comma::timestamped< T >& p, V& v )
+    {
+        v.apply( "t", p.t );
+        v.apply( "data", p.data );
+    }
+
+    template< typename K, typename V > static void visit( const K&, const comma::timestamped< T >& p, V& v )
+    {
+        v.apply( "t", p.t );
+        v.apply( "data", p.data );
+    }
+};
+
 } } // namespace comma { namespace visiting {

From 2b415129eb44ecc95e78a26976dc745b2c9c9840 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 6 Jun 2024 17:58:47 +1000
Subject: [PATCH 0825/1056] csv::split: refactoring to add optional logging to
 index file

---
 csv/split.cpp |  7 +++---
 csv/split.h   | 69 +++++++++++++++++++++++++++++++--------------------
 2 files changed, 46 insertions(+), 30 deletions(-)

diff --git a/csv/split.cpp b/csv/split.cpp
index 64838cbe1..bd63fb87f 100644
--- a/csv/split.cpp
+++ b/csv/split.cpp
@@ -37,9 +37,10 @@ std::string usage( unsigned int size, bool verbose )
 std::ofstream* ofstream::update( boost::posix_time::ptime t )
 {
     if( _ofs ) { _ofs.reset(); }
-    std::string filename = _dir + "/" + timing::to_iso_string( t ) + "." + _suffix;
-    _ofs = std::make_unique< std::ofstream >( filename );
-    COMMA_ASSERT( _ofs->is_open(), "failed to open '" << filename << "'" );
+    _time = t;
+    _filename = _dir + "/" + timing::to_iso_string( t ) + "." + _suffix;
+    _ofs = std::make_unique< std::ofstream >( _filename );
+    COMMA_ASSERT( _ofs->is_open(), "failed to open '" << _filename << "'" );
     return _ofs.get();
 }
 
diff --git a/csv/split.h b/csv/split.h
index 472732566..a0d7bea0a 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -27,12 +27,45 @@ struct type_traits
     static unsigned int id( const T& t ) { return t.id; }
 };
 
+class ofstream
+{
+    public:
+        ofstream( const std::string& dir, const std::string& suffix ): _dir( dir ), _suffix( suffix ) {}
+        ofstream( const std::string& dir, const options& csv ): _dir( dir ), _suffix( csv.binary() ? "bin" : "csv" ) {}
+        std::ofstream* update( boost::posix_time::ptime t );
+        template < typename T > std::ofstream* update( const T& t ) { return update( splitting::type_traits< T >::time( t ) ); }
+        std::ofstream* operator()() { return _ofs.get(); }
+        boost::posix_time::ptime time() const { return _time; }
+        const std::string& dir() const { return _dir; }
+        const std::string& filename() const { return _filename; }
+    
+    protected:
+        std::string _dir;
+        std::string _suffix;
+        std::string _filename;
+        boost::posix_time::ptime _time;
+        std::unique_ptr< std::ofstream > _ofs;
+};
+
 template < typename T >
 struct method
 {
     virtual ~method() {}
     virtual void wrote( unsigned int size ) {}
     virtual std::ostream* stream( const T& t, unsigned int size = 0 ) = 0;
+    virtual boost::posix_time::ptime time() const { return boost::posix_time::ptime(); } // quick and dirty for now
+};
+
+template < typename T >
+class to_timestamped_files: public method< T >
+{
+    public:
+        to_timestamped_files( const std::string& dir, const options& csv ): _ofs( dir, csv ) {}
+        boost::posix_time::ptime time() const { return _ofs.time(); }
+        const splitting::ofstream& ofs() const { return _ofs; }
+
+    protected:
+        splitting::ofstream _ofs;
 };
 
 template < typename T >
@@ -46,31 +79,15 @@ class none: public method< T >
         io::ostream _ostream;
 };
 
-class ofstream
-{
-    public:
-        ofstream( const std::string& dir, const std::string& suffix ): _dir( dir ), _suffix( suffix ) {}
-        ofstream( const std::string& dir, const options& csv ): _dir( dir ), _suffix( csv.binary() ? "bin" : "csv" ) {}
-        std::ofstream* update( boost::posix_time::ptime t );
-        template < typename T > std::ofstream* update( const T& t ) { return update( splitting::type_traits< T >::time( t ) ); }
-        std::ofstream* operator()() { return _ofs.get(); }
-    
-    protected:
-        std::string _dir;
-        std::string _suffix;
-        std::unique_ptr< std::ofstream > _ofs;
-};
-
 template < typename T >
-class by_time: public method< T >
+class by_time: public to_timestamped_files< T >
 {
     public:
         by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align = false );
         by_time( double max_duration, const std::string& dir, const options& csv, bool align ): by_time( timing::duration::from_seconds( max_duration ), dir, csv, align ) {}
-        std::ostream* stream( const T& t, unsigned int ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? _ofs.update( d ) : _ofs(); }
+        std::ostream* stream( const T& t, unsigned int ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? this->_ofs.update( d ) : this->_ofs(); }
     
     private:
-        splitting::ofstream _ofs;
         boost::posix_time::time_duration _max_duration;
         bool _align{false};
         boost::posix_time::ptime _deadline;
@@ -79,15 +96,14 @@ class by_time: public method< T >
 };
 
 template < typename T >
-class by_size: public method< T >
+class by_size: public to_timestamped_files< T >
 {
     public:
         by_size( std::size_t size, const std::string& dir, const options& csv );
-        std::ostream* stream( const T& t, unsigned int size = 0 ) { return _is_due( size ) ? _ofs.update( t ) : _ofs(); }
+        std::ostream* stream( const T& t, unsigned int size = 0 ) { return _is_due( size ) ? this->_ofs.update( t ) : this->_ofs(); }
         void wrote( unsigned int size );
 
     private:
-        splitting::ofstream _ofs;
         std::size_t _size{0};
         std::size_t _record_size{0};
         double _average_record_size{0};
@@ -98,14 +114,13 @@ class by_size: public method< T >
 };
 
 template < typename T >
-class by_block: public method< T >
+class by_block: public to_timestamped_files< T >
 {
     public:
-        by_block( const std::string& dir, const options& csv ): _ofs( dir, csv ), _block( silent_none< unsigned int >() ) {}
-        std::ostream* stream( const T& t, unsigned int ) { return _is_due( splitting::type_traits< T >::block( t ) ) ? _ofs.update( t ) : _ofs(); }
+        by_block( const std::string& dir, const options& csv ): to_timestamped_files< T >( dir, csv ), _block( silent_none< unsigned int >() ) {}
+        std::ostream* stream( const T& t, unsigned int ) { return _is_due( splitting::type_traits< T >::block( t ) ) ? this->_ofs.update( t ) : this->_ofs(); }
 
     private:
-        splitting::ofstream _ofs;
         boost::optional< unsigned int > _block;
 
         bool _is_due( unsigned int block );
@@ -213,7 +228,7 @@ namespace splitting {
 
 template < typename T >
 inline by_time< T >::by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align )
-    : _ofs( dir, csv )
+    : to_timestamped_files< T >( dir, csv )
     , _max_duration( max_duration )
     , _align( align )
 {
@@ -230,7 +245,7 @@ inline bool by_time< T >::_is_due( boost::posix_time::ptime t )
 
 template < typename T >
 inline by_size< T >::by_size( std::size_t size, const std::string& dir, const options& csv )
-    : _ofs( dir, csv )
+    : to_timestamped_files< T >( dir, csv )
     , _size( size )
     , _record_size( csv.binary() ? csv.format().size() : 0 )
 {

From b715dddfc7b8f6bd064662e012430687fb034bf8 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 6 Jun 2024 18:39:43 +1000
Subject: [PATCH 0826/1056] csv::split::how() method added

---
 csv/split.h | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/csv/split.h b/csv/split.h
index a0d7bea0a..cdb346ab0 100644
--- a/csv/split.h
+++ b/csv/split.h
@@ -54,6 +54,7 @@ struct method
     virtual void wrote( unsigned int size ) {}
     virtual std::ostream* stream( const T& t, unsigned int size = 0 ) = 0;
     virtual boost::posix_time::ptime time() const { return boost::posix_time::ptime(); } // quick and dirty for now
+    virtual const std::string& address() const;
 };
 
 template < typename T >
@@ -63,6 +64,7 @@ class to_timestamped_files: public method< T >
         to_timestamped_files( const std::string& dir, const options& csv ): _ofs( dir, csv ) {}
         boost::posix_time::ptime time() const { return _ofs.time(); }
         const splitting::ofstream& ofs() const { return _ofs; }
+        const std::string& address() const { return _ofs.dir(); }
 
     protected:
         splitting::ofstream _ofs;
@@ -72,10 +74,12 @@ template < typename T >
 class none: public method< T >
 {
     public:
-        none( const std::string& address ): _ostream( address ) {}
+        none( const std::string& address ): _ostream( address ), _address( address ) {}
         std::ostream* stream( const T&, unsigned int ) { return _ostream(); }
+        const std::string& address() const { return _address; }
     
     private:
+        std::string _address;
         io::ostream _ostream;
 };
 
@@ -141,6 +145,7 @@ class split
         split& operator<<( const T& t ) { return write( t, nullptr, 0 ); }
         bool eof() const { return _eof || ( _os && _os->eof() ); }
         static split< T >* make( const std::string& options, const csv::options& csv, bool permissive = false, const T& sample = T() );
+        const splitting::method< T >& how() { return *_how; }
 
     protected:
         std::unique_ptr< splitting::method< T > > _how;

From e18241c4be4ef7cd56cfdd6e795361acd2c3620a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 11 Jun 2024 11:21:17 +1000
Subject: [PATCH 0827/1056] synchronized::multiqueue moved to
 ordered::multiqueue

---
 .../{synchronized => ordered}/multiqueue.h    | 12 ++++++++--
 ...e_test.cpp => ordered_multiqueue_test.cpp} | 22 +++++++++----------
 2 files changed, 21 insertions(+), 13 deletions(-)
 rename containers/{synchronized => ordered}/multiqueue.h (84%)
 rename containers/test/{synchronized_multiqueue_test.cpp => ordered_multiqueue_test.cpp} (88%)

diff --git a/containers/synchronized/multiqueue.h b/containers/ordered/multiqueue.h
similarity index 84%
rename from containers/synchronized/multiqueue.h
rename to containers/ordered/multiqueue.h
index 85a9aab70..f72c171d5 100644
--- a/containers/synchronized/multiqueue.h
+++ b/containers/ordered/multiqueue.h
@@ -1,8 +1,14 @@
+// Copyright (c) 2024 Mission Systems
+
+/// @authors aspen eyers, vsevolod vlaskine
+
+#pragma once
+
 #include <queue>
 #include <tuple>
 #include <boost/date_time/posix_time/posix_time.hpp>
 
-namespace comma { namespace containers { namespace synchronized {
+namespace comma { namespace containers { namespace ordered {
 
 namespace impl {
 
@@ -11,6 +17,8 @@ template <> struct traits< boost::posix_time::ptime > { typedef boost::posix_tim
 
 }
 
+/// @todo variadic types
+/// @todo don't use std::pair, use traits instead?
 template < typename K, typename T, typename S >
 class multiqueue
 {
@@ -49,4 +57,4 @@ inline void multiqueue<K, T, S>::purge()
     }
 }
 
-} } } // namespace comma { namespace containers { namespace synchronized {
+} } } // namespace comma { namespace containers { namespace ordered {
diff --git a/containers/test/synchronized_multiqueue_test.cpp b/containers/test/ordered_multiqueue_test.cpp
similarity index 88%
rename from containers/test/synchronized_multiqueue_test.cpp
rename to containers/test/ordered_multiqueue_test.cpp
index f78cfcf4c..cd74666b5 100644
--- a/containers/test/synchronized_multiqueue_test.cpp
+++ b/containers/test/ordered_multiqueue_test.cpp
@@ -1,11 +1,11 @@
 // Copyright (c) 2023 Mission Systems Pty Ltd
 
 #include <gtest/gtest.h>
-#include "../synchronized/multiqueue.h"
-#include <boost/date_time/posix_time/posix_time.hpp>
+#include "../ordered/multiqueue.h"
 
-TEST( multiqueue, usage ){
-    typedef comma::containers::synchronized::multiqueue< int, int, int > multiqueue_t;
+TEST( multiqueue, usage )
+{
+    typedef comma::containers::ordered::multiqueue< int, int, int > multiqueue_t;
     multiqueue_t q{ 2 /*timeout*/  };
 
     EXPECT_EQ( std::get<0>(q.queues).size(), 0 );
@@ -34,7 +34,7 @@ TEST( multiqueue, usage ){
 }
 
 TEST( multiqueue, sync_first_to_second ){
-    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
     multiqueue_t q{ 2 /*timeout*/  };
 
     std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 0}, {2, 0}, {4, 5} });
@@ -52,7 +52,7 @@ TEST( multiqueue, sync_first_to_second ){
 }
 
 TEST( multiqueue, sync_second_to_first ){
-    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
     multiqueue_t q{ 2 /*timeout*/  };
 
     std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
@@ -70,7 +70,7 @@ TEST( multiqueue, sync_second_to_first ){
 }
 
 TEST( multiqueue, empty_list_before_sync ){
-    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
     multiqueue_t q{ 2 /*timeout*/ };
     std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 0}, {1, 0}, {2, 5} });
     std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
@@ -81,7 +81,7 @@ TEST( multiqueue, empty_list_before_sync ){
 }
 
 TEST( multiqueue, max_time_offset ){
-    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
     multiqueue_t q{ 2 /*timeout*/ };
     std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {3, 5} });
     std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
@@ -96,7 +96,7 @@ TEST( multiqueue, max_time_offset ){
 }
 
 TEST( multiqueue, floating_point_error ){
-    typedef comma::containers::synchronized::multiqueue< float, int, int > multiqueue_t;
+    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
     {
     multiqueue_t q{ 2 /*timeout*/ };
     std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
@@ -148,14 +148,14 @@ TEST( multiqueue, floating_point_error ){
 }
 
 TEST( multiqueue, type_difference ){
-    typedef comma::containers::synchronized::multiqueue< float, int, double > multiqueue_t;
+    typedef comma::containers::ordered::multiqueue< float, int, double > multiqueue_t;
     multiqueue_t q{ 2 /*timeout*/ };
     std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 1} });
     std::get<1>(q.queues) = std::queue< std::pair< float, double > >({ {0, 1.0} });
 }
 
 TEST( multiqueue, boost_time ){
-    typedef comma::containers::synchronized::multiqueue< boost::posix_time::ptime, double, double > multiqueue_t;
+    typedef comma::containers::ordered::multiqueue< boost::posix_time::ptime, double, double > multiqueue_t;
     multiqueue_t q{boost::posix_time::seconds( 2 /*timeout*/  ) };
 
     boost::posix_time::ptime t( boost::gregorian::date( 2023, 1, 1 ) );

From ba1b17b8af54b089e235877f6cd2cfd8cc2ff694 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 11 Jun 2024 11:33:28 +1000
Subject: [PATCH 0828/1056] ordered::multiqueue: renamed to queues simplified

---
 containers/ordered/{multiqueue.h => queues.h} |  29 ++-
 containers/test/ordered_multiqueue_test.cpp   | 167 ------------------
 containers/test/ordered_queues_test.cpp       | 167 ++++++++++++++++++
 3 files changed, 181 insertions(+), 182 deletions(-)
 rename containers/ordered/{multiqueue.h => queues.h} (50%)
 delete mode 100644 containers/test/ordered_multiqueue_test.cpp
 create mode 100644 containers/test/ordered_queues_test.cpp

diff --git a/containers/ordered/multiqueue.h b/containers/ordered/queues.h
similarity index 50%
rename from containers/ordered/multiqueue.h
rename to containers/ordered/queues.h
index f72c171d5..f5aa3a6e0 100644
--- a/containers/ordered/multiqueue.h
+++ b/containers/ordered/queues.h
@@ -20,12 +20,11 @@ template <> struct traits< boost::posix_time::ptime > { typedef boost::posix_tim
 /// @todo variadic types
 /// @todo don't use std::pair, use traits instead?
 template < typename K, typename T, typename S >
-class multiqueue
+class queues: public std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > >
 {
     public:
-        std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > > queues;
-
-        multiqueue( typename impl::traits< K >::diff_type max_diff ): _max_diff( max_diff ) {}
+        typedef std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > > queues_t;
+        queues( typename impl::traits< K >::diff_type max_diff ): _max_diff( max_diff ) {}
         bool ready() const;
         void purge();
 
@@ -35,25 +34,25 @@ class multiqueue
 };
 
 template < typename K, typename T, typename S >
-inline bool multiqueue<K, T, S>::ready() const
+inline bool queues<K, T, S>::ready() const
 {
-    if( std::get<0>(queues).empty() || std::get<1>(queues).empty() ) { return false; }
-    return _abs_diff( std::get<1>(queues).front().first, std::get<0>(queues).front().first ) <= _max_diff;
+    if( std::get<0>(*this).empty() || std::get<1>(*this).empty() ) { return false; }
+    return _abs_diff( std::get<1>(*this).front().first, std::get<0>(*this).front().first ) <= _max_diff;
 }
 
 template < typename K, typename T, typename S >
-inline void multiqueue<K, T, S>::purge()
+inline void queues<K, T, S>::purge()
 {
-    if( std::get<1>(queues).empty() || std::get<0>(queues).empty() ) { return; }
-    while( std::get<0>(queues).front().first - std::get<1>(queues).front().first > _max_diff ) 
+    if( std::get<1>(*this).empty() || std::get<0>(*this).empty() ) { return; }
+    while( std::get<0>(*this).front().first - std::get<1>(*this).front().first > _max_diff ) 
     { 
-        if( std::get<1>(queues).empty() ) { return; }
-        std::get<1>(queues).pop(); 
+        if( std::get<1>(*this).empty() ) { return; }
+        std::get<1>(*this).pop(); 
     }
-    while( std::get<1>(queues).front().first - std::get<0>(queues).front().first > _max_diff ) 
+    while( std::get<1>(*this).front().first - std::get<0>(*this).front().first > _max_diff ) 
     { 
-        if( std::get<0>(queues).empty() ) { return; }
-        std::get<0>(queues).pop(); 
+        if( std::get<0>(*this).empty() ) { return; }
+        std::get<0>(*this).pop(); 
     }
 }
 
diff --git a/containers/test/ordered_multiqueue_test.cpp b/containers/test/ordered_multiqueue_test.cpp
deleted file mode 100644
index cd74666b5..000000000
--- a/containers/test/ordered_multiqueue_test.cpp
+++ /dev/null
@@ -1,167 +0,0 @@
-// Copyright (c) 2023 Mission Systems Pty Ltd
-
-#include <gtest/gtest.h>
-#include "../ordered/multiqueue.h"
-
-TEST( multiqueue, usage )
-{
-    typedef comma::containers::ordered::multiqueue< int, int, int > multiqueue_t;
-    multiqueue_t q{ 2 /*timeout*/  };
-
-    EXPECT_EQ( std::get<0>(q.queues).size(), 0 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 0 );
-    EXPECT_EQ( q.ready(), false );
-
-    std::get<0>(q.queues).push( std::make_pair( 0, 1 ) );
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 1 );
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 0 );
-    EXPECT_EQ( q.ready(), false );
-
-    std::get<1>(q.queues).push( std::make_pair( 0, 1 ) );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 1 );
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( q.ready(), true );
-
-    // Purge should only remove items if they are unsynced
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 1 );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 1 );
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( q.ready(), true );
-}
-
-TEST( multiqueue, sync_first_to_second ){
-    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
-    multiqueue_t q{ 2 /*timeout*/  };
-
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 0}, {2, 0}, {4, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    EXPECT_EQ( q.ready(), false );
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<0>(q.queues).front().first, 4 );
-    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );    
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( q.ready(), true );
-
-}
-
-TEST( multiqueue, sync_second_to_first ){
-    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
-    multiqueue_t q{ 2 /*timeout*/  };
-
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {1, 0}, {2, 0}, {4, 5} });
-    EXPECT_EQ( q.ready(), false );
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<0>(q.queues).front().first, 5 );
-    EXPECT_EQ( std::get<1>(q.queues).front().first, 4 );    
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( q.ready(), true );
-
-}
-
-TEST( multiqueue, empty_list_before_sync ){
-    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
-    multiqueue_t q{ 2 /*timeout*/ };
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 0}, {1, 0}, {2, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).size(), 0 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( q.ready(), false );
-}
-
-TEST( multiqueue, max_time_offset ){
-    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
-    multiqueue_t q{ 2 /*timeout*/ };
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {3, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<0>(q.queues).front().first, 3 );
-    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );        
-    EXPECT_EQ( q.ready(), true );
-}
-
-TEST( multiqueue, floating_point_error ){
-    typedef comma::containers::ordered::multiqueue< float, int, int > multiqueue_t;
-    {
-    multiqueue_t q{ 2 /*timeout*/ };
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
-    EXPECT_NEAR( std::get<0>(q.queues).front().first, 3.000001, 1e-6 );
-    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );        
-    EXPECT_EQ( q.ready(), true );
-    }
-    {
-    multiqueue_t q{ 2 /*timeout*/ };
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).size(), 0 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<1>(q.queues).front().first, 5 );        
-    EXPECT_EQ( q.ready(), false );
-    }
-    {
-    multiqueue_t q{ 2 /*timeout*/ };
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<1>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<0>(q.queues).front().first, 5 );
-    EXPECT_NEAR( std::get<1>(q.queues).front().first, 3.000001, 1e-6 );
-    EXPECT_EQ( q.ready(), true );
-    }
-    {
-    multiqueue_t q{ 2 /*timeout*/ };
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {5, 5} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
-    q.purge();
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 0 );
-    EXPECT_EQ( std::get<0>(q.queues).front().second, 5 );
-    EXPECT_EQ( std::get<0>(q.queues).front().first, 5 );
-    EXPECT_EQ( q.ready(), false );
-    }    
-}
-
-TEST( multiqueue, type_difference ){
-    typedef comma::containers::ordered::multiqueue< float, int, double > multiqueue_t;
-    multiqueue_t q{ 2 /*timeout*/ };
-    std::get<0>(q.queues) = std::queue< std::pair< float, int > >({ {0, 1} });
-    std::get<1>(q.queues) = std::queue< std::pair< float, double > >({ {0, 1.0} });
-}
-
-TEST( multiqueue, boost_time ){
-    typedef comma::containers::ordered::multiqueue< boost::posix_time::ptime, double, double > multiqueue_t;
-    multiqueue_t q{boost::posix_time::seconds( 2 /*timeout*/  ) };
-
-    boost::posix_time::ptime t( boost::gregorian::date( 2023, 1, 1 ) );
-    std::get<0>(q.queues) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
-    std::get<1>(q.queues) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
-    EXPECT_EQ( std::get<0>(q.queues).size(), 1 );
-    EXPECT_EQ( std::get<1>(q.queues).size(), 1 );
-    EXPECT_EQ( q.ready(), true );
-}
diff --git a/containers/test/ordered_queues_test.cpp b/containers/test/ordered_queues_test.cpp
new file mode 100644
index 000000000..090a11af8
--- /dev/null
+++ b/containers/test/ordered_queues_test.cpp
@@ -0,0 +1,167 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+
+#include <gtest/gtest.h>
+#include "../ordered/queues.h"
+
+TEST( queues, usage )
+{
+    typedef comma::containers::ordered::queues< int, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/  };
+
+    EXPECT_EQ( std::get<0>(q).size(), 0 );
+    EXPECT_EQ( std::get<1>(q).size(), 0 );
+    EXPECT_EQ( q.ready(), false );
+
+    std::get<0>(q).push( std::make_pair( 0, 1 ) );
+    EXPECT_EQ( std::get<0>(q).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 0 );
+    EXPECT_EQ( q.ready(), false );
+
+    std::get<1>(q).push( std::make_pair( 0, 1 ) );
+    EXPECT_EQ( std::get<1>(q).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+    // Purge should only remove items if they are unsynced
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).front().second, 1 );
+    EXPECT_EQ( std::get<1>(q).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+}
+
+TEST( queues, sync_first_to_second ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/  };
+
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {0, 0}, {2, 0}, {4, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 4 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );    
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+}
+
+TEST( queues, sync_second_to_first ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/  };
+
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {1, 0}, {2, 0}, {4, 5} });
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_EQ( std::get<1>(q).front().first, 4 );    
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+}
+
+TEST( queues, empty_list_before_sync ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {0, 0}, {1, 0}, {2, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 0 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), false );
+}
+
+TEST( queues, max_time_offset ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {3, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 3 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );        
+    EXPECT_EQ( q.ready(), true );
+}
+
+TEST( queues, floating_point_error ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_NEAR( std::get<0>(q).front().first, 3.000001, 1e-6 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );        
+    EXPECT_EQ( q.ready(), true );
+    }
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 0 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );        
+    EXPECT_EQ( q.ready(), false );
+    }
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_NEAR( std::get<1>(q).front().first, 3.000001, 1e-6 );
+    EXPECT_EQ( q.ready(), true );
+    }
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 0 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_EQ( q.ready(), false );
+    }    
+}
+
+TEST( queues, type_difference ){
+    typedef comma::containers::ordered::queues< float, int, double > queues_t;
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::queue< std::pair< float, int > >({ {0, 1} });
+    std::get<1>(q) = std::queue< std::pair< float, double > >({ {0, 1.0} });
+}
+
+TEST( queues, boost_time ){
+    typedef comma::containers::ordered::queues< boost::posix_time::ptime, double, double > queues_t;
+    queues_t q{boost::posix_time::seconds( 2 /*timeout*/  ) };
+
+    boost::posix_time::ptime t( boost::gregorian::date( 2023, 1, 1 ) );
+    std::get<0>(q) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    std::get<1>(q) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+}

From 5049273612b631684735cb1e89e08329eefc7d54 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 11 Jun 2024 11:50:28 +1000
Subject: [PATCH 0829/1056] containers::ordered::queues: simplified: type
 traits torn down

---
 containers/ordered/queues.h | 16 +++++-----------
 1 file changed, 5 insertions(+), 11 deletions(-)

diff --git a/containers/ordered/queues.h b/containers/ordered/queues.h
index f5aa3a6e0..2902f1835 100644
--- a/containers/ordered/queues.h
+++ b/containers/ordered/queues.h
@@ -10,27 +10,21 @@
 
 namespace comma { namespace containers { namespace ordered {
 
-namespace impl {
-
-template < typename K > struct traits { typedef K diff_type; };
-template <> struct traits< boost::posix_time::ptime > { typedef boost::posix_time::time_duration diff_type; };
-
-}
-
 /// @todo variadic types
 /// @todo don't use std::pair, use traits instead?
 template < typename K, typename T, typename S >
 class queues: public std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > >
 {
     public:
-        typedef std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > > queues_t;
-        queues( typename impl::traits< K >::diff_type max_diff ): _max_diff( max_diff ) {}
+        typedef std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > > queues_type;
+        typedef decltype( K() - K() ) diff_type;
+        queues( diff_type max_diff ): _max_diff( max_diff ) {}
         bool ready() const;
         void purge();
 
     private:
-        typename impl::traits< K >::diff_type _max_diff;
-        static typename impl::traits< K >::diff_type _abs_diff(K lhs, K rhs) { return lhs < rhs ? (rhs - lhs) : (lhs - rhs); }
+        diff_type _max_diff;
+        static diff_type _abs_diff(K lhs, K rhs) { return lhs < rhs ? (rhs - lhs) : (lhs - rhs); }
 };
 
 template < typename K, typename T, typename S >

From 0b4140402436b617ccf8f25d49457512a53bcede Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 11 Jun 2024 11:54:06 +1000
Subject: [PATCH 0830/1056] containers::ordered::queues: dependency on
 boost::posix_time removed

---
 containers/ordered/queues.h             | 1 -
 containers/test/ordered_queues_test.cpp | 7 +++++--
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/containers/ordered/queues.h b/containers/ordered/queues.h
index 2902f1835..aba3e3dbb 100644
--- a/containers/ordered/queues.h
+++ b/containers/ordered/queues.h
@@ -6,7 +6,6 @@
 
 #include <queue>
 #include <tuple>
-#include <boost/date_time/posix_time/posix_time.hpp>
 
 namespace comma { namespace containers { namespace ordered {
 
diff --git a/containers/test/ordered_queues_test.cpp b/containers/test/ordered_queues_test.cpp
index 090a11af8..925edc262 100644
--- a/containers/test/ordered_queues_test.cpp
+++ b/containers/test/ordered_queues_test.cpp
@@ -1,6 +1,7 @@
 // Copyright (c) 2023 Mission Systems Pty Ltd
 
 #include <gtest/gtest.h>
+#include <boost/date_time/posix_time/posix_time.hpp>
 #include "../ordered/queues.h"
 
 TEST( queues, usage )
@@ -147,14 +148,16 @@ TEST( queues, floating_point_error ){
     }    
 }
 
-TEST( queues, type_difference ){
+TEST( queues, type_difference )
+{
     typedef comma::containers::ordered::queues< float, int, double > queues_t;
     queues_t q{ 2 /*timeout*/ };
     std::get<0>(q) = std::queue< std::pair< float, int > >({ {0, 1} });
     std::get<1>(q) = std::queue< std::pair< float, double > >({ {0, 1.0} });
 }
 
-TEST( queues, boost_time ){
+TEST( queues, boost_time )
+{
     typedef comma::containers::ordered::queues< boost::posix_time::ptime, double, double > queues_t;
     queues_t q{boost::posix_time::seconds( 2 /*timeout*/  ) };
 

From b3c6cc3f8cc11dd82a2f4bda204ac1cb6f16b97d Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 11 Jun 2024 16:17:38 +1000
Subject: [PATCH 0831/1056] io::streams::read() and ::operator++() implemented

---
 io/stream.cpp | 31 +++++++++++++++++++++++++++----
 io/stream.h   |  6 ++++--
 2 files changed, 31 insertions(+), 6 deletions(-)

diff --git a/io/stream.cpp b/io/stream.cpp
index ba9e31baa..f48f38bc9 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -390,12 +390,35 @@ ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, boo
 ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close ) : stream< std::ostream >( s, fd, mode, blocking, close ) {}
 iostream::iostream( const std::string& name, mode::value mode , mode::blocking_value blocking ) : stream< std::iostream >( name, mode, blocking ) {}
 
-istreams::istreams( const std::vector< std::string >& names, mode::value mode, mode::blocking_value blocking ): _istream( std::make_unique< istream >( names[0], mode, blocking ) ), _names( names ), _index( 0 ) {}
+istreams::istreams( const std::vector< std::string >& names, mode::value mode, mode::blocking_value blocking ): _istream( std::make_unique< istream >( names[0], mode, blocking ) ), _names( names ), _index( 0 ), _mode( mode ), _blocking( blocking ) {}
 
-stream< std::istream >& istreams::operator++()
+istreams& istreams::operator++()
 {
-    // todo
-    COMMA_THROW( comma::exception, "todo" );
+    ++_index;
+    if( _index < _names.size() ) { _istream.reset(); _istream.reset( new istream( _names[_index], _mode, _blocking ) ); }
+    return *this;
+}
+
+bool istreams::read( char* buf, std::size_t size )
+{
+    std::size_t s = size;
+    for( char* p = buf; s > 0 && !eof(); ++( *this ) )
+    {
+        auto& is = *( *_istream );
+        is.read( p, s );
+        if( is.gcount() > 0 ) { s -= is.gcount(); p += is.gcount(); }
+    }
+    return s == 0;
+}
+
+std::string istreams::getline()
+{
+    COMMA_THROW( comma::exception, "todo, just ask" );
+}
+
+void seek( std::uint64_t offset )
+{
+    COMMA_THROW( comma::exception, "todo, just ask" );
 }
 
 } } // namespace comma { namespace io {
diff --git a/io/stream.h b/io/stream.h
index 90b4d04ab..d1837a5e9 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -135,16 +135,18 @@ class istreams
         istreams( const std::vector< std::string >& names, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
         static std::string usage( unsigned int indent = 0, bool verbose = false );
         bool eof() const { return _index + 1 < _names.size() || ( *_istream )->eof(); }
-        void read( char* buf, std::size_t size );
+        bool read( char* buf, std::size_t size );
         std::string getline();
         void seek( std::uint64_t offset );
         stream< std::istream >& operator()() { return *_istream; }
         const stream< std::istream >& operator()() const { return *_istream; }
-        stream< std::istream >& operator++();
+        istreams& operator++();
     protected:
         std::unique_ptr< istream > _istream;
         std::vector< std::string > _names;
         unsigned int _index{0};
+        mode::value _mode;
+        mode::blocking_value _blocking;
 };
 
 } } // namespace comma { namespace io {

From cc545891ffb04f6fab60cdb408982b80d4a85496 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 12 Jun 2024 16:19:24 +1000
Subject: [PATCH 0832/1056] io::streams::eof(): bug fixed

---
 io/stream.cpp | 12 +++++++++++-
 io/stream.h   |  2 +-
 2 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/io/stream.cpp b/io/stream.cpp
index f48f38bc9..92ea7bdc0 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -390,10 +390,20 @@ ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, boo
 ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close ) : stream< std::ostream >( s, fd, mode, blocking, close ) {}
 iostream::iostream( const std::string& name, mode::value mode , mode::blocking_value blocking ) : stream< std::iostream >( name, mode, blocking ) {}
 
-istreams::istreams( const std::vector< std::string >& names, mode::value mode, mode::blocking_value blocking ): _istream( std::make_unique< istream >( names[0], mode, blocking ) ), _names( names ), _index( 0 ), _mode( mode ), _blocking( blocking ) {}
+istreams::istreams( const std::vector< std::string >& names, mode::value mode, mode::blocking_value blocking )
+    : _istream( std::make_unique< istream >( names[0], mode, blocking ) )
+    , _names( names )
+    , _index( 0 )
+    , _mode( mode )
+    , _blocking( blocking )
+{
+}
+
+bool istreams::eof() const { return _index >= _names.size() || _index == _names.size() - 1 || ( *_istream )->eof(); }
 
 istreams& istreams::operator++()
 {
+    if( _index >= _names.size() ) { return *this; }
     ++_index;
     if( _index < _names.size() ) { _istream.reset(); _istream.reset( new istream( _names[_index], _mode, _blocking ) ); }
     return *this;
diff --git a/io/stream.h b/io/stream.h
index d1837a5e9..70e3ff013 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -134,7 +134,7 @@ class istreams
         // todo: istreams( const std::string& dir...
         istreams( const std::vector< std::string >& names, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
         static std::string usage( unsigned int indent = 0, bool verbose = false );
-        bool eof() const { return _index + 1 < _names.size() || ( *_istream )->eof(); }
+        bool eof() const;
         bool read( char* buf, std::size_t size );
         std::string getline();
         void seek( std::uint64_t offset );

From cc5a6087fa103cca9e92cab65321298373b72874 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 18 Jun 2024 17:54:14 +1000
Subject: [PATCH 0833/1056] bash/comma-application-util: swiss: optional usage
 function check added

---
 bash/comma-application-util | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 8d8d72703..397265145 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -307,7 +307,7 @@ function comma-application-swiss-usage()
 {
     local common_options=$( cat )
     echo
-    echo "usage: $( basename "$0" ) <operation> <options>"
+    if [[ $( type -t usage ) == "function" ]]; then usage; else echo "usage: $( basename "$0" ) <operation> <options>"; fi
     echo; echo "common options"
     { [[ -z "$common_options" ]] || echo "$common_options"; comma-application-common-options; } | sed 's#^#   #'
     echo; echo "available operations: ${operations[@]}"

From 962a89295785d4caa7421d650a3e60c8a0ad68a9 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 18 Jun 2024 19:33:43 +1000
Subject: [PATCH 0834/1056] bash/comma-application-util: comma-source-relative
 implemented

---
 bash/comma-application-util | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 397265145..998a1137e 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -19,6 +19,17 @@ readonly comma_application_util_include_guard_=1
 
 source $( type -p comma-name-value-util ) || { echo "$comma_application_name: cannot source 'comma-name-value-util' from '$BASH_SOURCE'" >&2; exit 1; }
 
+## @page comma-source-relative comma-source-relative
+# @section comma-source-relative
+# @description source relative to the location of the calling
+#              script/subshell (a trivial convenience wrapper)
+# @param relative path to source
+function comma-source-relative()
+{
+    source "$( realpath $( dirname $0 ) )"/$1
+}
+export -f comma-source-relative
+
 ## @page comma_options_from_name_value comma_options_from_name_value
 # @section comma_options_from_name_value
 # @description convert path-value pairs to bash variables

From b6c56f96b065ce7fb9f9c8267413416a57fdbc52 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 20 Jun 2024 12:32:53 +1000
Subject: [PATCH 0835/1056] comma-application-util: comma-source-relative:
 support for wildcards and multiple sources implemented and tested

---
 bash/comma-application-util                         | 11 +++++++++--
 .../comma-source-relative/a/b/x                     |  3 +++
 .../comma-source-relative/a/b/y                     |  3 +++
 .../comma-source-relative/a/z                       |  3 +++
 .../comma-source-relative/expected                  | 13 +++++++++++++
 .../comma-source-relative/test                      |  9 +++++++++
 6 files changed, 40 insertions(+), 2 deletions(-)
 create mode 100644 bash/test/comma-application-util/comma-source-relative/a/b/x
 create mode 100644 bash/test/comma-application-util/comma-source-relative/a/b/y
 create mode 100644 bash/test/comma-application-util/comma-source-relative/a/z
 create mode 100644 bash/test/comma-application-util/comma-source-relative/expected
 create mode 100755 bash/test/comma-application-util/comma-source-relative/test

diff --git a/bash/comma-application-util b/bash/comma-application-util
index 998a1137e..4f6ff584b 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -23,10 +23,17 @@ source $( type -p comma-name-value-util ) || { echo "$comma_application_name: ca
 # @section comma-source-relative
 # @description source relative to the location of the calling
 #              script/subshell (a trivial convenience wrapper)
-# @param relative path to source
+# @param whitespace-separated relative paths to source
+#        regular expressions permitted, e.g. my/sources/*
+#        as well as directory names, e.g. my/sources, which is the
+#        same as my/sources/*
 function comma-source-relative()
 {
-    source "$( realpath $( dirname $0 ) )"/$1
+    local dir="$( realpath $( dirname $0 ) )"
+    for s in "$@"; do
+        if [[ -d "$s" ]]; then for t in "$s"/*; do comma-source-relative "$t" || return 1; done
+        else source "$dir/$s" || return 1; fi
+    done
 }
 export -f comma-source-relative
 
diff --git a/bash/test/comma-application-util/comma-source-relative/a/b/x b/bash/test/comma-application-util/comma-source-relative/a/b/x
new file mode 100644
index 000000000..b2b26ad4d
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/a/b/x
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+echo "a/b/x/sourced=1"
diff --git a/bash/test/comma-application-util/comma-source-relative/a/b/y b/bash/test/comma-application-util/comma-source-relative/a/b/y
new file mode 100644
index 000000000..57886fadc
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/a/b/y
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+echo "a/b/y/sourced=1"
diff --git a/bash/test/comma-application-util/comma-source-relative/a/z b/bash/test/comma-application-util/comma-source-relative/a/z
new file mode 100644
index 000000000..c117c82e6
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/a/z
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+echo "a/z/sourced=1"
diff --git a/bash/test/comma-application-util/comma-source-relative/expected b/bash/test/comma-application-util/comma-source-relative/expected
new file mode 100644
index 000000000..930585d1c
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/expected
@@ -0,0 +1,13 @@
+once/a/b/x/sourced=1
+multiple/a/b/x/sourced=1
+multiple/a/b/y/sourced=1
+multiple/a/z/sourced=1
+wildcard/a/b/x/sourced=1
+wildcard/a/b/y/sourced=1
+directory/a/b/x/sourced=1
+directory/a/b/y/sourced=1
+directories/a/b/x/sourced=1
+directories/a/b/y/sourced=1
+directories/a/b/x/sourced=1
+directories/a/b/y/sourced=1
+directories/a/z/sourced=1
diff --git a/bash/test/comma-application-util/comma-source-relative/test b/bash/test/comma-application-util/comma-source-relative/test
new file mode 100755
index 000000000..5b8a9e95c
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/test
@@ -0,0 +1,9 @@
+#!/bin/bash
+
+source ../../../comma-application-util || exit 1
+
+comma-source-relative a/b/x | sed 's#^#once/#'
+comma-source-relative a/b/x a/b/y a/z | sed 's#^#multiple/#'
+comma-source-relative a/b/* | sed 's#^#wildcard/#'
+comma-source-relative a/b | sed 's#^#directory/#'
+comma-source-relative a/b a | sed 's#^#directories/#'

From a6579f0564f9e916ae910838bbe3e73fda960827 Mon Sep 17 00:00:00 2001
From: aspen <aspen@aspen>
Date: Tue, 9 Jul 2024 12:11:10 +1000
Subject: [PATCH 0836/1056] containers/CMakeLists.txt: Added ordered queues to
 install

---
 containers/CMakeLists.txt | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/containers/CMakeLists.txt b/containers/CMakeLists.txt
index c809b3809..1e9d5a730 100644
--- a/containers/CMakeLists.txt
+++ b/containers/CMakeLists.txt
@@ -4,15 +4,16 @@ SET( TARGET_NAME comma_${PROJECT} )
 FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
 FILE( GLOB multidimensional_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/multidimensional/*.h )
+FILE( GLOB ordered_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/ordered/*.h )
 
-SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${multidimensional_includes} )
-
-add_custom_target( ${TARGET_NAME} ${source} ${includes} ${multidimensional_includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_includes} )
+SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${multidimensional_includes} ${ordered_includes} )
+add_custom_target( ${TARGET_NAME} ${source} ${includes} ${multidimensional_includes} ${ordered_includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_includes} )
 #SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 #TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( FILES ${multidimensional_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/multidimensional )
+INSTALL( FILES ${ordered_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ordered )
 #INSTALL(
 #    TARGETS ${TARGET_NAME}
 #    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll

From a9fd6f7a38efed2f11b4a72c713e81f41b107424 Mon Sep 17 00:00:00 2001
From: aspen <aspen@aspen>
Date: Tue, 9 Jul 2024 13:09:13 +1000
Subject: [PATCH 0837/1056] containers/ordered/queues.h

Switch to deque for flexability.
Add convenience function pop all element.
---
 containers/ordered/queues.h             | 35 ++++++++++--
 containers/test/ordered_queues_test.cpp | 76 ++++++++++++++++++-------
 2 files changed, 84 insertions(+), 27 deletions(-)

diff --git a/containers/ordered/queues.h b/containers/ordered/queues.h
index aba3e3dbb..27580392a 100644
--- a/containers/ordered/queues.h
+++ b/containers/ordered/queues.h
@@ -4,26 +4,35 @@
 
 #pragma once
 
-#include <queue>
+#include <deque>
 #include <tuple>
 
 namespace comma { namespace containers { namespace ordered {
 
 /// @todo variadic types
 /// @todo don't use std::pair, use traits instead?
+/// @todo max_diff, grater or grater_equal? & document; unit test on ints; unit test on max diff 0]
+/// @todo pop_all will remove the first elements from both queues, but we may want to pop just one element and still keep the other one
+///       Use case: we want to get every (valid) element from both queues with its corresponding element from the other queue and process them
+///       independently. If we pop both elements, we may lose the correspondence between the elements from the two queues. 
 template < typename K, typename T, typename S >
-class queues: public std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > >
+class queues: public std::tuple< std::deque< std::pair< K, T > >, std::deque< std::pair< K, S > > >
 {
     public:
-        typedef std::tuple< std::queue< std::pair< K, T > >, std::queue< std::pair< K, S > > > queues_type;
+        typedef std::tuple< std::deque< std::pair< K, T > >, std::deque< std::pair< K, S > > > queues_type;
+        typedef std::tuple< std::pair< K, T >, std::pair< K, S > > values_type;
+        typedef std::tuple< const std::pair< K, T >&, const std::pair< K, S >& > ref_type;
         typedef decltype( K() - K() ) diff_type;
         queues( diff_type max_diff ): _max_diff( max_diff ) {}
         bool ready() const;
         void purge();
+        void pop_all();
+        ref_type front() const;
 
     private:
         diff_type _max_diff;
         static diff_type _abs_diff(K lhs, K rhs) { return lhs < rhs ? (rhs - lhs) : (lhs - rhs); }
+        template < unsigned int I, unsigned int J > bool _purge();
 };
 
 template < typename K, typename T, typename S >
@@ -37,16 +46,32 @@ template < typename K, typename T, typename S >
 inline void queues<K, T, S>::purge()
 {
     if( std::get<1>(*this).empty() || std::get<0>(*this).empty() ) { return; }
+    // If not purge 0,1, then purge 1,0
     while( std::get<0>(*this).front().first - std::get<1>(*this).front().first > _max_diff ) 
     { 
         if( std::get<1>(*this).empty() ) { return; }
-        std::get<1>(*this).pop(); 
+        std::get<1>(*this).pop_front();
     }
     while( std::get<1>(*this).front().first - std::get<0>(*this).front().first > _max_diff ) 
     { 
         if( std::get<0>(*this).empty() ) { return; }
-        std::get<0>(*this).pop(); 
+        std::get<0>(*this).pop_front();
     }
 }
 
+template < typename K, typename T, typename S >
+void queues<K, T, S>::pop_all()
+{
+    std::get<0>(*this).pop_front();
+    std::get<1>(*this).pop_front();
+    return;
+}
+
+
+template < typename K, typename T, typename S >
+inline typename queues<K, T, S>::ref_type queues<K, T, S>::front() const
+{
+    return { std::get<0>(*this).front(), std::get<1>(*this).front() };
+}
+
 } } } // namespace comma { namespace containers { namespace ordered {
diff --git a/containers/test/ordered_queues_test.cpp b/containers/test/ordered_queues_test.cpp
index 925edc262..923197ea7 100644
--- a/containers/test/ordered_queues_test.cpp
+++ b/containers/test/ordered_queues_test.cpp
@@ -13,13 +13,13 @@ TEST( queues, usage )
     EXPECT_EQ( std::get<1>(q).size(), 0 );
     EXPECT_EQ( q.ready(), false );
 
-    std::get<0>(q).push( std::make_pair( 0, 1 ) );
+    std::get<0>(q).push_back( std::make_pair( 0, 1 ) );
     EXPECT_EQ( std::get<0>(q).front().second, 1 );
     EXPECT_EQ( std::get<0>(q).size(), 1 );
     EXPECT_EQ( std::get<1>(q).size(), 0 );
     EXPECT_EQ( q.ready(), false );
 
-    std::get<1>(q).push( std::make_pair( 0, 1 ) );
+    std::get<1>(q).push_back( std::make_pair( 0, 1 ) );
     EXPECT_EQ( std::get<1>(q).front().second, 1 );
     EXPECT_EQ( std::get<0>(q).size(), 1 );
     EXPECT_EQ( std::get<1>(q).size(), 1 );
@@ -38,8 +38,8 @@ TEST( queues, sync_first_to_second ){
     typedef comma::containers::ordered::queues< float, int, int > queues_t;
     queues_t q{ 2 /*timeout*/  };
 
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {0, 0}, {2, 0}, {4, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 0}, {2, 0}, {4, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
     EXPECT_EQ( q.ready(), false );
     q.purge();
     EXPECT_EQ( std::get<0>(q).front().second, 5 );
@@ -56,8 +56,8 @@ TEST( queues, sync_second_to_first ){
     typedef comma::containers::ordered::queues< float, int, int > queues_t;
     queues_t q{ 2 /*timeout*/  };
 
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {1, 0}, {2, 0}, {4, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {1, 0}, {2, 0}, {4, 5} });
     EXPECT_EQ( q.ready(), false );
     q.purge();
     EXPECT_EQ( std::get<0>(q).front().second, 5 );
@@ -73,19 +73,51 @@ TEST( queues, sync_second_to_first ){
 TEST( queues, empty_list_before_sync ){
     typedef comma::containers::ordered::queues< float, int, int > queues_t;
     queues_t q{ 2 /*timeout*/ };
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {0, 0}, {1, 0}, {2, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 0}, {1, 0}, {2, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
     q.purge();
     EXPECT_EQ( std::get<0>(q).size(), 0 );
     EXPECT_EQ( std::get<1>(q).size(), 1 );
     EXPECT_EQ( q.ready(), false );
 }
 
+TEST( queues, sync_and_pop ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 0.9 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 1}, {1, 1}, {2, 1}, {3, 1}, {4, 1}, {5, 1} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {3, 2}, {5, 2}});
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 3 ); // {3, 1}, {4, 1}, {5, 1} });
+    EXPECT_EQ( std::get<1>(q).size(), 2 ); // {3, 2}, {5, 2}});
+    EXPECT_EQ( std::get<0>(q).front().first, 3 );
+    EXPECT_EQ( std::get<1>(q).front().first, 3 );
+    EXPECT_EQ( q.ready(), true );
+
+    auto data = q.front();
+    q.pop_all();
+    EXPECT_EQ( std::get<0>(data).first, 3 );
+    EXPECT_EQ( std::get<1>(data).first, 3 );
+    EXPECT_EQ( std::get<0>(q).size(), 2 ); // {4, 1}, {5, 1} });
+    EXPECT_EQ( std::get<1>(q).size(), 1 ); // {5, 2}});
+    EXPECT_EQ( std::get<0>(q).front().first, 4 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );
+
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( q.ready(), true );
+
+    EXPECT_EQ( std::get<0>(q).size(), 1 ); // {5, 1} });
+    EXPECT_EQ( std::get<1>(q).size(), 1 ); // {5, 2}});
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );
+    EXPECT_EQ( q.ready(), true );
+}
+
 TEST( queues, max_time_offset ){
     typedef comma::containers::ordered::queues< float, int, int > queues_t;
     queues_t q{ 2 /*timeout*/ };
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {3, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {3, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
     q.purge();
     EXPECT_EQ( std::get<0>(q).size(), 1 );
     EXPECT_EQ( std::get<1>(q).size(), 1 );
@@ -100,8 +132,8 @@ TEST( queues, floating_point_error ){
     typedef comma::containers::ordered::queues< float, int, int > queues_t;
     {
     queues_t q{ 2 /*timeout*/ };
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {3.000001, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
     q.purge();
     EXPECT_EQ( std::get<0>(q).size(), 1 );
     EXPECT_EQ( std::get<1>(q).size(), 1 );
@@ -113,8 +145,8 @@ TEST( queues, floating_point_error ){
     }
     {
     queues_t q{ 2 /*timeout*/ };
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {2.999999, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
     q.purge();
     EXPECT_EQ( std::get<0>(q).size(), 0 );
     EXPECT_EQ( std::get<1>(q).size(), 1 );
@@ -124,8 +156,8 @@ TEST( queues, floating_point_error ){
     }
     {
     queues_t q{ 2 /*timeout*/ };
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {3.000001, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {3.000001, 5} });
     q.purge();
     EXPECT_EQ( std::get<0>(q).size(), 1 );
     EXPECT_EQ( std::get<1>(q).size(), 1 );
@@ -137,8 +169,8 @@ TEST( queues, floating_point_error ){
     }
     {
     queues_t q{ 2 /*timeout*/ };
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {5, 5} });
-    std::get<1>(q) = std::queue< std::pair< float, int > >({ {2.999999, 5} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {2.999999, 5} });
     q.purge();
     EXPECT_EQ( std::get<0>(q).size(), 1 );
     EXPECT_EQ( std::get<1>(q).size(), 0 );
@@ -152,8 +184,8 @@ TEST( queues, type_difference )
 {
     typedef comma::containers::ordered::queues< float, int, double > queues_t;
     queues_t q{ 2 /*timeout*/ };
-    std::get<0>(q) = std::queue< std::pair< float, int > >({ {0, 1} });
-    std::get<1>(q) = std::queue< std::pair< float, double > >({ {0, 1.0} });
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 1} });
+    std::get<1>(q) = std::deque< std::pair< float, double > >({ {0, 1.0} });
 }
 
 TEST( queues, boost_time )
@@ -162,8 +194,8 @@ TEST( queues, boost_time )
     queues_t q{boost::posix_time::seconds( 2 /*timeout*/  ) };
 
     boost::posix_time::ptime t( boost::gregorian::date( 2023, 1, 1 ) );
-    std::get<0>(q) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
-    std::get<1>(q) = std::queue< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    std::get<0>(q) = std::deque< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    std::get<1>(q) = std::deque< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
     EXPECT_EQ( std::get<0>(q).size(), 1 );
     EXPECT_EQ( std::get<1>(q).size(), 1 );
     EXPECT_EQ( q.ready(), true );

From c103b9c3c84a3e777411f0824b0d2b9ae183c241 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 23 Jul 2024 16:56:41 +1000
Subject: [PATCH 0838/1056] containers/test/multidimensional_array_test.cpp:
 quick and dirty: cache miss slowdown: added and commented out

---
 .../test/multidimensional_array_test.cpp      | 29 ++++++++++++++++++-
 1 file changed, 28 insertions(+), 1 deletion(-)

diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index a48b25cf8..93b476201 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -1,6 +1,8 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
+// #include <numeric>
+// #include <boost/date_time/posix_time/posix_time.hpp>
 #include "../multidimensional/array.h"
 
 namespace cmd = comma::containers::multidimensional; 
@@ -213,4 +215,29 @@ TEST( multidimensional_array, grid_interpolate )
         //EXPECT_EQ( g.interpolated( {1, 0} ), 2 );
         //EXPECT_EQ( g.interpolated( {1, 1} ), 3 );
     }
-}
\ No newline at end of file
+}
+
+// TEST( vector_of_vectors, performance )
+// {
+//     //std::pair< unsigned int, unsigned int > size{ 10000000, 4 };
+//     std::pair< unsigned int, unsigned int > size{ 4096, 8 };
+//     std::vector< std::vector< float > > a( size.first, std::vector< float >( size.second, 0 ) );
+//     std::vector< float > b( size.first * size.second, 0 );
+//     auto t0 = boost::posix_time::microsec_clock::universal_time();
+//     for( auto& c: a )
+//     {
+//         for( auto& d: c )
+//         {
+//             d += 10;
+//         }
+//     }
+//     auto t1 = boost::posix_time::microsec_clock::universal_time();
+//     for( auto& d: b )
+//     {
+//         d += 10;
+//     }
+//     auto t2 = boost::posix_time::microsec_clock::universal_time();
+//     auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
+//     auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
+//     std::cerr << "==> speedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
+// }

From 54cd161145473359c91f9a296fe60dca4970afd5 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 23 Jul 2024 18:09:31 +1000
Subject: [PATCH 0839/1056] containers/test/multidimensional_array_test.cpp:
 quick and dirty: memcpy speedup: added and commented out

---
 .../test/multidimensional_array_test.cpp      | 50 ++++++++++++++-----
 1 file changed, 38 insertions(+), 12 deletions(-)

diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 93b476201..e33ddd596 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -1,8 +1,7 @@
 // Copyright (c) 2023 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
-// #include <numeric>
-// #include <boost/date_time/posix_time/posix_time.hpp>
+//#include <boost/date_time/posix_time/posix_time.hpp>
 #include "../multidimensional/array.h"
 
 namespace cmd = comma::containers::multidimensional; 
@@ -223,21 +222,48 @@ TEST( multidimensional_array, grid_interpolate )
 //     std::pair< unsigned int, unsigned int > size{ 4096, 8 };
 //     std::vector< std::vector< float > > a( size.first, std::vector< float >( size.second, 0 ) );
 //     std::vector< float > b( size.first * size.second, 0 );
-//     auto t0 = boost::posix_time::microsec_clock::universal_time();
-//     for( auto& c: a )
 //     {
-//         for( auto& d: c )
+//         auto t0 = boost::posix_time::microsec_clock::universal_time();
+//         for( auto& c: a )
+//         {
+//             for( auto& d: c )
+//             {
+//                 d += 10;
+//             }
+//         }
+//         auto t1 = boost::posix_time::microsec_clock::universal_time();
+//         for( auto& d: b )
 //         {
 //             d += 10;
 //         }
+//         auto t2 = boost::posix_time::microsec_clock::universal_time();
+//         auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
+//         auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
+//         //std::cerr << "==> cashe hits:\tspeedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
+//         std::cerr << "==> cashe hits:\tspeedup: " << ( e0 / e1 ) << std::endl;
+//     }
+//     {
+//         std::vector< float > z( size.first * size.second, 0 );
+//         auto t0 = boost::posix_time::microsec_clock::universal_time();
+//         for( unsigned int i = 0; i < b.size(); ++i ) { z[i] = b[i]; }
+//         auto t1 = boost::posix_time::microsec_clock::universal_time();
+//         std::memcpy( reinterpret_cast< char* >( &z[0] ), reinterpret_cast< const char* >( &b[0] ), b.size() * sizeof( b[0] ) );
+//         auto t2 = boost::posix_time::microsec_clock::universal_time();
+//         auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
+//         auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
+//         //std::cerr << "==> memcpy:\tspeedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
+//         std::cerr << "==> memcpy vs element-wise assignment:\tspeedup: " << ( e0 / e1 ) << std::endl;
 //     }
-//     auto t1 = boost::posix_time::microsec_clock::universal_time();
-//     for( auto& d: b )
 //     {
-//         d += 10;
+//         std::vector< float > z( size.first * size.second, 0 );
+//         auto t0 = boost::posix_time::microsec_clock::universal_time();
+//         std::copy( b.begin(), b.end(), z.begin() );
+//         auto t1 = boost::posix_time::microsec_clock::universal_time();
+//         std::memcpy( reinterpret_cast< char* >( &z[0] ), reinterpret_cast< const char* >( &b[0] ), b.size() * sizeof( b[0] ) );
+//         auto t2 = boost::posix_time::microsec_clock::universal_time();
+//         auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
+//         auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
+//         //std::cerr << "==> memcpy:\tspeedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
+//         std::cerr << "==> memcpy vs std::copy:\tspeedup: " << ( e0 / e1 ) << std::endl;
 //     }
-//     auto t2 = boost::posix_time::microsec_clock::universal_time();
-//     auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
-//     auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
-//     std::cerr << "==> speedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
 // }

From e0b9972e2cd3849a04a6f5540a1437109e8508a0 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 25 Jul 2024 15:04:26 +1000
Subject: [PATCH 0840/1056] csv::write() implemented

---
 csv/stream.h | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/csv/stream.h b/csv/stream.h
index 51d5df091..93a829353 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -44,6 +44,10 @@ template < typename V > V read_as( const std::string& filename, const options& o
 template < typename V > V read_as( std::istream& is, const options& o, const typename V::value_type& default_value, std::size_t size = 0 );
 template < typename V > V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value, std::size_t size = 0 );
 
+/// convenience functions: write to output stream from a non-mapped container
+template < typename V > void write( const V& v, std::ostream& os, const options& o, const typename V::value_type& default_value );
+template < typename V > void write( const V& v, std::ostream& os, const options& o = options() );
+
 /// ascii csv input stream
 template < typename S >
 class ascii_input_stream : public boost::noncopyable
@@ -851,6 +855,20 @@ inline void output_stream< S >::append_output( input_stream< T >& is, const S& s
     }
 }*/
 
+template < typename V > inline void write( const V& v, std::ostream& os, const options& o ) { if( !v.empty() ) { write( v, os, o, typename V::value_type() ); } }
+
+template < typename V > inline void write( const V& v, std::ostream& os, const options& o, const typename V::value_type& default_value )
+{
+    if( v.empty() ) { return; }
+    output_stream< typename V::value_type > ostream( os, o, default_value );
+    for( const auto& e: v )
+    {
+        COMMA_ASSERT( os.good(), "output stream not good" );
+        ostream.write( e );
+    }
+    if( o.flush ) { os.flush(); }
+}
+
 template < typename V > inline V read_as( std::istream& is, const options& o, const typename V::value_type& default_value, std::size_t size )
 {
     input_stream< typename V::value_type > istream( is, o, default_value );

From 8f3a067d69a6d0081f87b631e3360e716af434ef Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 25 Jul 2024 17:42:34 +1000
Subject: [PATCH 0841/1056] containers::multidimensional::index: implemented
 and tested

---
 containers/multidimensional/array.h           | 55 +++++++++++
 .../test/multidimensional_array_test.cpp      | 98 ++++++++++++++++---
 2 files changed, 141 insertions(+), 12 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 8667f2fc1..43811c66a 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -5,11 +5,27 @@
 #pragma once
 
 #include <array>
+#include <cstring>
 #include "../../base/types.h"
 #include "array_traits.h"
 
 namespace comma { namespace containers { namespace multidimensional {
 
+template < unsigned int D >
+struct index: public std::array< std::size_t, D >
+{
+    typedef std::array< std::size_t, D > base_t;
+
+    //index() { std::memset( reinterpret_cast< char* >( this ), 0, sizeof( std::size_t ) * D ); }
+    template < typename... Args > index( Args... args ): base_t( { args... } ) {}
+    bool operator<( const index& rhs ) const;
+    bool operator==( const index& rhs ) const;
+    bool operator!=( const index& rhs ) const { return !operator==( rhs ); }
+    index& increment( const index& sizes );
+
+    class iterator;
+};
+
 template < typename V, unsigned int D >
 class slice
 {
@@ -310,4 +326,43 @@ inline bool grid< V, D, P, Traits, S >::has( const P& point ) const // quick and
     return true;
 }
 
+template < unsigned int D > inline bool index< D >::operator<( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    for( unsigned int i = 0; i < D; ++i )
+    {
+        if( ( *this )[i] < rhs[i] ) { return true; }
+    }
+    return false;
+}
+
+template < unsigned int D > inline bool index< D >::operator==( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    return std::memcmp( reinterpret_cast< const char* >( this ), reinterpret_cast< const char* >( &rhs ), sizeof( std::size_t ) * D ) == 0;
+}
+
+template < unsigned int D > inline index< D >& index< D >::increment( const index< D >& sizes ) // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    for( unsigned int i{0}, j{D - 1}; i < D; ++i, --j )
+    {
+        if( ++( *this )[j] < sizes[j] ) { return *this; }
+        ( *this )[j] = 0;
+    }
+    return *this;
+}
+
+template < unsigned int D >
+class index< D >::iterator
+{
+    public:
+        iterator( const index< D >& shape ): _shape( shape ) {}
+        iterator& operator++() { _valid = _index.increment( _shape ) != index< D >{}; return *this; }
+        operator bool() const { return _valid; }
+        const index< D >& operator*() const { return _index; }
+
+    private:
+        index< D > _index;
+        index< D > _shape;
+        bool _valid{true};
+};
+
 } } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index e33ddd596..3e2879c72 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -45,7 +45,7 @@ TEST( multidimensional_array, iteration )
 {
     {
         typedef std::array< std::size_t, 3 > array_t;
-        comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+        cmd::array< int, 3 > a( {2, 3, 4}, 0 );
         { array_t s{2, 3, 4}; EXPECT_EQ( a.shape(), s ); EXPECT_EQ( a.data().size(), 2 * 3 * 4 ); }
         unsigned int i = 0;
         for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
@@ -83,10 +83,10 @@ TEST( multidimensional_array, iteration )
 TEST( multidimensional_array, array )
 {
     {
-        comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+        cmd::array< int, 3 > a( {2, 3, 4}, 0 );
         unsigned int i = 0;
         for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
-        typedef comma::containers::multidimensional::array< int, 3 >::index_type index_t;
+        typedef cmd::array< int, 3 >::index_type index_t;
         { index_t i{0, 0, 0}; EXPECT_EQ( a[i], 0 ); }
         { index_t i{0, 1, 0}; EXPECT_EQ( a[i], 4 ); }
         { index_t i{1, 2, 3}; EXPECT_EQ( a[i], 23 ); }
@@ -100,11 +100,11 @@ TEST( multidimensional_array, slice )
 {
     {
         {
-            comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+            cmd::array< int, 3 > a( {2, 3, 4}, 0 );
             unsigned int i = 0;
             for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
-            typedef comma::containers::multidimensional::array< int, 2 >::index_type index_t;
-            comma::containers::multidimensional::slice< int, 2 > s = a.at( 0 );
+            typedef cmd::array< int, 2 >::index_type index_t;
+            cmd::slice< int, 2 > s = a.at( 0 );
             { index_t i{0, 0}; EXPECT_EQ( s[i], 0 ); }
             { index_t i{0, 1}; EXPECT_EQ( s[i], 1 ); }
             { index_t i{0, 2}; EXPECT_EQ( s[i], 2 ); }
@@ -119,7 +119,7 @@ TEST( multidimensional_array, slice )
             { index_t i{2, 3}; EXPECT_EQ( s[i], 11 ); }
             {
                 auto t = s.at( 0 );
-                typedef comma::containers::multidimensional::array< int, 1 >::index_type index_t;
+                typedef cmd::array< int, 1 >::index_type index_t;
                 { index_t i{0}; EXPECT_EQ( t[i], 0 ); }
                 { index_t i{1}; EXPECT_EQ( t[i], 1 ); }
                 { index_t i{2}; EXPECT_EQ( t[i], 2 ); }
@@ -146,12 +146,12 @@ TEST( multidimensional_array, slice )
             { s[{1, 3}] = 111; std::array< std::size_t, 3 > i{1, 1, 3}; EXPECT_EQ( a[i], 111 ); }
         }
         {
-            comma::containers::multidimensional::array< int, 3 > a( {2, 3, 4}, 0 );
+            cmd::array< int, 3 > a( {2, 3, 4}, 0 );
             unsigned int i = 0;
             for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
-            typedef comma::containers::multidimensional::array< int, 1 >::index_type index_t;
+            typedef cmd::array< int, 1 >::index_type index_t;
             {
-                comma::containers::multidimensional::slice< int, 1 > s = a.at< 2 >( {0, 0} ); // todo! super-ugly! improve templating!
+                cmd::slice< int, 1 > s = a.at< 2 >( {0, 0} ); // todo! super-ugly! improve templating!
                 { index_t i{0}; EXPECT_EQ( s[i], 0 ); } // todo: improve usage on 1-dimensional slices
                 { index_t i{1}; EXPECT_EQ( s[i], 1 ); }
                 { index_t i{2}; EXPECT_EQ( s[i], 2 ); }
@@ -189,7 +189,7 @@ TEST( multidimensional_array, slice )
 TEST( multidimensional_array, grid_index )
 {
     {
-        comma::containers::multidimensional::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 3}, 0 );
+        cmd::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 3}, 0 );
         typedef std::array< std::size_t, 2 > index_t;
         int i = 0;
         for( auto it = g.begin(); it != g.end(); ++it ) { *it = i++; }
@@ -205,7 +205,7 @@ TEST( multidimensional_array, grid_index )
 TEST( multidimensional_array, grid_interpolate )
 {
     {
-        comma::containers::multidimensional::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 2}, 0 );
+        cmd::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 2}, 0 );
         g[{0, 0}] = 0; g[{0, 1}] = 1; g[{1, 0}] = 0; g[{1, 1}] = 1;
         EXPECT_EQ( g.interpolated( {0, 0} ), 0 );
         EXPECT_EQ( g.interpolated( {0, 0.5} ), 0.5 );
@@ -216,6 +216,79 @@ TEST( multidimensional_array, grid_interpolate )
     }
 }
 
+TEST( multidimensional_array, index )
+{
+    {
+        cmd::index< 4 > i;
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 0 );
+        EXPECT_EQ( i[2], 0 );
+        EXPECT_EQ( i[3], 0 );
+    }
+    {
+        cmd::index< 4 > i{};
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 0 );
+        EXPECT_EQ( i[2], 0 );
+        EXPECT_EQ( i[3], 0 );
+    }
+    {
+        cmd::index< 4 > i{0u, 1u, 2u, 3u};
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 1 );
+        EXPECT_EQ( i[2], 2 );
+        EXPECT_EQ( i[3], 3 );
+    }
+    {
+        cmd::index< 1 > i;
+        cmd::index< 1 > j{5u};
+        EXPECT_TRUE( i < j );
+        EXPECT_TRUE( i != j );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{1u} );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{2u} );
+    }
+    {
+        cmd::index< 2 > i;
+        cmd::index< 2 > j{3u, 2u};
+        EXPECT_EQ( i               , ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 1u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 0u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 1u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 0u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 1u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_TRUE( i == cmd::index< 2 >{} );
+    }
+    {
+        cmd::index< 2 >::iterator i{{3u, 2u}};
+        EXPECT_TRUE( bool( i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 1u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 1u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 1u} ) );
+        EXPECT_FALSE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
+    }
+    {
+        unsigned int count{0};
+        for( cmd::index< 2 >::iterator i{{3u, 2u}}; i; ++i, ++count );
+        EXPECT_EQ( count, 6 );
+    }
+}
+
 // TEST( vector_of_vectors, performance )
 // {
 //     //std::pair< unsigned int, unsigned int > size{ 10000000, 4 };
@@ -266,4 +339,5 @@ TEST( multidimensional_array, grid_interpolate )
 //         //std::cerr << "==> memcpy:\tspeedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
 //         std::cerr << "==> memcpy vs std::copy:\tspeedup: " << ( e0 / e1 ) << std::endl;
 //     }
+//     // todo! multidimensional::array performance
 // }

From 26efa9e4fcc84cbe56f8da65b02979d8e8bd2318 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 25 Jul 2024 17:47:49 +1000
Subject: [PATCH 0842/1056] containers::multidimensional::index: implemented
 and tested

---
 containers/multidimensional/index.h           | 70 ++++++++++++++++
 .../test/multidimensional_array_test.cpp      | 73 -----------------
 .../test/multidimensional_index_test.cpp      | 80 +++++++++++++++++++
 3 files changed, 150 insertions(+), 73 deletions(-)
 create mode 100644 containers/multidimensional/index.h
 create mode 100644 containers/test/multidimensional_index_test.cpp

diff --git a/containers/multidimensional/index.h b/containers/multidimensional/index.h
new file mode 100644
index 000000000..9dfd2e820
--- /dev/null
+++ b/containers/multidimensional/index.h
@@ -0,0 +1,70 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+#include <cstring>
+#include "../../base/types.h"
+
+namespace comma { namespace containers { namespace multidimensional {
+
+template < unsigned int D >
+struct index: public std::array< std::size_t, D >
+{
+    typedef std::array< std::size_t, D > base_t;
+
+    template < typename... Args > index( Args... args ): base_t( { args... } ) {}
+
+    bool operator<( const index& rhs ) const;
+
+    bool operator==( const index& rhs ) const;
+
+    bool operator!=( const index& rhs ) const { return !operator==( rhs ); }
+
+    index& increment( const index& sizes );
+
+    class iterator
+    {
+        public:
+            iterator( const index< D >& shape ): _shape( shape ) {}
+
+            iterator& operator++() { _valid = _index.increment( _shape ) != index< D >{}; return *this; }
+
+            operator bool() const { return _valid; }
+            
+            const index< D >& operator*() const { return _index; }
+
+        private:
+            index< D > _index;
+            index< D > _shape;
+            bool _valid{true};
+    };
+};
+
+template < unsigned int D > inline bool index< D >::operator<( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    for( unsigned int i = 0; i < D; ++i )
+    {
+        if( ( *this )[i] < rhs[i] ) { return true; }
+    }
+    return false;
+}
+
+template < unsigned int D > inline bool index< D >::operator==( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    return std::memcmp( reinterpret_cast< const char* >( this ), reinterpret_cast< const char* >( &rhs ), sizeof( std::size_t ) * D ) == 0;
+}
+
+template < unsigned int D > inline index< D >& index< D >::increment( const index< D >& sizes ) // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    for( unsigned int i{0}, j{D - 1}; i < D; ++i, --j )
+    {
+        if( ++( *this )[j] < sizes[j] ) { return *this; }
+        ( *this )[j] = 0;
+    }
+    return *this;
+}
+
+} } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 3e2879c72..4641933a6 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -216,79 +216,6 @@ TEST( multidimensional_array, grid_interpolate )
     }
 }
 
-TEST( multidimensional_array, index )
-{
-    {
-        cmd::index< 4 > i;
-        EXPECT_EQ( i[0], 0 );
-        EXPECT_EQ( i[1], 0 );
-        EXPECT_EQ( i[2], 0 );
-        EXPECT_EQ( i[3], 0 );
-    }
-    {
-        cmd::index< 4 > i{};
-        EXPECT_EQ( i[0], 0 );
-        EXPECT_EQ( i[1], 0 );
-        EXPECT_EQ( i[2], 0 );
-        EXPECT_EQ( i[3], 0 );
-    }
-    {
-        cmd::index< 4 > i{0u, 1u, 2u, 3u};
-        EXPECT_EQ( i[0], 0 );
-        EXPECT_EQ( i[1], 1 );
-        EXPECT_EQ( i[2], 2 );
-        EXPECT_EQ( i[3], 3 );
-    }
-    {
-        cmd::index< 1 > i;
-        cmd::index< 1 > j{5u};
-        EXPECT_TRUE( i < j );
-        EXPECT_TRUE( i != j );
-        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{1u} );
-        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{2u} );
-    }
-    {
-        cmd::index< 2 > i;
-        cmd::index< 2 > j{3u, 2u};
-        EXPECT_EQ( i               , ( cmd::index< 2 >{0u, 0u} ) );
-        EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 1u} ) );
-        EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 0u} ) );
-        EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 1u} ) );
-        EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 0u} ) );
-        EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 1u} ) );
-        EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 0u} ) );
-        EXPECT_TRUE( i == cmd::index< 2 >{} );
-    }
-    {
-        cmd::index< 2 >::iterator i{{3u, 2u}};
-        EXPECT_TRUE( bool( i ) );
-        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
-        EXPECT_TRUE( bool( ++i ) );
-        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 1u} ) );
-        EXPECT_TRUE( bool( ++i ) );
-        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 0u} ) );
-        EXPECT_TRUE( bool( ++i ) );
-        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 1u} ) );
-        EXPECT_TRUE( bool( ++i ) );
-        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 0u} ) );
-        EXPECT_TRUE( bool( ++i ) );
-        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 1u} ) );
-        EXPECT_FALSE( bool( ++i ) );
-        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
-    }
-    {
-        unsigned int count{0};
-        for( cmd::index< 2 >::iterator i{{3u, 2u}}; i; ++i, ++count );
-        EXPECT_EQ( count, 6 );
-    }
-}
-
 // TEST( vector_of_vectors, performance )
 // {
 //     //std::pair< unsigned int, unsigned int > size{ 10000000, 4 };
diff --git a/containers/test/multidimensional_index_test.cpp b/containers/test/multidimensional_index_test.cpp
new file mode 100644
index 000000000..7178a41d2
--- /dev/null
+++ b/containers/test/multidimensional_index_test.cpp
@@ -0,0 +1,80 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <gtest/gtest.h>
+//#include <boost/date_time/posix_time/posix_time.hpp>
+#include "../multidimensional/index.h"
+
+namespace cmd = comma::containers::multidimensional; 
+
+TEST( multidimensional_array, index )
+{
+    {
+        cmd::index< 4 > i;
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 0 );
+        EXPECT_EQ( i[2], 0 );
+        EXPECT_EQ( i[3], 0 );
+    }
+    {
+        cmd::index< 4 > i{};
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 0 );
+        EXPECT_EQ( i[2], 0 );
+        EXPECT_EQ( i[3], 0 );
+    }
+    {
+        cmd::index< 4 > i{0u, 1u, 2u, 3u};
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 1 );
+        EXPECT_EQ( i[2], 2 );
+        EXPECT_EQ( i[3], 3 );
+    }
+    {
+        cmd::index< 1 > i;
+        cmd::index< 1 > j{5u};
+        EXPECT_TRUE( i < j );
+        EXPECT_TRUE( i != j );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{1u} );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{2u} );
+    }
+    {
+        cmd::index< 2 > i;
+        cmd::index< 2 > j{3u, 2u};
+        EXPECT_EQ( i               , ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 1u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 0u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 1u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 0u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 1u} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_TRUE( i == cmd::index< 2 >{} );
+    }
+    {
+        cmd::index< 2 >::iterator i{{3u, 2u}};
+        EXPECT_TRUE( bool( i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 1u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 1u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 1u} ) );
+        EXPECT_FALSE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
+    }
+    {
+        unsigned int count{0};
+        for( cmd::index< 2 >::iterator i{{3u, 2u}}; i; ++i, ++count );
+        EXPECT_EQ( count, 6 );
+    }
+}

From 15fee76ce90a7e21ae257994be813f82cefa2a7f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 25 Jul 2024 20:13:18 +1000
Subject: [PATCH 0843/1056] name-value-convert: quoting inf and nan implemented
 and tested

---
 name_value/impl/json_writer.h               | 4 +++-
 name_value/ptree.cpp                        | 2 +-
 name_value/test/name-value-convert/expected | 2 ++
 name_value/test/name-value-convert/input    | 2 ++
 4 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index 857acc87d..4afcfc3ea 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -42,8 +42,10 @@ template< typename C > inline void json_remove_quotes( std::basic_string< C >& j
         bool quoted = true;
         if( ':' != *next_token )
         {
-            auto const value = std::string( value_begin + 1, value_end );
+            auto value = std::string( value_begin + 1, value_end );
+            for( char& c: value ) { c = std::tolower( c ); } // quick and dirty, watch performance
             if( true_str == value || false_str == value ) { quoted = false; }
+            else if( value == "nan" || value == "inf" ) { quoted = true; } // lexical cast thinks it's a number
             else if( !boost::regex_match( value, number_like_string ) ) { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} } // todo? try to avoid lexical_cast+exception to improve performace?
         }
         if( !quoted ) { value_begin++; }
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index 2c9d2c4dd..cc8b56e02 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -110,7 +110,7 @@ boost::optional< std::string > property_tree::get( const boost::property_tree::p
 
 namespace comma { namespace impl {
 
-static void ptree_output_value_( std::ostream& os, const std::string& value, bool is_begin, const xpath& path, char equal_sign, char delimiter, const std::string& root, bool const unquote_numbers )
+static void ptree_output_value_( std::ostream& os, const std::string& value, bool is_begin, const xpath& path, char equal_sign, char delimiter, const std::string& root, bool unquote_numbers )
 {
     static boost::regex number_like_string( "^0[0-9][0-9]*$" );
     if( !is_begin ) { os << delimiter; }
diff --git a/name_value/test/name-value-convert/expected b/name_value/test/name-value-convert/expected
index 14ceb85d1..7c0fd180a 100644
--- a/name_value/test/name-value-convert/expected
+++ b/name_value/test/name-value-convert/expected
@@ -7,6 +7,8 @@ quoting[6]/output='a=1'
 quoting[4]/output='{"a":"1"}'
 quoting[5]/output='a="1"'
 quoting[6]/output='a=1'
+quoting[7]/output='{"a":"inf","b":"iNf","c":"nan","d":"NaN"}'
+quoting[8]/output='{"a":"inf","b":"iNf","c":"nan","d":"NaN"}'
 
 paths[0]/output='a/b="1";a/c="2";x/y="3";x/z="4"'
 paths[1]/output='b="1";c="2"'
diff --git a/name_value/test/name-value-convert/input b/name_value/test/name-value-convert/input
index 90557b5d0..84597767d 100644
--- a/name_value/test/name-value-convert/input
+++ b/name_value/test/name-value-convert/input
@@ -7,6 +7,8 @@ quoting[6]="echo a=1 | name-value-convert --to json --minify | name-value-conver
 quoting[4]="echo a=1 | name-value-convert --to json --quote-numbers --minify"
 quoting[5]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert"
 quoting[6]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert --unquote-numbers"
+quoting[7]="( echo a=inf; echo b=iNf; echo c=nan; echo d=NaN ) | name-value-convert --to json --minify"
+quoting[8]="( echo a=inf; echo b=iNf; echo c=nan; echo d=NaN ) | name-value-convert --to json --minify --unquote-numbers"
 
 paths[0]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --delimiter=';'"
 paths[1]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path a --delimiter=';'"

From c8147899218732c07e168cedd8a3db0e47305261 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 31 Jul 2024 14:19:55 +1000
Subject: [PATCH 0844/1056] containers/multidimensional/array: made compatible
 with multidimensional::index; todo: make array::index_type
 multidimensional::index

---
 containers/multidimensional/array.h           | 57 +------------------
 containers/multidimensional/array_traits.h    |  1 +
 containers/multidimensional/index.h           | 52 ++++++++++++++---
 .../test/multidimensional_array_test.cpp      | 29 +++++++---
 .../test/multidimensional_index_test.cpp      | 26 ++++-----
 5 files changed, 83 insertions(+), 82 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 43811c66a..00f161a58 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -8,29 +8,15 @@
 #include <cstring>
 #include "../../base/types.h"
 #include "array_traits.h"
+#include "index.h"
 
 namespace comma { namespace containers { namespace multidimensional {
 
-template < unsigned int D >
-struct index: public std::array< std::size_t, D >
-{
-    typedef std::array< std::size_t, D > base_t;
-
-    //index() { std::memset( reinterpret_cast< char* >( this ), 0, sizeof( std::size_t ) * D ); }
-    template < typename... Args > index( Args... args ): base_t( { args... } ) {}
-    bool operator<( const index& rhs ) const;
-    bool operator==( const index& rhs ) const;
-    bool operator!=( const index& rhs ) const { return !operator==( rhs ); }
-    index& increment( const index& sizes );
-
-    class iterator;
-};
-
 template < typename V, unsigned int D >
 class slice
 {
     public:
-        typedef std::array< std::size_t, D > index_type;
+        typedef std::array< std::size_t, D > index_type; // todo: typedef multidimensional::index< D > index_type;
 
         typedef V value_type;
 
@@ -326,43 +312,4 @@ inline bool grid< V, D, P, Traits, S >::has( const P& point ) const // quick and
     return true;
 }
 
-template < unsigned int D > inline bool index< D >::operator<( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
-{
-    for( unsigned int i = 0; i < D; ++i )
-    {
-        if( ( *this )[i] < rhs[i] ) { return true; }
-    }
-    return false;
-}
-
-template < unsigned int D > inline bool index< D >::operator==( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
-{
-    return std::memcmp( reinterpret_cast< const char* >( this ), reinterpret_cast< const char* >( &rhs ), sizeof( std::size_t ) * D ) == 0;
-}
-
-template < unsigned int D > inline index< D >& index< D >::increment( const index< D >& sizes ) // todo: unravel in compile time (compiler probably will do it anyway)
-{
-    for( unsigned int i{0}, j{D - 1}; i < D; ++i, --j )
-    {
-        if( ++( *this )[j] < sizes[j] ) { return *this; }
-        ( *this )[j] = 0;
-    }
-    return *this;
-}
-
-template < unsigned int D >
-class index< D >::iterator
-{
-    public:
-        iterator( const index< D >& shape ): _shape( shape ) {}
-        iterator& operator++() { _valid = _index.increment( _shape ) != index< D >{}; return *this; }
-        operator bool() const { return _valid; }
-        const index< D >& operator*() const { return _index; }
-
-    private:
-        index< D > _index;
-        index< D > _shape;
-        bool _valid{true};
-};
-
 } } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index 4122d7358..8998461d8 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -8,6 +8,7 @@
 #include <cmath>
 #include <type_traits>
 #include "../../math/compare.h"
+#include "index.h"
 
 template< typename T, std::size_t D, typename S >
 inline std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
diff --git a/containers/multidimensional/index.h b/containers/multidimensional/index.h
index 9dfd2e820..6df4a3430 100644
--- a/containers/multidimensional/index.h
+++ b/containers/multidimensional/index.h
@@ -10,12 +10,18 @@
 
 namespace comma { namespace containers { namespace multidimensional {
 
-template < unsigned int D >
-struct index: public std::array< std::size_t, D >
+template < unsigned int D, typename T = std::size_t >
+struct index: public std::array< T, D >
 {
-    typedef std::array< std::size_t, D > base_t;
+    typedef T value_t;
 
-    template < typename... Args > index( Args... args ): base_t( { args... } ) {}
+    typedef std::array< T, D > base_t;
+
+    index(): base_t{} {}
+
+    index( const index& rhs ): base_t( static_cast< const base_t& >( rhs ) ) {}
+
+    template < typename... Args > index( T t, Args... args ); // quick and dirty for now to avoid compile warning // template < typename... Args > index( Args... args ): base_t( { args... } ) {}
 
     bool operator<( const index& rhs ) const;
 
@@ -23,6 +29,14 @@ struct index: public std::array< std::size_t, D >
 
     bool operator!=( const index& rhs ) const { return !operator==( rhs ); }
 
+    index& operator=( const index& rhs ) = default;
+
+    index& operator=( const base_t& rhs ) { static_cast< base_t& >( *this ) = rhs; }
+
+    operator base_t() { return static_cast< base_t& >( *this ); }
+
+    operator base_t() const { return static_cast< const base_t& >( *this ); }
+
     index& increment( const index& sizes );
 
     class iterator
@@ -43,7 +57,31 @@ struct index: public std::array< std::size_t, D >
     };
 };
 
-template < unsigned int D > inline bool index< D >::operator<( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+namespace impl {
+
+template < typename T, unsigned int D, unsigned int I > struct type_cast
+{
+    template < typename... Args > static void assign( index< D, T >& i, T v, Args... args )
+    {
+        i[ D - I ] = v;
+        type_cast< T, D, I - 1 >::assign( i, args... );
+    }
+};
+
+template < typename T, unsigned int D > struct type_cast< T, D, 1 >
+{
+    static void assign( index< D, T >& i, T v ) { i[ D - 1 ] = v; }
+};
+
+} // namespace impl {
+
+template < unsigned int D, typename T > 
+template < typename... Args > inline index< D, T >::index( T t, Args... args )
+{
+    impl::type_cast< T, D, D >::assign( *this, t, args... );
+}
+
+template < unsigned int D, typename T > inline bool index< D, T >::operator<( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
 {
     for( unsigned int i = 0; i < D; ++i )
     {
@@ -52,12 +90,12 @@ template < unsigned int D > inline bool index< D >::operator<( const index& rhs
     return false;
 }
 
-template < unsigned int D > inline bool index< D >::operator==( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+template < unsigned int D, typename T > inline bool index< D, T >::operator==( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
 {
     return std::memcmp( reinterpret_cast< const char* >( this ), reinterpret_cast< const char* >( &rhs ), sizeof( std::size_t ) * D ) == 0;
 }
 
-template < unsigned int D > inline index< D >& index< D >::increment( const index< D >& sizes ) // todo: unravel in compile time (compiler probably will do it anyway)
+template < unsigned int D, typename T > inline index< D, T >& index< D, T >::increment( const index< D, T >& sizes ) // todo: unravel in compile time (compiler probably will do it anyway)
 {
     for( unsigned int i{0}, j{D - 1}; i < D; ++i, --j )
     {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index 4641933a6..df423855e 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -41,6 +41,22 @@ TEST( multidimensional_array, impl_index_inverted_value )
     // todo: way more tests
 }
 
+TEST( multidimensional_array, index )
+{
+    {
+        cmd::array< int, 3 > a( {2, 3, 4}, 0 );
+        unsigned int i = 0;
+        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        typedef cmd::array< int, 3 >::index_type array_index_t;
+        typedef cmd::index< 3 > index_t;
+        EXPECT_EQ( ( array_index_t{1, 2, 3} ), ( index_t{1, 2, 3} ) );
+        EXPECT_EQ( ( index_t{1, 2, 3} ), ( array_index_t{1, 2, 3} ) );
+        EXPECT_EQ( ( a[{1, 2, 3}]), 23 );
+        EXPECT_EQ( ( a[ index_t( {1, 2, 3} )] ), 23 );
+        EXPECT_EQ( ( a[ index_t( {1, 2, 3} )] ), 23 );
+    }
+}
+
 TEST( multidimensional_array, iteration )
 {
     {
@@ -86,13 +102,12 @@ TEST( multidimensional_array, array )
         cmd::array< int, 3 > a( {2, 3, 4}, 0 );
         unsigned int i = 0;
         for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
-        typedef cmd::array< int, 3 >::index_type index_t;
-        { index_t i{0, 0, 0}; EXPECT_EQ( a[i], 0 ); }
-        { index_t i{0, 1, 0}; EXPECT_EQ( a[i], 4 ); }
-        { index_t i{1, 2, 3}; EXPECT_EQ( a[i], 23 ); }
-        { index_t i{0, 0, 0}; a[{0, 0, 0}] = 111; EXPECT_EQ( a[i], 111 ); }
-        { index_t i{1, 1, 2}; a[{1, 1, 2}] = 222; EXPECT_EQ( a[i], 222 ); }
-        { index_t i{1, 2, 3}; a[{1, 2, 3}] = 333; EXPECT_EQ( a[i], 333 ); }
+        EXPECT_EQ( ( a[{0, 0, 0}] ), 0 );
+        EXPECT_EQ( ( a[{0, 1, 0}] ), 4 );
+        EXPECT_EQ( ( a[{1, 2, 3}] ), 23 );
+        a[{0, 0, 0}] = 111; EXPECT_EQ( ( a[{0, 0, 0}] ), 111 );
+        a[{1, 1, 2}] = 222; EXPECT_EQ( ( a[{1, 1, 2}] ), 222 );
+        a[{1, 2, 3}] = 333; EXPECT_EQ( ( a[{1, 2, 3}] ), 333 );
     }
 }
 
diff --git a/containers/test/multidimensional_index_test.cpp b/containers/test/multidimensional_index_test.cpp
index 7178a41d2..186ac816b 100644
--- a/containers/test/multidimensional_index_test.cpp
+++ b/containers/test/multidimensional_index_test.cpp
@@ -6,7 +6,7 @@
 
 namespace cmd = comma::containers::multidimensional; 
 
-TEST( multidimensional_array, index )
+TEST( multidimentional_index, basics )
 {
     {
         cmd::index< 4 > i;
@@ -23,7 +23,7 @@ TEST( multidimensional_array, index )
         EXPECT_EQ( i[3], 0 );
     }
     {
-        cmd::index< 4 > i{0u, 1u, 2u, 3u};
+        cmd::index< 4 > i{0, 1, 2, 3};
         EXPECT_EQ( i[0], 0 );
         EXPECT_EQ( i[1], 1 );
         EXPECT_EQ( i[2], 2 );
@@ -31,28 +31,28 @@ TEST( multidimensional_array, index )
     }
     {
         cmd::index< 1 > i;
-        cmd::index< 1 > j{5u};
+        cmd::index< 1 > j{5};
         EXPECT_TRUE( i < j );
         EXPECT_TRUE( i != j );
-        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{1u} );
-        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{2u} );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{1} );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{2} );
     }
     {
         cmd::index< 2 > i;
-        cmd::index< 2 > j{3u, 2u};
-        EXPECT_EQ( i               , ( cmd::index< 2 >{0u, 0u} ) );
+        cmd::index< 2 > j{3, 2};
+        EXPECT_EQ( i               , ( cmd::index< 2 >{0, 0} ) );
         EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 1u} ) );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0, 1} ) );
         EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 0u} ) );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1, 0} ) );
         EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1u, 1u} ) );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1, 1} ) );
         EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 0u} ) );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2, 0} ) );
         EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2u, 1u} ) );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2, 1} ) );
         EXPECT_TRUE( i < j );
-        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0, 0} ) );
         EXPECT_TRUE( i == cmd::index< 2 >{} );
     }
     {

From 82087f9553707bac1e42703acd0f2d35bad3bf8d Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 31 Jul 2024 16:29:59 +1000
Subject: [PATCH 0845/1056] containers::multidimensional::array::index_type:
 using multidimensional::index now

---
 containers/applications/math-lookup.cpp       |  4 +--
 containers/multidimensional/array.h           | 26 +++++++++----------
 containers/multidimensional/array_traits.h    | 12 ++++++---
 containers/multidimensional/traits.h          | 25 ++++++++++++++++++
 .../test/multidimensional_array_test.cpp      |  2 +-
 5 files changed, 49 insertions(+), 20 deletions(-)
 create mode 100644 containers/multidimensional/traits.h

diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
index d41783eeb..fd8886204 100644
--- a/containers/applications/math-lookup.cpp
+++ b/containers/applications/math-lookup.cpp
@@ -10,8 +10,8 @@
 #include "../../csv/stream.h"
 #include "../../csv/traits.h"
 #include "../../name_value/parser.h"
-#include "../../visiting/traits.h"
 #include "../multidimensional/array.h"
+#include "../multidimensional/traits.h"
 
 void usage( bool verbose )
 {
@@ -79,7 +79,7 @@ template < typename T, std::size_t D, std::size_t E >
 struct lut
 {
     typedef std::array< double, D > point_t;
-    typedef std::array< std::size_t, D > index_t;
+    typedef comma::containers::multidimensional::index< D > index_t; // typedef std::array< std::size_t, D > index_t;
     typedef std::array< T, E > value_t;
     typedef comma::containers::multidimensional::grid< value_t, D, point_t > grid_t;
     typedef _array< double, D > input_t;
diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 00f161a58..0e3b895f0 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -16,7 +16,7 @@ template < typename V, unsigned int D >
 class slice
 {
     public:
-        typedef std::array< std::size_t, D > index_type; // todo: typedef multidimensional::index< D > index_type;
+        typedef multidimensional::index< D > index_type; // typedef std::array< std::size_t, D > index_type; // todo: typedef multidimensional::index< D > index_type;
 
         typedef V value_type;
 
@@ -31,14 +31,14 @@ class slice
         const V& operator[]( const index_type& i ) const { return _data[ _index( i ) ]; }
 
         template < unsigned int I >
-        slice< V, D - I > at( const std::array< std::size_t, I >& i );
+        slice< V, D - I > at( const multidimensional::index< I >& i );
 
         template < unsigned int I >
-        const slice< V, D - I > at( const std::array< std::size_t, I >& i ) const;
+        const slice< V, D - I > at( const multidimensional::index< I >& i ) const;
 
-        slice< V, D - 1 > at( std::size_t i ) { return at< 1 >( std::array< std::size_t, 1 >{i} ); }
+        slice< V, D - 1 > at( std::size_t i ) { return at< 1 >( multidimensional::index< 1 >{i} ); }
 
-        const slice< V, D - 1 > at( std::size_t i ) const { return at< 1 >( std::array< std::size_t, 1 >{i} ); }
+        const slice< V, D - 1 > at( std::size_t i ) const { return at< 1 >( multidimensional::index< 1 >{i} ); }
 
         V* data() { return _data; }
         
@@ -127,10 +127,10 @@ class array
         const V& operator[]( const index_type& i ) const { return _slice[i]; }
 
         template < unsigned int I >
-        multidimensional::slice< V, D - I > at( const std::array< std::size_t, I >& i ) { return _slice.template at< I >( i ); }
+        multidimensional::slice< V, D - I > at( const multidimensional::index< I >& i ) { return _slice.template at< I >( i ); } // todo!
 
         template < unsigned int I >
-        const multidimensional::slice< V, D - I > at( const std::array< std::size_t, I >& i ) const { return _slice.template at< I >( i ); }
+        const multidimensional::slice< V, D - I > at( const multidimensional::index< I >& i ) const { return _slice.template at< I >( i ); } // todo!
 
         multidimensional::slice< V, D - 1 > at( std::size_t i ) { return _slice.at( i ); }
 
@@ -201,15 +201,15 @@ namespace impl {
 template < unsigned int D, unsigned int I = D >
 struct index_traits
 {
-    typedef std::array< std::size_t, D > index_type;
+    typedef comma::containers::multidimensional::index< D > index_type; // typedef std::array< std::size_t, D > index_type;
     static unsigned int value( const index_type& i, const index_type& shape ) { return i[ I - 1 ] + index_traits< D, I - 1 >::value( i, shape ) * shape[ I - 1 ]; }
     static void value( std::size_t j, index_type& i, const index_type& shape ) { i[ I - 1 ] = j % shape[ I - 1 ]; index_traits< D, I - 1 >::value( j / shape[ I - 1 ], i, shape ); }
     static index_type value( std::size_t j, const index_type& shape ) { index_type i; value( j, i, shape ); return i; }
     static std::size_t product( const index_type& i ) { return i[ I - 1 ] * index_traits< D, I - 1 >::product( i ); }
     template < unsigned int J >
-    static std::pair< std::array< std::size_t, J >, std::array< std::size_t, D - J > > split( const index_type& i ) // todo: use metaprogramming, kinda same as product
+    static std::pair< comma::containers::multidimensional::index< J >, comma::containers::multidimensional::index< D - J > > split( const index_type& i ) // todo: use metaprogramming, kinda same as product
     {
-        std::pair< std::array< std::size_t, J >, std::array< std::size_t, D - J > > p;
+        std::pair< comma::containers::multidimensional::index< J >, comma::containers::multidimensional::index< D - J > > p;
         unsigned int k = 0;
         for( unsigned int n = 0; n < J; ++n, ++k ) { p.first[n] = i[k]; }
         for( unsigned int n = 0; n < D - J; ++n, ++k ) { p.second[n] = i[k]; }
@@ -220,7 +220,7 @@ struct index_traits
 template < unsigned int D >
 struct index_traits< D, 1 >
 {
-    typedef std::array< std::size_t, D > index_type;
+    typedef comma::containers::multidimensional::index< D > index_type; // typedef std::array< std::size_t, D > index_type;
     static unsigned int value( const index_type& i, const index_type& ) { return i[0]; }
     static void value( std::size_t j, index_type& i, const index_type& size ) { i[0] = j; }
     static std::size_t product( const index_type& i ) { return i[0]; }
@@ -242,7 +242,7 @@ inline typename slice< V, D >::index_type slice< V, D >::const_iterator::index()
 
 template < typename V, unsigned int D >
 template < unsigned int I >
-inline slice< V, D - I > slice< V, D >::at( const std::array< std::size_t, I >& i )
+inline slice< V, D - I > slice< V, D >::at( const multidimensional::index< I >& i )
 {
     auto s = impl::index_traits< D >::template split< I >( _shape );
     return slice< V, D - I >( s.second, _data + impl::index_traits< I >::value( i, s.first ) * impl::index_traits< D - I >::product( s.second ) );
@@ -250,7 +250,7 @@ inline slice< V, D - I > slice< V, D >::at( const std::array< std::size_t, I >&
 
 template < typename V, unsigned int D >
 template < unsigned int I >
-inline const slice< V, D - I > slice< V, D >::at( const std::array< std::size_t, I >& i ) const
+inline const slice< V, D - I > slice< V, D >::at( const multidimensional::index< I >& i ) const
 {
     auto s = impl::index_traits< D >::template split< I >( _shape );
     return slice< V, D - I >( s.second, _data + impl::index_traits< I >::value( i, s.first ) * impl::index_traits< D - I >::product( s.second ) );
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
index 8998461d8..59d9eec0e 100644
--- a/containers/multidimensional/array_traits.h
+++ b/containers/multidimensional/array_traits.h
@@ -37,10 +37,14 @@ template < typename T > inline int index( T p, T origin, T resolution )
 template < int Base, unsigned int Pow > static constexpr int pow = Base * pow< Base, Pow - 1 >;
 template < int Base > static constexpr int pow< Base, 0 >{1};
 template < typename I, std::size_t Size > static constexpr std::array< I, Size > neighbours; // quick and dirty, for now leaving it to the enthusiasts to implement it using metaprogramming
-template < typename I > static constexpr std::array< I, 2 > neighbours< I, 1 > = {{ {{ 0 }}, {{ 1 }} }};
-template < typename I > static constexpr std::array< I, 4 > neighbours< I, 2 > = {{ {{ 0, 0 }}, {{ 0, 1 }}, {{ 1, 0 }}, {{ 1, 1 }} }};
-template < typename I > static constexpr std::array< I, 8 > neighbours< I, 3 > = {{ {{ 0, 0, 0 }}, {{ 0, 0, 1 }}, {{ 0, 1, 0 }}, {{ 0, 1, 1 }}, {{ 1, 0, 0 }}, {{ 1, 0, 1 }}, {{ 1, 1, 0 }}, {{ 1, 1, 1 }} }};
-template < typename I > static constexpr std::array< I, 16 > neighbours< I, 4 > = {{ {{ 0, 0, 0, 0 }}, {{ 0, 0, 0, 1 }}, {{ 0, 0, 1, 0 }}, {{ 0, 0, 1, 1 }}, {{ 0, 1, 0, 0 }}, {{ 0, 1, 0, 1 }}, {{ 0, 1, 1, 0 }}, {{ 0, 1, 1, 1 }}, {{ 1, 0, 0, 0 }}, {{ 1, 0, 0, 1 }}, {{ 1, 0, 1, 0 }}, {{ 1, 0, 1, 1 }}, {{ 1, 1, 0, 0 }}, {{ 1, 1, 0, 1 }}, {{ 1, 1, 1, 0 }}, {{ 1, 1, 1, 1 }} }};
+template < typename I > static constexpr std::array< I, 2 > neighbours< I, 1 > = {{ I{ 0 }, I{ 1 } }};
+template < typename I > static std::array< I, 4 > neighbours< I, 2 > = {{ I{ 0, 0 }, I{ 0, 1 }, I{ 1, 0 }, I{ 1, 1 } }};
+template < typename I > static std::array< I, 8 > neighbours< I, 3 > = {{ I{ 0, 0, 0 }, I{ 0, 0, 1 }, I{ 0, 1, 0 }, I{ 0, 1, 1 }, I{ 1, 0, 0 }, I{ 1, 0, 1 }, I{ 1, 1, 0 }, I{ 1, 1, 1 } }};
+template < typename I > static std::array< I, 16 > neighbours< I, 4 > = {{ I{ 0, 0, 0, 0 }, I{ 0, 0, 0, 1 }, I{ 0, 0, 1, 0 }, I{ 0, 0, 1, 1 }, I{ 0, 1, 0, 0 }, I{ 0, 1, 0, 1 }, I{ 0, 1, 1, 0 }, I{ 0, 1, 1, 1 }, I{ 1, 0, 0, 0 }, I{ 1, 0, 0, 1 }, I{ 1, 0, 1, 0 }, I{ 1, 0, 1, 1 }, I{ 1, 1, 0, 0 }, I{ 1, 1, 0, 1 }, I{ 1, 1, 1, 0 }, I{ 1, 1, 1, 1 } }};
+// template < typename I > static constexpr std::array< I, 2 > neighbours< I, 1 > = {{ {{ 0 }}, {{ 1 }} }};
+// template < typename I > static constexpr std::array< I, 4 > neighbours< I, 2 > = {{ {{ 0, 0 }}, {{ 0, 1 }}, {{ 1, 0 }}, {{ 1, 1 }} }};
+// template < typename I > static constexpr std::array< I, 8 > neighbours< I, 3 > = {{ {{ 0, 0, 0 }}, {{ 0, 0, 1 }}, {{ 0, 1, 0 }}, {{ 0, 1, 1 }}, {{ 1, 0, 0 }}, {{ 1, 0, 1 }}, {{ 1, 1, 0 }}, {{ 1, 1, 1 }} }};
+// template < typename I > static constexpr std::array< I, 16 > neighbours< I, 4 > = {{ {{ 0, 0, 0, 0 }}, {{ 0, 0, 0, 1 }}, {{ 0, 0, 1, 0 }}, {{ 0, 0, 1, 1 }}, {{ 0, 1, 0, 0 }}, {{ 0, 1, 0, 1 }}, {{ 0, 1, 1, 0 }}, {{ 0, 1, 1, 1 }}, {{ 1, 0, 0, 0 }}, {{ 1, 0, 0, 1 }}, {{ 1, 0, 1, 0 }}, {{ 1, 0, 1, 1 }}, {{ 1, 1, 0, 0 }}, {{ 1, 1, 0, 1 }}, {{ 1, 1, 1, 0 }}, {{ 1, 1, 1, 1 }} }};
 // todo: add more dimensions as required or write that little metaprogramming piece
 
 template < std::size_t Size > struct operations
diff --git a/containers/multidimensional/traits.h b/containers/multidimensional/traits.h
new file mode 100644
index 000000000..1e32fbff1
--- /dev/null
+++ b/containers/multidimensional/traits.h
@@ -0,0 +1,25 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+#pragma once
+
+#include "../../visiting/traits.h"
+#include "index.h"
+
+namespace comma { namespace visiting {
+
+template < unsigned int D, typename T > struct traits< comma::containers::multidimensional::index< D, T > >
+{
+    typedef comma::containers::multidimensional::index< D, T > value_t;
+
+    template < typename Key, class Visitor > static void visit( const Key& k, value_t& p, Visitor& v )
+    {
+        comma::visiting::traits< std::array< T, D > >::visit( k, static_cast< std::array< T, D >& >( p ), v );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key& k, const value_t& p, Visitor& v )
+    {
+        comma::visiting::traits< std::array< T, D > >::visit( k, static_cast< const std::array< T, D >& >( p ), v );
+    }
+};
+
+} } // namespace comma { namespace visiting {
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
index df423855e..8a48b321e 100644
--- a/containers/test/multidimensional_array_test.cpp
+++ b/containers/test/multidimensional_array_test.cpp
@@ -158,7 +158,7 @@ TEST( multidimensional_array, slice )
             { index_t i{2, 1}; EXPECT_EQ( s[i], 21 ); }
             { index_t i{2, 2}; EXPECT_EQ( s[i], 22 ); }
             { index_t i{2, 3}; EXPECT_EQ( s[i], 23 ); }
-            { s[{1, 3}] = 111; std::array< std::size_t, 3 > i{1, 1, 3}; EXPECT_EQ( a[i], 111 ); }
+            s[{1, 3}] = 111; EXPECT_EQ( ( a[{1, 1, 3}] ), 111 );
         }
         {
             cmd::array< int, 3 > a( {2, 3, 4}, 0 );

From ab1bed60e9a1305c860e007cd5a8142606d747c1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 2 Aug 2024 13:29:03 +1000
Subject: [PATCH 0846/1056] 
 containers::multidimensional::array::absolute_index() implemented

---
 containers/multidimensional/array.h | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
index 0e3b895f0..5d08c17d4 100644
--- a/containers/multidimensional/array.h
+++ b/containers/multidimensional/array.h
@@ -97,6 +97,8 @@ class slice
 
         const_iterator end() const { return const_iterator( _size, _data + _size, _shape ); }
 
+        std::size_t absolute_index( const index_type& i ) const { return _index( i ); }
+
     protected:
         index_type _shape;
         std::size_t _size;
@@ -122,9 +124,9 @@ class array
 
         array( const index_type& shape, const V& default_value = V() );
 
-        V& operator[]( const index_type& i ) { return _slice[i]; }
+        V& operator[]( const index_type& i ) { return _slice[i]; } // V& operator[]( const index_type& i ) { return _data[ absolute_index( i ) ]; } //{ return _slice[i]; }
 
-        const V& operator[]( const index_type& i ) const { return _slice[i]; }
+        const V& operator[]( const index_type& i ) const { return _slice[i]; } // const V& operator[]( const index_type& i ) const { return _data[ absolute_index( i ) ]; } //{ return _slice[i]; }
 
         template < unsigned int I >
         multidimensional::slice< V, D - I > at( const multidimensional::index< I >& i ) { return _slice.template at< I >( i ); } // todo!
@@ -142,6 +144,8 @@ class array
 
         const index_type& shape() const { return _slice.shape(); }
 
+        std::size_t absolute_index( const index_type& i ) const { return _slice.absolute_index( i ); }
+
         typedef typename slice_type::iterator iterator;
 
         typedef typename slice_type::const_iterator const_iterator;

From 4ca3cb78b41d355f831f9a2137658d72f21d1832 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 2 Aug 2024 14:00:51 +1000
Subject: [PATCH 0847/1056] csv-shape: sliding-window: ascii implemented; in
 progress...

---
 csv/applications/csv-shape.cpp | 69 +++++++++++++++++++++++++++++-----
 1 file changed, 59 insertions(+), 10 deletions(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 4f679ee9b..a9fb53be7 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -1,11 +1,11 @@
 // Copyright (c) 2011 The University of Sydney
-// Copyright (c) 2023 Vsevolod Vlaskine
+// Copyright (c) 2023-2024 Vsevolod Vlaskine
 
 /// @author dewey nguyen
 
+#include <deque>
 #include <iostream>
 #include <vector>
-#include <deque>
 #include "../../base/types.h"
 #include "../../application/command_line_options.h"
 #include "../options.h"
@@ -14,18 +14,21 @@
 
 using namespace comma;
 
+namespace comma { namespace csv { namespace applications { namespace shape { namespace operations { namespace sliding_window { static std::string usage( bool verbose ); } } } } } }
+
 static void usage( bool verbose=false )
 {
     std::cerr << "Perform reshaping operations on input data" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
-    std::cerr << "    concatenate: group input records for concatenation into output records." << std::endl;
-    std::cerr << "                 the user can choose non-overlapping or overlapping grouping (sliding window) mode." << std::endl;
-    std::cerr << "    loop:        same as concatenate, but with an additional last record:" << std::endl;
-    std::cerr << "                 last input record concatenated with the first record (hence, 'loop')" << std::endl;
-    std::cerr << "                 this mode always uses the sliding window for overlapping groups" << std::endl;
-    std::cerr << "    repeat:      repeat input given number of times, e.g. csv-shape repeat --size 5" << std::endl;
-    std::cerr << "    split:       csv-only: split line at n-th field, e.g. csv-shape split --size 4" << std::endl;
+    std::cerr << "    concatenate:    group input records for concatenation into output records." << std::endl;
+    std::cerr << "                    the user can choose non-overlapping or overlapping grouping (sliding window) mode." << std::endl;
+    std::cerr << "    loop:           same as concatenate, but with an additional last record:" << std::endl;
+    std::cerr << "                    last input record concatenated with the first record (hence, 'loop')" << std::endl;
+    std::cerr << "                    this mode always uses the sliding window for overlapping groups" << std::endl;
+    std::cerr << "    repeat:         repeat input given number of times, e.g. csv-shape repeat --size 5" << std::endl;
+    std::cerr << "    sliding-window: todo" << std::endl;
+    std::cerr << "    split:          csv-only: split line at n-th field, e.g. csv-shape split --size 4" << std::endl;
     std::cerr << std::endl;
     std::cerr << "Usage: cat data.csv | csv-shape <operation> [<options>]" << std::endl;
     std::cerr << std::endl;
@@ -49,6 +52,7 @@ static void usage( bool verbose=false )
     std::cerr << "                     echo 0,1,2,3,4,5 | csv-shape split -n 2 --repeat will output: 0,1, then 2,3, then 4,5" << std::endl;
     std::cerr << "      --size,-n=<n>; e.g. echo 0,1,2,3,4,5| csv-shape split -n 3 will output" << std::endl;
     std::cerr << "                     two lines: 0,1,2 and 3,4,5" << std::endl;
+    std::cerr << comma::csv::applications::shape::operations::sliding_window::usage( verbose ) << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
@@ -273,6 +277,50 @@ static int _split( const comma::command_line_options& options, const comma::csv:
     return 0;
 }
 
+namespace comma { namespace csv { namespace applications { namespace shape { namespace operations {
+
+namespace sliding_window {
+
+std::string usage( bool verbose )
+{
+    ( void )verbose;
+    return R"(todo)";
+}
+
+static int run( const comma::command_line_options& options, comma::csv::options& csv )
+{
+    unsigned int size = options.value< unsigned int >( "--size" );
+    std::deque< std::string > deque;
+    if( csv.binary() )
+    {
+        // todo
+    }
+    else
+    {
+        while( std::cin.good() && !std::cin.eof() )
+        {
+            std::string line;
+            std::getline( std::cin, line );
+            if( comma::strip( line ).empty() ) { continue; }
+            deque.push_back( line );
+            if( deque.size() > size )
+            {
+                deque.pop_front();
+                for( const auto& d: deque ) { std::cout << d << std::endl; }
+            }
+            else
+            {
+                std::cout << line << std::endl;
+            }
+        }
+    }
+    return 0;
+}
+
+} // namespace sliding_window {
+
+} } } } } // namespace comma { namespace csv { namespace applications { namespace shape { namespace operations {
+
 int main( int ac, char** av )
 {
     try
@@ -287,8 +335,9 @@ int main( int ac, char** av )
         std::string operation = unnamed[0];
         if( operation == "concatenate" || operation == "loop" ) { return _concatenate().run( options, csv ); }
         if( operation == "repeat" ) { return _repeat( options, csv ); }
+        if( operation == "sliding-window" ) { return comma::csv::applications::shape::operations::sliding_window::run( options, csv ); }
         if( operation == "split" ) { return _split( options, csv ); }
-        std::cerr << comma::verbose.app_name() << ": expected operation; got: '" << operation << '\'' << std::endl;
+        comma::say() << ": expected operation; got: '" << operation << "'" << std::endl;
     }
     catch( std::exception& ex ) { std::cerr << "csv-shape: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-shape: unknown exception" << std::endl; }

From 9fe5e1f17a05d6a59429eafcd3dc06de11854505 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 2 Aug 2024 17:04:45 +1000
Subject: [PATCH 0848/1056] csv-shape: sliding-window: first cut implemented

---
 csv/applications/csv-shape.cpp | 79 +++++++++++++++++++---------------
 1 file changed, 45 insertions(+), 34 deletions(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index a9fb53be7..357be6729 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -39,19 +39,18 @@ static void usage( bool verbose=false )
     std::cerr << "    --verbose,-v: more output to stderr, shows examples with --help,-h" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations options" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "   concatenate" << std::endl;
-    std::cerr << "      --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
-    std::cerr << "      --reverse; output records in reverse order (e.g. b,a)" << std::endl;
-    std::cerr << "      --sliding-window,-w; use a sliding window to group input records, see examples" << std::endl;
-    std::cerr << "   loop" << std::endl;
-    std::cerr << "      --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
-    std::cerr << "      --reverse; output records in reverse order (e.g. b,a)" << std::endl;
-    std::cerr << "   split" << std::endl;
-    std::cerr << "      --repeat; e.g: echo 0,1,2,3,4,5 | csv-shape split -n 2 will output: 0,1 and 2,3,4,5" << std::endl;
-    std::cerr << "                     echo 0,1,2,3,4,5 | csv-shape split -n 2 --repeat will output: 0,1, then 2,3, then 4,5" << std::endl;
-    std::cerr << "      --size,-n=<n>; e.g. echo 0,1,2,3,4,5| csv-shape split -n 3 will output" << std::endl;
-    std::cerr << "                     two lines: 0,1,2 and 3,4,5" << std::endl;
+    std::cerr << "    concatenate" << std::endl;
+    std::cerr << "       --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
+    std::cerr << "       --reverse; output records in reverse order (e.g. b,a)" << std::endl;
+    std::cerr << "       --sliding-window,-w; use a sliding window to group input records, see examples" << std::endl;
+    std::cerr << "    loop" << std::endl;
+    std::cerr << "       --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
+    std::cerr << "       --reverse; output records in reverse order (e.g. b,a)" << std::endl;
+    std::cerr << "    split" << std::endl;
+    std::cerr << "       --repeat; e.g: echo 0,1,2,3,4,5 | csv-shape split -n 2 will output: 0,1 and 2,3,4,5" << std::endl;
+    std::cerr << "                      echo 0,1,2,3,4,5 | csv-shape split -n 2 --repeat will output: 0,1, then 2,3, then 4,5" << std::endl;
+    std::cerr << "       --size,-n=<n>; e.g. echo 0,1,2,3,4,5| csv-shape split -n 3 will output" << std::endl;
+    std::cerr << "                      two lines: 0,1,2 and 3,4,5" << std::endl;
     std::cerr << comma::csv::applications::shape::operations::sliding_window::usage( verbose ) << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
@@ -281,38 +280,50 @@ namespace comma { namespace csv { namespace applications { namespace shape { nam
 
 namespace sliding_window {
 
-std::string usage( bool verbose )
+std::string usage( bool )
 {
-    ( void )verbose;
-    return R"(todo)";
+    return R"(    sliding-window
+        --size=<n>; number of input records in each grouping
+        --step=<n>; default=1; sliding window step)";
 }
 
 static int run( const comma::command_line_options& options, comma::csv::options& csv )
 {
-    unsigned int size = options.value< unsigned int >( "--size" );
+    const unsigned int size = options.value< unsigned int >( "--size" );
+    const unsigned int stride = options.value< unsigned int >( "--step,--stride", 1 );
+    COMMA_ASSERT( stride <= size, "stride greater than size currently not supported, just ask; got: size: " << size << " stride: " << stride );
     std::deque< std::string > deque;
-    if( csv.binary() )
-    {
-        // todo
-    }
-    else
+    std::string record = csv.binary() ? std::string( csv.format().size(), 0 ) : std::string();
+    while( std::cin.good() && !std::cin.eof() )
     {
-        while( std::cin.good() && !std::cin.eof() )
+        if( csv.binary() )
         {
-            std::string line;
-            std::getline( std::cin, line );
-            if( comma::strip( line ).empty() ) { continue; }
-            deque.push_back( line );
-            if( deque.size() > size )
-            {
-                deque.pop_front();
-                for( const auto& d: deque ) { std::cout << d << std::endl; }
-            }
-            else
+            std::cin.read( &record[0], record.size() );
+            if( std::cin.gcount() == 0 ) { break; }
+            COMMA_ASSERT( std::cin.gcount() == int( record.size() ), "expected " << record.size() << " bytes; got only: " << std::cin.gcount() );
+        }
+        else
+        {
+            std::getline( std::cin, record );
+            if( comma::strip( record ).empty() ) { continue; }
+        }
+        deque.push_back( record );
+        if( deque.size() > ( size + stride ) )
+        {
+            for( unsigned int i = 0; i < stride; ++i ) { deque.pop_front(); } // quick and dirty
+            for( const auto& d: deque )
             {
-                std::cout << line << std::endl;
+                std::cout.write( &d[0], d.size() );
+                if( !csv.binary() ) { std::cout << std::endl; }
             }
         }
+        else
+        {
+            if( deque.size() > size ) { continue; }
+            std::cout.write( &record[0], record.size() );
+            if( !csv.binary() ) { std::cout << std::endl; }
+        }
+        if( csv.flush ) { std::cout.flush(); }
     }
     return 0;
 }

From 002a4ef9692baebac94055817444e79722d8c309 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 2 Aug 2024 17:22:05 +1000
Subject: [PATCH 0849/1056] csv-shape: sliding-window: --incremental
 implemented

---
 csv/applications/csv-shape.cpp | 19 +++++++++++--------
 1 file changed, 11 insertions(+), 8 deletions(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 357be6729..e5761e007 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -283,6 +283,7 @@ namespace sliding_window {
 std::string usage( bool )
 {
     return R"(    sliding-window
+        --incremental; output first block incrementally: first record, then first and second, etc
         --size=<n>; number of input records in each grouping
         --step=<n>; default=1; sliding window step)";
 }
@@ -294,6 +295,13 @@ static int run( const comma::command_line_options& options, comma::csv::options&
     COMMA_ASSERT( stride <= size, "stride greater than size currently not supported, just ask; got: size: " << size << " stride: " << stride );
     std::deque< std::string > deque;
     std::string record = csv.binary() ? std::string( csv.format().size(), 0 ) : std::string();
+    bool incremental = options.exists( "--incremental" );
+    auto output_record = [&]( const std::string& record )
+    {
+        std::cout.write( &record[0], record.size() );
+        if( !csv.binary() ) { std::cout << std::endl; }
+    };
+    auto output_all = [&]() { for( const auto& r: deque ) { output_record( r ); } };
     while( std::cin.good() && !std::cin.eof() )
     {
         if( csv.binary() )
@@ -311,17 +319,12 @@ static int run( const comma::command_line_options& options, comma::csv::options&
         if( deque.size() > ( size + stride ) )
         {
             for( unsigned int i = 0; i < stride; ++i ) { deque.pop_front(); } // quick and dirty
-            for( const auto& d: deque )
-            {
-                std::cout.write( &d[0], d.size() );
-                if( !csv.binary() ) { std::cout << std::endl; }
-            }
+            output_all();
         }
         else
         {
             if( deque.size() > size ) { continue; }
-            std::cout.write( &record[0], record.size() );
-            if( !csv.binary() ) { std::cout << std::endl; }
+            if( incremental ) { output_all(); } else { output_record( record ); }
         }
         if( csv.flush ) { std::cout.flush(); }
     }
@@ -337,7 +340,7 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        std::vector< std::string > unnamed = options.unnamed( "--expected-records,--repeat,--sliding-window,-w,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--expected-records,--incremental,--repeat,--sliding-window,-w,--verbose,-v", "-.*" );
         comma::csv::options csv( options );
         csv.full_xpath = false;
         if( csv.fields.empty() ) { csv.fields="a"; }

From 83b0f2925a9b461b0893adae0be497d4911bfa86 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 2 Aug 2024 17:45:25 +1000
Subject: [PATCH 0850/1056] csv-shape: sliding-window: bug fixed

---
 csv/applications/csv-shape.cpp | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index e5761e007..2cc123da7 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -316,16 +316,20 @@ static int run( const comma::command_line_options& options, comma::csv::options&
             if( comma::strip( record ).empty() ) { continue; }
         }
         deque.push_back( record );
-        if( deque.size() > ( size + stride ) )
-        {
-            for( unsigned int i = 0; i < stride; ++i ) { deque.pop_front(); } // quick and dirty
-            output_all();
-        }
-        else
+        // std::cerr << "============" << std::endl;
+        // for( const auto& d: deque ) { std::cerr << " " << d; }
+        // std::cerr << std::endl;
+        // std::cerr << "------------" << std::endl;
+        if( deque.size() < ( size + stride ) )
         {
             if( deque.size() > size ) { continue; }
             if( incremental ) { output_all(); } else { output_record( record ); }
         }
+        else
+        {
+            while( deque.size() > size ) { deque.pop_front(); } // quick and dirty
+            output_all();
+        }        
         if( csv.flush ) { std::cout.flush(); }
     }
     return 0;

From 6c4a0e984f55570e6c38f2e88644506103d1e0c4 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 2 Aug 2024 18:14:13 +1000
Subject: [PATCH 0851/1056] csv-shape: sliding-window: bug fixed

---
 csv/applications/csv-shape.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 2cc123da7..acb9a24d1 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -323,7 +323,7 @@ static int run( const comma::command_line_options& options, comma::csv::options&
         if( deque.size() < ( size + stride ) )
         {
             if( deque.size() > size ) { continue; }
-            if( incremental ) { output_all(); } else { output_record( record ); }
+            if( incremental ) { if( deque.size() % stride == 0 ) { output_all(); } } else { output_record( record ); }
         }
         else
         {

From 0b8abc2f80e0d2d57cbaa7bc535cadb693104d8a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 Aug 2024 20:21:02 +1000
Subject: [PATCH 0852/1056] csv-shape: sliding-window --prepend-block
 implemented

---
 csv/applications/csv-shape.cpp | 31 ++++++++++++++++++++++++++++---
 1 file changed, 28 insertions(+), 3 deletions(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index acb9a24d1..cc099caf2 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -284,10 +284,16 @@ std::string usage( bool )
 {
     return R"(    sliding-window
         --incremental; output first block incrementally: first record, then first and second, etc
+        --prepend-block,--block; prepend each record with block number, ui if binary output
         --size=<n>; number of input records in each grouping
         --step=<n>; default=1; sliding window step)";
 }
 
+// todo
+// - examples
+// - test
+// - notify
+
 static int run( const comma::command_line_options& options, comma::csv::options& csv )
 {
     const unsigned int size = options.value< unsigned int >( "--size" );
@@ -296,12 +302,23 @@ static int run( const comma::command_line_options& options, comma::csv::options&
     std::deque< std::string > deque;
     std::string record = csv.binary() ? std::string( csv.format().size(), 0 ) : std::string();
     bool incremental = options.exists( "--incremental" );
+    bool prepend_block = options.exists( "--prepend-block,--block" );
+    std::uint32_t block = 0;
     auto output_record = [&]( const std::string& record )
     {
+        if( prepend_block )
+        {
+            if( csv.binary() ) { std::cout.write( reinterpret_cast< const char* >( &block ), sizeof( std::uint32_t ) ); }
+            else { std::cout << block << csv.delimiter; }
+        }
         std::cout.write( &record[0], record.size() );
         if( !csv.binary() ) { std::cout << std::endl; }
     };
-    auto output_all = [&]() { for( const auto& r: deque ) { output_record( r ); } };
+    auto output_all = [&]()
+    {
+        for( const auto& r: deque ) { output_record( r ); }
+        ++block;
+    };
     while( std::cin.good() && !std::cin.eof() )
     {
         if( csv.binary() )
@@ -323,7 +340,15 @@ static int run( const comma::command_line_options& options, comma::csv::options&
         if( deque.size() < ( size + stride ) )
         {
             if( deque.size() > size ) { continue; }
-            if( incremental ) { if( deque.size() % stride == 0 ) { output_all(); } } else { output_record( record ); }
+            if( incremental )
+            {
+                if( deque.size() % stride == 0 ) { output_all(); }
+            }
+            else
+            {
+                output_record( record );
+                if( deque.size() == size ) { ++block; } // quick and dirty
+            }
         }
         else
         {
@@ -344,7 +369,7 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        std::vector< std::string > unnamed = options.unnamed( "--expected-records,--incremental,--repeat,--sliding-window,-w,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--prepend-block,--block,--expected-records,--incremental,--repeat,--sliding-window,-w,--verbose,-v", "-.*" );
         comma::csv::options csv( options );
         csv.full_xpath = false;
         if( csv.fields.empty() ) { csv.fields="a"; }

From c7167d91b1c0c3e39ad7e3e4ac677c4ccc7b72e5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 Aug 2024 20:29:48 +1000
Subject: [PATCH 0853/1056] csv-shape: sliding-window: examples added

---
 csv/applications/csv-shape.cpp | 33 ++++++++++++++++++++++-----------
 1 file changed, 22 insertions(+), 11 deletions(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index cc099caf2..1d9123f86 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -58,22 +58,33 @@ static void usage( bool verbose=false )
     std::cerr << "examples" << std::endl;
     if( verbose )
     {
-        std::cerr << "examples" << std::endl;
-        std::cerr << "   concatenate" << std::endl;
-        std::cerr << "      non-overlapping groups:" << std::endl;
-        std::cerr << "          concatenate each group of 5 input records into one output record." << std::endl;
-        std::cerr << "          input records 1 to 5 create the first output record, input records 6-10 create the second output record, and so forth." << std::endl;
-        std::cerr << "              seq 1 15 | csv-shape concatenate -n 5" << std::endl;
-        std::cerr << "      overlapping groups:" << std::endl;
-        std::cerr << "          move a sliding window of size 5 along the input records, every time the sliding window moves, make an output record from window" << std::endl;
-        std::cerr << "          input records 1 to 5 create the first output record, input records 2 to 6 create the second record, input records 3 to 7 create the third record, and so forth" << std::endl;
-        std::cerr << "              seq 1 10 | csv-shape concatenate -n 5 --sliding-window" << std::endl;
-        std::cerr << std::endl;
+        std::cerr << R"(examples
+    concatenate
+        non-overlapping groups
+            concatenate each group of 5 input records into one output record.
+            input records 1 to 5 create the first output record, input records 6-10 create the second output record, and so forth.
+                seq 1 15 | csv-shape concatenate -n 5
+        overlapping groups
+            move a sliding window of size 5 along the input records, every time the sliding window moves, make an output record from window
+            input records 1 to 5 create the first output record, input records 2 to 6 create the second record, input records 3 to 7 create the third record, and so forth
+                seq 1 10 | csv-shape concatenate -n 5 --sliding-window
+    sliding-window
+        basics
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4 --step 2
+        enumerate blocks of records
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4 --block
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4 --step 2 --block
+        incrementally output of the records 
+            for x in a b c d e f; do echo $x; done | csv-shape sliding-window --size 4 --incremental --block
+            for x in a b c d e f; do echo $x; done | csv-shape sliding-window --size 4 --incremental --block --step 2
+)";
     }
     else
     {
         std::cerr << "    run csv-shape --help --verbose for more..." << std::endl;
     }
+    std::cerr << std::endl;
     exit( 0 );
 }
 

From d4a912eff6fdc0c2e752d4b0eb65419bc3d3736c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 Aug 2024 20:29:53 +1000
Subject: [PATCH 0854/1056] csv-shape: sliding-window: examples added

---
 csv/applications/csv-shape.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 1d9123f86..5d90bf42f 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -301,7 +301,6 @@ std::string usage( bool )
 }
 
 // todo
-// - examples
 // - test
 // - notify
 

From 185757a275536d15603552360b150ab735e25600 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 Aug 2024 21:22:04 +1000
Subject: [PATCH 0855/1056] csv-shape: sliding-window: unit test added

---
 csv/applications/csv-shape.cpp             |  4 ---
 csv/test/csv-shape/sliding-window/expected | 26 +++++++++++++++++++
 csv/test/csv-shape/sliding-window/input    | 30 ++++++++++++++++++++++
 3 files changed, 56 insertions(+), 4 deletions(-)
 create mode 100644 csv/test/csv-shape/sliding-window/expected
 create mode 100644 csv/test/csv-shape/sliding-window/input

diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 5d90bf42f..74d65d009 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -300,10 +300,6 @@ std::string usage( bool )
         --step=<n>; default=1; sliding window step)";
 }
 
-// todo
-// - test
-// - notify
-
 static int run( const comma::command_line_options& options, comma::csv::options& csv )
 {
     const unsigned int size = options.value< unsigned int >( "--size" );
diff --git a/csv/test/csv-shape/sliding-window/expected b/csv/test/csv-shape/sliding-window/expected
new file mode 100644
index 000000000..ee9d13b2d
--- /dev/null
+++ b/csv/test/csv-shape/sliding-window/expected
@@ -0,0 +1,26 @@
+basics[0]/output="a b c d e f "
+basics[1]/output="a b b c c d d e e f "
+basics[2]/output="a b c b c d c d e d e f "
+basics[3]/output="a b c d b c d e c d e f "
+step[0]/output="a b c d c d e f "
+step[1]/output="a b c d e f g h "
+block[0]/output="0,a 1,b 2,c 3,d 4,e 5,f "
+block[1]/output="0,a 0,b 1,b 1,c 2,c 2,d 3,d 3,e 4,e 4,f "
+block[2]/output="0,a 0,b 0,c 1,b 1,c 1,d 2,c 2,d 2,e 3,d 3,e 3,f "
+block[3]/output="0,a 0,b 0,c 0,d 1,b 1,c 1,d 1,e 2,c 2,d 2,e 2,f "
+block[4]/output="0,a 0,b 0,c 0,d 1,c 1,d 1,e 1,f "
+incremental/basic[0]/output="a b c d e f "
+incremental/basic[1]/output="a a b b c c d d e e f "
+incremental/basic[2]/output="a a b a b c b c d c d e d e f "
+incremental/basic[3]/output="a a b a b c a b c d b c d e c d e f "
+incremental/basic[4]/output="a b a b c d c d e f "
+incremental/block[0]/output="0,a 1,b 2,c 3,d 4,e 5,f "
+incremental/block[1]/output="0,a 1,a 1,b 2,b 2,c 3,c 3,d 4,d 4,e 5,e 5,f "
+incremental/block[2]/output="0,a 1,a 1,b 2,a 2,b 2,c 3,b 3,c 3,d 4,c 4,d 4,e 5,d 5,e 5,f "
+incremental/block[3]/output="0,a 1,a 1,b 2,a 2,b 2,c 3,a 3,b 3,c 3,d 4,b 4,c 4,d 4,e 5,c 5,d 5,e 5,f "
+incremental/block[4]/output="0,a 0,b 1,a 1,b 1,c 1,d 2,c 2,d 2,e 2,f "
+binary[0]/output="a b c d e f "
+binary[1]/output="a b c d b c d e c d e f "
+binary[2]/output="0,a 0,b 0,c 0,d 1,b 1,c 1,d 1,e 2,c 2,d 2,e 2,f "
+binary[3]/output="a a b a b c a b c d b c d e c d e f "
+binary[4]/output="0,a 1,a 1,b 2,a 2,b 2,c 3,a 3,b 3,c 3,d 4,b 4,c 4,d 4,e 5,c 5,d 5,e 5,f "
diff --git a/csv/test/csv-shape/sliding-window/input b/csv/test/csv-shape/sliding-window/input
new file mode 100644
index 000000000..b75549129
--- /dev/null
+++ b/csv/test/csv-shape/sliding-window/input
@@ -0,0 +1,30 @@
+basics[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 | tr '\\n' ' '"
+basics[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 | tr '\\n' ' '"
+basics[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 | tr '\\n' ' '"
+basics[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 | tr '\\n' ' '"
+
+step[0]="echo a b c d e f g | tr ' ' '\\n' | csv-shape sliding-window --size 4 --step 2 | tr '\\n' ' '"
+step[1]="echo a b c d e f g h i | tr ' ' '\\n' | csv-shape sliding-window --size 4 --step 4 | tr '\\n' ' '"
+
+block[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 --block | tr '\\n' ' '"
+block[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 --block | tr '\\n' ' '"
+block[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 --block | tr '\\n' ' '"
+block[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --block | tr '\\n' ' '"
+block[4]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --block --step 2 | tr '\\n' ' '"
+
+incremental/basic[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 --incremental | tr '\\n' ' '"
+incremental/basic[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 --incremental | tr '\\n' ' '"
+incremental/basic[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 --incremental | tr '\\n' ' '"
+incremental/basic[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental | tr '\\n' ' '"
+incremental/basic[4]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental --step 2 | tr '\\n' ' '"
+incremental/block[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 --incremental --block | tr '\\n' ' '"
+incremental/block[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 --incremental --block | tr '\\n' ' '"
+incremental/block[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 --incremental --block | tr '\\n' ' '"
+incremental/block[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental --block | tr '\\n' ' '"
+incremental/block[4]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental --block --step 2 | tr '\\n' ' '"
+
+binary[0]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 1 | csv-from-bin c | tr '\\n' ' '"
+binary[1]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 | csv-from-bin c | tr '\\n' ' '"
+binary[2]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 --block | csv-from-bin ui,c | tr '\\n' ' '"
+binary[3]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 --incremental | csv-from-bin c | tr '\\n' ' '"
+binary[4]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 --incremental --block | csv-from-bin ui,c | tr '\\n' ' '"

From 56656d317f167232b307d1022ac2c5ae0f51b87a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 4 Aug 2024 18:40:58 +1000
Subject: [PATCH 0856/1056] csv-sort: bug fixed: now works for strings with no
 --format option; basic regression/unit test added

---
 csv/applications/csv-sort.cpp   | 25 +++++++++++++++++++------
 csv/test/csv-sort/sort/expected | 11 +++++++++++
 csv/test/csv-sort/sort/input    | 12 ++++++++++++
 3 files changed, 42 insertions(+), 6 deletions(-)

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index d271b7fb4..b4157c346 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -618,15 +618,21 @@ static int random( const comma::command_line_options& options )
 static int sort( const comma::command_line_options& options )
 {
     input_with_block default_input;
-    std::vector< std::string > v = comma::split( csv.fields, ',' );
-    std::vector< std::string > order = options.exists( "--order" ) ? comma::split( options.value< std::string >( "--order" ), ',' ) : v;
+    std::vector< std::string > v = comma::split( csv.fields, ',', true );
+    std::vector< std::string > order = options.exists( "--order" ) ? comma::split( options.value< std::string >( "--order" ), ',', true ) : v;
     std::vector< std::string > w( v.size() );
     bool unique = options.exists( "--unique,-u" );
     for( std::size_t k = 0; k < v.size(); ++k ) { if( v[k] == "block" ) { w[k] = "block"; } }
     std::string first_line;
     comma::csv::format f;
-    if( csv.binary() ) { f = csv.format(); }
-    else if( options.exists( "--format" ) ) { f = comma::csv::format( options.value< std::string >( "--format" ) ); }
+    if( csv.binary() )
+    {
+        f = csv.format();
+    }
+    else if( options.exists( "--format" ) )
+    {
+        f = comma::csv::format( options.value< std::string >( "--format" ) );
+    }
     else
     {
         while( std::cin.good() && first_line.empty() ) { std::getline( std::cin, first_line ); }
@@ -634,12 +640,19 @@ static int sort( const comma::command_line_options& options )
         f = comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter, options.exists( "--numeric-keys-are-floats,--floats" ) );
         if( verbose ) { std::cerr << "csv-sort: guessed format: " << f.string() << std::endl; }
     }
+    if( order.empty() ) // quick and dirty for now (really should be a method in unstructured or alike)
+    {
+        order.resize( f.count() );
+        for( unsigned int i = 0; i < order.size(); ++i ) { order[i] = std::to_string( i ); }
+        if( v.empty() ) { v = order; w.resize( v.size() ); }
+    }
     for( std::size_t i = 0; i < order.size(); ++i ) // quick and dirty, wasteful, but who cares
     {
         if( order[i].empty() || order[i] == "block" ) { continue; }
         for( std::size_t k = 0; k < v.size(); ++k )
         {
-            if( v[k].empty() || v[k] != order[i] ) { 
+            if( v[k].empty() || v[k] != order[i] )
+            {
                 if( k + 1 == v.size() ) { std::cerr << "csv-sort: order field name \"" << order[i] << "\" not found in input fields \"" << csv.fields << "\"" << std::endl; return 1; }
                 continue; 
             }
@@ -667,7 +680,7 @@ static int sort( const comma::command_line_options& options )
     if( sliding_window ) { return handle_sliding_window( istream, first_line, default_input, reverse, *sliding_window ); }
     input_t::map map;
     if( !first_line.empty() )
-    { 
+    {
         input_with_block input = comma::csv::ascii< input_with_block >( csv, default_input ).get( first_line );
         block.update( input );
         input_t::map::mapped_type& d = map[ input ];
diff --git a/csv/test/csv-sort/sort/expected b/csv/test/csv-sort/sort/expected
index 15c7a5aec..5eadc99aa 100644
--- a/csv/test/csv-sort/sort/expected
+++ b/csv/test/csv-sort/sort/expected
@@ -17,3 +17,14 @@ numeric_keys_are_floats[1]/output/line[1]="3.1"
 numeric_keys_are_floats[1]/output/line[2]="4"
 numeric_keys_are_floats[1]/output/line[3]="5"
 numeric_keys_are_floats[1]/status=0
+
+strings[0]/output="a,z;b,y;b,z;"
+strings[1]/output="a,z;b,y;b,z;"
+strings[2]/output="a,z;b,z;b,y;"
+strings[3]/output="b,y;a,z;b,z;"
+strings[5]/output=",_a;,a_;,aa;"
+strings[6]/output=",_a;,a_;,aa;"
+strings[7]/output="x,aa;y,a_;z,_a;"
+strings[8]/output="x,aa;y,a_;z,_a;"
+strings[9]/output="x,aa;y,a_;z,_a;"
+strings[10]/output="z,_a;y,a_;x,aa;"
diff --git a/csv/test/csv-sort/sort/input b/csv/test/csv-sort/sort/input
index df6282f28..a9ae5a4ed 100644
--- a/csv/test/csv-sort/sort/input
+++ b/csv/test/csv-sort/sort/input
@@ -14,3 +14,15 @@ descending/block[2]="( echo 1,0; echo 0,0; echo 1,0 ; echo 1,1; echo 0,1; echo 1
 
 numeric_keys_are_floats[0]="( echo 5; echo 4; echo 3.1; echo 2 ) | csv-sort --fields a"
 numeric_keys_are_floats[1]="( echo 5; echo 4; echo 3.1; echo 2 ) | csv-sort --fields a --numeric-keys-are-floats"
+
+strings[0]="( echo a,z; echo b,z; echo b,y )     | csv-sort              | tr '\\n' ';'"
+strings[1]="( echo a,z; echo b,z; echo b,y )     | csv-sort --fields a,b | tr '\\n' ';'"
+strings[2]="( echo a,z; echo b,z; echo b,y )     | csv-sort --fields a   | tr '\\n' ';'"
+strings[3]="( echo a,z; echo b,z; echo b,y )     | csv-sort --fields ,a  | tr '\\n' ';'"
+strings[4]="( echo a_; echo aa; echo _a )        | csv-sort              | tr '\\n' ';'"
+strings[5]="( echo ,a_; echo ,aa; echo ,_a )     | csv-sort              | tr '\\n' ';'"
+strings[6]="( echo ,a_; echo ,aa; echo ,_a )     | csv-sort --fields ,a  | tr '\\n' ';'"
+strings[7]="( echo y,a_; echo x,aa; echo z,_a )  | csv-sort              | tr '\\n' ';'"
+strings[8]="( echo y,a_; echo x,aa; echo z,_a )  | csv-sort --fields a,b | tr '\\n' ';'"
+strings[9]="( echo y,a_; echo x,aa; echo z,_a )  | csv-sort --fields a   | tr '\\n' ';'"
+strings[10]="( echo y,a_; echo x,aa; echo z,_a ) | csv-sort --fields ,a  | tr '\\n' ';'"
\ No newline at end of file

From 87b55dd3230be76bd0faaddb2275f1558d56a103 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 5 Aug 2024 13:40:02 +1000
Subject: [PATCH 0857/1056] csv-crc: minor brush-up

---
 csv/applications/csv-crc.cpp | 123 ++++++++++++++++-------------------
 1 file changed, 57 insertions(+), 66 deletions(-)

diff --git a/csv/applications/csv-crc.cpp b/csv/applications/csv-crc.cpp
index 735ab5cee..703bc14a2 100644
--- a/csv/applications/csv-crc.cpp
+++ b/csv/applications/csv-crc.cpp
@@ -45,54 +45,52 @@
 
 static void usage( bool )
 {
-    std::cerr << "\n";
-    std::cerr << "wrap/check crc on fixed-width input (ascii or binary)\n";
-    std::cerr << "\n";
-    std::cerr << "usage: csv-crc <command> [<options>]\n";
-    std::cerr << "\n";
-    std::cerr << "<command>\n";
-    std::cerr << "    wrap:    add crc\n";
-    std::cerr << "    check:   check crc; exit if check fails\n";
-    std::cerr << "    recover: recover with given parameters (see below)\n";
-    std::cerr << "\n";
-    std::cerr << "general options\n";
-    std::cerr << "    --help,-h;    this help\n";
-    std::cerr << "    --verbose,-v: more output\n";
-    std::cerr << "\n";
-    std::cerr << "data options\n";
-    std::cerr << "    --crc-size;      output given crc size to stdout and exit\n";
-    std::cerr << "    --delimiter,-d=[<char>]: ascii csv delimiter\n";
-    std::cerr << "    --size=[<size>]: binary data size; if absent, expect ascii csv\n";
-    std::cerr << "                     for wrap: payload size\n";
-    std::cerr << "                     for check/recover: size including crc\n";
-    std::cerr << "\n";
-    std::cerr << "crc options\n";
-    std::cerr << "    --crc=<which>:\n";
-    std::cerr << "        16:     16-bit, generator 0x8805\n";
-    std::cerr << "        ccitt:  16-bit, generator 0x1021\n";
-    std::cerr << "        xmodem: 16-bit, generator 0x1021\n";
-    std::cerr << "        32:     32-bit, generator 0x04C11DB7\n";
-    //std::cerr << "        checksum16: simple 16-bit checksum (todo)\n";
-    //std::cerr << "        checksum32: simple 32-bit checksum (todo)\n";
-    std::cerr << "        default: ccitt\n";
-    std::cerr << "    --big-endian,--net-byte-order: if binary, crc is big endian\n";
-    std::cerr << "\n";
-    std::cerr << "recover options\n";
-    std::cerr << "    --give-up-after=<n>: if check fails, give up after <n> bytes\n";
-    std::cerr << "                         default: infinity; don't give up\n";
-    std::cerr << "    --recover-after=<n>: if check fails and then new valid crc found\n";
-    std::cerr << "                         make sure that at least <n> subsequent lines (ascii)\n";
-    std::cerr << "                         or packets (binary) are valid, before output;\n";
-    std::cerr << "                         default: 0; recover on the next valid packet\n";
-    std::cerr << "    --discard-on-recovery,--discard: discard packets accumulated when recovering\n";
-    std::cerr << "\n";
-    std::cerr << "    Note that the check command is equivalent to\n";
-    std::cerr << "    csv-crc recover --give-up-after 0\n";
-    std::cerr << "\n";
-    std::cerr << "For a definitive list of 16 bit CRC algorithms see:\n";
-    std::cerr << "http://reveng.sourceforge.net/crc-catalogue/16.htm\n";
-    std::cerr << std::endl;
-    exit( 1 );
+    std::cerr << R"(
+wrap/check crc on fixed-width input (ascii or binary)
+
+usage: csv-crc <command> [<options>]
+
+<command>
+    wrap:    add crc
+    check:   check crc; exit if check fails
+    recover: recover with given parameters (see below)
+
+general options
+    --help,-h;    this help
+    --verbose,-v: more output
+
+data options
+    --crc-size;      output given crc size to stdout and exit
+    --delimiter,-d=[<char>]: ascii csv delimiter
+    --size=[<size>]: binary data size; if absent, expect ascii csv
+                     for wrap: payload size
+                     for check/recover: size including crc
+
+crc options
+    --crc=<which>:
+        16:     16-bit, generator 0x8805
+        ccitt:  16-bit, generator 0x1021
+        xmodem: 16-bit, generator 0x1021
+        32:     32-bit, generator 0x04C11DB7
+        default: ccitt
+    --big-endian,--net-byte-order: if binary, crc is big endian
+
+recover options
+    --give-up-after=<n>: if check fails, give up after <n> bytes
+                         default: infinity; don't give up
+    --recover-after=<n>: if check fails and then new valid crc found
+                         make sure that at least <n> subsequent lines (ascii)
+                         or packets (binary) are valid, before output;
+                         default: 0; recover on the next valid packet
+    --discard-on-recovery,--discard: discard packets accumulated when recovering
+
+    Note that the check command is equivalent to
+    csv-crc recover --give-up-after 0
+
+For a definitive list of 16 bit CRC algorithms see:
+http://reveng.sourceforge.net/crc-catalogue/16.htm
+)";
+    exit( 0 );
 }
 
 static bool verbose;
@@ -173,7 +171,7 @@ static bool run_()
                         {
                             if( recovered_count == recover_after )
                             {
-                                std::cerr << "csv-crc: recovered after " << recovered_byte_count << " byte(s)" << std::endl;
+                                comma::say() << "recovered after " << recovered_byte_count << " byte(s)" << std::endl;
                                 if( !discard_on_recovery ) { std::cout.write( &recovery_buffer[0], recovery_buffer.size() ); }
                                 recovered = true;
                                 recovered_count = 0;
@@ -197,7 +195,7 @@ static bool run_()
                             recovered_count = 0;
                             current_recovered_byte_count = 0;
                         }
-                        if( recovered ) { std::cerr << "csv-crc: crc check failed" << ( !give_up_after || *give_up_after > 0 ? "; recovering..." : "" ) << std::endl; }
+                        if( recovered ) { comma::say() << "crc check failed" << ( !give_up_after || *give_up_after > 0 ? "; recovering..." : "" ) << std::endl; }
                         recovered = false;
                         if( give_up_after && recovered_byte_count >= *give_up_after ) { break; }
                     }
@@ -217,7 +215,7 @@ static bool run_()
             if( r <= 0 ) { break; }
             offset += r;
         }
-        if( offset > 0 && offset < size ) { std::cerr << "csv-crc: expected at least " << size << " byte(s), got only " << offset << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( offset <= 0 || offset >= size, "expected at least " << size << " byte(s), got only " << offset );
     }
     else
     {
@@ -243,7 +241,7 @@ static bool run_()
                 }
                 else
                 {
-                    std::cerr << "csv-crc: check failed (recovery is not implemented for ascii mode, todo)" << std::endl;
+                    comma::say() << "check failed (recovery is not implemented for ascii mode, todo)" << std::endl;
                     return 1;
                 }
             }
@@ -265,10 +263,10 @@ int main( int ac, char** av )
             else if( crc == "ccitt" ) { std::cout << sizeof( boost::crc_ccitt_type::value_type ) << std::endl; }
             else if( crc == "xmodem" ) { std::cout << sizeof( boost::crc_xmodem_type::value_type ) << std::endl; }
             else if( crc == "xmodem-boost" ) { std::cout << sizeof( boost::crc_xmodem_type::value_type ) << std::endl; }
-            else { std::cerr << "csv-crc: expected crc type, got \"" << crc << "\"" << std::endl; return 1; }
+            else { comma::say() << "expected crc type, got \"" << crc << "\"" << std::endl; return 1; }
             return 0;
         }
-        if( wrap && recover ) { std::cerr << "csv-crc: if 'wrap', then no 'check' or 'recover'" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !wrap || !recover, "if 'wrap', then no 'check' or 'recover'" );
         verbose = options.exists( "--verbose,-v" );
         give_up_after = options.optional< unsigned int >( "--give-up-after" );
         recover_after = options.value( "--recover-after", 0 );
@@ -278,13 +276,13 @@ int main( int ac, char** av )
         big_endian = options.exists( "--big-endian,--net-byte-order" );
         delimiter = options.value< char >( "--delimiter,-d", ',' );
         std::vector< std::string > commands = options.unnamed( "--discard-on-recovery,--discard,--verbose,-v,--big-endian,--net-byte-order", "--size,--delimiter,-d,--crc,--give-up-after,--recover-after" );
-        if( commands.empty() ) { std::cerr << "csv-crc: specify a command" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !commands.empty(), "please specify a command" );
         for( std::size_t i = 0; i < commands.size(); ++i )
         {
             if( commands[i] == "wrap" ) { wrap = true; }
             else if( commands[i] == "check" ) { recover = true; give_up_after = 0; }
             else if( commands[i] == "recover" ) { recover = true; }
-            else { std::cerr << "csv-crc: expected command, got '" << commands[i] << "'" << std::endl; return 1; }
+            else { comma::say() << "expected command, got '" << commands[i] << "'" << std::endl; return 1; }
         }
         // The list of crc versions predefined by boost is given at
         //     http://www.boost.org/doc/libs/1_58_0/libs/crc/crc.html#crc_ex
@@ -300,16 +298,9 @@ int main( int ac, char** av )
         // the following is designated boost::crc_xmodem_t in the git repo for boost/crc.hpp
         else if( crc == "xmodem" ) { return run_< boost::crc_optimal< 16, 0x1021, 0, 0, false, false > >(); }
         else if( crc == "xmodem-boost" ) { return run_< boost::crc_xmodem_type >(); }
-        std::cerr << "csv-crc: expected crc type, got \"" << crc << "\"" << std::endl;
-        return 1;
-    }
-    catch( std::exception& ex )
-    {
-        std::cerr << "csv-crc: " << ex.what() << std::endl;
-    }
-    catch( ... )
-    {
-        std::cerr << "csv-crc: unknown exception" << std::endl;
+        comma::say() << "expected crc type, got '" << crc << "'" << std::endl;
     }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }

From c21015f4d402c5dd4dfa9b68ecc5ce4f1703fd77 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 7 Aug 2024 16:16:12 +1000
Subject: [PATCH 0858/1056] comma-timeout-group.cpp: ignore zombie processes
 when waiting for group

---
 util/applications/comma-timeout-group.cpp | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/util/applications/comma-timeout-group.cpp b/util/applications/comma-timeout-group.cpp
index 9e514e4b8..104f791c9 100644
--- a/util/applications/comma-timeout-group.cpp
+++ b/util/applications/comma-timeout-group.cpp
@@ -276,9 +276,10 @@ int parse_process_tree( bool verbose = false )
     int count = 0;
     while ( readproc( proc, &proc_info ) != NULL ) {
         if ( proc_info.pgrp == ownpid ) {
-            if ( first && verbose ) { std::cerr << "extant processes in group " << ownpid << std::endl; first = 0; }
-            ++count;
-            if ( verbose ) { std::cerr << "    " << proc_info.cmd << ":\t" << proc_info.tid << "\t" << proc_info.pgrp << "\t" << proc_info.state << "\t" << proc_info.start_time << std::endl; }
+            if ( first && verbose ) { comma::say() << "extant processes in group " << ownpid << std::endl; first = 0; }
+            if( proc_info.state == 'Z' ) { comma::say() << "    " << proc_info.cmd << " (pid " << proc_info.tid << ") is a zombie process - ignoring" << std::endl; }
+            else { ++count; }
+            if ( verbose ) { comma::say() << "    " << proc_info.cmd << ":\t" << proc_info.tid << "\t" << proc_info.pgrp << "\t" << proc_info.state << "\t" << proc_info.start_time << std::endl; }
         }
     }
     closeproc(proc);

From 246acf8e815eb5f6d5da4f09b91d49fbe72560cf Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 8 Aug 2024 18:17:31 +1000
Subject: [PATCH 0859/1056] name-value-get <file>:<path> implemented

---
 name_value/applications/name-value-get.cpp | 33 +++++++++++++++++-----
 name_value/test/name-value-get/expected    |  6 ++++
 name_value/test/name-value-get/input       |  4 +++
 3 files changed, 36 insertions(+), 7 deletions(-)

diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index 91ccc79cc..ed5a01710 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -2,16 +2,19 @@
 
 /// @author vsevolod vlaskine
 
+#include <fstream>
 #include <iostream>
 #include <boost/property_tree/info_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/regex.hpp>
-#include "../../base/exception.h"
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../base/none.h"
 #include "../../name_value/ptree.h"
 #include "../../name_value/serialize.h"
+#include "../../string/split.h"
 #include "../../xpath/xpath.h"
 
 static const std::string regex_characters_ =  ".{}()\\*+?|^$";
@@ -22,6 +25,7 @@ static void usage( bool verbose = false )
     std::cerr << "take json, xml, or path-value formatted data on stdin and output value at given path on stdout" << std::endl;
     std::cerr << std::endl;
     std::cerr << "usage: cat data.xml | name-value-get <paths> [<options>]" << std::endl;
+    std::cerr << "       name-value-get data.xml:<paths> [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "<paths>: x-path, e.g. \"command/type\" or posix regular expressions" << std::endl;
     std::cerr << "    if <paths> doesn't contain any of regex characters: \"" << regex_characters_ << "\" it will be treated as x-path" << std::endl;
@@ -204,7 +208,7 @@ void match_regex_( std::ostream& os, const boost::property_tree::ptree& ptree )
 static bool is_regex_(const std::string& s)
 {
     std::string regex_characters = regex_characters_;
-    if (option_regex) { regex_characters += "[]"; }
+    if( option_regex ) { regex_characters += "[]"; }
     for( unsigned int k = 0; k < regex_characters.size(); ++k )
     {
         if( s.find_first_of( regex_characters[k] ) != std::string::npos ) { return true; }
@@ -218,15 +222,22 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         path_strings = options.unnamed( "--linewise,-l,--minify,--output-path,--use-buffer,--regex,--quote-numbers,--quote,--unquote-numbers,--unquote", "-.*" );
-        if( path_strings.empty() ) { std::cerr << std::endl << "name-value-get: xpath missing" << std::endl; usage(); }
+        if( path_strings.empty() ) { std::cerr << std::endl << "name-value-get: please specify at least one path" << std::endl; usage(); }
         path_regex.resize( path_strings.size() );
         paths.resize( path_strings.size() );
         bool has_regex = false;
         option_regex = options.exists( "--regex" );
+        std::string filename;
+        if( !option_regex )
+        {
+            const auto& s = comma::split_head( path_strings[0], 2, ':' );
+            COMMA_ASSERT_BRIEF( !option_regex || s.size() == 1 || path_strings.size() == 1, "<filename>:<path> syntax is supported only for a single query path" );
+            if( s.size() == 2 ) { filename = s[0]; path_strings[0] = s[1]; }
+        }
         for( std::size_t i = 0; i < path_strings.size(); ++i )
         {
             if( is_regex_( path_strings[i] ) ) { path_regex[i] = boost::regex( path_strings[i], boost::regex::extended ); has_regex = true; }
-            else {  paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' ); }
+            else { paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' ); }
         }
         boost::optional< std::string > from = options.optional< std::string >( "--from" );
         std::string to = options.value< std::string >( "--to", "path-value" );
@@ -263,13 +274,21 @@ int main( int ac, char** av )
         else if( to == "path-value" ) { output = &traits< path_value >::output; output_last_line_break = true; }
         else { std::cerr << "name-value-get: expected --to format to be ini, info, json, xml, or path-value, got " << to << std::endl; return 1; }
         indices_mode = options.exists( "--no-brackets" ) ? comma::property_tree::without_brackets : comma::property_tree::with_brackets;
+        //auto ifstream = comma::silent_none< std::ifstream >();
+        std::ifstream ifs;
+        if( !filename.empty() )
+        {
+            ifs.open( filename );
+            COMMA_ASSERT_BRIEF( ifs.is_open(), "failed to open '" << filename << "'" );
+        }
+        std::istream& istream = filename.empty() ? static_cast< std::istream& >( std::cin ) : static_cast< std::istream& >( ifs );
         if( linewise )
         {
             while( std::cout.good() )
             {
                 std::string line;
-                std::getline( std::cin, line );
-                if( !std::cin.good() || std::cin.eof() ) { break; }
+                std::getline( istream, line );
+                if( !istream.good() || istream.eof() ) { break; }
                 std::istringstream iss( line );
                 boost::property_tree::ptree ptree;
                 input( iss, ptree );
@@ -296,7 +315,7 @@ int main( int ac, char** av )
         else
         {
             boost::property_tree::ptree ptree;
-            input( std::cin, ptree );
+            input( istream, ptree );
             if( has_regex ) { match_regex_( std::cout, ptree ); } else { match_( std::cout, ptree ); }
         }
         return 0;
diff --git a/name_value/test/name-value-get/expected b/name_value/test/name-value-get/expected
index 317e32094..e0640a9a9 100644
--- a/name_value/test/name-value-get/expected
+++ b/name_value/test/name-value-get/expected
@@ -26,3 +26,9 @@ regex[2]/output='0;2;'
 
 whitespace[0]/output='2'
 whitespace[1]/output='2'
+
+file[0]/output/line[0]="c=111"
+file[0]/output/line[1]="d=222"
+file[1]/output="111"
+file[2]/output=""
+
diff --git a/name_value/test/name-value-get/input b/name_value/test/name-value-get/input
index e1d56b2df..36a1fce14 100644
--- a/name_value/test/name-value-get/input
+++ b/name_value/test/name-value-get/input
@@ -26,3 +26,7 @@ regex[2]="( echo a/phi=0 ; echo a/psi=1; echo a/rho=2; ) | name-value-get --rege
 
 whitespace[0]="( echo a/b/c=0; echo; echo a/b/d=1; echo; echo a/b/e=2; ) | name-value-get a/b/e"
 whitespace[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/ e =2; ) | name-value-get 'a/b/ e '"
+
+file[0]="name-value-get <( echo a/b/c=111; echo a/b/d=222 )':a/b' --unquote"
+file[1]="name-value-get <( echo a/b/c=111; echo a/b/d=222 )':a/b/c' --unquote"
+file[2]="name-value-get <( echo a/b/c=111; echo a/b/d=222 )':a/b/c/d' --unquote"

From b9c783acece951ef61584e7773cb89886dbccb0f Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 8 Aug 2024 18:23:18 +1000
Subject: [PATCH 0860/1056] name-value-get <file>:<path> tail instead of head
 of the path is used

---
 name_value/applications/name-value-get.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index ed5a01710..745992e9a 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -230,7 +230,7 @@ int main( int ac, char** av )
         std::string filename;
         if( !option_regex )
         {
-            const auto& s = comma::split_head( path_strings[0], 2, ':' );
+            const auto& s = comma::split_tail( path_strings[0], 2, ':' );
             COMMA_ASSERT_BRIEF( !option_regex || s.size() == 1 || path_strings.size() == 1, "<filename>:<path> syntax is supported only for a single query path" );
             if( s.size() == 2 ) { filename = s[0]; path_strings[0] = s[1]; }
         }

From e22132e7c6f5da25b232a517b86081ac47572a05 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 8 Aug 2024 18:46:45 +1000
Subject: [PATCH 0861/1056] name-value-convert <file>:<path> implemented

---
 .../applications/name-value-convert.cpp       | 34 +++++++++++++++----
 name_value/test/name-value-convert/expected   |  5 +++
 name_value/test/name-value-convert/input      |  4 +++
 3 files changed, 36 insertions(+), 7 deletions(-)

diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index d38aaaca8..e61acd5e7 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -2,6 +2,7 @@
 
 /// @author vsevolod vlaskine
 
+#include <fstream>
 #include <iostream>
 #include <map>
 #include <boost/property_tree/info_parser.hpp>
@@ -14,6 +15,7 @@
 #include "../../application/command_line_options.h"
 #include "../../name_value/ptree.h"
 #include "../../name_value/serialize.h"
+#include "../../string/split.h"
 #include "../../xpath/xpath.h"
 
 static void usage( bool verbose = false )
@@ -26,9 +28,12 @@ static void usage( bool verbose = false )
     std::cerr << "data options" << std::endl;
     std::cerr << "    --from <format>: input format; if this options is omitted, input format will be guessed; formats: json, xml, path-value/pv" << std::endl;
     std::cerr << "    --to <format>: output format; formats: ini, json, xml, path-value (pv), dot; default: path-value" << std::endl;
-    std::cerr << "    --path=[<path>]; output data at a given path in the input" << std::endl;
-    std::cerr << "                     multiple instances of --path supported" << std::endl;
-    std::cerr << "                     regex expression support: todo" << std::endl;
+    std::cerr << "    --path=[[<filename>:]<path>]; output data at a given path in the input" << std::endl;
+    std::cerr << "                                  multiple instances of --path supported" << std::endl;
+    std::cerr << "                                  <filename> supported only for a single --path" << std::endl;
+    std::cerr << "                                  e.g. --path path/inside/json/file" << std::endl;
+    std::cerr << "                                       --path my-config.json:path/inside/json/file" << std::endl;
+    std::cerr << "                                  regex expression support: todo" << std::endl;
     std::cerr << "    --strict: return error if path specified in --path not found" << std::endl;
     std::cerr << std::endl;
     std::cerr << "formats" << std::endl;
@@ -193,7 +198,22 @@ int main( int ac, char** av )
         xml_writer_settings.indent_count = options.value( "--indent", options.exists( "--indented" ) ? 4 : 0 );
         boost::optional< char > delimiter = options.optional< char >( "--delimiter,-d" );
         path_value_delimiter = delimiter ? *delimiter : ( linewise ? ',' : '\n' );
-        const auto& paths = options.values< std::string >( "--path" );
+        auto paths = options.values< std::string >( "--path" );
+        std::string filename;
+        std::ifstream ifs;
+        if( !paths.empty() )
+        {
+            const auto& s = comma::split_tail( paths[0], 2, ':' );
+            COMMA_ASSERT_BRIEF( paths.size() == 1 || s.size() == 1, "<filename>:<path>: currently supported only for a single --path option" );
+            if( s.size() == 2 )
+            {
+                filename = s[0];
+                paths[0] = s[1];
+                ifs.open( filename );
+                COMMA_ASSERT_BRIEF( ifs.is_open(), "failed to open '" << filename << "'" );
+            }
+        }
+        std::istream& istream = filename.empty() ? static_cast< std::istream& >( std::cin ) : static_cast< std::istream& >( ifs );
         bool strict = options.exists( "--strict" );
         bool output_line_breaks = to == "path-value" && path_value_delimiter != '\n'; // hyper-quick and dirty
         if( from )
@@ -228,8 +248,8 @@ int main( int ac, char** av )
             while( std::cout.good() )
             {
                 std::string line;
-                std::getline( std::cin, line );
-                if( !std::cin.good() || std::cin.eof() ) { break; }
+                std::getline( istream, line );
+                if( !istream.good() || istream.eof() ) { break; }
                 std::istringstream iss( line );
                 boost::property_tree::ptree ptree;
                 input( iss, ptree );
@@ -257,7 +277,7 @@ int main( int ac, char** av )
         else
         {
             boost::property_tree::ptree ptree;
-            input( std::cin, ptree );
+            input( istream, ptree );
             if( paths.empty() )
             {
                 output( std::cout, ptree, indices_mode );
diff --git a/name_value/test/name-value-convert/expected b/name_value/test/name-value-convert/expected
index 7c0fd180a..ba8ce1e95 100644
--- a/name_value/test/name-value-convert/expected
+++ b/name_value/test/name-value-convert/expected
@@ -27,3 +27,8 @@ paths[12]/output='y="3";z="4";b="1";c="2";'
 paths[13]/output='y="3";'
 paths[14]/output='z="4";y="3";'
 paths[15]/output='z="4";y="3";b="1";c="2";'
+
+file[0]/output/line[0]="a=3"
+file[0]/output/line[1]="b=4"
+file[1]/output="a=3"
+file[2]/output=""
diff --git a/name_value/test/name-value-convert/input b/name_value/test/name-value-convert/input
index 84597767d..bc009d1f6 100644
--- a/name_value/test/name-value-convert/input
+++ b/name_value/test/name-value-convert/input
@@ -26,3 +26,7 @@ paths[12]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-conve
 paths[13]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y | tr '\\n' ';'"
 paths[14]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y | tr '\\n' ';'"
 paths[15]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y --path a | tr '\\n' ';'"
+
+file[0]="name-value-convert --path <( echo x/y/a=3; echo x/y/b=4 )':x/y' --unquote"
+file[1]="name-value-convert --path <( echo x/y/a=3; echo x/y/b=4 )':x/y/a' --unquote"
+file[2]="name-value-convert --path <( echo x/y/a=3; echo x/y/b=4 )':x/y/c' --unquote"

From 628aaf63289303db156abc8abc55c45d4fd80e11 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 8 Aug 2024 19:13:58 +1000
Subject: [PATCH 0862/1056] name_value/serialize: read_*( filename, permissive,
 split_filename ) implemented

---
 name_value/serialize.h | 56 +++++++++++++++++++++++++++++++++++++++---
 1 file changed, 52 insertions(+), 4 deletions(-)

diff --git a/name_value/serialize.h b/name_value/serialize.h
index de99a9c26..9c48b100f 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -40,10 +40,10 @@
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include "../base/exception.h"
-#include "../xpath/xpath.h"
+#include "../string/split.h"
 #include "../visiting/apply.h"
+#include "../xpath/xpath.h"
 #include "impl/json_writer.h"
-
 #include "ptree.h"
 
 namespace comma {
@@ -54,12 +54,14 @@ template < typename T > T read( const std::string& filename, const xpath& root,
 template < typename T > T read( const std::string& filename, const char* root, bool permissive );
 template < typename T > T read( const std::string& filename, const xpath& root );
 template < typename T > T read( const std::string& filename, const char* root );
+template < typename T > T read( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read( const std::string& filename, bool permissive );
 template < typename T > T read( const std::string& filename );
 template < typename T > void read( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read( T& t, const std::string& filename, const char* root );
+template < typename T > void read( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read( T& t, const std::string& filename, bool permissive );
 template < typename T > void read( T& t, const std::string& filename );
 template < typename T > T read( std::istream& stream, const xpath& root, bool permissive );
@@ -82,12 +84,14 @@ template < typename T > T read_json( const std::string& filename, const char* ro
 template < typename T > T read_json( const std::string& filename, const xpath& root );
 template < typename T > T read_json( const std::string& filename, const char* root );
 template < typename T > T read_json( const std::string& filename, bool permissive );
+template < typename T > T read_json( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_json( const std::string& filename );
 template < typename T > void read_json( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_json( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_json( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_json( T& t, const std::string& filename, const char* root );
 template < typename T > void read_json( T& t, const std::string& filename, bool permissive );
+template < typename T > void read_json( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_json( T& t, const std::string& filename );
 template < typename T > T read_json( std::istream& stream, const xpath& root, bool permissive );
 template < typename T > T read_json( std::istream& stream, const char* root, bool permissive );
@@ -108,12 +112,14 @@ template < typename T > T read_xml( const std::string& filename, const xpath& ro
 template < typename T > T read_xml( const std::string& filename, const char* root, bool permissive );
 template < typename T > T read_xml( const std::string& filename, const xpath& root );
 template < typename T > T read_xml( const std::string& filename, const char* root );
+template < typename T > T read_xml( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_xml( const std::string& filename, bool permissive );
 template < typename T > T read_xml( const std::string& filename );
 template < typename T > void read_xml( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_xml( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_xml( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_xml( T& t, const std::string& filename, const char* root );
+template < typename T > void read_xml( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_xml( T& t, const std::string& filename, bool permissive );
 template < typename T > void read_xml( T& t, const std::string& filename );
 template < typename T > T read_xml( std::istream& stream, const xpath& root, bool permissive );
@@ -136,11 +142,13 @@ template < typename T > T read_path_value( const std::string& filename, const ch
 template < typename T > T read_path_value( const std::string& filename, const xpath& root );
 template < typename T > T read_path_value( const std::string& filename, const char* root );
 template < typename T > T read_path_value( const std::string& filename, bool permissive );
+template < typename T > T read_path_value( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_path_value( const std::string& filename );
 template < typename T > void read_path_value( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_path_value( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_path_value( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_path_value( T& t, const std::string& filename, const char* root );
+template < typename T > void read_path_value( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_path_value( T& t, const std::string& filename, bool permissive );
 template < typename T > void read_path_value( T& t, const std::string& filename );
 template < typename T > T read_path_value( std::istream& stream, const xpath& root, bool permissive );
@@ -162,12 +170,14 @@ template < typename T > T read_ini( const std::string& filename, const xpath& ro
 template < typename T > T read_ini( const std::string& filename, const char* root, bool permissive );
 template < typename T > T read_ini( const std::string& filename, const xpath& root );
 template < typename T > T read_ini( const std::string& filename, const char* root );
+template < typename T > T read_ini( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_ini( const std::string& filename, bool permissive );
 template < typename T > T read_ini( const std::string& filename );
 template < typename T > void read_ini( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_ini( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_ini( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_ini( T& t, const std::string& filename, const char* root );
+template < typename T > void read_ini( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_ini( T& t, const std::string& filename, bool permissive );
 template < typename T > void read_ini( T& t, const std::string& filename );
 template < typename T > T read_ini( std::istream& stream, const xpath& root, bool permissive );
@@ -223,6 +233,15 @@ template < typename T > std::ostream& write_ini( const T& t, std::ostream& strea
 template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream, const char* root );
 template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream );
 
+namespace impl {
+
+inline std::pair< std::string, xpath > _split( const std::string& filename )
+{
+    const auto& s = comma::split_tail( filename, 2, ':' );
+    return s.size() == 1 ? std::pair< std::string, xpath >{ filename, xpath() } : std::pair< std::string, xpath >{ s[0], xpath( s[1] ) };
+}
+
+} // namespace impl {
 
 template < typename T > inline void read_json( T& t, const std::string& filename, const xpath& root, bool permissive )
 {
@@ -244,6 +263,7 @@ template < typename T > inline T read_json( const std::string& filename, const x
 template < typename T > inline T read_json( const std::string& filename, const char* root, bool permissive ) { return root ? read_json< T >( filename, xpath( root ), permissive ) : read_json< T >( filename, permissive ); }
 template < typename T > inline T read_json( const std::string& filename, const xpath& root ) { return read_json< T >( filename, root, true ); }
 template < typename T > inline T read_json( const std::string& filename, const char* root ) { return root ? read_json< T >( filename, xpath( root ), true ) : read_json< T >( filename, true ); }
+template < typename T > inline T read_json( const std::string& filename, bool permissive, bool split_filename ) { T t; read_json< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_json( const std::string& filename, bool permissive ) { return read_json< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_json( const std::string& filename ) { return read_json< T >( filename, xpath(), true ); }
 template < typename T > inline T read_json( std::istream& stream, const xpath& root, bool permissive ) { T t; read_json< T >( t, stream, root, permissive ); return t; }
@@ -255,6 +275,11 @@ template < typename T > inline T read_json( std::istream& stream ) { return read
 template < typename T > inline void read_json( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_json< T >( t, filename, xpath( root ), permissive ); } else { read_json< T >( t, filename, permissive ); } }
 template < typename T > inline void read_json( T& t, const std::string& filename, const xpath& root ) { read_json< T >( t, filename, root, true ); }
 template < typename T > inline void read_json( T& t, const std::string& filename, const char* root ) { if( root ) { read_json< T >( t, filename, xpath( root ), true ); } else { read_json< T >( t, filename, true ); } }
+template < typename T > inline void read_json( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    return read_json< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_json( T& t, const std::string& filename, bool permissive ) { read_json< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read_json( T& t, const std::string& filename ) { return read_json< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_json( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_json< T >( t, stream, xpath( root ), permissive ); } else { read_json< T >( t, stream, permissive ); } }
@@ -283,6 +308,7 @@ template < typename T > inline T read_xml( const std::string& filename, const xp
 template < typename T > inline T read_xml( const std::string& filename, const char* root, bool permissive ) { return root ? read_xml< T >( filename, xpath( root ), permissive ) : read_xml< T >( filename, permissive ); }
 template < typename T > inline T read_xml( const std::string& filename, const xpath& root ) { return read_xml< T >( filename, root, true ); }
 template < typename T > inline T read_xml( const std::string& filename, const char* root ) { return root ? read_xml< T >( filename, xpath( root ), true ) : read_xml< T >( filename, true ); }
+template < typename T > inline T read_xml( const std::string& filename, bool permissive, bool split_filename ) { T t; read_xml< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_xml( const std::string& filename, bool permissive ) { return read_xml< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_xml( const std::string& filename ) { return read_xml< T >( filename, xpath(), true ); }
 template < typename T > inline T read_xml( std::istream& stream, const xpath& root, bool permissive ) { T t; read_xml< T >( t, stream, root, permissive ); return t; }
@@ -294,8 +320,13 @@ template < typename T > inline T read_xml( std::istream& stream ) { return read_
 template < typename T > inline void read_xml( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_xml< T >( t, filename, xpath( root ), permissive ); } else { read_xml< T >( t, filename, permissive ); } }
 template < typename T > inline void read_xml( T& t, const std::string& filename, const xpath& root ) { read_xml< T >( t, filename, root, true ); }
 template < typename T > inline void read_xml( T& t, const std::string& filename, const char* root ) { if( root ) { read_xml< T >( t, filename, xpath( root ), true ); } else { read_xml< T >( t, filename, true ); } }
+template < typename T > inline void read_xml( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_xml< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_xml( T& t, const std::string& filename, bool permissive ) { read_xml< T >( t, filename, xpath(), permissive ); }
-template < typename T > inline void read_xml( T& t, const std::string& filename ) { return read_xml< T >( t, filename, xpath(), true ); }
+template < typename T > inline void read_xml( T& t, const std::string& filename ) { read_xml< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_xml( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_xml< T >( t, stream, xpath( root ), permissive ); } else { read_xml< T >( t, stream, permissive ); } }
 template < typename T > inline void read_xml( T& t, std::istream& stream, const xpath& root ) { read_xml< T >( t, stream, root, true ); }
 template < typename T > inline void read_xml( T& t, std::istream& stream, const char* root ) { if( root ) { read_xml< T >( t, stream, xpath( root ), true ); } else { read_xml< T >( t, stream, true ); } }
@@ -322,6 +353,7 @@ template < typename T > inline T read_path_value( const std::string& filename, c
 template < typename T > inline T read_path_value( const std::string& filename, const char* root, bool permissive ) { return root ? read_path_value< T >( filename, xpath( root ), permissive ) : read_path_value< T >( filename, permissive ); }
 template < typename T > inline T read_path_value( const std::string& filename, const xpath& root ) { return read_path_value< T >( filename, root, true ); }
 template < typename T > inline T read_path_value( const std::string& filename, const char* root ) { return root ? read_path_value< T >( filename, xpath( root ), true ) : read_path_value< T >( filename, true ); }
+template < typename T > inline T read_path_value( const std::string& filename, bool permissive, bool split_filename ) { T t; read_path_value< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_path_value( const std::string& filename, bool permissive ) { return read_path_value< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_path_value( const std::string& filename ) { return read_path_value< T >( filename, xpath(), true ); }
 template < typename T > inline T read_path_value( std::istream& stream, const xpath& root, bool permissive ) { T t; read_path_value< T >( t, stream, root, permissive ); return t; }
@@ -333,6 +365,11 @@ template < typename T > inline T read_path_value( std::istream& stream ) { retur
 template < typename T > inline void read_path_value( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_path_value< T >( t, filename, xpath( root ), permissive ); } else { read_path_value< T >( t, filename, permissive ); } }
 template < typename T > inline void read_path_value( T& t, const std::string& filename, const xpath& root ) { read_path_value< T >( t, filename, root, true ); }
 template < typename T > inline void read_path_value( T& t, const std::string& filename, const char* root ) { if( root ) { read_path_value< T >( t, filename, xpath( root ), true ); } else { read_path_value< T >( t, filename, true ); } }
+template < typename T > inline void read_path_value( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_path_value< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_path_value( T& t, const std::string& filename, bool permissive ) { read_path_value< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read_path_value( T& t, const std::string& filename ) { return read_path_value< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_path_value( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_path_value< T >( t, stream, xpath( root ), permissive ); } else { read_path_value< T >( t, stream, permissive ); } }
@@ -361,6 +398,7 @@ template < typename T > inline T read_ini( const std::string& filename, const xp
 template < typename T > inline T read_ini( const std::string& filename, const char* root, bool permissive ) { return root ? read_ini< T >( filename, xpath( root ), permissive ) : read_ini< T >( filename, permissive ); }
 template < typename T > inline T read_ini( const std::string& filename, const xpath& root ) { return read_ini< T >( filename, root, true ); }
 template < typename T > inline T read_ini( const std::string& filename, const char* root ) { return root ? read_ini< T >( filename, xpath( root ), true ) : read_ini< T >( filename, true ); }
+template < typename T > inline T read_ini( const std::string& filename, bool permissive, bool split_filename ) { T t; read_ini< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_ini( const std::string& filename, bool permissive ) { return read_ini< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_ini( const std::string& filename ) { return read_ini< T >( filename, xpath(), true ); }
 template < typename T > inline T read_ini( std::istream& stream, const xpath& root, bool permissive ) { T t; read_ini< T >( t, stream, root, permissive ); return t; }
@@ -372,6 +410,11 @@ template < typename T > inline T read_ini( std::istream& stream ) { return read_
 template < typename T > inline void read_ini( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_ini< T >( t, filename, xpath( root ), permissive ); } else { read_ini< T >( t, filename, permissive ); } }
 template < typename T > inline void read_ini( T& t, const std::string& filename, const xpath& root ) { read_ini< T >( t, filename, root, true ); }
 template < typename T > inline void read_ini( T& t, const std::string& filename, const char* root ) { if( root ) { read_ini< T >( t, filename, xpath( root ), true ); } else { read_ini< T >( t, filename, true ); } }
+template < typename T > inline void read_ini( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_ini< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_ini( T& t, const std::string& filename, bool permissive ) { read_ini< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read_ini( T& t, const std::string& filename ) { return read_ini< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_ini( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_ini< T >( t, stream, xpath( root ), permissive ); } else { read_ini< T >( t, stream, permissive ); } }
@@ -482,7 +525,6 @@ template < typename T > inline void write_ini( const T& t, const std::string& fi
 template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream, const char* root ) { return write_ini( t, stream, xpath( root ) ); }
 template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream ) { return write_ini( t, stream, xpath() ); }
 
-
 template < typename T > inline void read( T& t, std::istream& stream, const xpath& root, bool permissive )
 {
     boost::property_tree::ptree p;
@@ -503,6 +545,7 @@ template < typename T > inline T read( const std::string& filename, const xpath&
 template < typename T > inline T read( const std::string& filename, const char* root, bool permissive ) { return root ? read_json< T >( filename, xpath( root ), permissive ) : read< T >( filename, permissive ); }
 template < typename T > inline T read( const std::string& filename, const xpath& root ) { return read< T >( filename, root, true ); }
 template < typename T > inline T read( const std::string& filename, const char* root ) { return root ? read< T >( filename, xpath( root ), true ) : read< T >( filename, true ); }
+template < typename T > inline T read( const std::string& filename, bool permissive, bool split_filename ) { T t; read< T >( t, filename, permissive, split_filename ); }
 template < typename T > inline T read( const std::string& filename, bool permissive ) { return read< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read( const std::string& filename ) { return read< T >( filename, xpath(), true ); }
 template < typename T > inline T read( std::istream& stream, const xpath& root, bool permissive ) { T t; read< T >( t, stream, root, permissive ); return t; }
@@ -514,6 +557,11 @@ template < typename T > inline T read( std::istream& stream ) { return read< T >
 template < typename T > inline void read( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read< T >( t, filename, xpath( root ), permissive ); } else { read< T >( t, filename, permissive ); } }
 template < typename T > inline void read( T& t, const std::string& filename, const xpath& root ) { read< T >( t, filename, root, true ); }
 template < typename T > inline void read( T& t, const std::string& filename, const char* root ) { if( root ) { read< T >( t, filename, xpath( root ), true ); } else { read< T >( t, filename, true ); } }
+template < typename T > inline void read( T& t, const std::string& filename, bool permissive, bool split_filename )
+{ 
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read( T& t, const std::string& filename, bool permissive ) { read< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read( T& t, const std::string& filename ) { return read< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read< T >( t, stream, xpath( root ), permissive ); } else { read< T >( t, stream, permissive ); } }

From 8f5ab73e62b3f21ed5443b0c6921179e89243399 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 13 Aug 2024 15:31:42 +1000
Subject: [PATCH 0863/1056] csv-repeat/period: increase test times by factor of
 ten

to make test runs more reliable and consistent
---
 csv/test/csv-repeat/period/expected | 48 ++++++++++++++++++-----------
 csv/test/csv-repeat/period/input    | 16 +++++-----
 2 files changed, 38 insertions(+), 26 deletions(-)

diff --git a/csv/test/csv-repeat/period/expected b/csv/test/csv-repeat/period/expected
index 3f3faac3c..2a51778fd 100644
--- a/csv/test/csv-repeat/period/expected
+++ b/csv/test/csv-repeat/period/expected
@@ -1,37 +1,49 @@
-ascii[0]/timestamp=0.0 +/- 0.03
+ascii[0]/timestamp=0 +/- 0.1
 ascii[0]/data=123
-ascii[1]/timestamp=0.1 +/- 0.03
+ascii[1]/timestamp=1 +/- 0.1
 ascii[1]/data=456
-ascii[2]/timestamp=0.2 +/- 0.03
+ascii[2]/timestamp=2 +/- 0.1
 ascii[2]/data=789
-ascii[3]/timestamp=0.5 +/- 0.03
+ascii[3]/timestamp=5 +/- 0.1
 ascii[3]/data=789
-ascii[4]/timestamp=0.7 +/- 0.03
+ascii[4]/timestamp=7 +/- 0.1
 ascii[4]/data=789
-ascii[5]/timestamp=0.8 +/- 0.03
+ascii[5]/timestamp=8 +/- 0.1
 ascii[5]/data=123
-ascii[6]/timestamp=0.9 +/- 0.03
+ascii[6]/timestamp=9 +/- 0.1
 ascii[6]/data=456
-ascii[7]/timestamp=1.2 +/- 0.03
+ascii[7]/timestamp=12 +/- 0.1
 ascii[7]/data=456
-ascii[8]/timestamp=1.4 +/- 0.03
+ascii[8]/timestamp=14 +/- 0.1
 ascii[8]/data=456
+ascii[9]/timestamp=16 +/- 0.1
+ascii[9]/data=456
+ascii[10]/timestamp=18 +/- 0.1
+ascii[10]/data=456
+ascii[11]/timestamp=19 +/- 0.1
+ascii[11]/data=999
 
-binary[0]/timestamp=0.0 +/- 0.03
+binary[0]/timestamp=0 +/- 0.1
 binary[0]/data=123
-binary[1]/timestamp=0.1 +/- 0.03
+binary[1]/timestamp=1 +/- 0.1
 binary[1]/data=456
-binary[2]/timestamp=0.2 +/- 0.03
+binary[2]/timestamp=2 +/- 0.1
 binary[2]/data=789
-binary[3]/timestamp=0.5 +/- 0.03
+binary[3]/timestamp=5 +/- 0.1
 binary[3]/data=789
-binary[4]/timestamp=0.7 +/- 0.03
+binary[4]/timestamp=7 +/- 0.1
 binary[4]/data=789
-binary[5]/timestamp=0.8 +/- 0.03
+binary[5]/timestamp=8 +/- 0.1
 binary[5]/data=123
-binary[6]/timestamp=0.9 +/- 0.03
+binary[6]/timestamp=9 +/- 0.1
 binary[6]/data=456
-binary[7]/timestamp=1.2 +/- 0.03
+binary[7]/timestamp=12 +/- 0.1
 binary[7]/data=456
-binary[8]/timestamp=1.4 +/- 0.03
+binary[8]/timestamp=14 +/- 0.1
 binary[8]/data=456
+binary[9]/timestamp=16 +/- 0.1
+binary[9]/data=456
+binary[10]/timestamp=18 +/- 0.1
+binary[10]/data=456
+binary[11]/timestamp=19 +/- 0.1
+binary[11]/data=999
diff --git a/csv/test/csv-repeat/period/input b/csv/test/csv-repeat/period/input
index f2e0a2acc..9919c34f2 100644
--- a/csv/test/csv-repeat/period/input
+++ b/csv/test/csv-repeat/period/input
@@ -1,10 +1,10 @@
-timeout=0.3
-period=0.2
+timeout=3
+period=2
 format=ui
 data="
-0.2,123
-0.1,456
-0.1,789
-0.6,123
-0.1,456
-1.0,999"
+0,123
+1,456
+1,789
+6,123
+1,456
+10,999"

From ce3025e9882d273b96f5db3ff5be925c4bb83d06 Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Wed, 14 Aug 2024 11:58:03 +1000
Subject: [PATCH 0864/1056] csv/applications/csv-seek:

Added a new utility for jumping to
points files.

This only works for binary filesand ASCII input streams  at the moment.
---
 csv/applications/CMakeLists.txt |   4 +
 csv/applications/csv-seek.cpp   | 172 ++++++++++++++++++++++++++++++++
 2 files changed, 176 insertions(+)
 create mode 100644 csv/applications/csv-seek.cpp

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index 1583dfff2..b0d3ed4fe 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -17,6 +17,7 @@ install( TARGETS csv-fields RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONE
 
 add_executable( csv-format ${dir}/csv-format.cpp )
 add_executable( csv-size ${dir}/csv-size.cpp )
+add_executable( csv-seek ${dir}/csv-seek.cpp )
 add_executable( csv-select ${dir}/csv-select.cpp )
 add_executable( csv-bin-cut ${dir}/csv-bin-cut.cpp )
 add_executable( csv-from-columns ${dir}/csv-from-columns.cpp )
@@ -47,6 +48,7 @@ target_link_libraries ( csv-split comma_csv comma_application comma_io comma_str
 target_link_libraries ( csv-from-columns ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string )
 target_link_libraries ( csv-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string comma_name_value )
 target_link_libraries ( csv-sort ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
+target_link_libraries ( csv-seek ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string comma_name_value )
 target_link_libraries ( csv-select ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string comma_name_value )
 target_link_libraries ( csv-paste ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_io comma_name_value )
 target_link_libraries ( csv-time ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string comma_timing )
@@ -84,6 +86,7 @@ set_target_properties( csv-play PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( csv-shape PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( csv-shuffle PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( csv-crc PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-seek PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( csv-select PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( csv-thin PROPERTIES LINK_FLAGS_RELEASE -s )
 set_target_properties( csv-analyse PROPERTIES LINK_FLAGS_RELEASE -s )
@@ -109,6 +112,7 @@ install( TARGETS csv-bin-cut
                  csv-shape
                  csv-shuffle
                  csv-crc
+                 csv-seek
                  csv-select
                  csv-thin
                  csv-analyse
diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
new file mode 100644
index 000000000..5b3c7e56a
--- /dev/null
+++ b/csv/applications/csv-seek.cpp
@@ -0,0 +1,172 @@
+#include <iostream>
+#include <fstream>
+#include "../../application/command_line_options.h"
+#include "../../csv/traits.h"
+#include "../../name_value/parser.h"
+#include "../../visiting/traits.h"
+#include "../../csv/stream.h"
+#include "../../csv/traits.h"
+
+/// @todo : Handle field name for scrubbing - should i name it selection or target or record or offset or index or grab or seek or cursor or bookmark or needle or marker...?
+///         I'm thinking 'offset'
+/// @todo: Implement index operation as well as percentage operation. I only have percentage implemented.
+
+static void usage( bool verbose = false )
+{
+    std::cerr << std::endl;
+    std::cerr << "seek through a stream to grab selected records" << std::endl;
+    std::cerr << "" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: csv-seek <operation> [<options>] <stream>" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --binary,-b=<format>: data is packets of fixed size given by <format>" << std::endl;
+    std::cerr << "                          alternatively use --size" << std::endl;
+    std::cerr << "    --size,-s=<size>: data is packets of fixed size, otherwise data is expected" << std::endl;
+    std::cerr << "                      line-wise. Alternatively use --binary" << std::endl;
+    std::cerr << "    --scrub,-s:          Input is read as a percentage of the data" << std::endl;
+    std::cerr << "    --index,-i:          grab the record at index <n> through the data" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << "examples setup" << std::endl;
+    std::cerr << "      The following examples assume you have some data to work on." << std::endl;
+    std::cerr << "      Run this to create some data to look at!" << std::endl;
+    std::cerr << "      for i in $( seq 0 1 100  ); do echo $i,$i,$i; done | csv-to-bin 3f > data.bin" << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "      Sample the records at 50% and 10% through the data:" << std::endl;
+    std::cerr << "      ( echo 0.5; echo 0.1 ) | csv-seek scrub \"data.bin;binary=3f\" | csv-from-bin 3f" << std::endl;
+    std::cerr << "" << std::endl;
+    std::cerr << "      Sample the 10th record" << std::endl;
+    std::cerr << "      ( echo 0.5; echo 0.1 ) | csv-seek scrub \"data.bin;binary=3f\" | csv-from-bin 3f" << std::endl;
+    std::cerr << "" << std::endl;
+    std::cerr << "      Scrub through a point cloud (note this example requires snark):" << std::endl;
+    std::cerr << "      csv-sliders \"percentage;min=0;max=1\" --on-change --frequency 100 | csv-seek scrub --fields=percent \"data.bin;binary=3f\" | view-points \"-;binary=3f;size=1\" << std::endl;" << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+std::streampos jump_to_record(const std::string& file_path, double percentage, size_t record_size, std::vector<char>& record_data) 
+{
+    std::ifstream file(file_path, std::ios::binary | std::ios::ate);
+    if (!file.is_open()) {
+        throw std::runtime_error("Unable to open file.");
+    }
+
+    std::streamsize file_size = file.tellg();
+    std::streampos target_offset = static_cast<std::streampos>(file_size * percentage);
+    std::streampos adjusted_offset = (target_offset / record_size) * record_size;
+
+    file.seekg(adjusted_offset);
+    record_data.resize(record_size);
+    file.read(record_data.data(), record_size);
+
+    if (file.gcount() != record_size) {
+        throw std::runtime_error("Unable to read a full record at the adjusted offset.");
+    }
+
+    return adjusted_offset;
+}
+
+namespace comma { namespace csv {
+struct config_t
+{
+    std::string filename;
+    std::string format;
+};
+
+struct input_t
+{
+    double offset;
+};
+
+}} // namespace comma { namespace csv {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv::config_t >
+{
+    template < typename K, typename V > static void visit( const K&, comma::csv::config_t& p, V& v )
+    {
+        v.apply( "filename", p.filename );
+        v.apply( "format", p.format );
+    }
+
+    template < typename K, typename V > static void visit( const K&, const comma::csv::config_t& p, V& v )
+    {
+        v.apply( "filename", p.filename );
+        v.apply( "format", p.format );
+    }
+};
+
+template <> struct traits< comma::csv::input_t >
+{
+    template < typename K, typename V > static void visit( const K&, comma::csv::input_t& p, V& v )
+    {
+        v.apply( "offset", p.offset );
+    }
+
+    template < typename K, typename V > static void visit( const K&, const comma::csv::input_t& p, V& v )
+    {
+        v.apply( "offset", p.offset );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        std::vector< std::string > unnamed = options.unnamed( "", "-[^;].*" );
+        comma::csv::options csv( options );
+
+        std::cerr << "unnamed.size(): " << unnamed.size() << std::endl;
+        COMMA_ASSERT( unnamed.size() > 0, "expected operation" );
+        COMMA_ASSERT( unnamed.size() > 1, "expected file" );
+        COMMA_ASSERT( unnamed.size() < 3, "Does not work on multiple streams (yet (shouuld it?))" );
+
+        std::string operation = unnamed[0];
+        COMMA_ASSERT( operation=="scrub" || operation=="index", "expected operation to be scrub or index" );
+        
+        comma::name_value::parser csv_options_parser( "filename", ';', '=', false );
+        auto stream = csv_options_parser.get< comma::csv::config_t >( unnamed[1] );
+        auto stream_csv = csv_options_parser.get< comma::csv::options >( unnamed[1] );
+        std::string filename = stream.filename;
+        COMMA_ASSERT( filename!="-", "expected filename. file scrubbing does not work on streams." );
+        COMMA_ASSERT( stream_csv.binary(), "expected binary file" );
+
+        if( operation=="scrub" ) { std::cerr << "configuring scrub operation... todo" << std::endl; }
+        else if( operation=="index" ) { std::cerr << "configuring index operation... todo" << std::endl; }
+
+        std::ifstream file(filename, std::ios::binary | std::ios::ate);
+        COMMA_ASSERT( file.is_open(), "unable to open file" );
+
+        std::streamsize file_size = file.tellg();
+        std::streampos record_size = stream_csv.format().size();
+
+        comma::csv::input_stream< comma::csv::input_t > istream( std::cin, csv );
+        while( std::cin.good() && !std::cin.eof() )
+        {
+            const comma::csv::input_t* p = istream.read();
+            if( !p ) { break; }
+
+            std::streampos target_offset = static_cast<std::streampos>(file_size * p->offset);
+            std::streampos adjusted_offset = (target_offset / record_size) * record_size;
+
+            std::vector<char> record_data;
+            file.seekg(adjusted_offset);
+            record_data.resize(record_size);
+            file.read(record_data.data(), record_size);
+            std::cout.write(record_data.data(), record_data.size());
+            if( csv.flush ) { std::cout.flush(); }
+        }
+
+        file.close();
+        return 0;
+    }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
+    return 1;
+}

From 79d80ba26d0d670bee7af83319473d73e90c1616 Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Wed, 14 Aug 2024 16:07:08 +1000
Subject: [PATCH 0865/1056] csv/applications/csv-seek:

Updated help, reformatted usage and added seek by index.
---
 csv/applications/csv-seek.cpp | 124 +++++++++++++++-------------------
 1 file changed, 53 insertions(+), 71 deletions(-)

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index 5b3c7e56a..0ef3518b2 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -7,65 +7,44 @@
 #include "../../csv/stream.h"
 #include "../../csv/traits.h"
 
-/// @todo : Handle field name for scrubbing - should i name it selection or target or record or offset or index or grab or seek or cursor or bookmark or needle or marker...?
-///         I'm thinking 'offset'
-/// @todo: Implement index operation as well as percentage operation. I only have percentage implemented.
 
 static void usage( bool verbose = false )
 {
-    std::cerr << std::endl;
-    std::cerr << "seek through a stream to grab selected records" << std::endl;
-    std::cerr << "" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: csv-seek <operation> [<options>] <stream>" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --binary,-b=<format>: data is packets of fixed size given by <format>" << std::endl;
-    std::cerr << "                          alternatively use --size" << std::endl;
-    std::cerr << "    --size,-s=<size>: data is packets of fixed size, otherwise data is expected" << std::endl;
-    std::cerr << "                      line-wise. Alternatively use --binary" << std::endl;
-    std::cerr << "    --scrub,-s:          Input is read as a percentage of the data" << std::endl;
-    std::cerr << "    --index,-i:          grab the record at index <n> through the data" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "csv options" << std::endl;
+    std::cerr << R"(
+seek through a stream to grab selected records
+usage: csv-seek <options> [<stream>]
+options
+    --binary,-b=<format>:  data is packets of fixed size given by <format>
+                           alternatively use --size
+    --fields=[<fields>]:   index(default) - find record by index  
+                           ratio - find record as a proportion of the file size"
+
+    --size,-s=<size>:      [todo] data is packets of fixed size, otherwise data is expected
+                           line-wise. Alternatively use --binary" << std::endl
+csv options
+)";
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
-    std::cerr << "examples setup" << std::endl;
-    std::cerr << "      The following examples assume you have some data to work on." << std::endl;
-    std::cerr << "      Run this to create some data to look at!" << std::endl;
-    std::cerr << "      for i in $( seq 0 1 100  ); do echo $i,$i,$i; done | csv-to-bin 3f > data.bin" << std::endl;
     std::cerr << "examples" << std::endl;
-    std::cerr << "      Sample the records at 50% and 10% through the data:" << std::endl;
-    std::cerr << "      ( echo 0.5; echo 0.1 ) | csv-seek scrub \"data.bin;binary=3f\" | csv-from-bin 3f" << std::endl;
-    std::cerr << "" << std::endl;
-    std::cerr << "      Sample the 10th record" << std::endl;
-    std::cerr << "      ( echo 0.5; echo 0.1 ) | csv-seek scrub \"data.bin;binary=3f\" | csv-from-bin 3f" << std::endl;
-    std::cerr << "" << std::endl;
-    std::cerr << "      Scrub through a point cloud (note this example requires snark):" << std::endl;
-    std::cerr << "      csv-sliders \"percentage;min=0;max=1\" --on-change --frequency 100 | csv-seek scrub --fields=percent \"data.bin;binary=3f\" | view-points \"-;binary=3f;size=1\" << std::endl;" << std::endl;
-    std::cerr << std::endl;
-    exit( 0 );
-}
-
-std::streampos jump_to_record(const std::string& file_path, double percentage, size_t record_size, std::vector<char>& record_data) 
-{
-    std::ifstream file(file_path, std::ios::binary | std::ios::ate);
-    if (!file.is_open()) {
-        throw std::runtime_error("Unable to open file.");
-    }
+    if( verbose ) { std::cerr << R"(    examples setup
+      The following examples assume you have some data to work on.
+      Run this to create some data to look at!
+      csv-paste 'line-number;binary=ui' --head 100 > data.bin
 
-    std::streamsize file_size = file.tellg();
-    std::streampos target_offset = static_cast<std::streampos>(file_size * percentage);
-    std::streampos adjusted_offset = (target_offset / record_size) * record_size;
+      Sample the records at 50% and 10% through the data:
+      ( echo 0.5; echo 0.1 ) | csv-seek --fields=ratio \"data.bin;binary=f\" | csv-from-bin f
 
-    file.seekg(adjusted_offset);
-    record_data.resize(record_size);
-    file.read(record_data.data(), record_size);
+      Sample the 10th record
+      echo 10 | csv-seek \"data.bin;binary=12f\" | csv-from-bin f
 
-    if (file.gcount() != record_size) {
-        throw std::runtime_error("Unable to read a full record at the adjusted offset.");
+      Scrub through a point cloud (note this example requires snark):
+      csv-sliders \"percentage;min=0;max=1\" --on-change --frequency 100 | csv-seek --fields=ratio --flush \"data.bin;binary=ui\" | csv-from-bin ui --flush
+)";
     }
-
-    return adjusted_offset;
+    else
+    {
+        std::cerr << "    see --help --verbose for more help" << std::endl;
+    }
+    exit( 0 );
 }
 
 namespace comma { namespace csv {
@@ -77,7 +56,11 @@ struct config_t
 
 struct input_t
 {
-    double offset;
+    double ratio{0};
+    std::uint32_t index{0};
+    std::uint32_t block{0}; // todo in some vague future
+
+    std::uint32_t get_index( std::size_t size, bool use_ratio ) const { return use_ratio ? static_cast<std::uint32_t>(size * ratio) : index; }
 };
 
 }} // namespace comma { namespace csv {
@@ -103,12 +86,16 @@ template <> struct traits< comma::csv::input_t >
 {
     template < typename K, typename V > static void visit( const K&, comma::csv::input_t& p, V& v )
     {
-        v.apply( "offset", p.offset );
+        v.apply( "ratio", p.ratio );
+        v.apply( "index", p.index );
+        v.apply( "block", p.block );
     }
 
     template < typename K, typename V > static void visit( const K&, const comma::csv::input_t& p, V& v )
     {
-        v.apply( "offset", p.offset );
+        v.apply( "ratio", p.ratio );
+        v.apply( "index", p.index );
+        v.apply( "block", p.block );
     }
 };
 
@@ -119,29 +106,22 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        std::vector< std::string > unnamed = options.unnamed( "", "-[^;].*" );
-        comma::csv::options csv( options );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,-v,--verbose,", "-.*" );
+        comma::csv::options csv( options, "index" );
+        COMMA_ASSERT_BRIEF( csv.has_field( "ratio" ) != csv.has_field( "index" ), "please specify either 'ratio' or 'index' (but not both) in --fields" );
 
-        std::cerr << "unnamed.size(): " << unnamed.size() << std::endl;
-        COMMA_ASSERT( unnamed.size() > 0, "expected operation" );
-        COMMA_ASSERT( unnamed.size() > 1, "expected file" );
-        COMMA_ASSERT( unnamed.size() < 3, "Does not work on multiple streams (yet (shouuld it?))" );
+        COMMA_ASSERT_BRIEF( unnamed.size() > 0, "expected file or stream (todo)" );
+        COMMA_ASSERT_BRIEF( unnamed.size() < 2, "Does not work on multiple streams (yet (shouuld it?))" );
 
-        std::string operation = unnamed[0];
-        COMMA_ASSERT( operation=="scrub" || operation=="index", "expected operation to be scrub or index" );
-        
         comma::name_value::parser csv_options_parser( "filename", ';', '=', false );
-        auto stream = csv_options_parser.get< comma::csv::config_t >( unnamed[1] );
-        auto stream_csv = csv_options_parser.get< comma::csv::options >( unnamed[1] );
+        auto stream = csv_options_parser.get< comma::csv::config_t >( unnamed[0] );
+        auto stream_csv = csv_options_parser.get< comma::csv::options >( unnamed[0] );
         std::string filename = stream.filename;
-        COMMA_ASSERT( filename!="-", "expected filename. file scrubbing does not work on streams." );
-        COMMA_ASSERT( stream_csv.binary(), "expected binary file" );
-
-        if( operation=="scrub" ) { std::cerr << "configuring scrub operation... todo" << std::endl; }
-        else if( operation=="index" ) { std::cerr << "configuring index operation... todo" << std::endl; }
+        COMMA_ASSERT_BRIEF( filename!="-", "expected filename. file scrubbing does not work on streams." );
+        COMMA_ASSERT_BRIEF( stream_csv.binary(), "expected binary file" );
 
         std::ifstream file(filename, std::ios::binary | std::ios::ate);
-        COMMA_ASSERT( file.is_open(), "unable to open file" );
+        COMMA_ASSERT_BRIEF( file.is_open(), "unable to open file" );
 
         std::streamsize file_size = file.tellg();
         std::streampos record_size = stream_csv.format().size();
@@ -152,9 +132,11 @@ int main( int ac, char** av )
             const comma::csv::input_t* p = istream.read();
             if( !p ) { break; }
 
-            std::streampos target_offset = static_cast<std::streampos>(file_size * p->offset);
+            std::uint32_t index = p->get_index( file_size, csv.has_field( "ratio" ) );
+            std::streampos target_offset = index;
             std::streampos adjusted_offset = (target_offset / record_size) * record_size;
 
+            if (adjusted_offset >= file_size) { std::cerr << "index out of bounds" << std::endl; continue; }
             std::vector<char> record_data;
             file.seekg(adjusted_offset);
             record_data.resize(record_size);

From 10b4fcd87f08fc6363d1cc02efed936a3d98498a Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Wed, 14 Aug 2024 16:49:30 +1000
Subject: [PATCH 0866/1056] csv-seek: testing...

---
 csv/test/csv-seek/data.bin | Bin 0 -> 40 bytes
 csv/test/csv-seek/expected |   4 ++++
 csv/test/csv-seek/input    |   8 ++++++++
 3 files changed, 12 insertions(+)
 create mode 100644 csv/test/csv-seek/data.bin
 create mode 100644 csv/test/csv-seek/expected
 create mode 100644 csv/test/csv-seek/input

diff --git a/csv/test/csv-seek/data.bin b/csv/test/csv-seek/data.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c6aacdecdc212596c5e82ae940eaaa7de2f9437
GIT binary patch
literal 40
fcmWN=i46cC3<RLl`gQ+>g@hy-PRr%?czw1X0=xh&

literal 0
HcmV?d00001

diff --git a/csv/test/csv-seek/expected b/csv/test/csv-seek/expected
new file mode 100644
index 000000000..4e8303fbd
--- /dev/null
+++ b/csv/test/csv-seek/expected
@@ -0,0 +1,4 @@
+index[0]/output/line[0]="0"
+index[0]/output/line[1]="3"
+index[0]/output/line[2]="5"
+index[0]/output/line[3]="9"
diff --git a/csv/test/csv-seek/input b/csv/test/csv-seek/input
new file mode 100644
index 000000000..226c5480b
--- /dev/null
+++ b/csv/test/csv-seek/input
@@ -0,0 +1,8 @@
+#index[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek \'data.bin;binary=ui\'"
+index[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek 'data.bin;binary=ui' | csv-from-bin ui"
+# index[0]="( echo a,0; echo b,1 ) | csv-join <( echo s,0; echo t,0; echo x,1; echo y,1 )';fields=,block'"
+#index[1]="( echo 0; echo 3; echo 5; echo 9 ) | csv-to-bin ui | csv-seek --binary=ui \'data.bin;binary=ui\'"
+#index[2]="( echo a,0; echo b,3; echo c,5 ) | csv-seek --fields ,index \'data.bin;binary=ui\'"
+#index[3]="( echo 0,0; echo 1,3; echo 2,5 ) | csv-to-bin ui | csv-seek --fields ,index --binary=2ui \'data.bin;binary=ui\'"
+
+# todo! ratio tests

From 6dd345f4d2f848b0f5daa089f47f7e01cabdc6dd Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Wed, 14 Aug 2024 16:51:37 +1000
Subject: [PATCH 0867/1056] csv-seek: testing: tests made optional for now
 while debugging

---
 csv/test/csv-seek/expected | 8 ++++----
 csv/test/csv-seek/optional | 0
 2 files changed, 4 insertions(+), 4 deletions(-)
 create mode 100644 csv/test/csv-seek/optional

diff --git a/csv/test/csv-seek/expected b/csv/test/csv-seek/expected
index 4e8303fbd..51eb95386 100644
--- a/csv/test/csv-seek/expected
+++ b/csv/test/csv-seek/expected
@@ -1,4 +1,4 @@
-index[0]/output/line[0]="0"
-index[0]/output/line[1]="3"
-index[0]/output/line[2]="5"
-index[0]/output/line[3]="9"
+# index[0]/output/line[0]="0"
+# index[0]/output/line[1]="3"
+# index[0]/output/line[2]="5"
+# index[0]/output/line[3]="9"
diff --git a/csv/test/csv-seek/optional b/csv/test/csv-seek/optional
new file mode 100644
index 000000000..e69de29bb

From 0fa63d8a6a1a90bc5b5a49b798c2f70d1613a15d Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Wed, 14 Aug 2024 16:52:55 +1000
Subject: [PATCH 0868/1056] csv-seek: testing: expected: uncommented

---
 csv/test/csv-seek/expected | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/csv/test/csv-seek/expected b/csv/test/csv-seek/expected
index 51eb95386..e167096e2 100644
--- a/csv/test/csv-seek/expected
+++ b/csv/test/csv-seek/expected
@@ -1,4 +1,6 @@
-# index[0]/output/line[0]="0"
-# index[0]/output/line[1]="3"
-# index[0]/output/line[2]="5"
-# index[0]/output/line[3]="9"
+index[0]/output/line[0]="0"
+index[0]/output/line[1]="3"
+index[0]/output/line[2]="5"
+index[0]/output/line[3]="9"
+
+

From 40ed6a6bece0ee6f1e163f6b6c44160565c129dd Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 14 Aug 2024 18:12:08 +1000
Subject: [PATCH 0869/1056] comma-test-run: a quick fix added for
 comma-test-run not to stray outside of git repositories

---
 util/applications/comma-test-run | 18 +++++++-----------
 1 file changed, 7 insertions(+), 11 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 2017f1ab9..c36c5b9f0 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -392,19 +392,15 @@ function closest_file_in_path()
 {
     local path="$1"
     local file="$2"
-    
-    # sanity check (and avoid infinite loop)
-    if [[ -z "$path" || -z "$file" ]]; then echo "$name: error: empty path in closest_file_in_path()" >&2; exit 1; fi
-    # get canonical name (so path always starts with "/")
-    path=$( readlink -e "$path" )
-
+    [[ -n "$path" && -n "$file" ]] || { echo "$name: error: empty path in closest_file_in_path()" >&2; exit 1; }
+    path=$( readlink -e "$path" ) # get canonical name (so path always starts with "/")
     while true; do
         if [[ -d "$path/$file" ]]; then
-            echo "$name: warning: \"$path/$file\" is a directory (expected an executable script); ignoring" >&2
+            echo "$name: warning: '$path/$file' is a directory (expected an executable script); ignoring" >&2
         elif [[ -f "$path/$file" ]]; then
-            if [[ $file == "test" && ! -x "$path/$file" ]]; then echo "$name: warning: \"$path/$file\" is not executable; ignoring" >&2 
-            else echo $path/$file; break; fi
-        elif [[ $path == "/" ]]; then break
+            if [[ $file == "test" && ! -x "$path/$file" ]]; then echo "$name: warning: '$path/$file' is not executable; ignoring" >&2 
+            else echo "$path/$file"; break; fi
+        elif [[ "$path" == "/" || -d "$path/.git" ]]; then break # super-quick and dirty: stop on .git directory, otherwise it leads to bizarre errors, e.g. when there is a file 'config' or 'test' outside of git repository 
         fi
         path=$( dirname "$path" )
     done
@@ -803,7 +799,7 @@ function run_single_test()
     elif disabled_ "optional" "$dir" "$options_run_optional" ; then
         warning_ "$name: test $counter: $dir: optional, skipped"
     else
-        test_exec=$( closest_file_in_path "$dir" "test" )
+        test_exec=$( closest_file_in_path "$dir" test )
         if [[ -z "$test_exec" ]]; then
             error_ "$name: error: no \"test\" script found in any parent directory of $dir"
             result=1

From c529e1107d91c3e00b618c571869aa00c8861315 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 14 Aug 2024 18:17:15 +1000
Subject: [PATCH 0870/1056] comma-test-run: --root-path: todo placeholder added

---
 util/applications/comma-test-run | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index c36c5b9f0..dacf9a0b8 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -102,6 +102,7 @@ function description_others()
 --output-junit,--junit=[<file>]; output to file junit record compatible with jenkins for each test
 --output-stdout,--stdout; output test results to stdout as <dir>,<status>, <status>: success, failed, timeout, disabled
 --path=[<dir>]; data-storage directory for tests, default: none, let the tests define it
+--root-path,--root=[<dir>]; todo: do not accend beyond this path while searching for specially-named files, e.g. 'test' or 'config'
 --test-option=[<option>]; extra command line argument(s) pass to "test" script
 
 --quiet,-q; minimize output
@@ -1017,6 +1018,7 @@ comma_path_value_to_var --export --prefix=options < <( default_options )
 options_path_value="$( description | comma-options-to-name-value $@ )"
 comma_path_value_to_var --export --prefix=options <<<"$options_path_value"
 
+[[ -z "$options_root_path" ]] || { error_ "$name: --root-path: todo, just ask"; exit 1; }
 options_test_option=$( echo "$options_path_value" |  grep "^test-option=" | cut -d'=' -f2- | sed 's#^"##;s#"$##' | tr '\n' ' ' )
 
 # and perform sanity check

From f77ee4d486b54f36190866333a2d67c891c96445 Mon Sep 17 00:00:00 2001
From: aspen <aspen@aspen>
Date: Thu, 15 Aug 2024 00:03:11 +1000
Subject: [PATCH 0871/1056] csv/applications/csv-seek: made existing index and
 ratio tests work.

---
 csv/applications/csv-seek.cpp | 10 +++++-----
 csv/test/csv-seek/expected    | 19 +++++++++++++++++--
 csv/test/csv-seek/input       | 12 +++++-------
 3 files changed, 27 insertions(+), 14 deletions(-)

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index 0ef3518b2..f9a63fb4f 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -31,13 +31,13 @@ csv options
       csv-paste 'line-number;binary=ui' --head 100 > data.bin
 
       Sample the records at 50% and 10% through the data:
-      ( echo 0.5; echo 0.1 ) | csv-seek --fields=ratio \"data.bin;binary=f\" | csv-from-bin f
+      ( echo 0.5; echo 0.1 ) | csv-seek --fields=ratio "data.bin;binary=f" | csv-from-bin f
 
       Sample the 10th record
-      echo 10 | csv-seek \"data.bin;binary=12f\" | csv-from-bin f
+      echo 10 | csv-seek "data.bin;binary=12f" | csv-from-bin f
 
       Scrub through a point cloud (note this example requires snark):
-      csv-sliders \"percentage;min=0;max=1\" --on-change --frequency 100 | csv-seek --fields=ratio --flush \"data.bin;binary=ui\" | csv-from-bin ui --flush
+      csv-sliders "percentage;min=0;max=1" --on-change --frequency 100 | csv-seek --fields=ratio --flush "data.bin;binary=ui" | csv-from-bin ui --flush
 )";
     }
     else
@@ -60,7 +60,7 @@ struct input_t
     std::uint32_t index{0};
     std::uint32_t block{0}; // todo in some vague future
 
-    std::uint32_t get_index( std::size_t size, bool use_ratio ) const { return use_ratio ? static_cast<std::uint32_t>(size * ratio) : index; }
+    std::uint32_t get_index( std::size_t filesize, std::size_t record_size, bool use_ratio ) const { return use_ratio ? static_cast<std::uint32_t>(filesize * ratio) : index*record_size; }
 };
 
 }} // namespace comma { namespace csv {
@@ -132,7 +132,7 @@ int main( int ac, char** av )
             const comma::csv::input_t* p = istream.read();
             if( !p ) { break; }
 
-            std::uint32_t index = p->get_index( file_size, csv.has_field( "ratio" ) );
+            std::uint32_t index = p->get_index( file_size, record_size, csv.has_field( "ratio" ) );
             std::streampos target_offset = index;
             std::streampos adjusted_offset = (target_offset / record_size) * record_size;
 
diff --git a/csv/test/csv-seek/expected b/csv/test/csv-seek/expected
index e167096e2..afa1761cc 100644
--- a/csv/test/csv-seek/expected
+++ b/csv/test/csv-seek/expected
@@ -2,5 +2,20 @@ index[0]/output/line[0]="0"
 index[0]/output/line[1]="3"
 index[0]/output/line[2]="5"
 index[0]/output/line[3]="9"
-
-
+index[1]/output/line[0]="0"
+index[1]/output/line[1]="3"
+index[1]/output/line[2]="5"
+index[1]/output/line[3]="9"
+index[2]/output/line[0]="0"
+index[2]/output/line[1]="3"
+index[2]/output/line[2]="5"
+index[3]/output/line[0]="0"
+index[3]/output/line[1]="3"
+index[3]/output/line[2]="5"
+index[4]/output/line[0]="0"
+index[4]/output/line[1]="3"
+index[4]/output/line[2]="5"
+index[4]/output/line[3]="9"
+index[5]/output/line[0]="0"
+index[5]/output/line[1]="3"
+index[5]/output/line[2]="5"
diff --git a/csv/test/csv-seek/input b/csv/test/csv-seek/input
index 226c5480b..4058c6503 100644
--- a/csv/test/csv-seek/input
+++ b/csv/test/csv-seek/input
@@ -1,8 +1,6 @@
-#index[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek \'data.bin;binary=ui\'"
 index[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek 'data.bin;binary=ui' | csv-from-bin ui"
-# index[0]="( echo a,0; echo b,1 ) | csv-join <( echo s,0; echo t,0; echo x,1; echo y,1 )';fields=,block'"
-#index[1]="( echo 0; echo 3; echo 5; echo 9 ) | csv-to-bin ui | csv-seek --binary=ui \'data.bin;binary=ui\'"
-#index[2]="( echo a,0; echo b,3; echo c,5 ) | csv-seek --fields ,index \'data.bin;binary=ui\'"
-#index[3]="( echo 0,0; echo 1,3; echo 2,5 ) | csv-to-bin ui | csv-seek --fields ,index --binary=2ui \'data.bin;binary=ui\'"
-
-# todo! ratio tests
+index[1]="( echo 0; echo 3; echo 5; echo 9 ) | csv-to-bin ui | csv-seek --binary=ui \'data.bin;binary=ui\' | csv-from-bin ui"
+index[2]="( echo a,0; echo b,3; echo c,5 ) | csv-seek --fields ,index 'data.bin;binary=ui' | csv-from-bin ui"
+index[3]="( echo 0,0; echo 1,3; echo 2,5 ) | csv-to-bin 2ui | csv-seek --fields ,index --binary=2ui 'data.bin;binary=ui' | csv-from-bin ui"
+index[4]="( echo 0; echo 0.30; echo 0.5; echo 0.9 ) | csv-seek --fields ratio 'data.bin;binary=ui' | csv-from-bin ui"
+index[5]="( echo 0,0; echo 1,0.3; echo 2,0.5  ) | csv-to-bin ui,f | csv-seek --fields ,ratio --binary=ui,f 'data.bin;binary=ui' | csv-from-bin ui"

From bb387515a5f5acb1ce9039e320133a64cab6927b Mon Sep 17 00:00:00 2001
From: aspen <aspen@aspen>
Date: Thu, 15 Aug 2024 00:54:47 +1000
Subject: [PATCH 0872/1056] csv/application/csv-seek: larger files (such as
 video streams) require int 64

---
 csv/applications/csv-seek.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index f9a63fb4f..1482052ca 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -60,7 +60,7 @@ struct input_t
     std::uint32_t index{0};
     std::uint32_t block{0}; // todo in some vague future
 
-    std::uint32_t get_index( std::size_t filesize, std::size_t record_size, bool use_ratio ) const { return use_ratio ? static_cast<std::uint32_t>(filesize * ratio) : index*record_size; }
+    std::uint64_t get_index( std::size_t filesize, std::size_t record_size, bool use_ratio ) const { return use_ratio ? static_cast<std::uint64_t>(filesize * ratio) : index*record_size; }
 };
 
 }} // namespace comma { namespace csv {
@@ -132,9 +132,9 @@ int main( int ac, char** av )
             const comma::csv::input_t* p = istream.read();
             if( !p ) { break; }
 
-            std::uint32_t index = p->get_index( file_size, record_size, csv.has_field( "ratio" ) );
-            std::streampos target_offset = index;
-            std::streampos adjusted_offset = (target_offset / record_size) * record_size;
+            std::streampos index = p->get_index( file_size, record_size, csv.has_field( "ratio" ) );
+            std::cerr << "seeking to index:" << index << " with file size:" << file_size << " and record size:" << record_size << std::endl;
+            std::streampos adjusted_offset = (index / record_size) * record_size;
 
             if (adjusted_offset >= file_size) { std::cerr << "index out of bounds" << std::endl; continue; }
             std::vector<char> record_data;

From f250e342ae1fb183c7a94b90d0ebb68f31bc9f02 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 15 Aug 2024 15:34:23 +1000
Subject: [PATCH 0873/1056] csv-seek: --help: examples brushed up, colour hue
 example added

---
 csv/applications/csv-seek.cpp | 39 ++++++++++++++++++++++++-----------
 1 file changed, 27 insertions(+), 12 deletions(-)

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index 1482052ca..c1159f124 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -26,18 +26,33 @@ csv options
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
     std::cerr << "examples" << std::endl;
     if( verbose ) { std::cerr << R"(    examples setup
-      The following examples assume you have some data to work on.
-      Run this to create some data to look at!
-      csv-paste 'line-number;binary=ui' --head 100 > data.bin
-
-      Sample the records at 50% and 10% through the data:
-      ( echo 0.5; echo 0.1 ) | csv-seek --fields=ratio "data.bin;binary=f" | csv-from-bin f
-
-      Sample the 10th record
-      echo 10 | csv-seek "data.bin;binary=12f" | csv-from-bin f
-
-      Scrub through a point cloud (note this example requires snark):
-      csv-sliders "percentage;min=0;max=1" --on-change --frequency 100 | csv-seek --fields=ratio --flush "data.bin;binary=ui" | csv-from-bin ui --flush
+        basics
+            make data file
+                csv-paste 'line-number;binary=ui' --head 100 > data.bin
+
+            sample the records at 50% and 10% through the data:
+                ( echo 0.5; echo 0.1 ) | csv-seek --fields=ratio "data.bin;binary=f" | csv-from-bin f
+
+            sample the 10th record
+                echo 10 | csv-seek "data.bin;binary=12f" | csv-from-bin f
+
+        colour hue (you would need snark installed with graphics and imaging enabled)
+            make data file
+                ( csv-paste value=255 value=0 line-number --head 256; \
+                    csv-paste 'line-number;begin=255;step=-1' line-number value=255 --head 256; \
+                    csv-paste value=0 value=255 'line-number;begin=255;step=-1' --head 256; \
+                    csv-paste line-number value=255 value=0 --head 256; \
+                    csv-paste value=255 'line-number;begin=255;step=-1' value=0 --head 256 ) \
+                    | csv-to-bin 3ub \
+                    > colour-wheel.bin
+            sample colour hue
+                csv-sliders 'hue;min=0;max=1;step=0.0001' \
+                            --frequency 10 \
+                            --window-geometry=0,0,400,60 \
+                            --title='examples: hue selection' \
+                    | csv-seek --fields ratio 'colour-wheel.bin;binary=3ub' --flush \
+                    | cv-cat --input 'rows=1;cols=1;no-header;type=3ub' \
+                             'resize=400;view=,examples: hue selection,,0,130;null'
 )";
     }
     else

From 406187172da50fff2cbc2a69ae2092bedcafc53f Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Thu, 15 Aug 2024 17:24:45 +1000
Subject: [PATCH 0874/1056] csv/applications/csv-seek:    removed debugging
 prints    added permissive option to allow out of bounds input    updated
 tests

---
 csv/applications/csv-seek.cpp | 20 +++++++++++---------
 csv/test/csv-seek/expected    | 18 +++++++++++-------
 csv/test/csv-seek/input       |  6 ++++--
 csv/test/csv-seek/optional    |  0
 4 files changed, 26 insertions(+), 18 deletions(-)
 delete mode 100644 csv/test/csv-seek/optional

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index c1159f124..00773f653 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -14,10 +14,7 @@ static void usage( bool verbose = false )
 seek through a stream to grab selected records
 usage: csv-seek <options> [<stream>]
 options
-    --binary,-b=<format>:  data is packets of fixed size given by <format>
-                           alternatively use --size
-    --fields=[<fields>]:   index(default) - find record by index  
-                           ratio - find record as a proportion of the file size"
+    --permissive:          permissive mode: output empty record on error
 
     --size,-s=<size>:      [todo] data is packets of fixed size, otherwise data is expected
                            line-wise. Alternatively use --binary" << std::endl
@@ -50,7 +47,7 @@ csv options
                             --frequency 10 \
                             --window-geometry=0,0,400,60 \
                             --title='examples: hue selection' \
-                    | csv-seek --fields ratio 'colour-wheel.bin;binary=3ub' --flush \
+                    | csv-seek --permissive --fields ratio 'colour-wheel.bin;binary=3ub' --flush \
                     | cv-cat --input 'rows=1;cols=1;no-header;type=3ub' \
                              'resize=400;view=,examples: hue selection,,0,130;null'
 )";
@@ -121,11 +118,12 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        std::vector< std::string > unnamed = options.unnamed( "--flush,-v,--verbose,", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,-v,--verbose,--permissive,-p,--size", "-.*" );
         comma::csv::options csv( options, "index" );
+        bool permissive = options.exists( "--permissive,-p" );
         COMMA_ASSERT_BRIEF( csv.has_field( "ratio" ) != csv.has_field( "index" ), "please specify either 'ratio' or 'index' (but not both) in --fields" );
 
-        COMMA_ASSERT_BRIEF( unnamed.size() > 0, "expected file or stream (todo)" );
+        COMMA_ASSERT_BRIEF( unnamed.size() > 0, "expected file (or stream, todo)" );
         COMMA_ASSERT_BRIEF( unnamed.size() < 2, "Does not work on multiple streams (yet (shouuld it?))" );
 
         comma::name_value::parser csv_options_parser( "filename", ';', '=', false );
@@ -148,10 +146,14 @@ int main( int ac, char** av )
             if( !p ) { break; }
 
             std::streampos index = p->get_index( file_size, record_size, csv.has_field( "ratio" ) );
-            std::cerr << "seeking to index:" << index << " with file size:" << file_size << " and record size:" << record_size << std::endl;
             std::streampos adjusted_offset = (index / record_size) * record_size;
 
-            if (adjusted_offset >= file_size) { std::cerr << "index out of bounds" << std::endl; continue; }
+            if (adjusted_offset >= file_size) 
+            { 
+                comma::saymore() <<  "index out of bounds" << std::endl; 
+                if( permissive ) { continue; }
+                return 1;
+            }
             std::vector<char> record_data;
             file.seekg(adjusted_offset);
             record_data.resize(record_size);
diff --git a/csv/test/csv-seek/expected b/csv/test/csv-seek/expected
index afa1761cc..c711b4f31 100644
--- a/csv/test/csv-seek/expected
+++ b/csv/test/csv-seek/expected
@@ -12,10 +12,14 @@ index[2]/output/line[2]="5"
 index[3]/output/line[0]="0"
 index[3]/output/line[1]="3"
 index[3]/output/line[2]="5"
-index[4]/output/line[0]="0"
-index[4]/output/line[1]="3"
-index[4]/output/line[2]="5"
-index[4]/output/line[3]="9"
-index[5]/output/line[0]="0"
-index[5]/output/line[1]="3"
-index[5]/output/line[2]="5"
+index[4]/output=""
+index[4]/status=1
+index[5]/output=""
+index[5]/status=0
+offset[1]/output/line[0]="0"
+offset[1]/output/line[1]="3"
+offset[1]/output/line[2]="5"
+offset[1]/output/line[3]="9"
+offset[2]/output/line[0]="0"
+offset[2]/output/line[1]="3"
+offset[2]/output/line[2]="5"
diff --git a/csv/test/csv-seek/input b/csv/test/csv-seek/input
index 4058c6503..8d3de473e 100644
--- a/csv/test/csv-seek/input
+++ b/csv/test/csv-seek/input
@@ -2,5 +2,7 @@ index[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek 'data.bin;binary=ui' | c
 index[1]="( echo 0; echo 3; echo 5; echo 9 ) | csv-to-bin ui | csv-seek --binary=ui \'data.bin;binary=ui\' | csv-from-bin ui"
 index[2]="( echo a,0; echo b,3; echo c,5 ) | csv-seek --fields ,index 'data.bin;binary=ui' | csv-from-bin ui"
 index[3]="( echo 0,0; echo 1,3; echo 2,5 ) | csv-to-bin 2ui | csv-seek --fields ,index --binary=2ui 'data.bin;binary=ui' | csv-from-bin ui"
-index[4]="( echo 0; echo 0.30; echo 0.5; echo 0.9 ) | csv-seek --fields ratio 'data.bin;binary=ui' | csv-from-bin ui"
-index[5]="( echo 0,0; echo 1,0.3; echo 2,0.5  ) | csv-to-bin ui,f | csv-seek --fields ,ratio --binary=ui,f 'data.bin;binary=ui' | csv-from-bin ui"
+index[4]="( echo 200; ) | csv-seek 'data.bin;binary=ui' >/dev/null"
+index[5]="( echo 200; ) | csv-seek --permissive 'data.bin;binary=ui' >/dev/null"
+offset[1]="( echo 0; echo 0.30; echo 0.5; echo 0.9 ) | csv-seek --fields ratio 'data.bin;binary=ui' | csv-from-bin ui"
+offset[2]="( echo 0,0; echo 1,0.3; echo 2,0.5  ) | csv-to-bin ui,f | csv-seek --fields ,ratio --binary=ui,f 'data.bin;binary=ui' | csv-from-bin ui"
diff --git a/csv/test/csv-seek/optional b/csv/test/csv-seek/optional
deleted file mode 100644
index e69de29bb..000000000

From abffdd2b44d661f9dd99a77ed279797b5e8c77d2 Mon Sep 17 00:00:00 2001
From: Aspen Eyers <aspen.eyers@missionsystems.com.au>
Date: Thu, 15 Aug 2024 17:29:53 +1000
Subject: [PATCH 0875/1056] csv/applications/csv-seek: updated tests with more
 explicate naming

---
 csv/test/csv-seek/expected | 44 ++++++++++++++++++++++----------------
 csv/test/csv-seek/input    | 13 +++++------
 2 files changed, 33 insertions(+), 24 deletions(-)

diff --git a/csv/test/csv-seek/expected b/csv/test/csv-seek/expected
index c711b4f31..f6c826eff 100644
--- a/csv/test/csv-seek/expected
+++ b/csv/test/csv-seek/expected
@@ -1,25 +1,33 @@
-index[0]/output/line[0]="0"
-index[0]/output/line[1]="3"
-index[0]/output/line[2]="5"
-index[0]/output/line[3]="9"
-index[1]/output/line[0]="0"
-index[1]/output/line[1]="3"
-index[1]/output/line[2]="5"
-index[1]/output/line[3]="9"
-index[2]/output/line[0]="0"
-index[2]/output/line[1]="3"
-index[2]/output/line[2]="5"
-index[3]/output/line[0]="0"
-index[3]/output/line[1]="3"
-index[3]/output/line[2]="5"
-index[4]/output=""
-index[4]/status=1
-index[5]/output=""
-index[5]/status=0
+index/in_bounds_single_lookup[0]/output="6"
+index/in_bounds_single_lookup[0]/status=0
+index/in_bounds_multi_lookup[0]/output/line[0]="0"
+index/in_bounds_multi_lookup[0]/output/line[1]="3"
+index/in_bounds_multi_lookup[0]/output/line[2]="5"
+index/in_bounds_multi_lookup[0]/output/line[3]="9"
+index/in_bounds_multi_lookup[0]/status=0
+index/binary_input_stream[1]/output/line[0]="0"
+index/binary_input_stream[1]/output/line[1]="3"
+index/binary_input_stream[1]/output/line[2]="5"
+index/binary_input_stream[1]/output/line[3]="9"
+index/binary_input_stream[1]/status=0
+index/multi_input_stream[2]/output/line[0]="0"
+index/multi_input_stream[2]/output/line[1]="3"
+index/multi_input_stream[2]/output/line[2]="5"
+index/multi_input_stream[2]/status=0
+index/multi_input_stream_binary[3]/output/line[0]="0"
+index/multi_input_stream_binary[3]/output/line[1]="3"
+index/multi_input_stream_binary[3]/output/line[2]="5"
+index/multi_input_stream_binary[3]/status=0
+index/out_of_bounds[4]/output=""
+index/out_of_bounds[4]/status=1
+index/out_of_bounds_permissive[5]/output=""
+index/out_of_bounds_permissive[5]/status=0
 offset[1]/output/line[0]="0"
 offset[1]/output/line[1]="3"
 offset[1]/output/line[2]="5"
 offset[1]/output/line[3]="9"
+offset[1]/status=0
 offset[2]/output/line[0]="0"
 offset[2]/output/line[1]="3"
 offset[2]/output/line[2]="5"
+offset[2]/status=0
diff --git a/csv/test/csv-seek/input b/csv/test/csv-seek/input
index 8d3de473e..f3e93fe6a 100644
--- a/csv/test/csv-seek/input
+++ b/csv/test/csv-seek/input
@@ -1,8 +1,9 @@
-index[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek 'data.bin;binary=ui' | csv-from-bin ui"
-index[1]="( echo 0; echo 3; echo 5; echo 9 ) | csv-to-bin ui | csv-seek --binary=ui \'data.bin;binary=ui\' | csv-from-bin ui"
-index[2]="( echo a,0; echo b,3; echo c,5 ) | csv-seek --fields ,index 'data.bin;binary=ui' | csv-from-bin ui"
-index[3]="( echo 0,0; echo 1,3; echo 2,5 ) | csv-to-bin 2ui | csv-seek --fields ,index --binary=2ui 'data.bin;binary=ui' | csv-from-bin ui"
-index[4]="( echo 200; ) | csv-seek 'data.bin;binary=ui' >/dev/null"
-index[5]="( echo 200; ) | csv-seek --permissive 'data.bin;binary=ui' >/dev/null"
+index/in_bounds_single_lookup[0]="( echo 6 ) | csv-seek 'data.bin;binary=ui' | csv-from-bin ui"
+index/in_bounds_multi_lookup[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek 'data.bin;binary=ui' | csv-from-bin ui"
+index/binary_input_stream[1]="( echo 0; echo 3; echo 5; echo 9 ) | csv-to-bin ui | csv-seek --binary=ui \'data.bin;binary=ui\' | csv-from-bin ui"
+index/multi_input_stream[2]="( echo a,0; echo b,3; echo c,5 ) | csv-seek --fields ,index 'data.bin;binary=ui' | csv-from-bin ui"
+index/multi_input_stream_binary[3]="( echo 0,0; echo 1,3; echo 2,5 ) | csv-to-bin 2ui | csv-seek --fields ,index --binary=2ui 'data.bin;binary=ui' | csv-from-bin ui"
+index/out_of_bounds[4]="( echo 200; ) | csv-seek 'data.bin;binary=ui' >/dev/null"
+index/out_of_bounds_permissive[5]="( echo 200; ) | csv-seek --permissive 'data.bin;binary=ui' >/dev/null"
 offset[1]="( echo 0; echo 0.30; echo 0.5; echo 0.9 ) | csv-seek --fields ratio 'data.bin;binary=ui' | csv-from-bin ui"
 offset[2]="( echo 0,0; echo 1,0.3; echo 2,0.5  ) | csv-to-bin ui,f | csv-seek --fields ,ratio --binary=ui,f 'data.bin;binary=ui' | csv-from-bin ui"

From 51206c351a039faa144ffd20c1c73918270bfa0b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 16 Aug 2024 00:31:24 +1000
Subject: [PATCH 0876/1056] csv-seek: copyright added

---
 csv/applications/csv-seek.cpp | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index 00773f653..8897785c3 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -1,3 +1,7 @@
+// Copyright (c) 2024 Mission Systems
+
+/// @author Aspen Eyers
+
 #include <iostream>
 #include <fstream>
 #include "../../application/command_line_options.h"

From cf007cec565c425c790de4abc48dab4414244cee Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 22 Aug 2024 18:56:31 +1000
Subject: [PATCH 0877/1056] udp-client: brushed up in preparation to add a
 built-in publisher

---
 io/applications/udp-client.cpp | 147 +++++++++++++++++----------------
 1 file changed, 78 insertions(+), 69 deletions(-)

diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index f15a61114..a743d2cf3 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifndef WIN32
@@ -40,87 +39,97 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/noncopyable.hpp>
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
+#include "../publisher.h"
 
-void usage()
+static void usage()
 {
-    std::cerr << "simple udp client: receives udp packets and outputs them on stdout" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "rationale: netcat and socat somehow do not work very well with udp" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: udp-client <port> [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<options>" << std::endl;
-    std::cerr << "    --ascii: output timestamp as ascii; default: 64-bit binary" << std::endl;
-    std::cerr << "    --binary: output timestamp as 64-bit binary; default" << std::endl;
-    std::cerr << "    --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','" << std::endl;
-    std::cerr << "    --size=<size>: hint of maximum buffer size; default 16384" << std::endl;
-    std::cerr << "    --reuse-addr,--reuseaddr: reuse udp address/port" << std::endl;
-    std::cerr << "    --timestamp: output packet timestamp (currently just system time)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    std::cerr << R"(
+simple udp client: receives udp packets and outputs them on stdout
+
+rationale: netcat and socat somehow do not work very well with udp
+
+usage: udp-client <port> [<options>]
+
+options
+    --ascii: output timestamp as ascii; default: 64-bit binary
+    --binary: output timestamp as 64-bit binary; default
+    --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','
+    --size=<size>: hint of maximum buffer size; default 16384
+    --reuse-addr,--reuseaddr: reuse udp address/port
+    --timestamp: output packet timestamp (currently just system time)
+)" << std::endl;
+    exit( 0 );
 }
 
 int main( int argc, char** argv )
 {
-    comma::command_line_options options( argc, argv );
-    if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
-    const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
-    if( unnamed.empty() ) { std::cerr << "udp-client: please specify port" << std::endl; return 1; }
-    unsigned short port = boost::lexical_cast< unsigned short >( unnamed[0] );
-    bool timestamped = options.exists( "--timestamp" );
-    bool binary = !options.exists( "--ascii" );
-    char delimiter = options.value( "--delimiter", ',' );
-    std::vector< char > packet( options.value( "--size", 16384 ) );
-#if (BOOST_VERSION >= 106600)
-    boost::asio::io_context service;
-#else
-    boost::asio::io_service service;
-#endif
-    boost::asio::ip::udp::socket socket( service );
-    socket.open( boost::asio::ip::udp::v4() );
-    boost::system::error_code error;
-    socket.set_option( boost::asio::ip::udp::socket::broadcast( true ), error );
-    if( error ) { std::cerr << "udp-client: failed to set broadcast option on port " << port << std::endl; return 1; }
-    if( options.exists( "--reuse-addr,--reuseaddr" ) )
-    {
-        socket.set_option( boost::asio::ip::udp::socket::reuse_address( true ), error );
-        if( error ) { std::cerr << "udp-client: failed to set reuse address option on port " << port << std::endl; return 1; }
-    }
-    socket.bind( boost::asio::ip::udp::endpoint( boost::asio::ip::udp::v4(), port ), error );
-    if( error ) { std::cerr << "udp-client: failed to bind port " << port << std::endl; return 1; }
-
-    #ifdef WIN32
-    if( binary )
+    try
     {
-        _setmode( _fileno( stdout ), _O_BINARY );        
-    }
+        comma::command_line_options options( argc, argv );
+        if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
+        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
+        COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify port" );
+        COMMA_ASSERT_BRIEF( unnamed.size() < 3, "expected not more than two unnamed options; got: " << comma::join( unnamed, ' ' ) );
+        std::string publish_address = unnamed.size() == 2 ? "-" : unnamed[1];
+        COMMA_ASSERT_BRIEF( publish_address == "-", "publish: todo; got: '" << publish_address << "'" );
+        unsigned short port = boost::lexical_cast< unsigned short >( unnamed[0] );
+        bool timestamped = options.exists( "--timestamp" );
+        bool binary = !options.exists( "--ascii" );
+        char delimiter = options.value( "--delimiter", ',' );
+        std::vector< char > packet( options.value( "--size", 16384 ) );
+    #if ( BOOST_VERSION >= 106600 )
+        boost::asio::io_context service;
+    #else
+        boost::asio::io_service service;
     #endif
-    
-    while( std::cout.good() )
-    {
+        boost::asio::ip::udp::socket socket( service );
+        socket.open( boost::asio::ip::udp::v4() );
         boost::system::error_code error;
-        std::size_t size = socket.receive( boost::asio::buffer( packet ), 0, error );
-        if( error || size == 0 ) { break; }
-        if( timestamped )
+        socket.set_option( boost::asio::ip::udp::socket::broadcast( true ), error );
+        COMMA_ASSERT_BRIEF( !bool( error ), "failed to set broadcast option on port " << port );
+        if( options.exists( "--reuse-addr,--reuseaddr" ) )
         {
-            boost::posix_time::ptime timestamp = boost::posix_time::microsec_clock::universal_time();
-            static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
-            if( binary )
-            { 
-                static char buf[ sizeof( comma::int64 ) ];
-                comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( timestamp, buf );
-                std::cout.write( buf, sizeof( comma::int64 ) );
-            }
-            else
+            socket.set_option( boost::asio::ip::udp::socket::reuse_address( true ), error );
+            COMMA_ASSERT_BRIEF( !bool( error ), "failed to set reuse address option on port " << port );
+        }
+        socket.bind( boost::asio::ip::udp::endpoint( boost::asio::ip::udp::v4(), port ), error );
+        COMMA_ASSERT_BRIEF( !bool( error ), "failed to bind port " << port );
+        #ifdef WIN32
+        if( binary )
+        {
+            _setmode( _fileno( stdout ), _O_BINARY );        
+        }
+        #endif
+        static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
+        // todo: comma::io::publisher publisher( publish_address, binary ? comma::io::mode::binary : comma::io::mode::ascii, false, flush );
+        while( std::cout.good() )
+        {
+            boost::system::error_code error;
+            std::size_t size = socket.receive( boost::asio::buffer( packet ), 0, error );
+            if( error || size == 0 ) { break; }
+            if( timestamped )
             {
-                std::cout << boost::posix_time::to_iso_string( timestamp ) << delimiter;
+                boost::posix_time::ptime timestamp = boost::posix_time::microsec_clock::universal_time();
+                if( binary )
+                { 
+                    static char buf[ sizeof( comma::int64 ) ];
+                    comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( timestamp, buf );
+                    std::cout.write( buf, sizeof( comma::int64 ) );
+                }
+                else
+                {
+                    std::cout << boost::posix_time::to_iso_string( timestamp ) << delimiter;
+                }
             }
+            std::cout.write( &packet[0], size );
+            std::cout.flush();
         }
-        std::cout.write( &packet[0], size );
-        std::cout.flush();
-   }
-   return 0;
+        return 0;
+    }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
+    return 1;
 }

From e8a521393c950fb4b46bd5cd74caafdc5b475add Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 23 Aug 2024 12:23:49 +1000
Subject: [PATCH 0878/1056] udp-client: optional publishing: io-publish:
 publish moved out to detail; in progress...

---
 io/applications/CMakeLists.txt     |   6 +-
 io/applications/detail/publish.cpp | 169 +++++++++++++
 io/applications/detail/publish.h   |  83 +++++++
 io/applications/io-publish.cpp     | 380 +++++++----------------------
 4 files changed, 337 insertions(+), 301 deletions(-)
 create mode 100644 io/applications/detail/publish.cpp
 create mode 100644 io/applications/detail/publish.h

diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index 83428dc3b..ffde49fd0 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -38,7 +38,7 @@ if( NOT WIN32 )
     set_target_properties( io-ls PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-ls RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
-    add_executable( io-publish ${dir}/io-publish.cpp )
+    add_executable( io-publish ${dir}/io-publish.cpp ${dir}/detail/publish.h ${dir}/detail/publish.cpp )
     target_link_libraries( io-publish comma_base comma_io comma_application comma_xpath comma_name_value ) # profiler )
     set_target_properties( io-publish PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-publish RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
@@ -48,8 +48,8 @@ if( NOT WIN32 )
     set_target_properties( io-tee PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-tee RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
-    add_executable( udp-client ${dir}/udp-client.cpp )
-    target_link_libraries( udp-client comma_application comma_io comma_csv comma_base ) # profiler )
+    add_executable( udp-client ${dir}/udp-client.cpp ${dir}/detail/publish.h ${dir}/detail/publish.cpp )
+    target_link_libraries( udp-client comma_application comma_name_value comma_io comma_csv comma_base ) # profiler )
     set_target_properties( udp-client PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS udp-client RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
diff --git a/io/applications/detail/publish.cpp b/io/applications/detail/publish.cpp
new file mode 100644
index 000000000..765ff4b71
--- /dev/null
+++ b/io/applications/detail/publish.cpp
@@ -0,0 +1,169 @@
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+#include "publish.h"
+
+namespace comma { namespace io { namespace detail {
+
+publish::publish( const std::vector< std::string >& endpoints
+                , unsigned int packet_size
+                , bool discard
+                , bool flush
+                , bool output_number_of_clients
+                , bool update_no_clients
+                , unsigned int cache_size )
+    : discard_( discard )
+    , flush_( flush )
+    , buffer_( packet_size, '\0' )
+    , packet_size_( packet_size )
+    , output_number_of_clients_( output_number_of_clients )
+    , cache_size_( cache_size )
+    , update_no_clients_( update_no_clients )
+    , got_first_client_ever_( false )
+    , sizes_( endpoints.size(), 0 )
+    , num_clients_( 0 )
+    , is_shutdown_( false )
+{
+    bool has_primary_stream = false;
+    for( unsigned int i = 0; i < endpoints.size(); ++i )
+    {
+        comma::name_value::map m( endpoints[i], "address", ';', '=' );
+        bool secondary = !m.exists( "primary" ) && m.exists( "secondary" );
+        endpoints_.push_back( endpoint( m.value< std::string >( "address" ), secondary ) ); // todo? quick and dirty; better usage semantics?
+        if( !secondary ) { has_primary_stream = true; }
+    }
+    if( !has_primary_stream ) { comma::say() << "please specify at least one primary stream" << std::endl; exit( 1 ); }
+    struct sigaction new_action, old_action;
+    new_action.sa_handler = SIG_IGN;
+    sigemptyset( &new_action.sa_mask );
+    sigaction( SIGPIPE, NULL, &old_action );
+    sigaction( SIGPIPE, &new_action, NULL );
+    transaction_t t( publishers_ );
+    t->resize( endpoints.size() );
+    for( std::size_t i = 0; i < endpoints.size(); ++i )
+    {
+        if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
+    }
+    acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
+}
+        
+publish::~publish()
+{
+    is_shutdown_ = true;
+    acceptor_thread_->join();
+    transaction_t t( publishers_ );
+    for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
+}
+        
+void publish::disconnect_all()
+{
+    transaction_t t( publishers_ );
+    for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
+    handle_sizes_( t ); // quick and dirty
+}
+        
+bool publish::read( std::istream& input )
+{
+    if( is_binary_() )
+    {
+        input.read( &buffer_[0], buffer_.size() );
+        if( input.gcount() < int( buffer_.size() ) || !input.good() ) { return false; }
+    }
+    else
+    {
+        std::getline( input, buffer_ );
+        buffer_ += '\n';
+        if( !input.good() ) { return false; }
+    }
+    transaction_t t( publishers_ );
+    if( cache_size_ > 0 )
+    {
+        cache_.push_back( buffer_ );
+        if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
+    }
+    for( auto& p: *t ) { if( p ) { p->write( &buffer_[0], buffer_.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
+    return handle_sizes_( t );
+}
+
+bool publish::handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
+{
+    if( !output_number_of_clients_ && !update_no_clients_ ) { return true; }
+    unsigned int total = 0;
+    bool changed = false;
+    has_primary_clients_ = false;
+    for( unsigned int i = 0; i < t->size(); ++i )
+    {
+        unsigned int size = ( *t )[i] ? ( *t )[i]->size() : 0;
+        total += size;
+        if( !endpoints_[i].secondary && size > 0 ) { has_primary_clients_ = true; }
+        if( sizes_[i] == size ) { continue; }
+        sizes_[i] = size;
+        changed = true;
+        num_clients_ = total;
+    }
+    if( !changed ) { return true; }
+    if( output_number_of_clients_ )
+    {
+        std::cout << boost::posix_time::to_iso_string( boost::posix_time::microsec_clock::universal_time() );
+        for( unsigned int i = 0; i < sizes_.size(); ++i ) { std::cout << ',' << sizes_[i]; }
+        std::cout << std::endl;
+    }
+    if( update_no_clients_ )
+    {
+        if( total > 0 ) { got_first_client_ever_ = true; }
+        else if( got_first_client_ever_ ) { comma::verbose << "the last client exited" << std::endl; return false; }
+    }
+    return true;
+}
+
+void publish::accept_()
+{
+    comma::io::select select;
+    {
+        transaction_t t( publishers_ );
+        for( unsigned int i = 0; i < t->size(); ++i )
+        {
+            if( !( *t )[i] ) { continue; }
+            if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
+        }
+    }
+    while( !is_shutdown_ )
+    {
+        select.wait( boost::posix_time::millisec( 100 ) ); // todo? make timeout configurable?
+        transaction_t t( publishers_ );
+        for( unsigned int i = 0; i < t->size(); ++i )
+        {
+            if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
+            {
+                const auto& streams = ( *t )[i]->accept();
+                for( auto s: streams )
+                {
+                    for( const auto& c: cache_ ) { ( *s )->write( &c[0], c.size() ); }
+                    if( flush_ ) { ( *s )->flush(); }
+                }
+            }
+        }
+        handle_sizes_( t );
+        if( has_primary_clients_ )
+        {
+            for( unsigned int i = 0; i < t->size(); ++i )
+            {
+                if( !endpoints_[i].secondary || ( *t )[i] ) { continue; }
+                ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
+                if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
+            }
+        }
+        else
+        {
+            for( unsigned int i = 0; i < t->size(); ++i )
+            {
+                if( !endpoints_[i].secondary || !( *t )[i] ) { continue; }
+                select.read().remove( ( *t )[i]->acceptor_file_descriptor() );
+                ( *t )[i].reset();
+            }
+        }
+    }
+}
+
+} } } // namespace comma { namespace io { namespace detail {
diff --git a/io/applications/detail/publish.h b/io/applications/detail/publish.h
new file mode 100644
index 000000000..0071dc133
--- /dev/null
+++ b/io/applications/detail/publish.h
@@ -0,0 +1,83 @@
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+#pragma once
+
+#include <errno.h>
+#include <signal.h>
+#include <sys/wait.h>
+#include <unistd.h>
+#include <deque>
+#include <memory>
+#include <boost/bind/bind.hpp>
+#include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/iostreams/device/file_descriptor.hpp>
+#include <boost/iostreams/stream.hpp>
+#include <boost/scoped_ptr.hpp>
+#include <boost/thread.hpp>
+#include "../../../application/command_line_options.h"
+#include "../../../application/signal_flag.h"
+#include "../../../base/last_error.h"
+#include "../../../io/file_descriptor.h"
+#include "../../../io/publisher.h"
+#include "../../../name_value/map.h"
+#include "../../../string/string.h"
+#include "../../../sync/synchronized.h"
+
+namespace comma { namespace io { namespace detail {
+
+class publish
+{
+    public:
+        typedef comma::synchronized< std::vector< std::unique_ptr< comma::io::publisher > > > publishers_t;
+        
+        typedef publishers_t::scoped_transaction transaction_t;
+        
+        struct endpoint
+        {
+            std::string address;
+            bool secondary;
+            endpoint( const std::string& address = "", bool secondary = false ): address( address ), secondary( secondary ) {}
+        };
+        
+        publish( const std::vector< std::string >& endpoints
+               , unsigned int packet_size
+               , bool discard
+               , bool flush
+               , bool output_number_of_clients
+               , bool update_no_clients
+               , unsigned int cache_size );
+        
+        ~publish();
+        
+        void disconnect_all();
+        
+        bool read( std::istream& input );
+        
+        unsigned int num_clients() const { return num_clients_; }
+
+    private:
+        std::vector< endpoint > endpoints_;
+        bool discard_;
+        bool flush_;
+        publishers_t publishers_;
+        std::string buffer_;
+        unsigned int packet_size_;
+        bool output_number_of_clients_;
+        unsigned int cache_size_;
+        bool update_no_clients_;
+        bool got_first_client_ever_;
+        std::vector< unsigned int > sizes_;
+        bool has_primary_clients_;
+        unsigned int num_clients_;
+        boost::scoped_ptr< boost::thread > acceptor_thread_;
+        bool is_shutdown_;
+        std::deque< std::string > cache_;
+
+        bool is_binary_() const { return packet_size_ > 0; }
+        bool handle_sizes_( transaction_t& t ); // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
+        void accept_();
+};
+
+} } } // namespace comma { namespace io { namespace detail {
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 826b6e3a5..6e209aba2 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -3,297 +3,81 @@
 
 /// @authors cedric wohlleber, vsevolod vlaskine, dave jennings
 
-#include <errno.h>
-#include <signal.h>
-#include <sys/wait.h>
-#include <unistd.h>
-#include <deque>
-#include <memory>
-#include <boost/bind/bind.hpp>
-#include <boost/date_time/posix_time/posix_time.hpp>
-#include <boost/iostreams/device/file_descriptor.hpp>
-#include <boost/iostreams/stream.hpp>
-#include <boost/scoped_ptr.hpp>
-#include <boost/thread.hpp>
-#include "../../application/command_line_options.h"
-#include "../../application/signal_flag.h"
-#include "../../base/last_error.h"
-#include "../../io/file_descriptor.h"
-#include "../../io/publisher.h"
-#include "../../name_value/map.h"
-#include "../../string/string.h"
-#include "../../sync/synchronized.h"
+#include "detail/publish.h"
 
 //#include <google/profiler.h>
 
 static void usage( bool verbose = false )
 {
-    std::cerr << std::endl;
-    std::cerr << "read from standard input and write to given outputs (files, sockets, named pipes):" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "- the data is only written to the outputs that are ready for writing" << std::endl;
-    std::cerr << "- client can connect and disconnect at any time" << std::endl;
-    std::cerr << "- only full packets are written" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: io-publish [<options>] <outputs>" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "general options" << std::endl;
-    std::cerr << "    --help,-h: show this help" << std::endl;
-    std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "stream options" << std::endl;
-    std::cerr << "    --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the" << std::endl;
-    std::cerr << "                                         the cached records will be sent to it once connected (todo)" << std::endl;
-    std::cerr << "    --size,-s: binary input; packet size" << std::endl;
-    std::cerr << "    --multiplier,-m: multiplier for packet size, default is 1. The actual packet size will be m * s" << std::endl;
-    std::cerr << "    --no-discard: if present, do blocking write to every open stream" << std::endl;
-    std::cerr << "    --no-flush: if present, do not flush the output stream (use on high bandwidth sources)" << std::endl;
-    std::cerr << "    --exec=[<command>]: read from <command> rather than stdin" << std::endl;
-    std::cerr << "    -- [<command>]: alternate syntax for specifying a command (simplifies quoting)" << std::endl;
-    std::cerr << "    --on-demand: only run <command> when a client is connected" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "client options" << std::endl;
-    std::cerr << "    --exit-on-no-clients,-e: once the last client disconnects, exit" << std::endl;
-    std::cerr << "    --output-number-of-clients,--clients: output to stdout timestamped number of clients whenever it changes" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    attention: in the current implementation, the number of clients will be" << std::endl;
-    std::cerr << "               updated only on attempt to write a new record," << std::endl;
-    std::cerr << "               i.e. output number of clients will not change if there are no new" << std::endl;
-    std::cerr << "               records on stdin, even if the actual number of clients changes" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    known problems: io::ostream or at least boost::asio::ostream does not mark" << std::endl;
-    std::cerr << "               stream as bad, if one tries to write to it first time after" << std::endl;
-    std::cerr << "               stream has been closed; the stream is marked as bad only after" << std::endl;
-    std::cerr << "               writing to it second time." << std::endl;
-    std::cerr << "               This problem is pretty benign: the worst thing that happens is" << std::endl;
-    std::cerr << "               writing to a closed stream, which will not cause grief unless you" << std::endl;
-    std::cerr << "               specifically rely on io-publish exiting on no clients for a" << std::endl;
-    std::cerr << "               rarely sent heartbeat." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "               io-publish will not be very responsive in counting clients for" << std::endl;
-    std::cerr << "               low bandwidth streams. It immediately recognises new clients" << std::endl;
-    std::cerr << "               but might take a while to notice that a client has gone." << std::endl;
-    std::cerr << "               This affects --output-number-of-clients and --on-demand." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "output streams: <address>[,<options>]" << std::endl;
-    std::cerr << "    <address>" << std::endl;
-    std::cerr << "        tcp:<port>: e.g. tcp:1234" << std::endl;
-    std::cerr << "        udp:<port>: e.g. udp:1234 (todo)" << std::endl;
-    std::cerr << "        local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
-    std::cerr << "        <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
-    std::cerr << "        <filename>: a regular file" << std::endl;
-    std::cerr << "        -: stdout" << std::endl;
-    std::cerr << "    <options>" << std::endl;
-    std::cerr << "        primary (default): clients always can connect to the 'primary' stream" << std::endl;
-    std::cerr << "        secondary: clients can connect to the 'secondary' stream, only if there are existing clients on a primary stream" << std::endl;
-    std::cerr << "                   if a client connects to a 'primary' stream, 'secondary' streams will be opened" << std::endl;
-    std::cerr << "                   if last client on a 'primary' stream disconnects, 'secondary' streams will be closed" << std::endl;
-    std::cerr << "                   e.g: io-publish tcp:8888 'tcp:9999;secondary'" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    cat data | io-publish tcp:1234 --size 100" << std::endl;
-    std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand --exec \"camera-cat arg1 arg2\"" << std::endl;
-    std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand -- camera-cat arg1 arg2" << std::endl;
-    std::cerr << std::endl;
-    exit( 0 );
-}
+    std::cerr << R"(
+read from standard input and write to given outputs (files, sockets, named pipes):
 
-class publish
-{
-    public:
-        typedef comma::synchronized< std::vector< std::unique_ptr< comma::io::publisher > > > publishers_t;
-        
-        typedef publishers_t::scoped_transaction transaction_t;
-        
-        struct endpoint
-        {
-            std::string address;
-            bool secondary;
-            endpoint( const std::string& address = "", bool secondary = false ): address( address ), secondary( secondary ) {}
-        };
-        
-        publish( const std::vector< std::string >& endpoints
-               , unsigned int packet_size
-               , bool discard
-               , bool flush
-               , bool output_number_of_clients
-               , bool update_no_clients
-               , unsigned int cache_size )
-            : discard_( discard )
-            , flush_( flush )
-            , buffer_( packet_size, '\0' )
-            , packet_size_( packet_size )
-            , output_number_of_clients_( output_number_of_clients )
-            , cache_size_( cache_size )
-            , update_no_clients_( update_no_clients )
-            , got_first_client_ever_( false )
-            , sizes_( endpoints.size(), 0 )
-            , num_clients_( 0 )
-            , is_shutdown_( false )
-        {
-            bool has_primary_stream = false;
-            for( unsigned int i = 0; i < endpoints.size(); ++i )
-            {
-                comma::name_value::map m( endpoints[i], "address", ';', '=' );
-                bool secondary = !m.exists( "primary" ) && m.exists( "secondary" );
-                endpoints_.push_back( endpoint( m.value< std::string >( "address" ), secondary ) ); // todo? quick and dirty; better usage semantics?
-                if( !secondary ) { has_primary_stream = true; }
-            }
-            if( !has_primary_stream ) { std::cerr << "io-publish: please specify at least one primary stream" << std::endl; exit( 1 ); }
-            struct sigaction new_action, old_action;
-            new_action.sa_handler = SIG_IGN;
-            sigemptyset( &new_action.sa_mask );
-            sigaction( SIGPIPE, NULL, &old_action );
-            sigaction( SIGPIPE, &new_action, NULL );
-            transaction_t t( publishers_ );
-            t->resize( endpoints.size() );
-            for( std::size_t i = 0; i < endpoints.size(); ++i )
-            {
-                if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
-            }
-            acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
-        }
-        
-        ~publish()
-        {
-            is_shutdown_ = true;
-            acceptor_thread_->join();
-            transaction_t t( publishers_ );
-            for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
-        }
-        
-        void disconnect_all()
-        {
-            transaction_t t( publishers_ );
-            for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
-            handle_sizes_( t ); // quick and dirty
-        }
-        
-        bool read( std::istream& input )
-        {
-            if( is_binary_() )
-            {
-                input.read( &buffer_[0], buffer_.size() );
-                if( input.gcount() < int( buffer_.size() ) || !input.good() ) { return false; }
-            }
-            else
-            {
-                std::getline( input, buffer_ );
-                buffer_ += '\n';
-                if( !input.good() ) { return false; }
-            }
-            transaction_t t( publishers_ );
-            if( cache_size_ > 0 )
-            {
-                cache_.push_back( buffer_ );
-                if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
-            }
-            for( auto& p: *t ) { if( p ) { p->write( &buffer_[0], buffer_.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
-            return handle_sizes_( t );
-        }
-        
-        unsigned int num_clients() const { return num_clients_; }
+- the data is only written to the outputs that are ready for writing
+- client can connect and disconnect at any time
+- only full packets are written
 
-    private:
-        bool is_binary_() const { return packet_size_ > 0; }
-        
-        bool handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
-        {
-            if( !output_number_of_clients_ && !update_no_clients_ ) { return true; }
-            unsigned int total = 0;
-            bool changed = false;
-            has_primary_clients_ = false;
-            for( unsigned int i = 0; i < t->size(); ++i )
-            {
-                unsigned int size = ( *t )[i] ? ( *t )[i]->size() : 0;
-                total += size;
-                if( !endpoints_[i].secondary && size > 0 ) { has_primary_clients_ = true; }
-                if( sizes_[i] == size ) { continue; }
-                sizes_[i] = size;
-                changed = true;
-                num_clients_ = total;
-            }
-            if( !changed ) { return true; }
-            if( output_number_of_clients_ )
-            {
-                std::cout << boost::posix_time::to_iso_string( boost::posix_time::microsec_clock::universal_time() );
-                for( unsigned int i = 0; i < sizes_.size(); ++i ) { std::cout << ',' << sizes_[i]; }
-                std::cout << std::endl;
-            }
-            if( update_no_clients_ )
-            {
-                if( total > 0 ) { got_first_client_ever_ = true; }
-                else if( got_first_client_ever_ ) { comma::verbose << "the last client exited" << std::endl; return false; }
-            }
-            return true;
-        }
-        
-        void accept_()
-        {
-            comma::io::select select;
-            {
-                transaction_t t( publishers_ );
-                for( unsigned int i = 0; i < t->size(); ++i )
-                {
-                    if( !( *t )[i] ) { continue; }
-                    if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
-                }
-            }
-            while( !is_shutdown_ )
-            {
-                select.wait( boost::posix_time::millisec( 100 ) ); // todo? make timeout configurable?
-                transaction_t t( publishers_ );
-                for( unsigned int i = 0; i < t->size(); ++i )
-                {
-                    if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
-                    {
-                        const auto& streams = ( *t )[i]->accept();
-                        for( auto s: streams )
-                        {
-                            for( const auto& c: cache_ ) { ( *s )->write( &c[0], c.size() ); }
-                            if( flush_ ) { ( *s )->flush(); }
-                        }
-                    }
-                }
-                handle_sizes_( t );
-                if( has_primary_clients_ )
-                {
-                    for( unsigned int i = 0; i < t->size(); ++i )
-                    {
-                        if( !endpoints_[i].secondary || ( *t )[i] ) { continue; }
-                        ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
-                        if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
-                    }
-                }
-                else
-                {
-                    for( unsigned int i = 0; i < t->size(); ++i )
-                    {
-                        if( !endpoints_[i].secondary || !( *t )[i] ) { continue; }
-                        select.read().remove( ( *t )[i]->acceptor_file_descriptor() );
-                        ( *t )[i].reset();
-                    }
-                }
-            }
-        }
-        
-        std::vector< endpoint > endpoints_;
-        bool discard_;
-        bool flush_;
-        publishers_t publishers_;
-        std::string buffer_;
-        unsigned int packet_size_;
-        bool output_number_of_clients_;
-        unsigned int cache_size_;
-        bool update_no_clients_;
-        bool got_first_client_ever_;
-        std::vector< unsigned int > sizes_;
-        bool has_primary_clients_;
-        unsigned int num_clients_;
-        boost::scoped_ptr< boost::thread > acceptor_thread_;
-        bool is_shutdown_;
-        std::deque< std::string > cache_;
-};
+usage: io-publish [<options>] <outputs>
+
+general options
+    --help,-h: show this help
+    --verbose,-v: more output to stderr
+
+stream options
+    --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
+                                         the cached records will be sent to it once connected (todo)
+    --size,-s: binary input; packet size
+    --multiplier,-m: multiplier for packet size, default is 1. The actual packet size will be m * s
+    --no-discard: if present, do blocking write to every open stream
+    --no-flush: if present, do not flush the output stream (use on high bandwidth sources)
+    --exec=[<command>]: read from <command> rather than stdin
+    -- [<command>]: alternate syntax for specifying a command (simplifies quoting)
+    --on-demand: only run <command> when a client is connected
+
+client options
+    --exit-on-no-clients,-e: once the last client disconnects, exit
+    --output-number-of-clients,--clients: output to stdout timestamped number of clients whenever it changes
+
+    attention: in the current implementation, the number of clients will be
+               updated only on attempt to write a new record,
+               i.e. output number of clients will not change if there are no new
+               records on stdin, even if the actual number of clients changes
+
+    known problems: io::ostream or at least boost::asio::ostream does not mark
+               stream as bad, if one tries to write to it first time after
+               stream has been closed; the stream is marked as bad only after
+               writing to it second time.
+               This problem is pretty benign: the worst thing that happens is
+               writing to a closed stream, which will not cause grief unless you
+               specifically rely on io-publish exiting on no clients for a
+               rarely sent heartbeat.
+
+               io-publish will not be very responsive in counting clients for
+               low bandwidth streams. It immediately recognises new clients
+               but might take a while to notice that a client has gone.
+               This affects --output-number-of-clients and --on-demand.
+
+output streams: <address>[,<options>]
+    <address>
+        tcp:<port>: e.g. tcp:1234
+        udp:<port>: e.g. udp:1234 (todo)
+        local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket
+        <named pipe name>: named pipe, which will be re-opened, if client reconnects
+        <filename>: a regular file
+        -: stdout
+    <options>
+        primary (default): clients always can connect to the 'primary' stream
+        secondary: clients can connect to the 'secondary' stream, only if there are existing clients on a primary stream
+                   if a client connects to a 'primary' stream, 'secondary' streams will be opened
+                   if last client on a 'primary' stream disconnects, 'secondary' streams will be closed
+                   e.g: io-publish tcp:8888 'tcp:9999;secondary'
+
+examples
+    cat data | io-publish tcp:1234 --size 100
+    io-publish tcp:1234 --size 24000 --on-demand --exec \"camera-cat arg1 arg2\"
+    io-publish tcp:1234 --size 24000 --on-demand -- camera-cat arg1 arg2
+)";
+    exit( 0 );
+}
 
 class command
 {
@@ -313,7 +97,7 @@ class command
                 ::close( fd[1] );     // no longer need fd[1], now that it's duped
                 ::close( fd[0] );     // don't need pipe output in the child
                 ::execlp( "bash", "bash", "-c", &command_[0], NULL );
-                std::cerr << "io-publish: failed to exec child: errno " << comma::last_error::value() << " - " << comma::last_error::to_string() << std::endl;
+                comma::say() << "failed to exec child: errno " << comma::last_error::value() << " - " << comma::last_error::to_string() << std::endl;
                 exit( 1 );
             }
             child_pid_ = pid;
@@ -351,29 +135,29 @@ int main( int ac, char** av )
         for( int i = head.size() + 1; i < ac; ++i ) { tail.push_back( av[i] ); }
         comma::command_line_options options( head, usage );
         const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand", "-.+" );
-        if( names.empty() ) { std::cerr << "io-publish: please specify at least one stream; use '-' for stdout" << std::endl; return 1; }
+        if( names.empty() ) { comma::say() << "please specify at least one stream; use '-' for stdout" << std::endl; return 1; }
         options.assert_mutually_exclusive( "--cache-size,--cache", "--on-demand" );
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
         comma::signal_flag is_shutdown( signals );
         bool on_demand = options.exists( "--on-demand" );
         bool exit_on_no_clients = options.exists( "--exit-on-no-clients,-e" );
-        publish p( names
-                 , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
-                 , !options.exists( "--no-discard" )
-                 , !options.exists( "--no-flush" )
-                 , options.exists( "--output-number-of-clients,--clients" )
-                 , exit_on_no_clients || on_demand
-                 , options.value( "--cache-size,--cache", 0 ) );
+        comma::io::detail::publish p( names
+                                    , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                    , !options.exists( "--no-discard" )
+                                    , !options.exists( "--no-flush" )
+                                    , options.exists( "--output-number-of-clients,--clients" )
+                                    , exit_on_no_clients || on_demand
+                                    , options.value( "--cache-size,--cache", 0 ) );
         std::string exec_command = options.value< std::string >( "--exec", "" );
         if( !tail.empty() )
         {
-            if( !exec_command.empty() ) { std::cerr << "io-publish: expected either --exec or --, got both" << std::endl; return 1; }
+            if( !exec_command.empty() ) { comma::say() << "expected either --exec or --, got both" << std::endl; return 1; }
             exec_command = comma::join( tail, ' ' );
         }
         //ProfilerStart( "io-publish.prof" ); {
         if( exec_command.empty() )
         {
-            if( on_demand ) { std::cerr << "io-publish: got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" << std::endl; return 1; }
+            if( on_demand ) { comma::say() << "got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" << std::endl; return 1; }
             while( std::cin.good() && !is_shutdown ) { if( !p.read( std::cin ) && exit_on_no_clients ) { break; } }
         }
         else
@@ -394,18 +178,18 @@ int main( int ac, char** av )
             }
         }
         //ProfilerStop(); }
-        if( is_shutdown ) { std::cerr << "io-publish: interrupted by signal" << std::endl; }
+        if( is_shutdown ) { comma::say() << "interrupted by signal" << std::endl; }
         return 0;
     }
     catch( std::exception& ex )
     {
         if( comma::last_error::value() == EINTR || comma::last_error::value() == EBADF ) { return 0; }
-        std::cerr << "io-publish: " << ex.what() << std::endl;
+        comma::say() << "" << ex.what() << std::endl;
     }
     catch( ... )
     {
         if( comma::last_error::value() == EINTR || comma::last_error::value() == EBADF ) { return 0; }
-        std::cerr << "io-publish: unknown exception" << std::endl;
+        comma::say() << "unknown exception" << std::endl;
     }
     return 1;
 }

From ee7473bbab5fbddf0d8c637da9ae5abab27d87b9 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 23 Aug 2024 13:45:35 +1000
Subject: [PATCH 0879/1056] udp-client: republishing implemented
 (debugging...), --flush added

---
 io/applications/detail/publish.cpp | 34 +++++++++++------
 io/applications/detail/publish.h   |  6 ++-
 io/applications/io-publish.cpp     |  4 +-
 io/applications/udp-client.cpp     | 60 ++++++++++++++++++++----------
 4 files changed, 70 insertions(+), 34 deletions(-)

diff --git a/io/applications/detail/publish.cpp b/io/applications/detail/publish.cpp
index 765ff4b71..c13884bc3 100644
--- a/io/applications/detail/publish.cpp
+++ b/io/applications/detail/publish.cpp
@@ -1,5 +1,5 @@
 // Copyright (c) 2011 The University of Sydney
-// Copyright (c) 2024 Vsevolod Vlaskine
+// Copyright (c) 2020 Vsevolod Vlaskine
 // All rights reserved.
 
 #include "publish.h"
@@ -33,7 +33,7 @@ publish::publish( const std::vector< std::string >& endpoints
         endpoints_.push_back( endpoint( m.value< std::string >( "address" ), secondary ) ); // todo? quick and dirty; better usage semantics?
         if( !secondary ) { has_primary_stream = true; }
     }
-    if( !has_primary_stream ) { comma::say() << "please specify at least one primary stream" << std::endl; exit( 1 ); }
+    COMMA_ASSERT_BRIEF( has_primary_stream, "please specify at least one primary stream" );
     struct sigaction new_action, old_action;
     new_action.sa_handler = SIG_IGN;
     sigemptyset( &new_action.sa_mask );
@@ -62,7 +62,24 @@ void publish::disconnect_all()
     for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
     handle_sizes_( t ); // quick and dirty
 }
-        
+
+bool publish::write( const std::string& s )
+{
+    transaction_t t( publishers_ );
+    if( cache_size_ > 0 )
+    {
+        cache_.push_back( s );
+        if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
+    }
+    for( auto& p: *t ) { if( p ) { p->write( &s[0], s.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
+    return handle_sizes_( t );
+}
+
+bool publish::write( const char* buf, unsigned int size )
+{
+    return write( std::string( buf, size ) ); // todo: quick and dirty, watch performance
+}
+
 bool publish::read( std::istream& input )
 {
     if( is_binary_() )
@@ -76,14 +93,7 @@ bool publish::read( std::istream& input )
         buffer_ += '\n';
         if( !input.good() ) { return false; }
     }
-    transaction_t t( publishers_ );
-    if( cache_size_ > 0 )
-    {
-        cache_.push_back( buffer_ );
-        if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
-    }
-    for( auto& p: *t ) { if( p ) { p->write( &buffer_[0], buffer_.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
-    return handle_sizes_( t );
+    return write( buffer_ );
 }
 
 bool publish::handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
@@ -112,7 +122,7 @@ bool publish::handle_sizes_( transaction_t& t ) // todo? why pass transaction? i
     if( update_no_clients_ )
     {
         if( total > 0 ) { got_first_client_ever_ = true; }
-        else if( got_first_client_ever_ ) { comma::verbose << "the last client exited" << std::endl; return false; }
+        else if( got_first_client_ever_ ) { comma::saymore() << "the last client exited" << std::endl; return false; }
     }
     return true;
 }
diff --git a/io/applications/detail/publish.h b/io/applications/detail/publish.h
index 0071dc133..b13d90539 100644
--- a/io/applications/detail/publish.h
+++ b/io/applications/detail/publish.h
@@ -1,5 +1,5 @@
 // Copyright (c) 2011 The University of Sydney
-// Copyright (c) 2024 Vsevolod Vlaskine
+// Copyright (c) 2020 Vsevolod Vlaskine
 // All rights reserved.
 
 #pragma once
@@ -54,6 +54,10 @@ class publish
         void disconnect_all();
         
         bool read( std::istream& input );
+
+        bool write( const std::string& s );
+
+        bool write( const char* buf, unsigned int size );
         
         unsigned int num_clients() const { return num_clients_; }
 
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 6e209aba2..6b95ceb60 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -24,7 +24,7 @@ general options
 
 stream options
     --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
-                                         the cached records will be sent to it once connected (todo)
+                                         the cached records will be sent to it once connected
     --size,-s: binary input; packet size
     --multiplier,-m: multiplier for packet size, default is 1. The actual packet size will be m * s
     --no-discard: if present, do blocking write to every open stream
@@ -56,7 +56,7 @@ client options
                but might take a while to notice that a client has gone.
                This affects --output-number-of-clients and --on-demand.
 
-output streams: <address>[,<options>]
+output streams: <address>[;<options>]
     <address>
         tcp:<port>: e.g. tcp:1234
         udp:<port>: e.g. udp:1234 (todo)
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index a743d2cf3..1af2ad4bf 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -42,24 +42,41 @@
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
-#include "../publisher.h"
+#include "detail/publish.h"
 
 static void usage()
 {
     std::cerr << R"(
-simple udp client: receives udp packets and outputs them on stdout
+simple udp client: receive udp packets and outputs them on stdout (default)
+                   or to given output streams
 
 rationale: netcat and socat somehow do not work very well with udp
 
-usage: udp-client <port> [<options>]
+usage: udp-client <port> [<output-streams>] [<options>]
 
 options
-    --ascii: output timestamp as ascii; default: 64-bit binary
-    --binary: output timestamp as 64-bit binary; default
+    --ascii; output timestamp as ascii; default: 64-bit binary
+    --binary; output timestamp as 64-bit binary; default
+    --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
+                                         the cached records will be sent to it once connected
     --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','
-    --size=<size>: hint of maximum buffer size; default 16384
+    --flush; flush stdout after each packet
+    --no-discard: if present, do blocking write to every open output stream
+    --size=<size>; hint of maximum buffer size; default 16384
     --reuse-addr,--reuseaddr: reuse udp address/port
     --timestamp: output packet timestamp (currently just system time)
+
+output streams: <address>
+    <address>
+        tcp:<port>: e.g. tcp:1234
+        udp:<port>: e.g. udp:1234 (todo)
+        local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket
+        <named pipe name>: named pipe, which will be re-opened, if client reconnects
+        <filename>: a regular file
+        -: stdout
+
+examples
+    todo
 )" << std::endl;
     exit( 0 );
 }
@@ -70,21 +87,23 @@ int main( int argc, char** argv )
     {
         comma::command_line_options options( argc, argv );
         if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
-        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
+        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--no-discar,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
         COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify port" );
-        COMMA_ASSERT_BRIEF( unnamed.size() < 3, "expected not more than two unnamed options; got: " << comma::join( unnamed, ' ' ) );
         std::string publish_address = unnamed.size() == 2 ? "-" : unnamed[1];
         COMMA_ASSERT_BRIEF( publish_address == "-", "publish: todo; got: '" << publish_address << "'" );
+        std::vector< std::string > output_streams( unnamed.size() > 1 ? unnamed.size() - 1 : 1 );
+        if( unnamed.size() == 1 ) { output_streams[0] = "-"; }
+        else { std::copy( unnamed.begin() + 1, unnamed.end(), output_streams.begin() ); }
         unsigned short port = boost::lexical_cast< unsigned short >( unnamed[0] );
         bool timestamped = options.exists( "--timestamp" );
         bool binary = !options.exists( "--ascii" );
         char delimiter = options.value( "--delimiter", ',' );
         std::vector< char > packet( options.value( "--size", 16384 ) );
-    #if ( BOOST_VERSION >= 106600 )
-        boost::asio::io_context service;
-    #else
-        boost::asio::io_service service;
-    #endif
+        #if ( BOOST_VERSION >= 106600 )
+            boost::asio::io_context service;
+        #else
+            boost::asio::io_service service;
+        #endif
         boost::asio::ip::udp::socket socket( service );
         socket.open( boost::asio::ip::udp::v4() );
         boost::system::error_code error;
@@ -98,13 +117,17 @@ int main( int argc, char** argv )
         socket.bind( boost::asio::ip::udp::endpoint( boost::asio::ip::udp::v4(), port ), error );
         COMMA_ASSERT_BRIEF( !bool( error ), "failed to bind port " << port );
         #ifdef WIN32
-        if( binary )
-        {
-            _setmode( _fileno( stdout ), _O_BINARY );        
-        }
+        if( binary ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
         static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
         // todo: comma::io::publisher publisher( publish_address, binary ? comma::io::mode::binary : comma::io::mode::ascii, false, flush );
+        comma::io::detail::publish p( output_streams
+                                    , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                    , !options.exists( "--no-discard" )
+                                    , options.exists( "--flush" )
+                                    , false
+                                    , false
+                                    , options.value( "--cache-size,--cache", 0 ) );
         while( std::cout.good() )
         {
             boost::system::error_code error;
@@ -124,8 +147,7 @@ int main( int argc, char** argv )
                     std::cout << boost::posix_time::to_iso_string( timestamp ) << delimiter;
                 }
             }
-            std::cout.write( &packet[0], size );
-            std::cout.flush();
+            p.write( &packet[0], size );
         }
         return 0;
     }

From 25a6fbd1841f8ab69b1a0c59328a9c58715810b7 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 23 Aug 2024 13:48:47 +1000
Subject: [PATCH 0880/1056] udp-client: default flush behaviour restored for
 now

---
 io/applications/udp-client.cpp | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 1af2ad4bf..2d37200cc 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -62,6 +62,8 @@ options
     --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','
     --flush; flush stdout after each packet
     --no-discard: if present, do blocking write to every open output stream
+    --no-flush; if not present flush stdout after each packet (--no-flush logic to preserve
+                backward-compatible default behaviour)
     --size=<size>; hint of maximum buffer size; default 16384
     --reuse-addr,--reuseaddr: reuse udp address/port
     --timestamp: output packet timestamp (currently just system time)
@@ -98,6 +100,7 @@ int main( int argc, char** argv )
         bool timestamped = options.exists( "--timestamp" );
         bool binary = !options.exists( "--ascii" );
         char delimiter = options.value( "--delimiter", ',' );
+        options.assert_mutually_exclusive( "--flush", "--no-flush" );
         std::vector< char > packet( options.value( "--size", 16384 ) );
         #if ( BOOST_VERSION >= 106600 )
             boost::asio::io_context service;
@@ -124,7 +127,7 @@ int main( int argc, char** argv )
         comma::io::detail::publish p( output_streams
                                     , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
                                     , !options.exists( "--no-discard" )
-                                    , options.exists( "--flush" )
+                                    , options.exists( "--flush" ) || !options.exists( "--no-flush" )
                                     , false
                                     , false
                                     , options.value( "--cache-size,--cache", 0 ) );

From 5d05353ad6ef7b617667dfdbb58be593fff22d35 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 23 Aug 2024 20:13:33 +1000
Subject: [PATCH 0881/1056] udp-client: --flush added; default behaviour
 changed to non-flushing

---
 io/applications/udp-client.cpp | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 2d37200cc..64420ea1b 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -62,8 +62,6 @@ options
     --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','
     --flush; flush stdout after each packet
     --no-discard: if present, do blocking write to every open output stream
-    --no-flush; if not present flush stdout after each packet (--no-flush logic to preserve
-                backward-compatible default behaviour)
     --size=<size>; hint of maximum buffer size; default 16384
     --reuse-addr,--reuseaddr: reuse udp address/port
     --timestamp: output packet timestamp (currently just system time)
@@ -89,7 +87,7 @@ int main( int argc, char** argv )
     {
         comma::command_line_options options( argc, argv );
         if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
-        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--no-discar,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
+        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--flush,--no-discard,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
         COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify port" );
         std::string publish_address = unnamed.size() == 2 ? "-" : unnamed[1];
         COMMA_ASSERT_BRIEF( publish_address == "-", "publish: todo; got: '" << publish_address << "'" );
@@ -100,7 +98,6 @@ int main( int argc, char** argv )
         bool timestamped = options.exists( "--timestamp" );
         bool binary = !options.exists( "--ascii" );
         char delimiter = options.value( "--delimiter", ',' );
-        options.assert_mutually_exclusive( "--flush", "--no-flush" );
         std::vector< char > packet( options.value( "--size", 16384 ) );
         #if ( BOOST_VERSION >= 106600 )
             boost::asio::io_context service;
@@ -123,11 +120,10 @@ int main( int argc, char** argv )
         if( binary ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
         static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
-        // todo: comma::io::publisher publisher( publish_address, binary ? comma::io::mode::binary : comma::io::mode::ascii, false, flush );
         comma::io::detail::publish p( output_streams
                                     , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
                                     , !options.exists( "--no-discard" )
-                                    , options.exists( "--flush" ) || !options.exists( "--no-flush" )
+                                    , options.exists( "--flush" )
                                     , false
                                     , false
                                     , options.value( "--cache-size,--cache", 0 ) );

From ab20e7efcc9e3a6de4b32e0c7ba756139e9b98e3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 26 Aug 2024 10:38:01 +1000
Subject: [PATCH 0882/1056] udp-client: --timestamp: deprecated; --fields:
 plugging in...

---
 io/applications/CMakeLists.txt |  2 +-
 io/applications/udp-client.cpp | 29 ++++++++++++++++++++++-------
 2 files changed, 23 insertions(+), 8 deletions(-)

diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index ffde49fd0..811b4c6e6 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -49,7 +49,7 @@ if( NOT WIN32 )
     install( TARGETS io-tee RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( udp-client ${dir}/udp-client.cpp ${dir}/detail/publish.h ${dir}/detail/publish.cpp )
-    target_link_libraries( udp-client comma_application comma_name_value comma_io comma_csv comma_base ) # profiler )
+    target_link_libraries( udp-client comma_application comma_name_value comma_io comma_csv comma_base comma_string ) # profiler )
     set_target_properties( udp-client PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS udp-client RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 64420ea1b..22ded578b 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -42,6 +42,8 @@
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
+#include "../../csv/options.h"
+#include "../../string/string.h"
 #include "detail/publish.h"
 
 static void usage()
@@ -60,11 +62,16 @@ options
     --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
                                          the cached records will be sent to it once connected
     --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','
+    --fields=<fields>; default=data
+        <fields>
+            t: utc timestamp, same as --timestamp
+            size: data size in bytes
+            data: udp packet data
     --flush; flush stdout after each packet
     --no-discard: if present, do blocking write to every open output stream
     --size=<size>; hint of maximum buffer size; default 16384
     --reuse-addr,--reuseaddr: reuse udp address/port
-    --timestamp: output packet timestamp (currently just system time)
+    --timestamp: output packet timestamp; currently just system time as UTC, little endian
 
 output streams: <address>
     <address>
@@ -76,7 +83,13 @@ output streams: <address>
         -: stdout
 
 examples
-    todo
+    basics
+        udp-client 12435 > raw.bin
+        udp-client 12435 --timestamp > timestamped.bin
+    re-publishing
+        udp-client 12435 tcp::4567 
+        udp-client 12435 tcp::4567 tcp::7890 
+        udp-client 12435 tcp::4567 - > log.bin
 )" << std::endl;
     exit( 0 );
 }
@@ -87,7 +100,7 @@ int main( int argc, char** argv )
     {
         comma::command_line_options options( argc, argv );
         if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
-        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--flush,--no-discard,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
+        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--flush,--no-discard,--reuse-addr,--reuseaddr,--timestamp", "-.?.*" );
         COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify port" );
         std::string publish_address = unnamed.size() == 2 ? "-" : unnamed[1];
         COMMA_ASSERT_BRIEF( publish_address == "-", "publish: todo; got: '" << publish_address << "'" );
@@ -95,11 +108,13 @@ int main( int argc, char** argv )
         if( unnamed.size() == 1 ) { output_streams[0] = "-"; }
         else { std::copy( unnamed.begin() + 1, unnamed.end(), output_streams.begin() ); }
         unsigned short port = boost::lexical_cast< unsigned short >( unnamed[0] );
+        options.assert_mutually_exclusive( "--timestamp", "--fields" );
         bool timestamped = options.exists( "--timestamp" );
+        if( timestamped ) { comma::say() << "--timestamped: deprecated (will be maintained for now); use --fields=t,data" << std::endl; }
         bool binary = !options.exists( "--ascii" );
-        char delimiter = options.value( "--delimiter", ',' );
+        comma::csv::options csv( options );
         std::vector< char > packet( options.value( "--size", 16384 ) );
-        #if ( BOOST_VERSION >= 106600 )
+        #if BOOST_VERSION >= 106600
             boost::asio::io_context service;
         #else
             boost::asio::io_service service;
@@ -130,7 +145,7 @@ int main( int argc, char** argv )
         while( std::cout.good() )
         {
             boost::system::error_code error;
-            std::size_t size = socket.receive( boost::asio::buffer( packet ), 0, error );
+            std::size_t size = socket.receive( boost::asio::buffer( &packet[0], packet.size() ), 0, error );
             if( error || size == 0 ) { break; }
             if( timestamped )
             {
@@ -143,7 +158,7 @@ int main( int argc, char** argv )
                 }
                 else
                 {
-                    std::cout << boost::posix_time::to_iso_string( timestamp ) << delimiter;
+                    std::cout << boost::posix_time::to_iso_string( timestamp ) << csv.delimiter;
                 }
             }
             p.write( &packet[0], size );

From e675b2d85ad7c678ad065e790d2a23f60182fdf7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 26 Aug 2024 13:31:07 +1000
Subject: [PATCH 0883/1056] io-publish: bug fixed: if non-accepting output
 streams, exit accept thread straightaway (otherwise, it took 100% of cpu)
 udp-client: --fields: implemented; publishing to multiple output streams:
 implemented

---
 io/applications/detail/publish.cpp |  1 +
 io/applications/udp-client.cpp     | 83 +++++++++++++++++++-----------
 2 files changed, 55 insertions(+), 29 deletions(-)

diff --git a/io/applications/detail/publish.cpp b/io/applications/detail/publish.cpp
index c13884bc3..d92073334 100644
--- a/io/applications/detail/publish.cpp
+++ b/io/applications/detail/publish.cpp
@@ -138,6 +138,7 @@ void publish::accept_()
             if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
         }
     }
+    if( select.read()().empty() ) { return; }
     while( !is_shutdown_ )
     {
         select.wait( boost::posix_time::millisec( 100 ) ); // todo? make timeout configurable?
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 22ded578b..419dc09eb 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -33,12 +34,14 @@
 #include <stdlib.h>
 #endif
 #include <iostream>
+#include <sstream>
 #include <type_traits>
 #include <boost/array.hpp>
 #include <boost/asio/ip/udp.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/noncopyable.hpp>
 #include "../../application/command_line_options.h"
+#include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
@@ -58,20 +61,22 @@ usage: udp-client <port> [<output-streams>] [<options>]
 
 options
     --ascii; output timestamp as ascii; default: 64-bit binary
-    --binary; output timestamp as 64-bit binary; default
     --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
                                          the cached records will be sent to it once connected
     --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','
-    --fields=<fields>; default=data
+    --discard: not present, do blocking write to every open output stream
+    --endl; if --ascii, output '\n' after data
+    --fields=<fields>; default=data; choices (for now): 'data', 't,data', 't,size,data', 'size,data'
+                                                        't', 't,size', 'size' 
         <fields>
             t: utc timestamp, same as --timestamp
             size: data size in bytes
             data: udp packet data
     --flush; flush stdout after each packet
-    --no-discard: if present, do blocking write to every open output stream
-    --size=<size>; hint of maximum buffer size; default 16384
     --reuse-addr,--reuseaddr: reuse udp address/port
-    --timestamp: output packet timestamp; currently just system time as UTC, little endian
+    --size=<size>; hint of maximum buffer size; default 16384
+    --timestamp: deprecated, use --fields; output packet timestamp; currently just system
+                 time as UTC; if binary, little endian uint64
 
 output streams: <address>
     <address>
@@ -100,10 +105,8 @@ int main( int argc, char** argv )
     {
         comma::command_line_options options( argc, argv );
         if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
-        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--flush,--no-discard,--reuse-addr,--reuseaddr,--timestamp", "-.?.*" );
+        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--discard,--endl,--flush,--reuse-addr,--reuseaddr,--timestamp", "-.+" );
         COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify port" );
-        std::string publish_address = unnamed.size() == 2 ? "-" : unnamed[1];
-        COMMA_ASSERT_BRIEF( publish_address == "-", "publish: todo; got: '" << publish_address << "'" );
         std::vector< std::string > output_streams( unnamed.size() > 1 ? unnamed.size() - 1 : 1 );
         if( unnamed.size() == 1 ) { output_streams[0] = "-"; }
         else { std::copy( unnamed.begin() + 1, unnamed.end(), output_streams.begin() ); }
@@ -111,9 +114,24 @@ int main( int argc, char** argv )
         options.assert_mutually_exclusive( "--timestamp", "--fields" );
         bool timestamped = options.exists( "--timestamp" );
         if( timestamped ) { comma::say() << "--timestamped: deprecated (will be maintained for now); use --fields=t,data" << std::endl; }
+        if( options.exists( "--binary" ) ) { comma::say() << "--binary: deprecated, please remove; data deemed binary anyway unless --ascii specified" << std::endl; }
         bool binary = !options.exists( "--ascii" );
-        comma::csv::options csv( options );
-        std::vector< char > packet( options.value( "--size", 16384 ) );
+        bool endl = options.exists( "--endl" );
+        comma::csv::options csv( options, timestamped ? "t,data" : "data" );
+        COMMA_ASSERT_BRIEF(    csv.fields == "data"
+                            || csv.fields == "t,data"
+                            || csv.fields == "t,size,data"
+                            || csv.fields == "size,data"
+                            || csv.fields == "t"
+                            || csv.fields == "t,size"
+                            || csv.fields == "size"
+                          , "unsupported fields: '" << csv.fields << "'" ); // uber-quick and dirty, shameful
+        bool has_time = csv.has_field( "t" ) || timestamped;
+        bool has_size = csv.has_field( "size" );
+        bool has_data = csv.has_field( "data" );
+        static_assert( sizeof( boost::posix_time::ptime ) == 8 ); // quick and dirty
+        unsigned max_size = options.value( "--size", 16384 );
+        std::vector< char > buffer( max_size + 12 ); // quick and dirty
         #if BOOST_VERSION >= 106600
             boost::asio::io_context service;
         #else
@@ -137,31 +155,38 @@ int main( int argc, char** argv )
         static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
         comma::io::detail::publish p( output_streams
                                     , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
-                                    , !options.exists( "--no-discard" )
-                                    , options.exists( "--flush" )
+                                    , options.exists( "--discard" )
+                                    , options.exists( "--flush" ) || !binary
                                     , false
                                     , false
                                     , options.value( "--cache-size,--cache", 0 ) );
-        while( std::cout.good() )
+        comma::signal_flag is_shutdown;
+        if( binary )
+        {
+            unsigned int offset = ( has_time ? 8 : 0 ) + ( has_size ? 4 : 0 ); // hyper-quick and dirty for now
+            while( !is_shutdown )
+            {
+                std::uint32_t size = socket.receive( boost::asio::buffer( &buffer[offset], max_size ), 0, error );
+                if( error || size == 0 ) { break; } // todo? throw on error?
+                if( has_time ) { comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( boost::posix_time::microsec_clock::universal_time(), &buffer[0] ); }
+                if( has_size ) { ::memcpy( &buffer[ has_time ? 8 : 0 ], reinterpret_cast< const char* >( &size ), 4 ); }
+                p.write( &buffer[0], offset + ( has_data ? size : 0 ) );
+            }
+        }
+        else
         {
-            boost::system::error_code error;
-            std::size_t size = socket.receive( boost::asio::buffer( &packet[0], packet.size() ), 0, error );
-            if( error || size == 0 ) { break; }
-            if( timestamped )
+            std::string delimiter;
+            while( !is_shutdown )
             {
-                boost::posix_time::ptime timestamp = boost::posix_time::microsec_clock::universal_time();
-                if( binary )
-                { 
-                    static char buf[ sizeof( comma::int64 ) ];
-                    comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( timestamp, buf );
-                    std::cout.write( buf, sizeof( comma::int64 ) );
-                }
-                else
-                {
-                    std::cout << boost::posix_time::to_iso_string( timestamp ) << csv.delimiter;
-                }
+                std::size_t size = socket.receive( boost::asio::buffer( &buffer[0], max_size ), 0, error );
+                if( error || size == 0 ) { break; } // todo? throw on error?
+                std::ostringstream oss;
+                if( has_time ) { oss << boost::posix_time::to_iso_string( boost::posix_time::microsec_clock::universal_time() ); delimiter = csv.delimiter; }
+                if( has_size ) { oss << delimiter << size; delimiter = csv.delimiter; }
+                if( has_data ) { oss << delimiter; oss.write( &buffer[0], size ); if( endl ) { oss << std::endl; } }
+                const std::string& s = oss.str();
+                p.write( &s[0], s.size() );
             }
-            p.write( &packet[0], size );
         }
         return 0;
     }

From c9108693e89606ff7622fe0273049797d532d03e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 26 Aug 2024 14:05:54 +1000
Subject: [PATCH 0884/1056] udp-client: --help: notes on reading multiple udp
 packets on a single receive added

---
 io/applications/udp-client.cpp | 15 ++++++++++++++-
 1 file changed, 14 insertions(+), 1 deletion(-)

diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 419dc09eb..5394fd2c3 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -59,6 +59,17 @@ rationale: netcat and socat somehow do not work very well with udp
 
 usage: udp-client <port> [<output-streams>] [<options>]
 
+attention! it is possible to receive several packets udp packets in a single
+           read from the udp socket; the way to deal with it:
+               - if fixed-width data is published on the UDP socket, use:
+                 udp-client ... --size=<expected-fixed-size>
+               - if variable-size data is published on the UDP socket, the data
+                 receiver will have to parse the packets depending on communication
+                 protocol or nature of the data
+               - if using udp-client --fields=size,data or --fields=t,size,data,
+                 size field will have the total size in bytes for all UDP packets
+                 read from the UDP socket in a single receive call
+
 options
     --ascii; output timestamp as ascii; default: 64-bit binary
     --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
@@ -74,7 +85,9 @@ options
             data: udp packet data
     --flush; flush stdout after each packet
     --reuse-addr,--reuseaddr: reuse udp address/port
-    --size=<size>; hint of maximum buffer size; default 16384
+    --size=<size>; default=16384; hint of maximum buffer size in bytes, if using timestamped
+                                  fixed-width data, use --size=<fixed-width-size>, otherwise
+                                  multiple packets may be read from the UDP socket at once
     --timestamp: deprecated, use --fields; output packet timestamp; currently just system
                  time as UTC; if binary, little endian uint64
 

From 58a1aa9dc3bdff532024dfae40c0a23646939928 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 26 Aug 2024 14:10:03 +1000
Subject: [PATCH 0885/1056] udp-client: --help: examples updated

---
 io/applications/udp-client.cpp | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 5394fd2c3..95f5a5630 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -101,9 +101,13 @@ output streams: <address>
         -: stdout
 
 examples
+    publishing on udp
+        ( echo a; echo b; echo c ) | socat - udp:localhost::12345
     basics
         udp-client 12435 > raw.bin
-        udp-client 12435 --timestamp > timestamped.bin
+        udp-client 12435 --fields=t,data > timestamped.bin
+        udp-client 12435 --fields=t,size,data > timestamp.size.bin
+        udp-client 12435 --fields=t,size,data --ascii > timestamp.size.csv
     re-publishing
         udp-client 12435 tcp::4567 
         udp-client 12435 tcp::4567 tcp::7890 

From 0581bce276106c9060d363ae604e6d15e4446a7f Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 28 Aug 2024 12:28:01 +1000
Subject: [PATCH 0886/1056] csv-random: sample, shuffle: a couple of bugs
 fixed; make: pseudo-random alias added

---
 csv/applications/csv-random.cpp | 57 ++++++++++++++++++++++-----------
 1 file changed, 39 insertions(+), 18 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 68c492caa..7c03933f6 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -16,6 +16,21 @@
 #include "../../csv/stream.h"
 #include "../../string/string.h"
 
+// todo
+// - seed=true-random
+// - true-random
+//   - --type=f: fix types (should work, but they don't)
+//   - --type=ui,ui: fix types (should work, but they don't)
+// - make, true-random: --head=<n>
+// - sample, shuffle
+//   - examples
+// - regression test!
+// - --help vs --help --verbose
+// ? wiki: tutorials
+//   - csv-random
+//   - csv-repeat: --pace etc
+//   - make tutorials searchable
+
 static void usage( bool verbose )
 {
     std::cerr << "\nrandom operations on input stream";
@@ -23,16 +38,18 @@ static void usage( bool verbose )
     std::cerr << "\nusage: csv-random <operation> [<options>]";
     std::cerr << "\n";
     std::cerr << "\n    where <operation> is one of:";
-    std::cerr << "\n        make: output pseudo-random numbers";
+    std::cerr << "\n        pseudo-random, make: output pseudo-random numbers";
     std::cerr << "\n        true-random: output non-deterministic uniformly distributed numbers";
     std::cerr << "\n        sample: output a uniformly distributed sample of input records";
     std::cerr << "\n        shuffle: output input records in pseudo-random order";
     std::cerr << '\n';
     std::cerr << "\noptions";
-    std::cerr << "\n    --seed=[<unsigned int>]; random seed";
+    std::cerr << "\n    --seed=[<unsigned int>]; random seed:";
+    std::cerr << "\n        <n>: integer seed for pseudo-random generator";
+    std::cerr << "\n        'true-random': todo: true random number to use as seed";
     std::cerr << '\n';
     std::cerr << "\noperations";
-    std::cerr << "\n    make: output pseudo-random numbers";
+    std::cerr << "\n    pseudo-random, make: output pseudo-random numbers";
     std::cerr << '\n';
     std::cerr << "\n        usage: csv-random make [<options>] > random.csv";
     std::cerr << "\n               cat input.csv | csv-random make --append [<options>]";
@@ -71,6 +88,7 @@ static void usage( bool verbose )
     std::cerr << "\n                    specify --binary=<format> for stdin input";
     std::cerr << "\n            --type=<type>; default=ui; todo: supported values: ui;";
     std::cerr << "\n                    e.g: --type=3ui; --type=ui,ui,ui; etc";
+    std::cerr << "\n                    todo! support other types, just ask";
     std::cerr << '\n';
     std::cerr << "\n        example";
     std::cerr << "\n            > csv-random make --seed=$( csv-random true-random --once )";
@@ -88,7 +106,7 @@ static void usage( bool verbose )
     std::cerr << "\n                where <engine> is one of: minstd_rand0, minstd_rand, mt19937,";
     std::cerr << "\n                    mt19937_64 (default), ranlux24_base, ranlux48_base,";
     std::cerr << "\n                    ranlux24, ranlux48, knuth_b, default_random_engine";
-    std::cerr << "\n            --fields=[<fields>]; if 'block' field present sample each block,";
+    std::cerr << "\n            --fields=[<fields>]; if 'block' field present, sample each block,";
     std::cerr << "\n                    otherwise read whole input and then sample";
     std::cerr << "\n            --ratio=[<ratio>]; portion of each block to output,";
     std::cerr << "\n                    if block is too small, nothing will be output for it";
@@ -136,8 +154,7 @@ namespace comma { namespace applications { namespace random { namespace shuffle
 
 struct input
 {
-    comma::uint32 block;
-    input() : block( 0 ) {}
+    comma::uint32 block{0};
 };
 
 } } } } // namespace comma { namespace applications { namespace random { namespace shuffle {
@@ -344,21 +361,25 @@ template < typename Engine > static int run_impl( const comma::command_line_opti
     if( sliding_window ) { std::cerr << "csv-random shuffle: --sliding-window: todo" << std::endl; return 1; }
     if( sliding_window ) { std::cerr << "csv-random shuffle: expected either block field or --sliding-window; got both" << std::endl; return 1; }
     comma::csv::input_stream< input > is( std::cin, ::csv );
-    comma::uint32 block = 0;
+    bool has_block = ::csv.has_field( "block" );
+    comma::uint32 block{0};
     while( is.ready() || std::cin.good() )
     {
         const input* p = is.read();
-        if( !p || p->block != block )
+        if( !p || ( has_block && p->block != block ) )
         {
-            std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
-            indices.resize( records.size() ); // quick and dirty
-            for( unsigned int i = 0; i < indices.size(); ++i ) { indices[i] = i; }
-            std::random_shuffle( indices.begin(), indices.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
-            unsigned int s = sample ? ( ratio ? int( records.size() * *ratio ) : size ) : records.size();
-            if( sample ) { std::sort( indices.begin(), indices.begin() + s ); } // quick and dirty
-            for( unsigned int i = 0; i < s; ++i ) { std::cout.write( &records[indices[i]][0], records[indices[i]].size() ); }
-            records.clear();
-            if( ::csv.flush ) { std::cout.flush(); }
+            if( !records.empty() )
+            {
+                std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+                indices.resize( records.size() ); // quick and dirty
+                for( unsigned int i = 0; i < indices.size(); ++i ) { indices[i] = i; }
+                std::random_shuffle( indices.begin(), indices.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
+                unsigned int s = sample ? ( ratio ? int( records.size() * *ratio ) : size ) : records.size();
+                if( sample ) { std::sort( indices.begin(), indices.begin() + s ); } // quick and dirty
+                for( unsigned int i = 0; i < s; ++i ) { std::cout.write( &records[indices[i]][0], records[indices[i]].size() ); }
+                records.clear();
+                if( ::csv.flush ) { std::cout.flush(); }
+            }
             if( p ) { block = p->block; }
         }
         if( !p ) { break; }
@@ -487,7 +508,7 @@ int main( int ac, char** av )
         ::seed = options.optional< comma::uint32 >( "--seed" );
         ::verbose = options.exists( "--verbose,-v" );
         std::string operation = unnamed[0];
-        if( operation == "make" ) { return comma::applications::random::make::run( options ); }
+        if( operation == "make" || operation == "pseudo-random" ) { return comma::applications::random::make::run( options ); }
         if( operation == "sample" ) { return comma::applications::random::sample::run( options ); }
         if( operation == "shuffle" ) { return comma::applications::random::shuffle::run( options ); }
         if( operation == "true-random" ) { return comma::applications::random::true_random::run( options ); }

From 0c47e081385bee80286adb8b81e970a404fba75f Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 28 Aug 2024 12:55:01 +1000
Subject: [PATCH 0887/1056] csv-random: true-random: --range implemented

---
 csv/applications/csv-random.cpp | 23 ++++++++++++++++-------
 1 file changed, 16 insertions(+), 7 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 7c03933f6..2d6aeb476 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -12,15 +12,13 @@
 
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
+#include "../../base/none.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../string/string.h"
 
 // todo
 // - seed=true-random
-// - true-random
-//   - --type=f: fix types (should work, but they don't)
-//   - --type=ui,ui: fix types (should work, but they don't)
 // - make, true-random: --head=<n>
 // - sample, shuffle
 //   - examples
@@ -85,10 +83,12 @@ static void usage( bool verbose )
     std::cerr << "\n            --append; append random number to stdin input";
     std::cerr << "\n            --once; output random number only once";
     std::cerr << "\n            --output-binary; output random numbers as binary";
-    std::cerr << "\n                    specify --binary=<format> for stdin input";
+    std::cerr << "\n                specify --binary=<format> for stdin input";
+    std::cerr << "\n            --range=[<min>,<max>]; desired value range";
+    std::cerr << "\n                if multiple output values, e.g: --type=f,ui,ub";
+    std::cerr << "\n                --range will be applied to all output values";
     std::cerr << "\n            --type=<type>; default=ui; todo: supported values: ui;";
-    std::cerr << "\n                    e.g: --type=3ui; --type=ui,ui,ui; etc";
-    std::cerr << "\n                    todo! support other types, just ask";
+    std::cerr << "\n                e.g: --type=3ui; --type=ui,ui,ui; etc";
     std::cerr << '\n';
     std::cerr << "\n        example";
     std::cerr << "\n            > csv-random make --seed=$( csv-random true-random --once )";
@@ -430,11 +430,20 @@ static int run_impl( const comma::command_line_options& options, std::size_t cou
     std::random_device rd;
     const bool binary = options.exists( "--output-binary" ) || ::csv.binary();
     const bool flush = options.exists( "--flush" ) || ::csv.flush;
+    typedef std::pair< double, double > pair_t;
+    boost::optional< pair_t > range = comma::silent_none< pair_t >();
+    double factor{1};
+    if( options.exists( "--range" ) )
+    {
+        range = comma::csv::ascii< pair_t >().get( options.value< std::string >( "--range" ) );
+        factor = ( range->second - range->first ) / ( rd.max() - rd.min() );
+    }
     auto output_line_to_stdout = [&]( std::string&& initial_delimiter )
     {
         for( std::size_t i = 0; i < count; ++i )
         {
-            const T r = rd();
+            T r = rd();
+            if( range ) { r = range->first + ( r - rd.min() ) * factor; }
             if( binary ) { std::cout.write( reinterpret_cast< const char* >( &r ), sizeof( T ) ); }
             else { std::cout << initial_delimiter << type_traits< T >::cast( r ); initial_delimiter = ::csv.delimiter; }
         }

From 17c20c5669389fc10c47d90236233c998a90d25b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Aug 2024 10:54:46 +1000
Subject: [PATCH 0888/1056] csv-split: --help brushed up

---
 csv/applications/csv-split.cpp | 163 +++++++++++++++++----------------
 1 file changed, 82 insertions(+), 81 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index aeb731248..1512a6063 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -15,7 +15,7 @@
 //
 // NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
 // GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED
 // WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 // MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
@@ -103,85 +103,86 @@ int main( int argc, char** argv )
         boost::program_options::notify( vm );
         if ( vm.count( "help" ) || vm.count( "long-help" ) )
         {
-            std::cerr << "\n";
-            std::cerr << "read from stdin by packet or by line and split into files\n";
-            std::cerr << "files are named by field value or time (if split by time)\n";
-            std::cerr << "if splitting by id, input can also be split into streams\n";
-            std::cerr << "\n";
-            std::cerr << "usage: csv-split [options] [outputs]*\n";
-            std::cerr << "\n";
+            std::cerr << R"(
+read from stdin by packet or by line and split into files
+files are named by field value or time (if split by time)
+if splitting by id, input can also be split into streams
+
+usage: csv-split [options] [outputs]*
+)";
             std::cerr << description;
-            std::cerr << "\n";
-            std::cerr << "data is split by one of the following fields (listed in descending precedence)\n";
-            std::cerr << "    block: split on the block number change\n";
-            std::cerr << "    id:    split by id (same as block, except does not have to be contiguous\n";
-            std::cerr << "                        with the price of worse performance)\n";
-            std::cerr << "    t:     if present, use timestamp from the packet; if absent, use system time\n";
-            std::cerr << "\n";
-            std::cerr << "examples:\n";
-            std::cerr << "    --- split by block field, output to files ---\n";
-            std::cerr << "    output records for each block to a separate file\n";
-            std::cerr << "    on change of block, open a new file, e.g. 0.csv, 1.csv, etc\n";
-            std::cerr << "\n";
-            std::cerr << "    with default filenames:\n";
-            std::cerr << "    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block\n";
-            std::cerr << "\n";
-            std::cerr << "    with specified filenames:\n";
-            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
-            std::cerr << "        | csv-split --fields block --files <( echo a; echo b; echo c )\n";
-            std::cerr << "\n";
-            std::cerr << "    with filenames mapped to block ids:\n";
-            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
-            std::cerr << "        | csv-split --fields block \\\n";
-            std::cerr << "              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'\n";
-            std::cerr << "\n";
-            std::cerr << "    --- split by id field, output to files ---\n";
-            std::cerr << "    for each id value, output records with this id to a separate file,\n";
-            std::cerr << "    e.g. 0.csv, 1.csv, etc\n";
-            std::cerr << "\n";
-            std::cerr << "    with default filenames:\n";
-            std::cerr << "    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields id\n";
-            std::cerr << "\n";
-            std::cerr << "    with specified filenames:\n";
-            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
-            std::cerr << "        | csv-split --fields id --files <( echo a; echo b; echo c )\n";
-            std::cerr << "\n";
-            std::cerr << "    with filenames mapped to block ids:\n";
-            std::cerr << "    ( echo 0; echo 1; echo 2 ) \\\n";
-            std::cerr << "        | csv-split --fields id \\\n";
-            std::cerr << "              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'\n";
-            std::cerr << "\n";
-            std::cerr << "    --- split by t field, output to files ---\n";
-            std::cerr << "    separate records into different time periods, outputting in separate files\n";
-            std::cerr << "    ( echo 20170101T000001,a; echo 20170101T000003,b; echo 20170101T000007,c ) \\\n";
-            std::cerr << "        | csv-split --fields=t --period=4\n";
-            std::cerr << "\n";
-            std::cerr << "    --- split by id field, output to streams ---\n";
-            std::cerr << "    if output streams (see example below) are present on the command line and \n";
-            std::cerr << "    id field present in --fields output records with the given ids to the\n";
-            std::cerr << "    corresponding streams, while outputing the rest into files\n";
-            std::cerr << "\n";
-            std::cerr << "    records with ids for which output stream is not specified will be discarded,\n";
-            std::cerr << "    unless ... stream is specified:\n";
-            std::cerr << "\n";
-            std::cerr << "    outputs: <keys>;<stream>; send records with given set of ids to this stream\n";
-            std::cerr << "        keys:\n";
-            std::cerr << "            <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc\n";
-            std::cerr << "            ... (three dots): send to this stream all the records with ids\n";
-            std::cerr << "                for which no other stream is specified (see example below)\n";
-            std::cerr << "        stream:\n";
-            std::cerr << "            tcp:<port>: e.g. tcp:1234\n";
-            std::cerr << "            udp:<port>: e.g. udp:1234 (todo)\n";
-            std::cerr << "            local:<name>: linux/unix local server socket\n";
-            std::cerr << "                          e.g. local:./tmp/my_socket\n";
-            std::cerr << "            <named pipe name>: named pipe, re-opened if client reconnects\n";
-            std::cerr << "            <filename>: a regular file\n";
-            std::cerr << "\n";
-            std::cerr << "        ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) \\\n";
-            std::cerr << "            | csv-split --fields id \"0,1;tcp:5999\" \"...;local:/tmp/named_fifo\"\n";
-            std::cerr << "        ( echo 0,a; echo 1,b ) | csv-split --fields id --files \\\n";
-            std::cerr << "                  <( echo '1,one.csv'; echo '0,zero.csv' )';fields=id,filename'\n";
-            std::cerr << std::endl;
+            std::cerr << R"(
+data is split by one of the following fields (listed in descending precedence)
+    block: split on the block number change
+    id:    split by id (same as block, except does not have to be contiguous
+                        with the price of worse performance)
+    t:     if present, use timestamp from the packet; if absent, use system time
+
+examples:
+    --- split by block field, output to files ---
+    output records for each block to a separate file
+    on change of block, open a new file, e.g. 0.csv, 1.csv, etc
+
+    with default filenames:
+    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block
+
+    with specified filenames:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields block --files <( echo a; echo b; echo c )
+
+    with filenames mapped to block ids:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields block \
+              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'
+
+    --- split by id field, output to files ---
+    for each id value, output records with this id to a separate file,
+    e.g. 0.csv, 1.csv, etc
+
+    with default filenames:
+    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields id
+
+    with specified filenames:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields id --files <( echo a; echo b; echo c )
+
+    with filenames mapped to block ids:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields id \
+              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'
+
+    --- split by t field, output to files ---
+    separate records into different time periods, outputting in separate files
+    ( echo 20170101T000001,a; echo 20170101T000003,b; echo 20170101T000007,c ) \
+        | csv-split --fields=t --period=4
+
+    --- split by id field, output to streams ---
+    if output streams (see example below) are present on the command line and 
+    id field present in --fields output records with the given ids to the
+    corresponding streams, while outputing the rest into files
+
+    records with ids for which output stream is not specified will be discarded,
+    unless ... stream is specified:
+
+    outputs: <keys>;<stream>; send records with given set of ids to this stream
+        keys:
+            <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc
+            ... (three dots): send to this stream all the records with ids
+                for which no other stream is specified (see example below)
+        stream:
+            tcp:<port>: e.g. tcp:1234
+            udp:<port>: e.g. udp:1234 (todo)
+            local:<name>: linux/unix local server socket
+                          e.g. local:./tmp/my_socket
+            <named pipe name>: named pipe, re-opened if client reconnects
+            <filename>: a regular file
+
+        ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) \
+            | csv-split --fields id "0,1;tcp:5999" "...;local:/tmp/named_fifo"
+        ( echo 0,a; echo 1,b ) | csv-split --fields id --files \
+                  <( echo '1,one.csv'; echo '0,zero.csv' )';fields=id,filename'
+
+)";
             return 0;
         }
         csv = comma::csv::program_options::get( vm );
@@ -202,7 +203,7 @@ int main( int argc, char** argv )
         else { run< comma::uint32 >(); }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << argv[0] << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << argv[0] << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }

From 6b1249e30042113a68fb3dbe51b01559ac117c49 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Aug 2024 11:00:46 +1000
Subject: [PATCH 0889/1056] csv-split: brushed up

---
 csv/applications/csv-split.cpp | 36 ++++++++++++++++------------------
 1 file changed, 17 insertions(+), 19 deletions(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index 1512a6063..fe8863bfd 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -51,7 +51,7 @@ static std::string files;
 static std::string default_filename;
 static std::string timestamps;
 
-template < typename T > static void run()
+template < typename T > static int run()
 {
     comma::csv::applications::split< T > split( duration, suffix, csv, streams, passthrough, files, default_filename, timestamps );
     if( size == 0 )
@@ -63,19 +63,18 @@ template < typename T > static void run()
             if( line.empty() ) { break; }
             split.write( line );
         }
+        return 0;
     }
-    else
+    #ifdef WIN32
+        _setmode( _fileno( stdin ), _O_BINARY );
+    #endif
+    std::vector< char > packet( size );
+    while( std::cin.good() && !std::cin.eof() )
     {
-        #ifdef WIN32
-            _setmode( _fileno( stdin ), _O_BINARY );
-        #endif
-        std::vector< char > packet( size );
-        while( std::cin.good() && !std::cin.eof() )
-        {
-            std::cin.read( &packet[0], size );
-            if( std::cin.gcount() > 0 ) { split.write( &packet[0], size ); }
-        }
+        std::cin.read( &packet[0], size );
+        if( std::cin.gcount() > 0 ) { split.write( &packet[0], size ); }
     }
+    return 0;
 }
 
 int main( int argc, char** argv )
@@ -186,22 +185,21 @@ data is split by one of the following fields (listed in descending precedence)
             return 0;
         }
         csv = comma::csv::program_options::get( vm );
-        if( vm.count( "period" ) && vm.count( "timestamps" ) ) { std::cerr << "csv-split: --period and --timestamps are mutually exclusive (todo? combine them? just ask)" << std::endl; return 1; }
-        if( !default_filename.empty() ) { std::cerr << "csv-split: --default-filename: todo, just ask" << std::endl; }
+        COMMA_ASSERT_BRIEF( !vm.count( "period" ) || !vm.count( "timestamps" ), "csv-split: --period and --timestamps are mutually exclusive (todo? combine them? just ask)" );
+        COMMA_ASSERT_BRIEF( default_filename.empty(), "csv-split: --default-filename: todo, just ask" )
         if( csv.binary() ) { size = csv.format().size(); }
         bool id_is_string = vm.count( "string" );
         bool id_is_time = vm.count( "time" );
         passthrough = vm.count("passthrough");
-        if( id_is_string && id_is_time ) { std::cerr << "csv-split: --string and --time are mutually exclusive" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !id_is_string || !id_is_time, "csv-split: --string and --time are mutually exclusive" );
         if( period > 0 ) { duration = boost::posix_time::microseconds( static_cast< unsigned int >( period * 1e6 )); }
         if( extension.empty() ) { suffix = csv.binary() || size > 0 ? ".bin" : ".csv"; }
         else { suffix += "."; suffix += extension; }
         streams = boost::program_options::collect_unrecognized( parsed.options, boost::program_options::include_positional );
-        if( !streams.empty() && ( csv.has_field( "block" ) || id_is_time ) ) { std::cerr << "publisher streams are not compatible with splitting by block or timestamp." << std::endl; return 1; }
-        if( id_is_string ) { run< std::string >(); }
-        else if( id_is_time ) { run< boost::posix_time::ptime >(); }
-        else { run< comma::uint32 >(); }
-        return 0;
+        COMMA_ASSERT_BRIEF( !( !streams.empty() && ( csv.has_field( "block" ) || id_is_time ) ), "publisher streams are not compatible with splitting by block or timestamp." );
+        if( id_is_string ) { return run< std::string >(); }
+        if( id_is_time ) { return run< boost::posix_time::ptime >(); }
+        return run< comma::uint32 >();
     }
     catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
     catch( ... ) { comma::say() << "unknown exception" << std::endl; }

From 8e5868b316d5a74da372120c1029b4427e0e8d9a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Aug 2024 11:15:28 +1000
Subject: [PATCH 0890/1056] csv-split: further brush-up

---
 csv/applications/split/split.cpp | 27 +++++++++------------------
 csv/traits.h                     |  5 +----
 2 files changed, 10 insertions(+), 22 deletions(-)

diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 69acfdb43..413eaad16 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -255,8 +255,7 @@ bool split< T >::published_on_stream( const char* data, unsigned int size )
     return true;
 }
 
-template < typename T >
-void split< T >::write( const char* data, unsigned int size )
+template < typename T > void split< T >::write( const char* data, unsigned int size )
 {
     mode_ = std::ofstream::out | std::ofstream::binary;
     if( binary_ ) { binary_->get( current_, data ); }
@@ -273,8 +272,7 @@ void split< T >::write( const char* data, unsigned int size )
     if ( pass_ ) { std::cout.write( data, size ); std::cout.flush(); }
 }
 
-template < typename T >
-void split< T >::write( std::string line )
+template < typename T > void split< T >::write( std::string line )
 {
     mode_ = std::ofstream::out; // quick and dirty
     if( ascii_ ) { ascii_->get( current_, line ); }
@@ -293,8 +291,7 @@ void split< T >::write( std::string line )
     if ( pass_ ) { std::cout.write( &line[0], line.size() ); /*std::cout.put('\n');*/ std::cout.flush(); }
 }
 
-template < typename T >
-std::ofstream* split< T >::ofstream_by_time_()
+template < typename T > std::ofstream* split< T >::ofstream_by_time_()
 {
     bool changed = period_ ? !last_ || current_.timestamp > last_->timestamp + *period_ : timestamps_stream_seek_( current_.timestamp );
     if( !last_ || changed )
@@ -308,8 +305,7 @@ std::ofstream* split< T >::ofstream_by_time_()
     return &file_;
 }
 
-template < typename T >
-std::ofstream* split< T >::ofstream_by_block_()
+template < typename T > std::ofstream* split< T >::ofstream_by_block_()
 {
     static comma::uint32 id = 0;
     if( !last_ || last_->block != current_.block )
@@ -322,11 +318,11 @@ std::ofstream* split< T >::ofstream_by_block_()
             if( it == filenames_.end() ) { return nullptr; }
             filename = it->second;
             const auto& dirname = comma::filesystem::path( filename ).parent_path();
-            if( !( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ) ) ) { COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << filename << "'" ); }
+            COMMA_ASSERT( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ), "failed to create directory '" << dirname << "' for file: '" << filename << "'" )
         }
         if( filename.empty() ) { filename = boost::lexical_cast< std::string >( current_.block ) + suffix_; }
         file_.open( &filename[0], mode_ );
-        if( !file_.is_open() ) { COMMA_THROW( comma::exception, "failed to open '" << filename << "'" ); }
+        COMMA_ASSERT( file_.is_open(), "failed to open '" << filename << "'" );
         last_ = current_;
         ++id;
     }
@@ -345,11 +341,9 @@ template <> std::string find_< comma::uint32, std::unordered_map< comma::uint32,
     return it == m.end() ? std::string() : it->second;
 }
 
-template < typename T >
-std::string split< T >::filename_from_id_( const T& id ) { return filenames_.empty() ? to_string( id ) + suffix_ : find_( filenames_, id ); }
+template < typename T > std::string split< T >::filename_from_id_( const T& id ) { return filenames_.empty() ? to_string( id ) + suffix_ : find_( filenames_, id ); }
 
-template < typename T >
-std::ofstream* split< T >::ofstream_by_id_()
+template < typename T > std::ofstream* split< T >::ofstream_by_id_()
 {
     typename Files::iterator it = files_.find( current_.id );
     if( it == files_.end() )
@@ -369,10 +363,7 @@ std::ofstream* split< T >::ofstream_by_id_()
         std::string name = filename_from_id_( current_.id );
         if( name.empty() ) { return nullptr; }
         const auto& dirname = comma::filesystem::path( name ).parent_path();
-        if( !( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ) ) )
-        {
-            COMMA_THROW( comma::exception, "failed to create directory '" << dirname << "' for file: '" << name << "'" );
-        }
+        COMMA_ASSERT( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ), "failed to create directory '" << dirname << "' for file: '" << name << "'" );
         std::shared_ptr< std::ofstream > stmp( new std::ofstream( &name[0], mode ) );
         it = files_.insert( std::make_pair( current_.id, stmp ) ).first;
     }
diff --git a/csv/traits.h b/csv/traits.h
index 2f444a01e..35cc0ce40 100644
--- a/csv/traits.h
+++ b/csv/traits.h
@@ -2,8 +2,7 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_TRAITS_H_
-#define COMMA_CSV_TRAITS_H_
+#pragma once
 
 #include "../csv/options.h"
 #include "../visiting/traits.h"
@@ -48,5 +47,3 @@ template <> struct traits< comma::csv::options >
 };
 
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_CSV_TRAITS_H_

From 4c76648b46397d356d361675743bbb9cc8b86f93 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Aug 2024 12:13:04 +1000
Subject: [PATCH 0891/1056] csv-split: --fields=,,size,, implemented;
 rudimental test added

---
 csv/applications/csv-split.cpp   | 52 +++++++++++++++++++++++---------
 csv/applications/split/split.cpp | 19 +++++-------
 csv/applications/split/split.h   |  5 ++-
 csv/test/csv-split/size/expected |  8 +++++
 csv/test/csv-split/size/input    |  2 ++
 5 files changed, 59 insertions(+), 27 deletions(-)
 create mode 100644 csv/test/csv-split/size/expected
 create mode 100644 csv/test/csv-split/size/input

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index fe8863bfd..9284dc048 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -37,6 +37,7 @@
 
 #include <boost/optional.hpp>
 #include <boost/program_options.hpp>
+#include "../../application/command_line_options.h"
 #include "../../csv/impl/program_options.h"
 #include "../../csv/traits.h"
 #include "split/split.h"
@@ -68,16 +69,31 @@ template < typename T > static int run()
     #ifdef WIN32
         _setmode( _fileno( stdin ), _O_BINARY );
     #endif
-    std::vector< char > packet( size );
+    bool has_size = csv.has_field( "size" );
+    std::vector< char > buffer( 32768 ); // quick and dirty
+    typedef comma::csv::applications::input< T > input_t;
+    comma::csv::binary< input_t > binary( csv );
+    input_t header;
     while( std::cin.good() && !std::cin.eof() )
     {
-        std::cin.read( &packet[0], size );
-        if( std::cin.gcount() > 0 ) { split.write( &packet[0], size ); }
+        std::cin.read( &buffer[0], size );
+        if( std::cin.gcount() == 0 ) { break; }
+        COMMA_ASSERT_BRIEF( std::cin.gcount() == int( size ), "expected " << size << " bytes; got: " << size );
+        unsigned int total_size = size;
+        if( has_size )
+        {
+            binary.get( header, &buffer[0] );
+            total_size += header.size;
+            if( buffer.size() < total_size ) { buffer.resize( total_size ); }
+            std::cin.read( &buffer[size], header.size );
+            COMMA_ASSERT_BRIEF( std::cin.gcount() == int( header.size ), "expected " << header.size << " bytes; got: " << size );
+        }
+        split.write( &buffer[0], total_size );
     }
     return 0;
 }
 
-int main( int argc, char** argv )
+int main( int ac, char** av )
 {
     try
     {
@@ -97,8 +113,8 @@ int main( int argc, char** argv )
             ( "timestamps", boost::program_options::value< std::string >( &timestamps ), "<filename>[;<csv options>]: split by timestamps (assuming both input and timestamps are in ascending order)" );
         description.add( comma::csv::program_options::description() );
         boost::program_options::variables_map vm;
-        boost::program_options::store( boost::program_options::parse_command_line( argc, argv, description), vm );
-        boost::program_options::parsed_options parsed = boost::program_options::command_line_parser( argc, argv ).options( description ).allow_unregistered().run();
+        boost::program_options::store( boost::program_options::parse_command_line( ac, av, description ), vm );
+        boost::program_options::parsed_options parsed = boost::program_options::command_line_parser( ac, av ).options( description ).allow_unregistered().run();
         boost::program_options::notify( vm );
         if ( vm.count( "help" ) || vm.count( "long-help" ) )
         {
@@ -111,11 +127,18 @@ usage: csv-split [options] [outputs]*
 )";
             std::cerr << description;
             std::cerr << R"(
-data is split by one of the following fields (listed in descending precedence)
-    block: split on the block number change
-    id:    split by id (same as block, except does not have to be contiguous
-                        with the price of worse performance)
-    t:     if present, use timestamp from the packet; if absent, use system time
+
+--fields=<fields>; <fields>: t,block,id,size
+    data is split by one of the following fields (listed in descending precedence)
+        block: split on the block number change
+        id   : split by id (same as block, except does not have to be contiguous
+                           with the price of worse performance)
+        t    : if present, use timestamp from the packet; if absent, use system time
+    size: if present, assume that fixed-width data is followed by <n> bytes
+          where <n> is the value of the size field; used only in binary mode
+          e.g: for the command: csv-split --fields t,,,size --binary=t,3ui,2f
+          the record has a fixed part (header) with format t,3ui,2f followed
+          by variable payload of size read from 'size' field (which can be 0 as well)
 
 examples:
     --- split by block field, output to files ---
@@ -128,7 +151,7 @@ data is split by one of the following fields (listed in descending precedence)
     with specified filenames:
     ( echo 0; echo 1; echo 2 ) \
         | csv-split --fields block --files <( echo a; echo b; echo c )
-
+csv-split
     with filenames mapped to block ids:
     ( echo 0; echo 1; echo 2 ) \
         | csv-split --fields block \
@@ -163,7 +186,7 @@ data is split by one of the following fields (listed in descending precedence)
     records with ids for which output stream is not specified will be discarded,
     unless ... stream is specified:
 
-    outputs: <keys>;<stream>; send records with given set of ids to this stream
+    outputs: <keys>;<stream>; send records with given set of i32768ds to this stream
         keys:
             <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc
             ... (three dots): send to this stream all the records with ids
@@ -184,7 +207,8 @@ data is split by one of the following fields (listed in descending precedence)
 )";
             return 0;
         }
-        csv = comma::csv::program_options::get( vm );
+        comma::command_line_options options( ac, av );
+        csv = comma::csv::options( options );
         COMMA_ASSERT_BRIEF( !vm.count( "period" ) || !vm.count( "timestamps" ), "csv-split: --period and --timestamps are mutually exclusive (todo? combine them? just ask)" );
         COMMA_ASSERT_BRIEF( default_filename.empty(), "csv-split: --default-filename: todo, just ask" )
         if( csv.binary() ) { size = csv.format().size(); }
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 413eaad16..e38aba81e 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -123,8 +123,7 @@ void split< T >::timestamps_stream_make_( const std::string& timestamps )
     //std::cerr << "--> a: interval: " << boost::posix_time::to_iso_string( timestamps_last_.first ) << " - " << boost::posix_time::to_iso_string( timestamps_last_.second ) << std::endl;
 }
 
-template < typename T >
-bool split< T >::timestamps_stream_seek_( boost::posix_time::ptime t )
+template < typename T > bool split< T >::timestamps_stream_seek_( boost::posix_time::ptime t )
 {
     bool changed = false;
     while( t >= timestamps_last_.second && !timestamps_last_.second.is_pos_infinity() )
@@ -212,8 +211,7 @@ split< T >::split( const boost::optional< boost::posix_time::time_duration >& pe
     acceptor_thread_ = std::thread( std::bind( &split< T >::accept_, std::ref( *this )));
 }
 
-template < typename T >
-split< T >::~split()
+template < typename T > split< T >::~split()
 {
     is_shutdown_ = true;
     if( acceptor_thread_.joinable() )
@@ -224,8 +222,7 @@ split< T >::~split()
     }
 }
 
-template < typename T >
-void split< T >::accept_()
+template < typename T > void split< T >::accept_()
 {
     comma::io::select select;
     {
@@ -242,9 +239,7 @@ void split< T >::accept_()
     }
 }
 
-
-template < typename T >
-bool split< T >::published_on_stream( const char* data, unsigned int size )
+template < typename T > bool split< T >::published_on_stream( const char* data, unsigned int size )
 {
     transaction t( publishers_ );
     if( t->empty() && !default_publisher_ ) { return false; }
@@ -269,7 +264,7 @@ template < typename T > void split< T >::write( const char* data, unsigned int s
             if( flush_ ) { ofs->flush(); }
         }
     }
-    if ( pass_ ) { std::cout.write( data, size ); std::cout.flush(); }
+    if( pass_ ) { std::cout.write( data, size ); std::cout.flush(); }
 }
 
 template < typename T > void split< T >::write( std::string line )
@@ -288,7 +283,7 @@ template < typename T > void split< T >::write( std::string line )
             if( flush_ ) { ofs->flush(); }
         }
     }
-    if ( pass_ ) { std::cout.write( &line[0], line.size() ); /*std::cout.put('\n');*/ std::cout.flush(); }
+    if( pass_ ) { std::cout.write( &line[0], line.size() ); /*std::cout.put('\n');*/ std::cout.flush(); }
 }
 
 template < typename T > std::ofstream* split< T >::ofstream_by_time_()
@@ -353,7 +348,7 @@ template < typename T > std::ofstream* split< T >::ofstream_by_id_()
         #else
         static struct rlimit r;
         static int q = getrlimit( RLIMIT_NOFILE, &r );
-        if( q != 0 ) { COMMA_THROW( comma::exception, "getrlimit() failed" ); }
+        if( q != 0 ) { COMMA_THROW( comma::exception, "getting resource limit (getrlimit()) for number of open files failed" ); }
         static unsigned int max_number_of_open_files = static_cast< unsigned int >( r.rlim_cur );
         #endif
         if( files_.size() + 10 > max_number_of_open_files ) { files_.clear(); } // quick and dirty, may be too drastic...
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 5705b04e0..5e1d4bfa4 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -56,7 +56,8 @@ namespace comma { namespace csv { namespace applications {
 template < typename T > struct input // quick and dirty
 {
     boost::posix_time::ptime timestamp;
-    comma::uint32 block;
+    comma::uint32 block{0};
+    comma::uint32 size{0};
     T id;
 };
 
@@ -72,6 +73,7 @@ template < typename T > struct traits< comma::csv::applications::input< T > >
     {
         v.apply( "t", p.timestamp );
         v.apply( "block", p.block );
+        v.apply( "size", p.size );
         v.apply( "id", p.id );
     }
 
@@ -79,6 +81,7 @@ template < typename T > struct traits< comma::csv::applications::input< T > >
     {
         v.apply( "t", p.timestamp );
         v.apply( "block", p.block );
+        v.apply( "size", p.size );
         v.apply( "id", p.id );
     }
 };
diff --git a/csv/test/csv-split/size/expected b/csv/test/csv-split/size/expected
new file mode 100644
index 000000000..37d4bebf8
--- /dev/null
+++ b/csv/test/csv-split/size/expected
@@ -0,0 +1,8 @@
+fixed[0]/output/line[0]="8"
+fixed[0]/output/line[1]="8"
+fixed[0]/output/line[2]="8"
+fixed[0]/status=0
+
+variable[0]/output/line[0]="8"
+variable[0]/output/line[1]="16"
+variable[0]/status=0
diff --git a/csv/test/csv-split/size/input b/csv/test/csv-split/size/input
new file mode 100644
index 000000000..cc6a0066a
--- /dev/null
+++ b/csv/test/csv-split/size/input
@@ -0,0 +1,2 @@
+fixed[0]="( echo 111,0; echo 222,1; echo 333,2 ) | csv-to-bin 2ui | ( mkdir -p output && cd output && csv-split --fields ,id --binary 2ui && wc -c < 0.bin && wc -c < 1.bin && wc -c < 2.bin )"
+variable[0]="( echo 0,0 | csv-to-bin 2ui; echo 1,8,3,4 | csv-to-bin 4ui ) | ( mkdir -p output && cd output && csv-split --fields id,size --binary 2ui && wc -c < 0.bin && wc -c < 1.bin )"
\ No newline at end of file

From bc3772f4cc629b3ee14f2038b8a72bd91ac1aabf Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Aug 2024 12:48:19 +1000
Subject: [PATCH 0892/1056] io-topics: log: header_fields added

---
 io/applications/io-topics | 41 +++++++++++++++------------------------
 1 file changed, 16 insertions(+), 25 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index c845e8ba5..8db594db2 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -14,10 +14,7 @@ source $( type -p comma-process-util ) || { echo "io-topics: could not source 'c
 function bash_completion()
 {
     echo "cat list log publish"
-    {
-        common_options
-        log_options
-    } | comma_options_to_bash_completion
+    { common_options; log_options; } | comma_options_to_bash_completion
 }
 
 function common_options()
@@ -177,10 +174,7 @@ function list_topic_fields() { :; }
 
 # todo: flush field? flush is default behaviour in io-publish, which is inconsistent with
 # log and cat operations and thus introducing flush in publish might be confusing
-function publish_topic_fields()
-{
-    publish_topic_fields_help | grep -v '^ ' | cut -f1 -d';'
-}
+function publish_topic_fields() { publish_topic_fields_help | grep -v '^ ' | cut -f1 -d';'; }
 
 function publish_topic_fields_help()
 {
@@ -201,10 +195,7 @@ size;              for binary data, size of the binary record
 eof
 }
 
-function cat_topic_fields()
-{
-    cat_topic_fields_help | grep -v '^ ' | cut -f1 -d';'
-}
+function cat_topic_fields() { cat_topic_fields_help | grep -v '^ ' | cut -f1 -d';'; }
 
 function cat_topic_fields_help()
 {
@@ -221,10 +212,7 @@ size;             if data is binary, size of the binary record
 eof
 }
 
-function log_topic_fields()
-{
-    log_topic_fields_help | grep -v '^ ' | cut -f1 -d';'
-}
+function log_topic_fields() { log_topic_fields_help | grep -v '^ ' | cut -f1 -d';'; }
 
 function log_topic_fields_help()
 {
@@ -235,6 +223,8 @@ command;          optional command for logger to run instead of default logger
 connect_attempts; number of connect attempts
 connect_period;   time in seconds between connect attempts
 flush;            flush output on each record, default: buffer output
+header_fields;    if binary and has 'size' field, variable payload of size field
+                  value after the fixed-width data part is expected
 host;             tcp host for publishing, unless address field is present
 index;            optional command to generate index file, default: fixed-width
                   binary index for each binary record, ascii: no index file
@@ -282,9 +272,10 @@ function set_topic_variables()
     eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
     eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
     topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )" # quick and dirty
-    if [[ -n "$topic_binary" ]]; then size_option="--size $( echo $topic_binary | csv-format size )"
-    elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
-    else unset size_option; fi
+    if [[ -n "$topic_binary" ]]; then size_option="--size=$( echo $topic_binary | csv-format size )"; binary_option="--binary=$topic_binary"
+    elif [[ -n "$topic_size" ]]; then size_option="--size=$topic_size"
+    else unset size_option; unset binary_option; fi
+    if [[ -n "$topic_header_fields" ]]; then fields_option="--fields=$topic_header_fields"; else unset fields_option; fi
 }
 
 function publish_command()
@@ -333,12 +324,12 @@ function log_command()
         local flush_option suffix_option
         (( topic_flush )) && flush_option="--flush"
         [[ -z "$topic_suffix" ]] || suffix_option="--suffix=$topic_suffix"
-        local period=$options_period
-        [[ -z "$topic_period" ]] || period=$topic_period
-        if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
-        if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
-        if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
-        cmd="io-cat $topic_address $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_index | csv-split -t $period $size_option $suffix_option $flush_option"
+        if [[ -n "$topic_period" ]]; then local period=$topic_period; else local period=$options_period; fi
+        if [[ -n "$topic_connect_attempts" ]]; then local connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
+        if [[ -n "$topic_connect_period" ]]; then local connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
+        if [[ -n "$options_verbose" ]]; then local verbose_option="--verbose"; else unset verbose_option; fi
+        if [[ -n "$binary_option" ]]; then local format_option=$binary_option; else local format_option=$size_option; fi
+        cmd="io-cat $topic_address $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_index | csv-split -t $period $fields_option $format_option $suffix_option $flush_option"
     fi
     local path
     [[ -z "$topic_path" ]] || path+="$topic_path/"

From dd264ddda901511dcb928e7b7208a3cdb0003b24 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Aug 2024 13:07:23 +1000
Subject: [PATCH 0893/1056] io-topics: log: header_fields renamed to
 header/fields; header/binary added

---
 io/applications/io-topics | 11 ++++++++---
 1 file changed, 8 insertions(+), 3 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 8db594db2..74a34bf8d 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -223,7 +223,8 @@ command;          optional command for logger to run instead of default logger
 connect_attempts; number of connect attempts
 connect_period;   time in seconds between connect attempts
 flush;            flush output on each record, default: buffer output
-header_fields;    if binary and has 'size' field, variable payload of size field
+header/fields;    if binary and has 'size' field, variable payload of size field
+header/binary;    only required for variable payload size
                   value after the fixed-width data part is expected
 host;             tcp host for publishing, unless address field is present
 index;            optional command to generate index file, default: fixed-width
@@ -271,11 +272,15 @@ function set_topic_variables()
     local topic="$2"
     eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
     eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
+    [[ -z "$topic_header_binary" || -z "$topic_binary" ]] || die "expected either header/binary or binary; got both"
+    [[ -z "$topic_header_binary" || -z "$topic_size" ]] || die "expected either header/binary or size; got both"
+    [[ -z "$topic_header_fields" || -n "$topic_header_binary" ]] || die "header/fields specified, but header/binary is not"
     topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )" # quick and dirty
+    unset size_option binary_option fields_option
     if [[ -n "$topic_binary" ]]; then size_option="--size=$( echo $topic_binary | csv-format size )"; binary_option="--binary=$topic_binary"
-    elif [[ -n "$topic_size" ]]; then size_option="--size=$topic_size"
-    else unset size_option; unset binary_option; fi
+    elif [[ -n "$topic_size" ]]; then size_option="--size=$topic_size"; fi
     if [[ -n "$topic_header_fields" ]]; then fields_option="--fields=$topic_header_fields"; else unset fields_option; fi
+    if [[ -n "$topic_header_binary" ]]; then binary_option="--binary=$topic_header_binary"; fi
 }
 
 function publish_command()

From 36010322e1aac9d5e0d83eebefc1b77b1a580271 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 29 Aug 2024 13:08:33 +1000
Subject: [PATCH 0894/1056] io-topics: log: field list made alphabetic

---
 io/applications/io-topics | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 74a34bf8d..c60d524b3 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -223,9 +223,9 @@ command;          optional command for logger to run instead of default logger
 connect_attempts; number of connect attempts
 connect_period;   time in seconds between connect attempts
 flush;            flush output on each record, default: buffer output
-header/fields;    if binary and has 'size' field, variable payload of size field
 header/binary;    only required for variable payload size
                   value after the fixed-width data part is expected
+header/fields;    if binary and has 'size' field, variable payload of size field
 host;             tcp host for publishing, unless address field is present
 index;            optional command to generate index file, default: fixed-width
                   binary index for each binary record, ascii: no index file

From a1c42ecb3424250265819a446ddfcf44fa323e4d Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 30 Aug 2024 16:06:19 +1000
Subject: [PATCH 0895/1056] io-topics: header/fields, header/binary: excluded
 from topics list

---
 io/applications/io-topics | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index c60d524b3..01ecbfe98 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -354,7 +354,7 @@ function cat_config()
 
 function topics_from_config() # quick and dirty
 {
-    local expression="/address=|/host=|/port=|/command=|/secondary/address=|/secondary/host|/secondary/port="
+    local expression="/address=|/host=|/port=|/command=|/secondary/address=|/secondary/host|/secondary/port=|/header/fields=|/header/binary="
     function grep_by_topic_config_fields() { egrep -e "$expression" | cut -d= -f1 | sed -e 's#/secondary/address$##' -e 's#/secondary/host$##' -e 's#/secondary/port$##' -e 's#/address$##' -e 's#/host$##' -e 's#/port$##' -e 's#/command$##'; }
     [[ -z "$options_topics_from_all_configs" ]] || { grep_by_topic_config_fields <<< "$config" | sort --unique; return; }
     {

From ebcec9d9a705e67e56d767ba498955f112dc84d3 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 30 Aug 2024 19:22:59 +1000
Subject: [PATCH 0896/1056] comma-test-run: --tags, --tags-excluded: in
 progress...

---
 util/applications/comma-test-run | 37 ++++++++++++++++++++++++++++++--
 1 file changed, 35 insertions(+), 2 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index dacf9a0b8..d36b3c36e 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -64,6 +64,8 @@ function description_test_selection()
 --run-disabled; run disabled tests
 --run-optional,--optional; run tests having file called "optional" (same logic as for --run-disabled)
 --stdin; read paths from stdin e.g. run test in hello/world: echo hello/world | comma-test-run --stdin
+--tags=[<tags>]; |-separated tags, run only tests with given tags (see below), todo: support regex
+--tags-excluded=[<tags>]; |-separated tags, do not run tests with given tags (see below), todo: support regex
 --to=[<dir>]; run tests up to a given test, the latter included, where test directories are ordered lexicographically
 --until-first-failure; exit after the first failure (works only when tests run serially)
 --white-list=[<file>]; only run these tests mentioned in the <file>, applied first before black list;
@@ -674,6 +676,24 @@ function get_test_timeout()
 }
 export -f get_test_timeout
 
+function get_tags()
+{
+    local config tags dc dt tt tc
+    config=$( closest_file_in_path "." "config" )
+    tags=$( closest_file_in_path "." "tags" )
+    [[ -f "$tags" || -f "$config" ]] || return
+    if [[ -f "$config" ]]; then tc="$( name-value-get tags < "$config" )"; fi
+    if [[ -f "$tags" ]]; then tt="$( cat "$tags" | grep -v '^#' | grep -v '^$' )"; fi
+    if [[ -n "$tc" && -n "$tt" ]]; then
+        dc="$( dirname "$config" )"
+        dt="$( dirname "$tags" )"
+        if (( "${#dc}" < "${#dt}" )); then echo "$tc"; else echo "$tt"; fi
+    elif [[ -n "$tc" ]]; then echo "$tc"
+    elif [[ -n "$tt" ]]; then echo "$tt"
+    fi
+}
+export -f get_tags
+
 # helper to terminate comma-top safely
 function terminate_comma_top()
 {
@@ -1068,6 +1088,20 @@ function apply_black_list() { if [[ -n "$options_black_list" ]] ; then grep -vE
 
 function apply_white_black_list() { apply_white_list | apply_black_list ; }
 
+function apply_tags()
+{
+    [[ -n "$options_tags" || -n "$options_tags_excluded" ]] || { cat; return; }
+    while read d; do
+        tags="$( cd $d && get_tags | tr ',' '\n' )"
+        if [[ -n "$tags" ]]; then
+            if [[ -n "$options_tags_excluded" ]]; then if egrep -e "^($options_tags_excluded)" <<< "$tags" --quiet; then continue; fi; fi
+            csv-paste <( echo "$tags" ) value="$d"; else echo ",$d"
+        fi
+    done \
+        | if [[ -n "$options_tags" ]]; then egrep -e "^($options_tags),"; else cat; fi \
+        | cut -d, -f2
+}
+
 # to run, search for directories containing either "test", "input" or "expected";
 # if "test" is absent, use the "test" in the closest parent directory
 function test_directories()
@@ -1080,11 +1114,10 @@ function test_directories()
         message_ "$name: applying black list from file '$options_black_list'"
         options_black_list="^(\./)?($( sed 's#\./##' <$options_black_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//' ))";
     fi
-
     local followsymlinks followmounts="-mount"
     (( ! options_followsymlinks )) || followsymlinks="-L"
     (( ! options_followmounts )) || followmounts=
-    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find $followsymlinks . $followmounts -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list ) )
+    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find $followsymlinks . $followmounts -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list | apply_tags ) )
     [[ -n "$options_from" || -n "$options_to" || -n "$options_end" ]] || { echo ${test_script_dirs_all[@]} ; return ; }
     [[ -z "$options_from" ]] || { local from="${options_from#\.\/}" ; }
     [[ -z "$options_to" ]] || { local to="${options_to#\.\/}" ; }

From c98bb0eb1c50750e9bb480f03829b0e50dd6395f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 30 Aug 2024 20:24:15 +1000
Subject: [PATCH 0897/1056] comma-test-run: --help: --tags, --tags-excluded:
 documented

---
 util/applications/comma-test-run | 19 +++++++++++++++----
 1 file changed, 15 insertions(+), 4 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index d36b3c36e..bad2d8f25 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -58,14 +58,14 @@ function description_test_selection()
 --black-list=[<file>]; do not run these tests mentioned in <file>, e.g. a lists of sub-directories in white list
   to be excluded; see '--white-list' below for file format.
 --end=[<dir>]; run tests up to a given test, the latter excluded, where test directories are ordered lexicographically
---followsymlinks,-L; follow symlinks when looking for test directories, same as find -L
+--followsymlinks,-L; folapply_tagslow symlinks when looking for test directories, same as find -L
 --followmounts; search mounted filesystems when looking for test directories, same as find without -mount
 --from,--begin=[<dir>]; run tests starting from a given test, where test directories are ordered lexicographically
 --run-disabled; run disabled tests
 --run-optional,--optional; run tests having file called "optional" (same logic as for --run-disabled)
 --stdin; read paths from stdin e.g. run test in hello/world: echo hello/world | comma-test-run --stdin
---tags=[<tags>]; |-separated tags, run only tests with given tags (see below), todo: support regex
---tags-excluded=[<tags>]; |-separated tags, do not run tests with given tags (see below), todo: support regex
+--tags=[<tags>]; |-separated tags or regular expressions, run only tests with given tags (see below)
+--tags-excluded=[<tags>]; |-separated tags or regular expressions, do not run tests with given tags (see below)
 --to=[<dir>]; run tests up to a given test, the latter included, where test directories are ordered lexicographically
 --until-first-failure; exit after the first failure (works only when tests run serially)
 --white-list=[<file>]; only run these tests mentioned in the <file>, applied first before black list;
@@ -215,7 +215,7 @@ ${brown}Running tests in parallel${none}
         as are available on the system. This is ${red}not recommended${none} for resource-heavy tests
         unless additional configuration files are provided as explained below.
 
-${brown}Config files${none}
+${brown}config files${none}
     The way a test is run can be controlled using a file named ${brown}config${none} in the test directory,
     which may contain the following parameters:
 
@@ -241,6 +241,12 @@ ${brown}Config files${none}
     run/max_time=<seconds>
         Test will be terminated and fail if it has not completed in the specified time (seconds).
         Overrides option '--max-run-time'.
+    
+    tags=<tags>
+        <tags>: comma-separated list of tags applied to the current directory and subdirectories
+                that do not have their own config containing 'tags' entry or a file named 'tags'
+                containing comma-separated list of arbitrary key words (tags); tests can be filtered
+                by tags using --tags and/or --tags-excluded command line options
 
     Example config:
         resources/cpus=4
@@ -248,6 +254,11 @@ ${brown}Config files${none}
         resources/serial=\"true\"
         run/max_time=600
 
+${brown}tags files${none}
+    If a file named 'tags' is present in the current directory or in one of its parent directories,
+    this file is expected to contain a comma-separated list of arbitrary key words (tags); tests can be
+    filtered by tags using --tags and/or --tags-excluded command line options
+
 ${brown}White(and black)-listing tests${none}
     The test names in the white/black list file shall match ${brown}exactly${none} the corresponding
     names in '--dry-run' output, e.g.

From c5478af4388a1104f1c594f87bcb71ae7bda2960 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 2 Sep 2024 11:00:44 +1000
Subject: [PATCH 0898/1056] comma-test-run --tags-list implemented

---
 util/applications/comma-test-run | 51 ++++++++++++++++++--------------
 1 file changed, 29 insertions(+), 22 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index bad2d8f25..ea92fece4 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -58,7 +58,7 @@ function description_test_selection()
 --black-list=[<file>]; do not run these tests mentioned in <file>, e.g. a lists of sub-directories in white list
   to be excluded; see '--white-list' below for file format.
 --end=[<dir>]; run tests up to a given test, the latter excluded, where test directories are ordered lexicographically
---followsymlinks,-L; folapply_tagslow symlinks when looking for test directories, same as find -L
+--followsymlinks,-L; follow symlinks when looking for test directories, same as find -L
 --followmounts; search mounted filesystems when looking for test directories, same as find without -mount
 --from,--begin=[<dir>]; run tests starting from a given test, where test directories are ordered lexicographically
 --run-disabled; run disabled tests
@@ -66,6 +66,7 @@ function description_test_selection()
 --stdin; read paths from stdin e.g. run test in hello/world: echo hello/world | comma-test-run --stdin
 --tags=[<tags>]; |-separated tags or regular expressions, run only tests with given tags (see below)
 --tags-excluded=[<tags>]; |-separated tags or regular expressions, do not run tests with given tags (see below)
+--tags-list; list tags for all subdirectories as <dir>,<tags>
 --to=[<dir>]; run tests up to a given test, the latter included, where test directories are ordered lexicographically
 --until-first-failure; exit after the first failure (works only when tests run serially)
 --white-list=[<file>]; only run these tests mentioned in the <file>, applied first before black list;
@@ -687,24 +688,6 @@ function get_test_timeout()
 }
 export -f get_test_timeout
 
-function get_tags()
-{
-    local config tags dc dt tt tc
-    config=$( closest_file_in_path "." "config" )
-    tags=$( closest_file_in_path "." "tags" )
-    [[ -f "$tags" || -f "$config" ]] || return
-    if [[ -f "$config" ]]; then tc="$( name-value-get tags < "$config" )"; fi
-    if [[ -f "$tags" ]]; then tt="$( cat "$tags" | grep -v '^#' | grep -v '^$' )"; fi
-    if [[ -n "$tc" && -n "$tt" ]]; then
-        dc="$( dirname "$config" )"
-        dt="$( dirname "$tags" )"
-        if (( "${#dc}" < "${#dt}" )); then echo "$tc"; else echo "$tt"; fi
-    elif [[ -n "$tc" ]]; then echo "$tc"
-    elif [[ -n "$tt" ]]; then echo "$tt"
-    fi
-}
-export -f get_tags
-
 # helper to terminate comma-top safely
 function terminate_comma_top()
 {
@@ -1099,11 +1082,29 @@ function apply_black_list() { if [[ -n "$options_black_list" ]] ; then grep -vE
 
 function apply_white_black_list() { apply_white_list | apply_black_list ; }
 
-function apply_tags()
+function tags-get()
+{
+    local config tags dc dt tt tc
+    config=$( closest_file_in_path "." "config" )
+    tags=$( closest_file_in_path "." "tags" )
+    [[ -f "$tags" || -f "$config" ]] || return
+    if [[ -f "$config" ]]; then tc="$( name-value-get tags < "$config" )"; fi
+    if [[ -f "$tags" ]]; then tt="$( cat "$tags" | grep -v '^#' | grep -v '^$' )"; fi
+    if [[ -n "$tc" && -n "$tt" ]]; then
+        dc="$( dirname "$config" )"
+        dt="$( dirname "$tags" )"
+        if (( "${#dc}" < "${#dt}" )); then echo "$tc"; else echo "$tt"; fi
+    elif [[ -n "$tc" ]]; then echo "$tc"
+    elif [[ -n "$tt" ]]; then echo "$tt"
+    fi
+}
+export -f tags-get
+
+function tags-apply() # todo! getting tags for each subdirectory is very slow; get tags for the root, then list all tags, then join matching/not-matching
 {
     [[ -n "$options_tags" || -n "$options_tags_excluded" ]] || { cat; return; }
     while read d; do
-        tags="$( cd $d && get_tags | tr ',' '\n' )"
+        tags="$( cd $d && tags-get | tr ',' '\n' )"
         if [[ -n "$tags" ]]; then
             if [[ -n "$options_tags_excluded" ]]; then if egrep -e "^($options_tags_excluded)" <<< "$tags" --quiet; then continue; fi; fi
             csv-paste <( echo "$tags" ) value="$d"; else echo ",$d"
@@ -1113,6 +1114,11 @@ function apply_tags()
         | cut -d, -f2
 }
 
+function tags-list()
+{
+    while read d; do echo "$d,$( cd $d && tags-get | tr ',' '\n' )"; done
+}
+
 # to run, search for directories containing either "test", "input" or "expected";
 # if "test" is absent, use the "test" in the closest parent directory
 function test_directories()
@@ -1128,7 +1134,7 @@ function test_directories()
     local followsymlinks followmounts="-mount"
     (( ! options_followsymlinks )) || followsymlinks="-L"
     (( ! options_followmounts )) || followmounts=
-    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find $followsymlinks . $followmounts -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list | apply_tags ) )
+    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find $followsymlinks . $followmounts -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list | tags-apply ) )
     [[ -n "$options_from" || -n "$options_to" || -n "$options_end" ]] || { echo ${test_script_dirs_all[@]} ; return ; }
     [[ -z "$options_from" ]] || { local from="${options_from#\.\/}" ; }
     [[ -z "$options_to" ]] || { local to="${options_to#\.\/}" ; }
@@ -1152,6 +1158,7 @@ else
     done
 fi
 [[ -z "$options_output_directories" ]] || { echo ${test_script_dirs[@]} | tr ' ' '\n' ; exit 0 ; }
+[[ -z "$options_tags_list" ]] || { echo ${test_script_dirs[@]} | tr ' ' '\n' | tags-list ; exit 0 ; }
 [[ -z "$options_document" ]] || { for d in ${test_script_dirs[@]} ; do document_test $d ; done ; exit 0 ; }
 export test_scripts_count=${#test_script_dirs[@]}
 

From 0a89b81b75e7604a1d005d0ea47272be23bf7220 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 4 Sep 2024 14:25:09 +1000
Subject: [PATCH 0899/1056] io-topics: added support for templated commands

---
 io/applications/io-topics                     | 19 ++++++++++++++++++-
 .../io-topics/command-template/config.json    |  6 ++++++
 io/test/io-topics/command-template/expected   |  4 ++++
 io/test/io-topics/command-template/input      |  2 ++
 io/test/io-topics/command-template/test       |  5 +++++
 5 files changed, 35 insertions(+), 1 deletion(-)
 create mode 100644 io/test/io-topics/command-template/config.json
 create mode 100644 io/test/io-topics/command-template/expected
 create mode 100644 io/test/io-topics/command-template/input
 create mode 100755 io/test/io-topics/command-template/test

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 01ecbfe98..f17a9f38e 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -157,6 +157,11 @@ EOF
                   echo 'b/command=socat tcp:localhost:12346 - > log.csv' )
             $ ls -al my-log/a
             $ head my-log/b/log.csv
+
+        trigger logging on a remote machine with templated command
+            $ io-topics log --dir my-log --config <(
+                  echo "a/command=curl 'http://remote:7000/log=start&name=${log_dir}'" )
+
 eof
     else
         echo "use \"$scriptname --help --verbose\" for examples"
@@ -318,12 +323,24 @@ function cat_command()
     echo "$cmd"
 }
 
+# allow placeholders in the command string
+function expanded_command()
+{
+    local cmd="$1"
+    eval "$( grep "=" <<< "$options" | comma_path_value_mangle | sed 's#^#local #' )"
+    eval "echo \"${cmd}\""
+}
+
 function log_command()
 {
     [[ -n "$options_log_dir" ]] || die "please specify --log-dir"
     local topic=$1
     local cmd="$topic_command"
-    if [[ -z "$cmd" ]]; then
+    if [[ "$cmd" ]]; then
+        verbose "got $cmd"
+        cmd=$( expanded_command "$cmd" )
+        verbose "expanded to $cmd"
+    else
         set_topic_address
         [[ -n "$topic_index" ]] || topic_index="cat"
         local flush_option suffix_option
diff --git a/io/test/io-topics/command-template/config.json b/io/test/io-topics/command-template/config.json
new file mode 100644
index 000000000..29347c0f3
--- /dev/null
+++ b/io/test/io-topics/command-template/config.json
@@ -0,0 +1,6 @@
+{
+    "topic1":
+    {
+        "command": "echo ${log_dir}"
+    }
+}
diff --git a/io/test/io-topics/command-template/expected b/io/test/io-topics/command-template/expected
new file mode 100644
index 000000000..c38a614eb
--- /dev/null
+++ b/io/test/io-topics/command-template/expected
@@ -0,0 +1,4 @@
+log/dir/output="my-dir"
+log/dir/status=0
+log/log_dir/output="my-log-dir"
+log/log_dir/status=0
diff --git a/io/test/io-topics/command-template/input b/io/test/io-topics/command-template/input
new file mode 100644
index 000000000..174169cc2
--- /dev/null
+++ b/io/test/io-topics/command-template/input
@@ -0,0 +1,2 @@
+log/dir="io-topics log --config config.json --dir my-dir"
+log/log_dir="io-topics log --config config.json --log-dir my-log-dir"
diff --git a/io/test/io-topics/command-template/test b/io/test/io-topics/command-template/test
new file mode 100755
index 000000000..152895e63
--- /dev/null
+++ b/io/test/io-topics/command-template/test
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From 8fa62cd3bdc26164add05ef962391183d0f88c60 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 4 Sep 2024 14:25:55 +1000
Subject: [PATCH 0900/1056] io-topics: added support for actions on exit

---
 io/applications/io-topics | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index f17a9f38e..a3d10ec1a 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -191,6 +191,7 @@ command;           command for the publisher to run
 input;             input topic for publish command to read on stdin
 multiplier;        passed to io-publish
 on_demand;         same meaning as io-publish --on-demand
+on_exit;           command to run when publisher stops
 port;              tcp port for publishing, unless address field is present
 secondary/address; passed verbatim to io-publish as '<address>;secondary',
                    in this case port attribute ignored
@@ -212,6 +213,7 @@ connect_attempts; number of connect attempts
 connect_period;   time in seconds between connect attempts
 flush;            flush output on each record, default: buffer output
 host;             tcp host for publishing, unless address field is present
+on_exit;          command to run when output stops
 port;             tcp port for publishing, unless address field is present
 size;             if data is binary, size of the binary record
 eof
@@ -234,6 +236,7 @@ header/fields;    if binary and has 'size' field, variable payload of size field
 host;             tcp host for publishing, unless address field is present
 index;            optional command to generate index file, default: fixed-width
                   binary index for each binary record, ascii: no index file
+on_exit;          command to run when logger stops
 path;             prefix path for log directory (to split logs across drives)
 period;           split log files at given number of seconds, overrides --period
 port;             tcp port for publishing, unless address field is present
@@ -404,6 +407,13 @@ if (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )); t
     usage $verbose
 fi
 
+on_exit_commands=()
+
+function on_exit()
+{
+    comma_execute_and_wait --group "${on_exit_commands[@]}"
+}
+
 operation=$1
 [[ $( type -t ${operation}_topic_fields ) == "function" ]] || die "expected operation, got '$operation'" # quick and dirty
 (( $( comma_options_has --topic-fields "$@" ) )) && { ${operation}_topic_fields; exit 0; }
@@ -419,8 +429,14 @@ for topic in ${topics[@]}; do
     set_topic_variables "$operation" "$topic"
     cmd="$( ${operation}_command $topic )" || die "topic '$topic': making command failed"
     commands+=( "$cmd" )
+    [[ $topic_on_exit ]] && on_exit_commands+=( "$topic_on_exit" )
 done
 say "will run 'comma_execute_and_wait --group' with commands:"
 for cmd in "${commands[@]}"; do say "    $cmd"; done
+if (( ${#on_exit_commands[@]} > 0 )); then
+    say "on exit will run:"
+    for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
+    trap on_exit EXIT
+fi
 [[ -z "$options_dry_run" ]] || exit
 comma_execute_and_wait --group "${commands[@]}"

From 95fd55458830b8c24cd6f5cb43a4ed38ef79a79b Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 6 Sep 2024 13:17:14 +1000
Subject: [PATCH 0901/1056] io-topics: --dry-run fixed and help improved

---
 io/applications/io-topics | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index a3d10ec1a..0db580955 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -55,6 +55,13 @@ operations
     play:    play back logs, counterpart to log operation (todo)
     publish: start all the publishers listed on command line or config file
 
+variable substition in commands
+    options can be passed to commands via variable substition. for example:
+    command="save-to-dir ${log_dir}"
+    all options are available,
+    e.g. --config -> ${config}; --log-dir -> ${log_dir}
+    see examples below for more detail
+
 common options
 $( common_options | sed 's/^/    /g' )
 
@@ -330,8 +337,10 @@ function cat_command()
 function expanded_command()
 {
     local cmd="$1"
-    eval "$( grep "=" <<< "$options" | comma_path_value_mangle | sed 's#^#local #' )"
-    eval "echo \"${cmd}\""
+    {
+        grep "=" <<< "$options" | comma_path_value_mangle
+        echo "cmd=\"$( sed -e 's#"#\\\"#g' -e "s#'#\\'#g" <<< "$cmd" )\""
+    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"'
 }
 
 function log_command()
@@ -411,6 +420,8 @@ on_exit_commands=()
 
 function on_exit()
 {
+    say "running commands on exit:"
+    for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
     comma_execute_and_wait --group "${on_exit_commands[@]}"
 }
 
@@ -436,7 +447,7 @@ for cmd in "${commands[@]}"; do say "    $cmd"; done
 if (( ${#on_exit_commands[@]} > 0 )); then
     say "on exit will run:"
     for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
-    trap on_exit EXIT
+    [[ $options_dry_run ]] || trap on_exit EXIT
 fi
 [[ -z "$options_dry_run" ]] || exit
 comma_execute_and_wait --group "${commands[@]}"

From 0b9edb8fe1ee0f5a8d5be84b35e68c7efe699ab2 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 6 Sep 2024 16:54:45 +1000
Subject: [PATCH 0902/1056] io: publish.* move from applications/detail to impl
 to expose to the outside world; name_value library: dependency on application
 library removed

---
 io/CMakeLists.txt                            |  2 +-
 io/applications/CMakeLists.txt               |  4 ++--
 io/applications/io-publish.cpp               | 24 +++++++++++++-------
 io/applications/udp-client.cpp               | 16 ++++++-------
 io/{applications/detail => impl}/publish.cpp |  7 +++---
 io/{applications/detail => impl}/publish.h   | 16 +++++--------
 name_value/CMakeLists.txt                    |  2 +-
 7 files changed, 38 insertions(+), 33 deletions(-)
 rename io/{applications/detail => impl}/publish.cpp (95%)
 rename io/{applications/detail => impl}/publish.h (84%)

diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index 19497c98f..a7ddc3c63 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -17,7 +17,7 @@ ELSE( comma_BUILD_ZEROMQ )
 ENDIF( comma_BUILD_ZEROMQ )
 
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_string )
+target_link_libraries( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_name_value comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index 811b4c6e6..336357f5f 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -38,7 +38,7 @@ if( NOT WIN32 )
     set_target_properties( io-ls PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-ls RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
-    add_executable( io-publish ${dir}/io-publish.cpp ${dir}/detail/publish.h ${dir}/detail/publish.cpp )
+    add_executable( io-publish ${dir}/io-publish.cpp )
     target_link_libraries( io-publish comma_base comma_io comma_application comma_xpath comma_name_value ) # profiler )
     set_target_properties( io-publish PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-publish RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
@@ -48,7 +48,7 @@ if( NOT WIN32 )
     set_target_properties( io-tee PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-tee RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
-    add_executable( udp-client ${dir}/udp-client.cpp ${dir}/detail/publish.h ${dir}/detail/publish.cpp )
+    add_executable( udp-client ${dir}/udp-client.cpp )
     target_link_libraries( udp-client comma_application comma_name_value comma_io comma_csv comma_base comma_string ) # profiler )
     set_target_properties( udp-client PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS udp-client RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 6b95ceb60..c0c0a4236 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -3,7 +3,15 @@
 
 /// @authors cedric wohlleber, vsevolod vlaskine, dave jennings
 
-#include "detail/publish.h"
+#include "../../application/command_line_options.h"
+#include "../../application/signal_flag.h"
+#include "../../base/last_error.h"
+#include "../../io/file_descriptor.h"
+#include "../../io/publisher.h"
+#include "../../io/impl/publish.h"
+#include "../../name_value/map.h"
+#include "../../string/string.h"
+#include "../../sync/synchronized.h"
 
 //#include <google/profiler.h>
 
@@ -141,13 +149,13 @@ int main( int ac, char** av )
         comma::signal_flag is_shutdown( signals );
         bool on_demand = options.exists( "--on-demand" );
         bool exit_on_no_clients = options.exists( "--exit-on-no-clients,-e" );
-        comma::io::detail::publish p( names
-                                    , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
-                                    , !options.exists( "--no-discard" )
-                                    , !options.exists( "--no-flush" )
-                                    , options.exists( "--output-number-of-clients,--clients" )
-                                    , exit_on_no_clients || on_demand
-                                    , options.value( "--cache-size,--cache", 0 ) );
+        comma::io::impl::publish p( names
+                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                  , !options.exists( "--no-discard" )
+                                  , !options.exists( "--no-flush" )
+                                  , options.exists( "--output-number-of-clients,--clients" )
+                                  , exit_on_no_clients || on_demand
+                                  , options.value( "--cache-size,--cache", 0 ) );
         std::string exec_command = options.value< std::string >( "--exec", "" );
         if( !tail.empty() )
         {
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 95f5a5630..c523a93ee 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -47,7 +47,7 @@
 #include "../../csv/format.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
-#include "detail/publish.h"
+#include "../../io/impl/publish.h"
 
 static void usage()
 {
@@ -170,13 +170,13 @@ int main( int argc, char** argv )
         if( binary ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
         static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
-        comma::io::detail::publish p( output_streams
-                                    , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
-                                    , options.exists( "--discard" )
-                                    , options.exists( "--flush" ) || !binary
-                                    , false
-                                    , false
-                                    , options.value( "--cache-size,--cache", 0 ) );
+        comma::io::impl::publish p( output_streams
+                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                  , options.exists( "--discard" )
+                                  , options.exists( "--flush" ) || !binary
+                                  , false
+                                  , false
+                                  , options.value( "--cache-size,--cache", 0 ) );
         comma::signal_flag is_shutdown;
         if( binary )
         {
diff --git a/io/applications/detail/publish.cpp b/io/impl/publish.cpp
similarity index 95%
rename from io/applications/detail/publish.cpp
rename to io/impl/publish.cpp
index d92073334..b25bde260 100644
--- a/io/applications/detail/publish.cpp
+++ b/io/impl/publish.cpp
@@ -2,9 +2,10 @@
 // Copyright (c) 2020 Vsevolod Vlaskine
 // All rights reserved.
 
+#include "../../name_value/map.h"
 #include "publish.h"
 
-namespace comma { namespace io { namespace detail {
+namespace comma { namespace io { namespace impl {
 
 publish::publish( const std::vector< std::string >& endpoints
                 , unsigned int packet_size
@@ -122,7 +123,7 @@ bool publish::handle_sizes_( transaction_t& t ) // todo? why pass transaction? i
     if( update_no_clients_ )
     {
         if( total > 0 ) { got_first_client_ever_ = true; }
-        else if( got_first_client_ever_ ) { comma::saymore() << "the last client exited" << std::endl; return false; }
+        else if( got_first_client_ever_ ) { return false; } // { comma::saymore() << "the last client exited" << std::endl; return false; }
     }
     return true;
 }
@@ -177,4 +178,4 @@ void publish::accept_()
     }
 }
 
-} } } // namespace comma { namespace io { namespace detail {
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/applications/detail/publish.h b/io/impl/publish.h
similarity index 84%
rename from io/applications/detail/publish.h
rename to io/impl/publish.h
index b13d90539..98349494d 100644
--- a/io/applications/detail/publish.h
+++ b/io/impl/publish.h
@@ -16,16 +16,12 @@
 #include <boost/iostreams/stream.hpp>
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
-#include "../../../application/command_line_options.h"
-#include "../../../application/signal_flag.h"
-#include "../../../base/last_error.h"
-#include "../../../io/file_descriptor.h"
-#include "../../../io/publisher.h"
-#include "../../../name_value/map.h"
-#include "../../../string/string.h"
-#include "../../../sync/synchronized.h"
+#include "../../io/file_descriptor.h"
+#include "../../io/publisher.h"
+#include "../../string/string.h"
+#include "../../sync/synchronized.h"
 
-namespace comma { namespace io { namespace detail {
+namespace comma { namespace io { namespace impl {
 
 class publish
 {
@@ -84,4 +80,4 @@ class publish
         void accept_();
 };
 
-} } } // namespace comma { namespace io { namespace detail {
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index b1b30b945..615d5009f 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -12,7 +12,7 @@ INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJE
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} ) # comma_application
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll

From 615ffa1a8f5fa1f6028bf68f3f9abaf3cba30b9b Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 6 Sep 2024 16:54:45 +1000
Subject: [PATCH 0903/1056] io: publish.* move from applications/detail to impl
 to expose to the outside world; name_value library: dependency on application
 library removed

---
 io/CMakeLists.txt                            |  2 +-
 io/applications/CMakeLists.txt               |  4 ++--
 io/applications/io-publish.cpp               | 24 +++++++++++++-------
 io/applications/udp-client.cpp               | 16 ++++++-------
 io/{applications/detail => impl}/publish.cpp |  7 +++---
 io/{applications/detail => impl}/publish.h   | 16 +++++--------
 name_value/CMakeLists.txt                    |  2 +-
 7 files changed, 38 insertions(+), 33 deletions(-)
 rename io/{applications/detail => impl}/publish.cpp (95%)
 rename io/{applications/detail => impl}/publish.h (84%)

diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index 19497c98f..a7ddc3c63 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -17,7 +17,7 @@ ELSE( comma_BUILD_ZEROMQ )
 ENDIF( comma_BUILD_ZEROMQ )
 
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_string )
+target_link_libraries( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_name_value comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index 811b4c6e6..336357f5f 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -38,7 +38,7 @@ if( NOT WIN32 )
     set_target_properties( io-ls PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-ls RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
-    add_executable( io-publish ${dir}/io-publish.cpp ${dir}/detail/publish.h ${dir}/detail/publish.cpp )
+    add_executable( io-publish ${dir}/io-publish.cpp )
     target_link_libraries( io-publish comma_base comma_io comma_application comma_xpath comma_name_value ) # profiler )
     set_target_properties( io-publish PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-publish RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
@@ -48,7 +48,7 @@ if( NOT WIN32 )
     set_target_properties( io-tee PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-tee RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
-    add_executable( udp-client ${dir}/udp-client.cpp ${dir}/detail/publish.h ${dir}/detail/publish.cpp )
+    add_executable( udp-client ${dir}/udp-client.cpp )
     target_link_libraries( udp-client comma_application comma_name_value comma_io comma_csv comma_base comma_string ) # profiler )
     set_target_properties( udp-client PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS udp-client RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 6b95ceb60..c0c0a4236 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -3,7 +3,15 @@
 
 /// @authors cedric wohlleber, vsevolod vlaskine, dave jennings
 
-#include "detail/publish.h"
+#include "../../application/command_line_options.h"
+#include "../../application/signal_flag.h"
+#include "../../base/last_error.h"
+#include "../../io/file_descriptor.h"
+#include "../../io/publisher.h"
+#include "../../io/impl/publish.h"
+#include "../../name_value/map.h"
+#include "../../string/string.h"
+#include "../../sync/synchronized.h"
 
 //#include <google/profiler.h>
 
@@ -141,13 +149,13 @@ int main( int ac, char** av )
         comma::signal_flag is_shutdown( signals );
         bool on_demand = options.exists( "--on-demand" );
         bool exit_on_no_clients = options.exists( "--exit-on-no-clients,-e" );
-        comma::io::detail::publish p( names
-                                    , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
-                                    , !options.exists( "--no-discard" )
-                                    , !options.exists( "--no-flush" )
-                                    , options.exists( "--output-number-of-clients,--clients" )
-                                    , exit_on_no_clients || on_demand
-                                    , options.value( "--cache-size,--cache", 0 ) );
+        comma::io::impl::publish p( names
+                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                  , !options.exists( "--no-discard" )
+                                  , !options.exists( "--no-flush" )
+                                  , options.exists( "--output-number-of-clients,--clients" )
+                                  , exit_on_no_clients || on_demand
+                                  , options.value( "--cache-size,--cache", 0 ) );
         std::string exec_command = options.value< std::string >( "--exec", "" );
         if( !tail.empty() )
         {
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index 95f5a5630..c523a93ee 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -47,7 +47,7 @@
 #include "../../csv/format.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
-#include "detail/publish.h"
+#include "../../io/impl/publish.h"
 
 static void usage()
 {
@@ -170,13 +170,13 @@ int main( int argc, char** argv )
         if( binary ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
         static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
-        comma::io::detail::publish p( output_streams
-                                    , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
-                                    , options.exists( "--discard" )
-                                    , options.exists( "--flush" ) || !binary
-                                    , false
-                                    , false
-                                    , options.value( "--cache-size,--cache", 0 ) );
+        comma::io::impl::publish p( output_streams
+                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                  , options.exists( "--discard" )
+                                  , options.exists( "--flush" ) || !binary
+                                  , false
+                                  , false
+                                  , options.value( "--cache-size,--cache", 0 ) );
         comma::signal_flag is_shutdown;
         if( binary )
         {
diff --git a/io/applications/detail/publish.cpp b/io/impl/publish.cpp
similarity index 95%
rename from io/applications/detail/publish.cpp
rename to io/impl/publish.cpp
index d92073334..b25bde260 100644
--- a/io/applications/detail/publish.cpp
+++ b/io/impl/publish.cpp
@@ -2,9 +2,10 @@
 // Copyright (c) 2020 Vsevolod Vlaskine
 // All rights reserved.
 
+#include "../../name_value/map.h"
 #include "publish.h"
 
-namespace comma { namespace io { namespace detail {
+namespace comma { namespace io { namespace impl {
 
 publish::publish( const std::vector< std::string >& endpoints
                 , unsigned int packet_size
@@ -122,7 +123,7 @@ bool publish::handle_sizes_( transaction_t& t ) // todo? why pass transaction? i
     if( update_no_clients_ )
     {
         if( total > 0 ) { got_first_client_ever_ = true; }
-        else if( got_first_client_ever_ ) { comma::saymore() << "the last client exited" << std::endl; return false; }
+        else if( got_first_client_ever_ ) { return false; } // { comma::saymore() << "the last client exited" << std::endl; return false; }
     }
     return true;
 }
@@ -177,4 +178,4 @@ void publish::accept_()
     }
 }
 
-} } } // namespace comma { namespace io { namespace detail {
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/applications/detail/publish.h b/io/impl/publish.h
similarity index 84%
rename from io/applications/detail/publish.h
rename to io/impl/publish.h
index b13d90539..98349494d 100644
--- a/io/applications/detail/publish.h
+++ b/io/impl/publish.h
@@ -16,16 +16,12 @@
 #include <boost/iostreams/stream.hpp>
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
-#include "../../../application/command_line_options.h"
-#include "../../../application/signal_flag.h"
-#include "../../../base/last_error.h"
-#include "../../../io/file_descriptor.h"
-#include "../../../io/publisher.h"
-#include "../../../name_value/map.h"
-#include "../../../string/string.h"
-#include "../../../sync/synchronized.h"
+#include "../../io/file_descriptor.h"
+#include "../../io/publisher.h"
+#include "../../string/string.h"
+#include "../../sync/synchronized.h"
 
-namespace comma { namespace io { namespace detail {
+namespace comma { namespace io { namespace impl {
 
 class publish
 {
@@ -84,4 +80,4 @@ class publish
         void accept_();
 };
 
-} } } // namespace comma { namespace io { namespace detail {
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index b1b30b945..615d5009f 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -12,7 +12,7 @@ INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJE
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} ) # comma_application
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll

From 7f4f390e2e23ca70d5b020b3e485b5e820e1b99f Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 6 Sep 2024 13:33:09 +1000
Subject: [PATCH 0904/1056] io-topics: added templated command support to
 publish and cat operations

---
 io/applications/io-topics | 27 ++++++++++++++-------------
 1 file changed, 14 insertions(+), 13 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 0db580955..70f863e78 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -298,6 +298,16 @@ function set_topic_variables()
     if [[ -n "$topic_header_binary" ]]; then binary_option="--binary=$topic_header_binary"; fi
 }
 
+# allow placeholders in the command string
+function expanded_command()
+{
+    local cmd="$1"
+    {
+        grep "=" <<< "$options" | comma_path_value_mangle
+        echo "cmd=\"$( sed -e 's#"#\\\"#g' -e "s#'#\\'#g" <<< "$cmd" )\""
+    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"'
+}
+
 function publish_command()
 {
     [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
@@ -309,8 +319,9 @@ function publish_command()
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     if [[ -n "$topic_cache_size" ]]; then cache_size="--cache-size=$topic_cache_size"; else unset cache_size; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size -- "
-    if [[ -z "$topic_input" ]]; then cmd+="$topic_command"
-    else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
+    local expanded_topic_command=$( expanded_command $topic_command )
+    if [[ -z "$topic_input" ]]; then cmd+="$expanded_topic_command"
+    else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $expanded_topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"
     echo "$cmd"
 }
@@ -328,21 +339,11 @@ function cat_command()
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
     if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
     if (( ignore_command )); then local cmd="io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option"
-    else local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_command"; fi # todo? comma_execute_and_wait?
+    else local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $( expanded_command $topic_command )"; fi # todo? comma_execute_and_wait?
     verbose "$cmd"
     echo "$cmd"
 }
 
-# allow placeholders in the command string
-function expanded_command()
-{
-    local cmd="$1"
-    {
-        grep "=" <<< "$options" | comma_path_value_mangle
-        echo "cmd=\"$( sed -e 's#"#\\\"#g' -e "s#'#\\'#g" <<< "$cmd" )\""
-    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"'
-}
-
 function log_command()
 {
     [[ -n "$options_log_dir" ]] || die "please specify --log-dir"

From ad9384d76bfc0b162a9c4cdb14075a15e9496500 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 6 Sep 2024 18:18:44 +1000
Subject: [PATCH 0905/1056] io-topics: disabled command expansion

---
 io/applications/io-topics                   | 29 +++++++++++++++++++--
 io/test/io-topics/command-template/disabled |  1 +
 2 files changed, 28 insertions(+), 2 deletions(-)
 create mode 100644 io/test/io-topics/command-template/disabled

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 70f863e78..77414c6c2 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -300,6 +300,24 @@ function set_topic_variables()
 
 # allow placeholders in the command string
 function expanded_command()
+{
+    local cmd="$1"
+    echo "$cmd"
+    return
+
+    local token
+    echo $cmd | sed 's/\${/\n${/;s/}/}\n/' \
+        | while IFS='' read token; do \
+              if [[ $token =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then
+                  local variable_name="options_${token:2:-1}"
+                  echo "${!variable_name}"
+              else
+                  echo "$token"
+              fi
+          done | tr -d '\n'
+}
+
+function expanded_command_old()
 {
     local cmd="$1"
     {
@@ -319,7 +337,9 @@ function publish_command()
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     if [[ -n "$topic_cache_size" ]]; then cache_size="--cache-size=$topic_cache_size"; else unset cache_size; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size -- "
-    local expanded_topic_command=$( expanded_command $topic_command )
+    verbose "publish topic_command: $topic_command"
+    local expanded_topic_command=$( expanded_command "$topic_command" )
+    verbose "publish expanded_topic_command: $expanded_topic_command"
     if [[ -z "$topic_input" ]]; then cmd+="$expanded_topic_command"
     else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $expanded_topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"
@@ -339,7 +359,12 @@ function cat_command()
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
     if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
     if (( ignore_command )); then local cmd="io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option"
-    else local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $( expanded_command $topic_command )"; fi # todo? comma_execute_and_wait?
+    else
+        verbose "cat topic_command: $topic_command"
+        local expanded_topic_command=$( expanded_command "$topic_command" )
+        verbose "cat expanded_topic_command: $expanded_topic_command"
+        local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $expanded_topic_command"
+    fi # todo? comma_execute_and_wait?
     verbose "$cmd"
     echo "$cmd"
 }
diff --git a/io/test/io-topics/command-template/disabled b/io/test/io-topics/command-template/disabled
new file mode 100644
index 000000000..9111fd4a0
--- /dev/null
+++ b/io/test/io-topics/command-template/disabled
@@ -0,0 +1 @@
+disabled pending feature completion

From 6ed799d27ba9735921d5c786bfa34d9a3664e3b3 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 4 Sep 2024 14:25:09 +1000
Subject: [PATCH 0906/1056] io-topics: added support for templated commands

---
 io/applications/io-topics                     | 19 ++++++++++++++++++-
 .../io-topics/command-template/config.json    |  6 ++++++
 io/test/io-topics/command-template/expected   |  4 ++++
 io/test/io-topics/command-template/input      |  2 ++
 io/test/io-topics/command-template/test       |  5 +++++
 5 files changed, 35 insertions(+), 1 deletion(-)
 create mode 100644 io/test/io-topics/command-template/config.json
 create mode 100644 io/test/io-topics/command-template/expected
 create mode 100644 io/test/io-topics/command-template/input
 create mode 100755 io/test/io-topics/command-template/test

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 01ecbfe98..f17a9f38e 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -157,6 +157,11 @@ EOF
                   echo 'b/command=socat tcp:localhost:12346 - > log.csv' )
             $ ls -al my-log/a
             $ head my-log/b/log.csv
+
+        trigger logging on a remote machine with templated command
+            $ io-topics log --dir my-log --config <(
+                  echo "a/command=curl 'http://remote:7000/log=start&name=${log_dir}'" )
+
 eof
     else
         echo "use \"$scriptname --help --verbose\" for examples"
@@ -318,12 +323,24 @@ function cat_command()
     echo "$cmd"
 }
 
+# allow placeholders in the command string
+function expanded_command()
+{
+    local cmd="$1"
+    eval "$( grep "=" <<< "$options" | comma_path_value_mangle | sed 's#^#local #' )"
+    eval "echo \"${cmd}\""
+}
+
 function log_command()
 {
     [[ -n "$options_log_dir" ]] || die "please specify --log-dir"
     local topic=$1
     local cmd="$topic_command"
-    if [[ -z "$cmd" ]]; then
+    if [[ "$cmd" ]]; then
+        verbose "got $cmd"
+        cmd=$( expanded_command "$cmd" )
+        verbose "expanded to $cmd"
+    else
         set_topic_address
         [[ -n "$topic_index" ]] || topic_index="cat"
         local flush_option suffix_option
diff --git a/io/test/io-topics/command-template/config.json b/io/test/io-topics/command-template/config.json
new file mode 100644
index 000000000..29347c0f3
--- /dev/null
+++ b/io/test/io-topics/command-template/config.json
@@ -0,0 +1,6 @@
+{
+    "topic1":
+    {
+        "command": "echo ${log_dir}"
+    }
+}
diff --git a/io/test/io-topics/command-template/expected b/io/test/io-topics/command-template/expected
new file mode 100644
index 000000000..c38a614eb
--- /dev/null
+++ b/io/test/io-topics/command-template/expected
@@ -0,0 +1,4 @@
+log/dir/output="my-dir"
+log/dir/status=0
+log/log_dir/output="my-log-dir"
+log/log_dir/status=0
diff --git a/io/test/io-topics/command-template/input b/io/test/io-topics/command-template/input
new file mode 100644
index 000000000..174169cc2
--- /dev/null
+++ b/io/test/io-topics/command-template/input
@@ -0,0 +1,2 @@
+log/dir="io-topics log --config config.json --dir my-dir"
+log/log_dir="io-topics log --config config.json --log-dir my-log-dir"
diff --git a/io/test/io-topics/command-template/test b/io/test/io-topics/command-template/test
new file mode 100755
index 000000000..152895e63
--- /dev/null
+++ b/io/test/io-topics/command-template/test
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From 23504e6273624013f42213270707b1b69bbb4ab0 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Wed, 4 Sep 2024 14:25:55 +1000
Subject: [PATCH 0907/1056] io-topics: added support for actions on exit

---
 io/applications/io-topics | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index f17a9f38e..a3d10ec1a 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -191,6 +191,7 @@ command;           command for the publisher to run
 input;             input topic for publish command to read on stdin
 multiplier;        passed to io-publish
 on_demand;         same meaning as io-publish --on-demand
+on_exit;           command to run when publisher stops
 port;              tcp port for publishing, unless address field is present
 secondary/address; passed verbatim to io-publish as '<address>;secondary',
                    in this case port attribute ignored
@@ -212,6 +213,7 @@ connect_attempts; number of connect attempts
 connect_period;   time in seconds between connect attempts
 flush;            flush output on each record, default: buffer output
 host;             tcp host for publishing, unless address field is present
+on_exit;          command to run when output stops
 port;             tcp port for publishing, unless address field is present
 size;             if data is binary, size of the binary record
 eof
@@ -234,6 +236,7 @@ header/fields;    if binary and has 'size' field, variable payload of size field
 host;             tcp host for publishing, unless address field is present
 index;            optional command to generate index file, default: fixed-width
                   binary index for each binary record, ascii: no index file
+on_exit;          command to run when logger stops
 path;             prefix path for log directory (to split logs across drives)
 period;           split log files at given number of seconds, overrides --period
 port;             tcp port for publishing, unless address field is present
@@ -404,6 +407,13 @@ if (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )); t
     usage $verbose
 fi
 
+on_exit_commands=()
+
+function on_exit()
+{
+    comma_execute_and_wait --group "${on_exit_commands[@]}"
+}
+
 operation=$1
 [[ $( type -t ${operation}_topic_fields ) == "function" ]] || die "expected operation, got '$operation'" # quick and dirty
 (( $( comma_options_has --topic-fields "$@" ) )) && { ${operation}_topic_fields; exit 0; }
@@ -419,8 +429,14 @@ for topic in ${topics[@]}; do
     set_topic_variables "$operation" "$topic"
     cmd="$( ${operation}_command $topic )" || die "topic '$topic': making command failed"
     commands+=( "$cmd" )
+    [[ $topic_on_exit ]] && on_exit_commands+=( "$topic_on_exit" )
 done
 say "will run 'comma_execute_and_wait --group' with commands:"
 for cmd in "${commands[@]}"; do say "    $cmd"; done
+if (( ${#on_exit_commands[@]} > 0 )); then
+    say "on exit will run:"
+    for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
+    trap on_exit EXIT
+fi
 [[ -z "$options_dry_run" ]] || exit
 comma_execute_and_wait --group "${commands[@]}"

From ef2f93452441f7f439f513506defa14b7e1b069f Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 6 Sep 2024 13:17:14 +1000
Subject: [PATCH 0908/1056] io-topics: --dry-run fixed and help improved

---
 io/applications/io-topics | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index a3d10ec1a..0db580955 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -55,6 +55,13 @@ operations
     play:    play back logs, counterpart to log operation (todo)
     publish: start all the publishers listed on command line or config file
 
+variable substition in commands
+    options can be passed to commands via variable substition. for example:
+    command="save-to-dir ${log_dir}"
+    all options are available,
+    e.g. --config -> ${config}; --log-dir -> ${log_dir}
+    see examples below for more detail
+
 common options
 $( common_options | sed 's/^/    /g' )
 
@@ -330,8 +337,10 @@ function cat_command()
 function expanded_command()
 {
     local cmd="$1"
-    eval "$( grep "=" <<< "$options" | comma_path_value_mangle | sed 's#^#local #' )"
-    eval "echo \"${cmd}\""
+    {
+        grep "=" <<< "$options" | comma_path_value_mangle
+        echo "cmd=\"$( sed -e 's#"#\\\"#g' -e "s#'#\\'#g" <<< "$cmd" )\""
+    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"'
 }
 
 function log_command()
@@ -411,6 +420,8 @@ on_exit_commands=()
 
 function on_exit()
 {
+    say "running commands on exit:"
+    for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
     comma_execute_and_wait --group "${on_exit_commands[@]}"
 }
 
@@ -436,7 +447,7 @@ for cmd in "${commands[@]}"; do say "    $cmd"; done
 if (( ${#on_exit_commands[@]} > 0 )); then
     say "on exit will run:"
     for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
-    trap on_exit EXIT
+    [[ $options_dry_run ]] || trap on_exit EXIT
 fi
 [[ -z "$options_dry_run" ]] || exit
 comma_execute_and_wait --group "${commands[@]}"

From 0d68878eea69a2ef8636d216bdfc864aa80d8bea Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 6 Sep 2024 13:33:09 +1000
Subject: [PATCH 0909/1056] io-topics: added templated command support to
 publish and cat operations

---
 io/applications/io-topics | 27 ++++++++++++++-------------
 1 file changed, 14 insertions(+), 13 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 0db580955..70f863e78 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -298,6 +298,16 @@ function set_topic_variables()
     if [[ -n "$topic_header_binary" ]]; then binary_option="--binary=$topic_header_binary"; fi
 }
 
+# allow placeholders in the command string
+function expanded_command()
+{
+    local cmd="$1"
+    {
+        grep "=" <<< "$options" | comma_path_value_mangle
+        echo "cmd=\"$( sed -e 's#"#\\\"#g' -e "s#'#\\'#g" <<< "$cmd" )\""
+    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"'
+}
+
 function publish_command()
 {
     [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
@@ -309,8 +319,9 @@ function publish_command()
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     if [[ -n "$topic_cache_size" ]]; then cache_size="--cache-size=$topic_cache_size"; else unset cache_size; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size -- "
-    if [[ -z "$topic_input" ]]; then cmd+="$topic_command"
-    else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
+    local expanded_topic_command=$( expanded_command $topic_command )
+    if [[ -z "$topic_input" ]]; then cmd+="$expanded_topic_command"
+    else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $expanded_topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"
     echo "$cmd"
 }
@@ -328,21 +339,11 @@ function cat_command()
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
     if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
     if (( ignore_command )); then local cmd="io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option"
-    else local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_command"; fi # todo? comma_execute_and_wait?
+    else local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $( expanded_command $topic_command )"; fi # todo? comma_execute_and_wait?
     verbose "$cmd"
     echo "$cmd"
 }
 
-# allow placeholders in the command string
-function expanded_command()
-{
-    local cmd="$1"
-    {
-        grep "=" <<< "$options" | comma_path_value_mangle
-        echo "cmd=\"$( sed -e 's#"#\\\"#g' -e "s#'#\\'#g" <<< "$cmd" )\""
-    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"'
-}
-
 function log_command()
 {
     [[ -n "$options_log_dir" ]] || die "please specify --log-dir"

From 68686738a9a2538a1df3fcb5a122333178959110 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 6 Sep 2024 18:18:44 +1000
Subject: [PATCH 0910/1056] io-topics: disabled command expansion

---
 io/applications/io-topics                   | 29 +++++++++++++++++++--
 io/test/io-topics/command-template/disabled |  1 +
 2 files changed, 28 insertions(+), 2 deletions(-)
 create mode 100644 io/test/io-topics/command-template/disabled

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 70f863e78..77414c6c2 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -300,6 +300,24 @@ function set_topic_variables()
 
 # allow placeholders in the command string
 function expanded_command()
+{
+    local cmd="$1"
+    echo "$cmd"
+    return
+
+    local token
+    echo $cmd | sed 's/\${/\n${/;s/}/}\n/' \
+        | while IFS='' read token; do \
+              if [[ $token =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then
+                  local variable_name="options_${token:2:-1}"
+                  echo "${!variable_name}"
+              else
+                  echo "$token"
+              fi
+          done | tr -d '\n'
+}
+
+function expanded_command_old()
 {
     local cmd="$1"
     {
@@ -319,7 +337,9 @@ function publish_command()
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
     if [[ -n "$topic_cache_size" ]]; then cache_size="--cache-size=$topic_cache_size"; else unset cache_size; fi
     local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size -- "
-    local expanded_topic_command=$( expanded_command $topic_command )
+    verbose "publish topic_command: $topic_command"
+    local expanded_topic_command=$( expanded_command "$topic_command" )
+    verbose "publish expanded_topic_command: $expanded_topic_command"
     if [[ -z "$topic_input" ]]; then cmd+="$expanded_topic_command"
     else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $expanded_topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"
@@ -339,7 +359,12 @@ function cat_command()
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
     if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
     if (( ignore_command )); then local cmd="io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option"
-    else local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $( expanded_command $topic_command )"; fi # todo? comma_execute_and_wait?
+    else
+        verbose "cat topic_command: $topic_command"
+        local expanded_topic_command=$( expanded_command "$topic_command" )
+        verbose "cat expanded_topic_command: $expanded_topic_command"
+        local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $expanded_topic_command"
+    fi # todo? comma_execute_and_wait?
     verbose "$cmd"
     echo "$cmd"
 }
diff --git a/io/test/io-topics/command-template/disabled b/io/test/io-topics/command-template/disabled
new file mode 100644
index 000000000..9111fd4a0
--- /dev/null
+++ b/io/test/io-topics/command-template/disabled
@@ -0,0 +1 @@
+disabled pending feature completion

From 4aba3c3c26e845646e676a7c19e2ab236afbe00f Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 6 Sep 2024 18:48:39 +1000
Subject: [PATCH 0911/1056] io-topics: command substitution: in progress

---
 io/applications/io-topics                     | 41 ++++++++++---------
 .../substitution}/config.json                 |  0
 .../substitution}/disabled                    |  0
 .../substitution}/expected                    |  0
 .../substitution}/input                       |  0
 .../substitution}/test                        |  0
 6 files changed, 21 insertions(+), 20 deletions(-)
 rename io/test/io-topics/{command-template => commands/substitution}/config.json (100%)
 rename io/test/io-topics/{command-template => commands/substitution}/disabled (100%)
 rename io/test/io-topics/{command-template => commands/substitution}/expected (100%)
 rename io/test/io-topics/{command-template => commands/substitution}/input (100%)
 rename io/test/io-topics/{command-template => commands/substitution}/test (100%)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 77414c6c2..3bf7e1b98 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -299,31 +299,32 @@ function set_topic_variables()
 }
 
 # allow placeholders in the command string
-function expanded_command()
-{
-    local cmd="$1"
-    echo "$cmd"
-    return
-
-    local token
-    echo $cmd | sed 's/\${/\n${/;s/}/}\n/' \
-        | while IFS='' read token; do \
-              if [[ $token =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then
-                  local variable_name="options_${token:2:-1}"
-                  echo "${!variable_name}"
-              else
-                  echo "$token"
-              fi
-          done | tr -d '\n'
-}
+# function expanded_command()
+# {
+#     local cmd="$1"
+#     echo "$cmd"
+#     return
+
+#     local token
+#     echo $cmd | sed 's/\${/\n${/;s/}/}\n/' \
+#         | while IFS='' read token; do \
+#               if [[ $token =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then
+#                   local variable_name="options_${token:2:-1}"
+#                   echo "${!variable_name}"
+#               else
+#                   echo "$token"
+#               fi
+#           done | tr -d '\n'
+# }
 
-function expanded_command_old()
+function expanded_command()
 {
     local cmd="$1"
     {
         grep "=" <<< "$options" | comma_path_value_mangle
-        echo "cmd=\"$( sed -e 's#"#\\\"#g' -e "s#'#\\'#g" <<< "$cmd" )\""
-    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"'
+        echo "cmd="
+        sed -e 's#\${#\n\$\{#g' -e 's#}#}\n#g' <<< "$cmd" | sed -e 's#^#cmd+="#' -e 's#$#"#'
+    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"' | tr -d '\n'
 }
 
 function publish_command()
diff --git a/io/test/io-topics/command-template/config.json b/io/test/io-topics/commands/substitution/config.json
similarity index 100%
rename from io/test/io-topics/command-template/config.json
rename to io/test/io-topics/commands/substitution/config.json
diff --git a/io/test/io-topics/command-template/disabled b/io/test/io-topics/commands/substitution/disabled
similarity index 100%
rename from io/test/io-topics/command-template/disabled
rename to io/test/io-topics/commands/substitution/disabled
diff --git a/io/test/io-topics/command-template/expected b/io/test/io-topics/commands/substitution/expected
similarity index 100%
rename from io/test/io-topics/command-template/expected
rename to io/test/io-topics/commands/substitution/expected
diff --git a/io/test/io-topics/command-template/input b/io/test/io-topics/commands/substitution/input
similarity index 100%
rename from io/test/io-topics/command-template/input
rename to io/test/io-topics/commands/substitution/input
diff --git a/io/test/io-topics/command-template/test b/io/test/io-topics/commands/substitution/test
similarity index 100%
rename from io/test/io-topics/command-template/test
rename to io/test/io-topics/commands/substitution/test

From db059d42abd96a7b7e1590f214d4b020d5d2eec1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 6 Sep 2024 19:59:38 +1000
Subject: [PATCH 0912/1056] io-topics: expanded command implemented

---
 io/applications/io-topics                     | 34 ++++++-------------
 .../io-topics/commands/substitution/disabled  |  1 -
 2 files changed, 11 insertions(+), 24 deletions(-)
 delete mode 100644 io/test/io-topics/commands/substitution/disabled

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 3bf7e1b98..b1581ef28 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -298,33 +298,21 @@ function set_topic_variables()
     if [[ -n "$topic_header_binary" ]]; then binary_option="--binary=$topic_header_binary"; fi
 }
 
-# allow placeholders in the command string
-# function expanded_command()
-# {
-#     local cmd="$1"
-#     echo "$cmd"
-#     return
-
-#     local token
-#     echo $cmd | sed 's/\${/\n${/;s/}/}\n/' \
-#         | while IFS='' read token; do \
-#               if [[ $token =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then
-#                   local variable_name="options_${token:2:-1}"
-#                   echo "${!variable_name}"
-#               else
-#                   echo "$token"
-#               fi
-#           done | tr -d '\n'
-# }
-
-function expanded_command()
+function expanded_command() # quick and dirty
 {
     local cmd="$1"
     {
         grep "=" <<< "$options" | comma_path_value_mangle
-        echo "cmd="
-        sed -e 's#\${#\n\$\{#g' -e 's#}#}\n#g' <<< "$cmd" | sed -e 's#^#cmd+="#' -e 's#$#"#'
-    } | env -i $BASH -c 'eval "$( cat )"; echo "$cmd"' | tr -d '\n'
+        echo "${cmd// /__whitespace__}"
+    } \
+        | env -i $BASH -c 'input=$( cat )
+                           eval "$( head -n-1 <<< "$input" )"
+                           cmd=""
+                           while read line; do
+                               echo -n "$line" >> 1.txt
+                               if [[ $line =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then var="${line:2:-1}"; cmd+="${!var}"; else cmd+="$line"; fi
+                           done < <( tail -n1 <<< "$input" | sed -e "s#\${#\n\$\{#g" -e "s#}#}\n#g" )
+                           echo "${cmd//__whitespace__/ }"'
 }
 
 function publish_command()
diff --git a/io/test/io-topics/commands/substitution/disabled b/io/test/io-topics/commands/substitution/disabled
deleted file mode 100644
index 9111fd4a0..000000000
--- a/io/test/io-topics/commands/substitution/disabled
+++ /dev/null
@@ -1 +0,0 @@
-disabled pending feature completion

From f9fe3ca55b51201d06e09d0cbb7681567f36f640 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 6 Sep 2024 20:03:46 +1000
Subject: [PATCH 0913/1056] io/test/io-topics/command-template: moved to
 commands/substitution

---
 io/test/io-topics/command-template/config.json | 6 ------
 io/test/io-topics/command-template/disabled    | 1 -
 io/test/io-topics/command-template/expected    | 4 ----
 io/test/io-topics/command-template/input       | 2 --
 io/test/io-topics/command-template/test        | 5 -----
 5 files changed, 18 deletions(-)
 delete mode 100644 io/test/io-topics/command-template/config.json
 delete mode 100644 io/test/io-topics/command-template/disabled
 delete mode 100644 io/test/io-topics/command-template/expected
 delete mode 100644 io/test/io-topics/command-template/input
 delete mode 100755 io/test/io-topics/command-template/test

diff --git a/io/test/io-topics/command-template/config.json b/io/test/io-topics/command-template/config.json
deleted file mode 100644
index 29347c0f3..000000000
--- a/io/test/io-topics/command-template/config.json
+++ /dev/null
@@ -1,6 +0,0 @@
-{
-    "topic1":
-    {
-        "command": "echo ${log_dir}"
-    }
-}
diff --git a/io/test/io-topics/command-template/disabled b/io/test/io-topics/command-template/disabled
deleted file mode 100644
index 9111fd4a0..000000000
--- a/io/test/io-topics/command-template/disabled
+++ /dev/null
@@ -1 +0,0 @@
-disabled pending feature completion
diff --git a/io/test/io-topics/command-template/expected b/io/test/io-topics/command-template/expected
deleted file mode 100644
index c38a614eb..000000000
--- a/io/test/io-topics/command-template/expected
+++ /dev/null
@@ -1,4 +0,0 @@
-log/dir/output="my-dir"
-log/dir/status=0
-log/log_dir/output="my-log-dir"
-log/log_dir/status=0
diff --git a/io/test/io-topics/command-template/input b/io/test/io-topics/command-template/input
deleted file mode 100644
index 174169cc2..000000000
--- a/io/test/io-topics/command-template/input
+++ /dev/null
@@ -1,2 +0,0 @@
-log/dir="io-topics log --config config.json --dir my-dir"
-log/log_dir="io-topics log --config config.json --log-dir my-log-dir"
diff --git a/io/test/io-topics/command-template/test b/io/test/io-topics/command-template/test
deleted file mode 100755
index 152895e63..000000000
--- a/io/test/io-topics/command-template/test
+++ /dev/null
@@ -1,5 +0,0 @@
-#!/bin/bash
-
-source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
-
-comma_test_commands

From 9f13bb3ddef7fd00d6a279082c16bca534fa525b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 7 Sep 2024 13:00:17 +1000
Subject: [PATCH 0914/1056] io-topics: command substitution simplified

---
 io/applications/io-topics | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index b1581ef28..5189cdd10 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -303,16 +303,15 @@ function expanded_command() # quick and dirty
     local cmd="$1"
     {
         grep "=" <<< "$options" | comma_path_value_mangle
-        echo "${cmd// /__whitespace__}"
+        echo "$cmd"
     } \
         | env -i $BASH -c 'input=$( cat )
                            eval "$( head -n-1 <<< "$input" )"
                            cmd=""
-                           while read line; do
-                               echo -n "$line" >> 1.txt
+                           while IFS="" read line; do
                                if [[ $line =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then var="${line:2:-1}"; cmd+="${!var}"; else cmd+="$line"; fi
                            done < <( tail -n1 <<< "$input" | sed -e "s#\${#\n\$\{#g" -e "s#}#}\n#g" )
-                           echo "${cmd//__whitespace__/ }"'
+                           echo "$cmd"'
 }
 
 function publish_command()

From a95e6075f22b97c01dd844529c9a3d50e63fab78 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 7 Sep 2024 13:27:44 +1000
Subject: [PATCH 0915/1056] io-topics: --env: first cut implemented, basic test
 added

---
 io/applications/io-topics                     | 41 +++++++++++--------
 .../commands/substitution/config.json         |  2 +-
 .../io-topics/commands/substitution/expected  |  2 +
 io/test/io-topics/commands/substitution/input |  5 ++-
 .../commands/{substitution => }/test          |  0
 5 files changed, 31 insertions(+), 19 deletions(-)
 rename io/test/io-topics/commands/{substitution => }/test (100%)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 5189cdd10..993109845 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -20,19 +20,23 @@ function bash_completion()
 function common_options()
 {
     cat <<EOF
---help,-h;           display help and exit
---config=[<config>]; <config>: <dir>[:<path>], where <dir> is path to a
-                     json or path-value file specifying topic attributes,
-                     <path>: path inside config, multiple --config options
-                     allowed, configs will be applied in the reverse order
-                     of --config options on command line (see examples)
---dry-run,--dry;     print final command and exit
+--help,-h;            display help and exit
+--config=[<config>];  <config>: <dir>[:<path>], where <dir> is path to a
+                      json or path-value file specifying topic attributes,
+                      <path>: path inside config, multiple --config options
+                      allowed, configs will be applied in the reverse order
+                      of --config options on command line (see examples)
+--dry-run,--dry;      print final command and exit
+--env=[<defintions>]; <definitions>: bash-style variable definitions that 
+                      will be used only for \${some-var} variable substitution
+                      in commands, see variable substition in commands below
+                      e.g. --env="my_var=123;another_var='hello;world'"
 --topics-from-all-configs,--all; take topics from all configs and topic
-                     command values, default: take topics and topic command
-                     values only from the first config ("master config")
---topic-fields;      output topic config fields and exit
---topic-fields-help; output topic config fields help and exit
---verbose,-v;        print verbose information
+                      command values, default: take topics and topic command
+                      values only from the first config ("master config")
+--topic-fields;       output topic config fields and exit
+--topic-fields-help;  output topic config fields help and exit
+--verbose,-v;         print verbose information
 EOF
 }
 
@@ -56,10 +60,14 @@ operations
     publish: start all the publishers listed on command line or config file
 
 variable substition in commands
-    options can be passed to commands via variable substition. for example:
-    command="save-to-dir ${log_dir}"
-    all options are available,
-    e.g. --config -> ${config}; --log-dir -> ${log_dir}
+    options can be passed to commands via variable substition
+    example:
+        command="save-to-dir \${log_dir}"
+    all command line options and values defined in --env are available
+        e.g:
+            --config -> \${config}
+            --log-dir -> \${log_dir}
+            --env="my_var=5" -> \${my_var}
     see examples below for more detail
 
 common options
@@ -303,6 +311,7 @@ function expanded_command() # quick and dirty
     local cmd="$1"
     {
         grep "=" <<< "$options" | comma_path_value_mangle
+        echo "$options_env"
         echo "$cmd"
     } \
         | env -i $BASH -c 'input=$( cat )
diff --git a/io/test/io-topics/commands/substitution/config.json b/io/test/io-topics/commands/substitution/config.json
index 29347c0f3..c6f043da4 100644
--- a/io/test/io-topics/commands/substitution/config.json
+++ b/io/test/io-topics/commands/substitution/config.json
@@ -1,6 +1,6 @@
 {
     "topic1":
     {
-        "command": "echo ${log_dir}"
+        "command": "echo ${log_dir} ${my_var} ${another_var}"
     }
 }
diff --git a/io/test/io-topics/commands/substitution/expected b/io/test/io-topics/commands/substitution/expected
index c38a614eb..10c101a24 100644
--- a/io/test/io-topics/commands/substitution/expected
+++ b/io/test/io-topics/commands/substitution/expected
@@ -2,3 +2,5 @@ log/dir/output="my-dir"
 log/dir/status=0
 log/log_dir/output="my-log-dir"
 log/log_dir/status=0
+log/evn/output="my-dir hello world"
+log/evn/status=0
diff --git a/io/test/io-topics/commands/substitution/input b/io/test/io-topics/commands/substitution/input
index 174169cc2..d48192f35 100644
--- a/io/test/io-topics/commands/substitution/input
+++ b/io/test/io-topics/commands/substitution/input
@@ -1,2 +1,3 @@
-log/dir="io-topics log --config config.json --dir my-dir"
-log/log_dir="io-topics log --config config.json --log-dir my-log-dir"
+log/dir="io-topics log --config config.json --dir my-dir --verbose"
+log/log_dir="io-topics log --config config.json --log-dir my-log-dir --verbose"
+log/evn="io-topics log --config config.json --dir my-dir --env 'my_var=hello;another_var=world' --verbose"
diff --git a/io/test/io-topics/commands/substitution/test b/io/test/io-topics/commands/test
similarity index 100%
rename from io/test/io-topics/commands/substitution/test
rename to io/test/io-topics/commands/test

From ebb2073235addd6558093b75a2d02a3a3770ac53 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 7 Sep 2024 13:34:19 +1000
Subject: [PATCH 0916/1056] io-topics: variable substitution: plugged into
 on_exit, basic test added

---
 io/applications/io-topics                           | 2 +-
 io/test/io-topics/commands/substitution/config.json | 3 ++-
 io/test/io-topics/commands/substitution/expected    | 9 ++++++---
 3 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 993109845..473d5dcd1 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -463,7 +463,7 @@ for topic in ${topics[@]}; do
     set_topic_variables "$operation" "$topic"
     cmd="$( ${operation}_command $topic )" || die "topic '$topic': making command failed"
     commands+=( "$cmd" )
-    [[ $topic_on_exit ]] && on_exit_commands+=( "$topic_on_exit" )
+    [[ $topic_on_exit ]] && on_exit_commands+=( "$( expanded_command "$topic_on_exit" )" )
 done
 say "will run 'comma_execute_and_wait --group' with commands:"
 for cmd in "${commands[@]}"; do say "    $cmd"; done
diff --git a/io/test/io-topics/commands/substitution/config.json b/io/test/io-topics/commands/substitution/config.json
index c6f043da4..106acde84 100644
--- a/io/test/io-topics/commands/substitution/config.json
+++ b/io/test/io-topics/commands/substitution/config.json
@@ -1,6 +1,7 @@
 {
     "topic1":
     {
-        "command": "echo ${log_dir} ${my_var} ${another_var}"
+        "command": "echo command: echo ${log_dir} ${my_var} ${another_var}",
+        "on_exit": "echo on_exit: echo ${log_dir}"
     }
 }
diff --git a/io/test/io-topics/commands/substitution/expected b/io/test/io-topics/commands/substitution/expected
index 10c101a24..d80b50e68 100644
--- a/io/test/io-topics/commands/substitution/expected
+++ b/io/test/io-topics/commands/substitution/expected
@@ -1,6 +1,9 @@
-log/dir/output="my-dir"
+log/dir/output/line[0]="command: echo my-dir"
+log/dir/output/line[1]="on_exit: echo my-dir"
 log/dir/status=0
-log/log_dir/output="my-log-dir"
+log/log_dir/output/line[0]="command: echo my-log-dir"
+log/log_dir/output/line[1]="on_exit: echo my-log-dir"
 log/log_dir/status=0
-log/evn/output="my-dir hello world"
+log/evn/output/line[0]="command: echo my-dir hello world"
+log/evn/output/line[1]="on_exit: echo my-dir"
 log/evn/status=0

From ac7dd964d54c8266ac41c281196b3eefec3f93e1 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 7 Sep 2024 18:27:05 +1000
Subject: [PATCH 0917/1056] io-topics: --help: variable substitution: more
 examples added

---
 io/applications/io-topics | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/io/applications/io-topics b/io/applications/io-topics
index 473d5dcd1..0dd42e1fa 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -60,9 +60,10 @@ operations
     publish: start all the publishers listed on command line or config file
 
 variable substition in commands
-    options can be passed to commands via variable substition
-    example:
-        command="save-to-dir \${log_dir}"
+    options can be passed to command and on_exit fields via variable substition
+    examples
+        "command": "log-some-sensor \${log_dir}"
+        "on_exit": "save-to-dir \${log_dir}"
     all command line options and values defined in --env are available
         e.g:
             --config -> \${config}

From 8e660a22bb826d8e2ae0413049fe43fb017ce679 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 Sep 2024 01:22:58 +1000
Subject: [PATCH 0918/1056] missing headers included

---
 csv/applications/csv-seek.cpp  | 1 +
 csv/applications/csv-shape.cpp | 1 +
 io/load.h                      | 4 ++--
 io/stream.h                    | 1 +
 name_value/ptree.h             | 1 +
 5 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index 8897785c3..881c95932 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -2,6 +2,7 @@
 
 /// @author Aspen Eyers
 
+#include <cstdint>
 #include <iostream>
 #include <fstream>
 #include "../../application/command_line_options.h"
diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 74d65d009..46fc29289 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -3,6 +3,7 @@
 
 /// @author dewey nguyen
 
+#include <cstdint>
 #include <deque>
 #include <iostream>
 #include <vector>
diff --git a/io/load.h b/io/load.h
index 44fc8f598..b6e2599a1 100644
--- a/io/load.h
+++ b/io/load.h
@@ -22,7 +22,7 @@ template < typename T, template < typename S, typename A > class C = std::vector
 C< T, A > load_array( const std::string& path );
 
 
-template < typename T, template < typename S, typename A > class C = std::vector, typename A >
+template < typename T, template < typename S, typename A > class C, typename A >
 inline C< T, A >& load_array( C< T, A >& a, const std::string& path )
 {
     std::ifstream ifs( path );
@@ -33,7 +33,7 @@ inline C< T, A >& load_array( C< T, A >& a, const std::string& path )
     return a;
 }
 
-template < typename T, template < typename S, typename A > class C = std::vector, typename A >
+template < typename T, template < typename S, typename A > class C, typename A >
 inline C< T, A > load_array( const std::string& path )
 {
     C< T, A > a;
diff --git a/io/stream.h b/io/stream.h
index 70e3ff013..a86ac2e58 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -5,6 +5,7 @@
 
 #pragma once
 
+#include <cstdint>
 #include <iostream>
 #include <memory>
 #include <string>
diff --git a/name_value/ptree.h b/name_value/ptree.h
index d80996b99..32710fd47 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -19,6 +19,7 @@
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
+#include <boost/type_traits.hpp>
 #include <boost/unordered_set.hpp>
 #include <boost/version.hpp>
 #include "../base/exception.h"

From baae2a8df7c8250c8a514e59cff3923a7b061d0a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 Sep 2024 12:44:16 +1000
Subject: [PATCH 0919/1056] test/io-cat/single_feed/test: check of netstat
 installed added

---
 io/test/io-cat/single_feed/test | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/io/test/io-cat/single_feed/test b/io/test/io-cat/single_feed/test
index 52799eab8..31cc8fdb8 100755
--- a/io/test/io-cat/single_feed/test
+++ b/io/test/io-cat/single_feed/test
@@ -6,6 +6,8 @@ prefix=io-cat
 declare -A pids
 declare -A files
 
+type -p netstat >/dev/null || { echo "$0: netstat not found; to install run: sudo apt install net-tools"; exit 1; }
+
 function bye
 {
     trap '' INT TERM HUP  # ignore signals

From 6be1bf86bba9350cf37bdb1c9d1248abc2b9445b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sat, 14 Sep 2024 12:59:54 +1000
Subject: [PATCH 0920/1056] python/comma/dictionary/test/test: pytest
 installation check added

---
 io/test/io-cat/single_feed/test   | 2 +-
 python/comma/dictionary/test/test | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/io/test/io-cat/single_feed/test b/io/test/io-cat/single_feed/test
index 31cc8fdb8..f08a94b25 100755
--- a/io/test/io-cat/single_feed/test
+++ b/io/test/io-cat/single_feed/test
@@ -6,7 +6,7 @@ prefix=io-cat
 declare -A pids
 declare -A files
 
-type -p netstat >/dev/null || { echo "$0: netstat not found; to install run: sudo apt install net-tools"; exit 1; }
+type -p netstat >/dev/null || { echo "$0: netstat not found; to install run: sudo apt install net-tools" >&2; exit 1; }
 
 function bye
 {
diff --git a/python/comma/dictionary/test/test b/python/comma/dictionary/test/test
index dd2083842..e61bd77fb 100755
--- a/python/comma/dictionary/test/test
+++ b/python/comma/dictionary/test/test
@@ -1,4 +1,5 @@
 #!/bin/bash
 
 name=$( basename $0 )
+type -p pytest >/dev/null || { echo "$0: pytest not found; to install run: sudo apt install python3-pytest" >&2; exit 1; }
 pytest 1>&2 && echo "$name: succeeded" >&2 || { echo "$name: failed" >&2; exit 1; }

From e1b5f3dcc2ef390944aa414b1cb0301ff6a112bd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 Sep 2024 11:27:38 +1000
Subject: [PATCH 0921/1056] csv-intervals: initialization warnings fixed

---
 csv/applications/csv-intervals.cpp | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/csv/applications/csv-intervals.cpp b/csv/applications/csv-intervals.cpp
index 01e02c6de..0042e47c9 100644
--- a/csv/applications/csv-intervals.cpp
+++ b/csv/applications/csv-intervals.cpp
@@ -270,9 +270,14 @@ struct interval_t
     to_t< To > to;
 };
 
+
+template < typename T > struct scalar_traits { static T zero() { return 0; } };
+template <> struct scalar_traits< boost::posix_time::ptime > { static boost::posix_time::ptime zero() { return boost::posix_time::ptime(); } };
+template <> struct scalar_traits< std::string > { static std::string zero() { return ""; } };
+
 template < typename T > struct scalar_t
 { 
-    T scalar;
+    T scalar{ scalar_traits< T >::zero() };
     scalar_t() {}
     scalar_t( const T& t ): scalar( t ) {}
 };

From e9322d1a7eafc35845f6d9fee04833aefa04332b Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 Sep 2024 12:11:56 +1000
Subject: [PATCH 0922/1056] csv/impl/unstructured, csv-enumerate: compile
 warning fixed

---
 csv/applications/csv-enumerate.cpp | 56 +++++++++++++++---------------
 csv/impl/unstructured.h            |  8 ++---
 2 files changed, 32 insertions(+), 32 deletions(-)

diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index 459c40719..10b15b6c7 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -29,7 +29,7 @@
 
 /// @author vsevolod vlaskine
 
-#include <boost/unordered_map.hpp>
+#include <unordered_map>
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -39,26 +39,27 @@
 
 static void usage( bool verbose )
 {
-    std::cerr << std::endl;
-    std::cerr << "append unique id to csv records with the same values; support integer, time, and string fields" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: cat data.csv | csv-enumerate <options>" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "todo: support floating point values as input keys" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --fields,-f=<fields>; fields of interest, actual field names do not matter; e.g: --fields ,,,a,,b,,,c" << std::endl;
-    std::cerr << "    --format=<binary format>; if input is ascii and deducing data types may be ambiguous, define field types explicitly, value as in --binary" << std::endl;
-    std::cerr << "    --output-map,--map: do not output input records, only an unsorted list of keys" << std::endl;
-    std::cerr << "                        output fields" << std::endl;
-    std::cerr << "                            - list of input key values; in same binary as input" << std::endl;
-    std::cerr << "                            - corresponding enumeration index as ui" << std::endl;
-    std::cerr << "                            - number of values for this enumeration index as ui" << std::endl;
-    std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "csv options" << std::endl;
+    std::cerr << R"(
+append unique id to csv records with the same values; support integer, time, and string fields
+
+usage: cat data.csv | csv-enumerate <options>
+
+todo: support floating point values as input keys
+
+options
+    --fields,-f=<fields>; fields of interest, actual field names do not matter
+                          e.g: --fields ,,,a,,b,,,c
+    --format=<binary format>; if input is ascii and deducing data types may be ambiguous,
+                              define field types explicitly, value as in --binary
+    --output-map,--map: do not output input records, only an unsorted list of keys
+                        output fields
+                            - list of input key values; in same binary as input
+                            - corresponding enumeration index as ui
+                            - number of values for this enumeration index as ui
+    --verbose,-v: more output to stderr
+)" << std::endl;
+std::cerr << "csv options" << std::endl;
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
-    std::cerr << std::endl;
     exit( 0 );
 }
 
@@ -81,16 +82,15 @@ template <> struct traits< output >
 int main( int ac, char** av )
 {
     typedef comma::csv::impl::unstructured input_t;
-    typedef boost::unordered_map< comma::csv::impl::unstructured, std::pair< comma::uint32, comma::uint32 >, comma::csv::impl::unstructured::hash >  map_t;
+    typedef std::unordered_map< comma::csv::impl::unstructured, std::pair< comma::uint32, comma::uint32 >, comma::csv::impl::unstructured::hash >  map_t;
     try
     {
         comma::command_line_options options( ac, av, usage );
-        bool verbose = options.exists( "--verbose,-v" );
         bool output_map = options.exists( "--output-map,--map" );
         comma::csv::options csv( options );
         bool has_non_empty_field = false;
         for( const auto& f: comma::split( csv.fields, ',' ) ) { if( !f.empty() ) { has_non_empty_field = true; break; } }
-        if( !has_non_empty_field ) { std::cerr << "csv-enumerate: please specify at least one key in fields" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( has_non_empty_field, "please specify at least one key in fields" );
         std::string first_line;
         comma::csv::format f;
         if( csv.binary() ) { f = csv.format(); }
@@ -100,7 +100,7 @@ int main( int ac, char** av )
             while( std::cin.good() && first_line.empty() ) { std::getline( std::cin, first_line ); }
             if( first_line.empty() ) { return 0; }
             f = comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter );
-            if( verbose ) { std::cerr << "csv-enumerate: guessed format: " << f.string() << std::endl; }
+            comma::saymore() << "guessed format: " << f.string() << std::endl;
         }
         input_t default_input;
         std::vector< std::string > v = comma::split( csv.fields, ',' );
@@ -114,7 +114,7 @@ int main( int ac, char** av )
             if( csv.binary() ) { s.push_back( format[i] ); }
         }
         std::string map_output_binary_format = comma::join( s, ',' );
-        if( verbose ) { std::cerr << "csv-enumerate: fields " << csv.fields << " interpreted as: " << comma::join( v, ',' ) << std::endl; }
+        comma::saymore() << "fields " << csv.fields << " interpreted as: " << comma::join( v, ',' ) << std::endl;
         csv.fields = comma::join( v, ',' );
         static map_t map;
         comma::uint32 id = 0;
@@ -148,13 +148,13 @@ int main( int ac, char** av )
         if( csv.binary() )
         { 
             output_map_csv.format( map_output_binary_format + ",2ui" ); //output_map_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" );
-            std::cerr << "csv-enumerate: binary output format for map: \"" << output_map_csv.format().string() << "\"" << std::endl;
+            comma::say() << "binary output format for map: '" << output_map_csv.format().string() << "'" << std::endl;
         }
         comma::csv::output_stream< map_t::value_type > omstream( std::cout, output_map_csv, std::make_pair( default_input, std::make_pair( 0, 0 ) ) );
         for( map_t::const_iterator it = map.begin(); it != map.end(); ++it ) { omstream.write( *it ); }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-enumerate: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-enumerate: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/impl/unstructured.h b/csv/impl/unstructured.h
index c724d7122..6f4e653e6 100644
--- a/csv/impl/unstructured.h
+++ b/csv/impl/unstructured.h
@@ -27,11 +27,11 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #pragma once
 
+#include <functional>
 #include <string>
 #include <type_traits>
 #include <vector>
@@ -67,9 +67,9 @@ struct unstructured
                 return true;
             }
             
-            struct hash : public std::unary_function< values, std::size_t >
+            struct hash //: public std::function< std::size_t ( const& values ) >
             {
-                std::size_t operator()( values const& p ) const
+                std::size_t operator()( const values& p ) const
                 {
                     std::size_t seed = 0;
                     for( std::size_t i = 0; i < p.size(); ++i ) { hash_combine_impl_( seed, p[i] ); }
@@ -212,7 +212,7 @@ struct unstructured
     
     template < typename T > const values< T >& get() const;
         
-    struct hash : public std::unary_function< unstructured, std::size_t >
+    struct hash //: public std::unary_function< unstructured, std::size_t >
     {
         std::size_t operator()( unstructured const& p ) const
         {

From f0b36c1f34b37a6f328a8b50c2c3f5fcd45b1791 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 Sep 2024 12:16:35 +1000
Subject: [PATCH 0923/1056] csv/impl/unstructured.h: unused include removed

---
 csv/impl/unstructured.h | 11 ++---------
 1 file changed, 2 insertions(+), 9 deletions(-)

diff --git a/csv/impl/unstructured.h b/csv/impl/unstructured.h
index 6f4e653e6..617f77b19 100644
--- a/csv/impl/unstructured.h
+++ b/csv/impl/unstructured.h
@@ -31,7 +31,6 @@
 
 #pragma once
 
-#include <functional>
 #include <string>
 #include <type_traits>
 #include <vector>
@@ -198,15 +197,9 @@ struct unstructured
         return f;
     }
     
-    bool operator==( const unstructured& rhs ) const
-    {
-        return longs == rhs.longs && doubles == rhs.doubles && time == rhs.time && strings == rhs.strings;        
-    }
+    bool operator==( const unstructured& rhs ) const { return longs == rhs.longs && doubles == rhs.doubles && time == rhs.time && strings == rhs.strings; }
     
-    bool operator<( const unstructured& rhs ) const
-    {
-        return doubles < rhs.doubles && time < rhs.time && strings < rhs.strings;        
-    }
+    bool operator<( const unstructured& rhs ) const { return doubles < rhs.doubles && time < rhs.time && strings < rhs.strings; }
     
     template < typename T > values< T >& get();
     

From 34d571331099e8ff6f83fb9e37163b120180eb77 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 Sep 2024 12:33:48 +1000
Subject: [PATCH 0924/1056] bash/test/comma_name_value_to_options: failing test
 fixed

---
 bash/test/comma_name_value_to_options/expected | 14 ++++++++++----
 bash/test/comma_name_value_to_options/test     | 16 +++++++++-------
 2 files changed, 19 insertions(+), 11 deletions(-)

diff --git a/bash/test/comma_name_value_to_options/expected b/bash/test/comma_name_value_to_options/expected
index 28464c9e2..b45350421 100644
--- a/bash/test/comma_name_value_to_options/expected
+++ b/bash/test/comma_name_value_to_options/expected
@@ -6,10 +6,16 @@ basic[4]/text=""
 basic[5]/text=""
 basic[6]/text="----hello_world=1 "
 multi[0]/text="--hello_world=1 --hello=world --hello=world ----hello_world=1 "
-co_to_nv[0]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
-co_to_nv[1]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
-co_to_nv[2]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
-co_to_nv[3]/text="debug=|1|@directory=|\|/tmp\||@verbose=|1|@"
+
+#co_to_nv[0]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
+#co_to_nv[1]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
+#co_to_nv[2]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
+#co_to_nv[3]/text="debug=|1|@directory=|\|/tmp\||@verbose=|1|@"
+co_to_nv[0]/text="debug=__quote__1__quote__&directory=__quote__/tmp__quote__&verbose=__quote__1__quote__&"
+co_to_nv[1]/text="debug=__quote__1__quote__&directory=__quote__/tmp__quote__&verbose=__quote__1__quote__&"
+co_to_nv[2]/text="debug=__quote__1__quote__&directory=__quote__/tmp__quote__&verbose=__quote__1__quote__&"
+co_to_nv[3]/text="debug=__quote__1__quote__&directory=__quote____backslash__quote__/tmp__backslash__quote____quote__&verbose=__quote__1__quote__&"
+
 cnv_to_o[0]/text="--debug=1 --directory=/tmp --verbose=1 "
 cnv_to_o[1]/text="--debug=1 --directory=/tmp --verbose=1 "
 cnv_to_o[2]/text="--debug=1 --directory=/tmp --verbose=1 "
diff --git a/bash/test/comma_name_value_to_options/test b/bash/test/comma_name_value_to_options/test
index e8c1f5369..7e549281c 100755
--- a/bash/test/comma_name_value_to_options/test
+++ b/bash/test/comma_name_value_to_options/test
@@ -58,6 +58,8 @@ echo '--debug; much more debug output
 --verbose,-v; more output'
 }
 
+function escape() { sed -e 's#"#__quote__#g' -e 's#\\#__backslash#g' | tr '\n' '&'; }
+
 echo "basic[0]/text=\"$( comma_name_value_to_options <<< 'hello world' )\""
 echo "basic[1]/text=\"$( comma_name_value_to_options <<< 'hello_world=1' )\""
 echo "basic[2]/text=\"$( comma_name_value_to_options <<< 'hello=world' )\""
@@ -73,14 +75,14 @@ hello="world"
 hello_world
 --hello_world=1' | tr '\n' '@' )\""
 
-echo "co_to_nv[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp" --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
-echo "co_to_nv[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp" --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
-echo "co_to_nv[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp" --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
-echo "co_to_nv[3]/text=\"$( command_description | comma-options-to-name-value '--directory="/tmp"' --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
+echo "co_to_nv[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp"   --debug --verbose | escape )\""
+echo "co_to_nv[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp"   --debug --verbose | escape )\""
+echo "co_to_nv[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp"   --debug --verbose | escape )\""
+echo "co_to_nv[3]/text=\"$( command_description | comma-options-to-name-value '--directory="/tmp"' --debug --verbose | escape )\""
 
-echo "cnv_to_o[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp" --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
-echo "cnv_to_o[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp" --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
-echo "cnv_to_o[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp" --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
+echo "cnv_to_o[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp"   --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
+echo "cnv_to_o[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp"   --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
+echo "cnv_to_o[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp"   --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
 
 comma_name_value_to_options <<< 'directory=/tmp
 verbose="1"

From 48f5e72843e3ccd62cd929e41e25571383242b55 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 Sep 2024 12:51:24 +1000
Subject: [PATCH 0925/1056] io/test/io-tee/simple: backslash escaped in output
 and expected

---
 io/test/io-tee/simple/expected | 2 +-
 io/test/io-tee/simple/test     | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/test/io-tee/simple/expected b/io/test/io-tee/simple/expected
index 36ad9793b..6e9d6d841 100644
--- a/io/test/io-tee/simple/expected
+++ b/io/test/io-tee/simple/expected
@@ -14,5 +14,5 @@ pipeline/stdout/matches="true"
 
 basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
-pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+pipeline/command="bash -c (SQUOTE)grep (SQUOTE)(BSLASH)(SQUOTE)(SQUOTE)^t(SQUOTE)(BSLASH)(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 
diff --git a/io/test/io-tee/simple/test b/io/test/io-tee/simple/test
index 21d6e0513..2b1cadefe 100755
--- a/io/test/io-tee/simple/test
+++ b/io/test/io-tee/simple/test
@@ -41,7 +41,7 @@ function run_test()
     local -r expected_file="$test_name.expected"
     if [[ -z "$expected" ]]; then > $expected_file; else echo -e "$expected" > $expected_file; fi
     echo "test: $test_name: command is: $@" >&2
-    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed 's/"/(DQUOTE)/g'"; s/'/(SQUOTE)/g" )\""
+    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed -e 's/"/(DQUOTE)/g' -e "s/'/(SQUOTE)/g" -e 's/\\/(BSLASH)/g' )\""
     cat $input | io-tee $options $tee_file $dashdash "$@" > $stdout_file
     if [[ $? != 0 ]]; then
         echo "test: io-tee call failed" >&2

From 9243d874187c5cd1eaa673d02bdb4627145ba5a6 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 16 Sep 2024 12:56:00 +1000
Subject: [PATCH 0926/1056] io/test/io-tee/comma_tee_function: backslash
 escaped in output and expected

---
 io/test/io-tee/comma_tee_function/expected | 2 +-
 io/test/io-tee/comma_tee_function/test     | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/io/test/io-tee/comma_tee_function/expected b/io/test/io-tee/comma_tee_function/expected
index 79d21019b..59c671aae 100644
--- a/io/test/io-tee/comma_tee_function/expected
+++ b/io/test/io-tee/comma_tee_function/expected
@@ -24,5 +24,5 @@ basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(D
 function_call_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 unbuffered_fn_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
-pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+pipeline/command="bash -c (SQUOTE)grep (SQUOTE)(BSLASH)(SQUOTE)(SQUOTE)^t(SQUOTE)(BSLASH)(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 
diff --git a/io/test/io-tee/comma_tee_function/test b/io/test/io-tee/comma_tee_function/test
index 510f80da4..954ac65c1 100755
--- a/io/test/io-tee/comma_tee_function/test
+++ b/io/test/io-tee/comma_tee_function/test
@@ -41,7 +41,7 @@ function run_test()
     local -r expected_file="$test_name.expected"
     if [[ -z "$expected" ]]; then > $expected_file; else echo -e "$expected" > $expected_file; fi
     echo "test: $test_name: command is: $@" >&2
-    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed 's/"/(DQUOTE)/g'"; s/'/(SQUOTE)/g" )\""
+    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed -e 's/"/(DQUOTE)/g' -e "s/'/(SQUOTE)/g" -e 's/\\/(BSLASH)/g' )\""
     cat $input | comma_tee_function $options $tee_file $dashdash "$@" > $stdout_file
     if [[ $? != 0 ]]; then
         echo "test: io-tee call failed" >&2

From 31b3c139773dbaa87d856bb0beda7fe45c8b4f3f Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 17 Sep 2024 11:19:56 +1000
Subject: [PATCH 0927/1056] python/CMakeLists.txt: change setup.py generated
 directories to be owned by user

---
 python/CMakeLists.txt | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index 94d059f5d..9dc0f284c 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -85,6 +85,14 @@ INSTALL( CODE "EXECUTE_PROCESS(
                     COMMAND ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE} install ${INSTALL_PREFIX_OPTION} --force
                     WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
 
+# setup.py creates a couple of working directories in the current directory: comma_py.egg_info and dist
+# Because it's run in the install stage, and therefore typically as root, these
+# directories are owned by root, which is a bit annoying as they are in the
+# source tree. So set them to being owned by the user.
+INSTALL( CODE "EXECUTE_PROCESS(
+                    COMMAND chown -R $ENV{USER} comma_py.egg-info dist
+                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
+
 #install( CODE "EXECUTE_PROCESS(
 #                    COMMAND ${PYTHON} -m pip install ${CMAKE_CURRENT_SOURCE_DIR} --ignore-installed
 #                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )

From 3c78011a2f1cc9369fbc9881af9ef9980e9d6a62 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 17 Sep 2024 13:47:22 +1000
Subject: [PATCH 0928/1056] packed: constexpr used for size instead of enum

---
 packed/field.h  | 2 +-
 packed/struct.h | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/packed/field.h b/packed/field.h
index 4d703e630..ac888832d 100644
--- a/packed/field.h
+++ b/packed/field.h
@@ -15,7 +15,7 @@ template < typename Derived, typename T, size_t S >
 class field
 {
     public:
-        enum { size = S };
+        static constexpr unsigned int size = S;
 
         static_assert( size > 0, "expected positive size" );
 
diff --git a/packed/struct.h b/packed/struct.h
index 3ac27ecc7..4fe5718be 100644
--- a/packed/struct.h
+++ b/packed/struct.h
@@ -14,7 +14,7 @@ namespace comma { namespace packed {
 template < class Derived, size_t S >
 struct packed_struct
 {
-    enum { size = S };
+    static constexpr unsigned int size = S;
 
     packed_struct() throw() { static_assert( sizeof( Derived ) == size, "expected derived of provided size" ); }
 

From 63ee7a3e0b03b7b8697c95d53b9abf78fb94429f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 17 Sep 2024 22:09:31 +1000
Subject: [PATCH 0929/1056] csv-sort: using std::shuffle() instead of
 std::random_shuffle()

---
 csv/applications/csv-sort.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index b4157c346..727f29de5 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -563,7 +563,7 @@ static int random( const comma::command_line_options& options )
             if( !p || block != *p )
             {
                 std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
-                std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+                std::shuffle( records.begin(), records.end(), generator ); // std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
                 for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
                 if( csv.flush ) { std::cout.flush(); }
                 records.clear();
@@ -609,7 +609,7 @@ static int random( const comma::command_line_options& options )
             }
         }
         std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
-        std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+        std::shuffle( records.begin(), records.end(), generator ); // std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
         for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
     }
     return 0;

From 8355a6c3a1de3e5b3366be3e5bd0b862eee72c8d Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 26 Sep 2024 17:16:04 +1000
Subject: [PATCH 0930/1056] csv-shuffle: --help brushed up

---
 csv/applications/csv-shuffle.cpp | 69 ++++++++++++++++----------------
 1 file changed, 35 insertions(+), 34 deletions(-)

diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index aaf9d0d77..5589ab800 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -17,33 +17,34 @@
 
 static void usage( bool verbose )
 {
-    std::cerr << "perform operations on csv columns" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: cat data.csv | csv-shuffle <options> > shuffled.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
-    std::cerr << "    --drop-empty,-e; e.g. csv-shuffle --fields a,b,,,c --drop-empty is equivalent to" << std::endl;
-    std::cerr << "                          csv-shuffle --fields a,b,,,c --output-fields a,b,c" << std::endl;
-    std::cerr << "    --fields,-f,--input-fields=<fields>; input fields" << std::endl;
-    std::cerr << "    --output-fields,--output,-o=<fields>; output fields, if not specified, will be set" << std::endl;
-    std::cerr << "                                          to --input-fields, which would chop off trailing input fields" << std::endl;
-    std::cerr << "                                          see also --drop-empty" << std::endl;
-    std::cerr << "    --verbose,-v: more output" << std::endl;
-    if( verbose ) { std::cerr << std::endl << comma::csv::options::usage() << std::endl; }
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    operations (for now): append, remove, swap" << std::endl;
-    std::cerr << "    semantics:" << std::endl;
-    std::cerr << "        remove:" << std::endl;
-    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z" << std::endl;
-    std::cerr << "        append:" << std::endl;
-    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=x,y,z,x" << std::endl;
-    std::cerr << "        swap:" << std::endl;
-    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=y,z,x" << std::endl;
-    std::cerr << "        remove x, swap y,z, append z two times:" << std::endl;
-    std::cerr << "            echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=z,y,z,z" << std::endl;
-    std::cerr << std::endl;
+    std::cerr << R"(
+swap, remove, or duplicate csv fields
+
+usage: cat data.csv | csv-shuffle <options> > shuffled.csv
+
+options
+    --drop-empty,-e; e.g. two following commands are equivalent
+                     csv-shuffle --fields a,b,,,c --drop-empty
+                     csv-shuffle --fields a,b,,,c --output-fields a,b,c
+    --fields,-f,--input-fields=<fields>; input fields
+    --output-fields,--output,-o=<fields>; output fields, if not specified,
+                                          will be set to --input-fields,
+                                          which would chop off trailing
+                                          input fields see also --drop-empty
+    --verbose,-v: more verbose output
+)" << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+std::cerr << R"(examples
+    remove
+        echo 0,1,2 | csv-shuffle --fields=x,y,z
+    append
+        echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=x,y,z,x
+    swap
+        echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=y,z,x
+    remove x, swap y,z, append z two times
+        echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=z,y,z,z
+)" << std::endl;
     exit( 0 );
 }
 
@@ -61,11 +62,11 @@ int main( int ac, char** av )
             for( auto s: output_fields ) { if( !s.empty() ) { v.push_back( s ); } }
             output_fields = v;
         }
-        if( output_fields.empty() ) { std::cerr << "csv-shuffle: please specify --output-fields or --drop-empty" << std::endl; return 1; }
-        if( output_fields.back() == "..." ) { std::cerr << "csv-shuffle: support for trailing fields has been removed for now; please specify input/output fields explicitly" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !output_fields.empty(), "please specify --output-fields or --drop-empty" );
+        COMMA_ASSERT_BRIEF( output_fields.back() != "...", "support for trailing fields has been removed for now; please specify input/output fields explicitly" );
         auto find_ = [&]( const std::string& n )->unsigned int
         {
-            if( n.empty() ) { COMMA_THROW( comma::exception, "got empty fields in output fields '" << comma::join( output_fields, ',' ) << "'; you may need to use --drop-empty" ); }
+            COMMA_ASSERT_BRIEF( !n.empty(), "got empty fields in output fields '" << comma::join( output_fields, ',' ) << "'; you may need to use --drop-empty" );
             unsigned int j = 0;
             for( ; j < input_fields.size(); ++j ) { if( input_fields[j] == n ) { return j; } }
             COMMA_THROW( comma::exception, "output field '" << n << "' not found in input fields '" << csv.fields << "'" );
@@ -89,7 +90,7 @@ int main( int ac, char** av )
             {
                 std::cin.read( &buf[0], csv.format().size() );
                 if( std::cin.gcount() == 0 ) { continue; }
-                if( std::cin.gcount() < int( csv.format().size() ) ) { std::cerr << "csv-shuffle: expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() << std::endl; return 1; }
+                COMMA_ASSERT_BRIEF( std::cin.gcount() >= int( csv.format().size() ), "expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() );
                 for( const auto& offset: offsets ) { std::cout.write( &buf[ offset.first ], offset.second ); }
                 if( csv.flush ) { std::cout.flush(); }
             }
@@ -104,14 +105,14 @@ int main( int ac, char** av )
             if( !line.empty() && *line.rbegin() == '\r' ) { line = line.substr( 0, line.length() - 1 ); } // windows... sigh...
             if( line.empty() ) { continue; }
             const auto& v = comma::split( line, csv.delimiter );
-            if( v.size() < input_fields.size() ) { std::cerr << "csv-shuffle: expected at least " << input_fields.size() << " fields, got only " << v.size() << " in record \"" << line << "\"" << std::endl; return 1; }
+            COMMA_ASSERT_BRIEF( v.size() >= input_fields.size(), "expected at least " << input_fields.size() << " fields, got only " << v.size() << " in record \"" << line << "\"" );
             std::string delimiter;
             for( auto index: indices ) { std::cout << delimiter << v[index]; delimiter = csv.delimiter; }
             std::cout << std::endl;
         }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-shuffle: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-shuffle: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }

From a1c8577e920ab999521bf22074ccfeeef680beed Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 27 Sep 2024 13:44:23 +1000
Subject: [PATCH 0931/1056] io-cat: --help brushed up

---
 io/applications/io-cat.cpp | 200 ++++++++++++++++++-------------------
 1 file changed, 100 insertions(+), 100 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index f12534c88..b9356ae14 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -49,99 +50,98 @@
 
 void usage( bool verbose = false )
 {
-    std::cerr << std::endl;
-    std::cerr << "read from one or a few sources, merge, and output to stdout" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: io-cat <address> [<address>] ... [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<address>" << std::endl;
-    std::cerr << "    local:<path>: local socket" << std::endl;
-    std::cerr << "    tcp:<host>:<port>: tcp socket" << std::endl;
-    std::cerr << "    udp:<port>: udp socket" << std::endl;
-    std::cerr << "    zmp-<protocol>:<address>: zmq (todo)" << std::endl;
-    std::cerr << "    <filename>: file" << std::endl;
-    std::cerr << "    <fifo>: named pipe" << std::endl;
-    std::cerr << "    -: stdin" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --exit-on-first-closed,-e: exit, if one of the streams finishes" << std::endl;
-    std::cerr << "    --flush,--unbuffered,-u: flush output" << std::endl;
-    std::cerr << "    --verbose,-v: more output" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "output order options" << std::endl;
-    std::cerr << "    --blocking: blocking read on each source in order sources appear on command line" << std::endl;
-    std::cerr << "                output modes" << std::endl;
-    std::cerr << "                    default:     output all records from the first source, then all" << std::endl;
-    std::cerr << "                                 records from the seconds source, etc" << std::endl;
-    std::cerr << "                    round robin: output <n> records from the first source, then <n>" << std::endl;
-    std::cerr << "                                 records from the seconds source, etc; note that if" << std::endl;
-    std::cerr << "                                 the number of records in a source is not divisible by <n>" << std::endl;
-    std::cerr << "                                 then the last records groups may contain fewer than <n>" << std::endl;
-    std::cerr << "                                 records" << std::endl;
-    std::cerr << "                attention: if you want full control over record ordering, use --blocking" << std::endl;
-    std::cerr << "                           when using subshells or sockets as io-cat inputs " << std::endl;
+    std::cerr << R"(
+read from one or a few sources, merge, and output to stdout
+
+usage: io-cat <address> [<address>] ... [<options>]
+
+<address>
+    local:<path>: local socket
+    tcp:<host>:<port>: tcp socket
+    udp:<port>: udp socket
+    zmp-<protocol>:<address>: zmq (todo)
+    <filename>: file
+    <fifo>: named pipe
+    -: stdin
+
+options
+    --exit-on-first-closed,-e: exit, if one of the streams finishes
+    --flush,--unbuffered,-u: flush output
+    --verbose,-v: more output
+
+output order options
+    --blocking: blocking read on each source in order sources appear on command line
+                output modes
+                    default:     output all records from the first source, then all
+                                 records from the seconds source, etc
+                    round robin: output <n> records from the first source, then <n>
+                                 records from the seconds source, etc; note that if
+                                 the number of records in a source is not divisible by <n>
+                                 then the last records groups may contain fewer than <n>
+                                 records
+                attention: if you want full control over record ordering, use --blocking
+                           when using subshells or sockets as io-cat inputs)" << std::endl;
     if( verbose )
     {
-        std::cerr << "                           io-cat will open such inputs, but they may not be immediately" << std::endl;
-        std::cerr << "                           ready for reading, which may lead to records being read from sources" << std::endl;
-        std::cerr << "                           out of order;  use --blocking to avoid this problem" << std::endl;
-        std::cerr << "                           e.g. in the following command without --blocking one subshell may" << std::endl;
-        std::cerr << "                           start slightly earlier than the other and thus likely to output" << std::endl;
-        std::cerr << "                           not what you expect or want - add --blocking to fix that:" << std::endl;
-        std::cerr << "                               io-cat --round-robin=1 \\" << std::endl;
-        std::cerr << "                                      <( csv-paste line-number value=a | head -n100 ) \\" << std::endl;
-        std::cerr << "                                      <( csv-paste line-number value=b | head -n100 )" << std::endl;
+        std::cerr << R"(                           io-cat will open such inputs, but they may not be immediately
+                           ready for reading, which may lead to records being read from sources
+                           out of order;  use --blocking to avoid this problem
+                           e.g. in the following command without --blocking one subshell may
+                           start slightly earlier than the other and thus likely to output
+                           not what you expect or want - add --blocking to fix that:
+                               io-cat --round-robin=1 \\
+                                      <( csv-paste line-number value=a | head -n100 ) \\
+                                      <( csv-paste line-number value=b | head -n100 ))" << std::endl;
     }
     else
     {
-        std::cerr << "                           run io-cat --help --verbose for more details" << std::endl;
+        std::cerr << "                           run io-cat --help --verbose for more details..." << std::endl;
     }
-    std::cerr << "    --head=[<n>]; output first <n> records and exit without waiting for record n+1" << std::endl;
-    std::cerr << "                  a workaround for sparse input fed into: io-cat ... | head -n10, which" << std::endl;
-    std::cerr << "                  not exit until io-cat receives record 11" << std::endl;
-    std::cerr << "                  instead run: io-cat ... --head=10 (use --flush if you don't want buffering" << std::endl;
-    std::cerr << "    --repeat=[<n>]; read each stream, output <n> times" << std::endl;
-    std::cerr << "                  e.g: run: io-cat my-file-1 my-file-2 --repeat=3" << std::endl;
-    std::cerr << "                       instead of: cat my-file-1 my-file-2 my-file-1 my-file-2 my-file-1 my-file-2" << std::endl;
-    std::cerr << "                  when using for large source, be aware that the sources get stored in memory first" << std::endl;
-    std::cerr << "    --repeat-forever,--forever; same as --repeat, but forever" << std::endl;
-    std::cerr << "    --round-robin=[<number of packets>]: only for multiple inputs: read not more" << std::endl;
-    std::cerr << "                                         than <number of packets> from an input at once," << std::endl;
-    std::cerr << "                                         before checking other inputs" << std::endl;
-    std::cerr << "                                         if not specified, read from each input" << std::endl;
-    std::cerr << "                                         all available data" << std::endl;
-    std::cerr << "                                         ignored for udp streams, where one full udp" << std::endl;
-    std::cerr << "                                         packet at a time is always read" << std::endl;
-    std::cerr << "    --size=[<bytes>]; on fixed-width binary records, size of the record in bytes, for --round-robin or --head" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "connect options" << std::endl;
-    std::cerr << "    --connect-max-attempts,--connect-attempts,--attempts,--max-attempts=<n>; default=1; number of attempts to reconnect or 'unlimited'" << std::endl;
-    std::cerr << "    --connect-period=<seconds>; default=1; how long to wait before the next connect attempt" << std::endl;
-    std::cerr << "    --permissive; run even if connection to some sources fails" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "supported address types: tcp, udp, local (unix) sockets, named pipes, files, zmq (todo)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    single stream" << std::endl;
-    std::cerr << "        io-cat tcp:localhost:12345" << std::endl;
-    std::cerr << "        io-cat udp:12345" << std::endl;
-    std::cerr << "        io-cat local:/tmp/socket" << std::endl;
-    std::cerr << "        io-cat some/pipe" << std::endl;
-    std::cerr << "        io-cat some/file" << std::endl;
-    std::cerr << "        io-cat zmq-local:/tmp/socket (not implemented)" << std::endl;
-    std::cerr << "        io-cat zmq-tcp:localhost:12345 (not implemented)" << std::endl;
-    std::cerr << "        echo hello | io-cat -" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    multiple streams" << std::endl;
-    std::cerr << "        merge line-based input" << std::endl;
-    std::cerr << "            io-cat tcp:localhost:55555 tcp:localhost:88888" << std::endl;
-    std::cerr << "        merge binary input with packet size 100 bytes" << std::endl;
-    std::cerr << "            io-cat tcp:localhost:55555 tcp:localhost:88888 --size 100" << std::endl;
-    std::cerr << "        merge line-based input with stdin" << std::endl;
-    std::cerr << "            echo hello | io-cat tcp:localhost:55555 -" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << std::endl;
+    std::cerr << R"(    --head=[<n>]; output first <n> records and exit without waiting for record n+1
+                  a workaround for sparse input fed into: io-cat ... | head -n10, which
+                  not exit until io-cat receives record 11
+                  instead run: io-cat ... --head=10 (use --flush if you don't want buffering
+    --repeat=[<n>]; read each stream, output <n> times
+                  e.g: run: io-cat my-file-1 my-file-2 --repeat=3
+                       instead of: cat my-file-1 my-file-2 my-file-1 my-file-2 my-file-1 my-file-2
+                  when using for large source, be aware that the sources get stored in memory first
+    --repeat-forever,--forever; same as --repeat, but forever
+    --round-robin=[<number of packets>]: only for multiple inputs: read not more
+                                         than <number of packets> from an input at once,
+                                         before checking other inputs
+                                         if not specified, read from each input
+                                         all available data
+                                         ignored for udp streams, where one full udp
+                                         packet at a time is always read
+    --size=[<bytes>]; on fixed-width binary records, size of the record in bytes, for --round-robin or --head
+    
+connect options
+    --connect-max-attempts,--connect-attempts,--attempts,--max-attempts=<n>; default=1; number of attempts to reconnect or 'unlimited'
+    --connect-period=<seconds>; default=1; how long to wait before the next connect attempt
+    --permissive; run even if connection to some sources fails
+    
+supported address types: tcp, udp, local (unix) sockets, named pipes, files, zmq (todo)
+    
+examples
+    
+    single stream
+        io-cat tcp:localhost:12345
+        io-cat udp:12345
+        io-cat local:/tmp/socket
+        io-cat some/pipe
+        io-cat some/file
+        io-cat zmq-local:/tmp/socket (not implemented)
+        io-cat zmq-tcp:localhost:12345 (not implemented)
+        echo hello | io-cat -
+    
+    multiple streams
+        merge line-based input
+            io-cat tcp:localhost:55555 tcp:localhost:88888
+        merge binary input with packet size 100 bytes
+            io-cat tcp:localhost:55555 tcp:localhost:88888 --size 100
+        merge line-based input with stdin
+            echo hello | io-cat tcp:localhost:55555 -
+)" << std::endl;
     exit( 0 );
 }
 
@@ -288,7 +288,7 @@ static stream* make_stream( const std::string& address, unsigned int size, bool
 {
     const std::vector< std::string >& v = comma::split( address, ':' );
     if( v[0] == "udp" ) { return new udp_stream( address ); }
-    if( v[0] == "zmq-local" || v[0] == "zero-local" || v[0] == "zmq-tcp" || v[0] == "zero-tcp" ) { COMMA_THROW( comma::exception, "io-cat: zmq support not implemented" ); }
+    COMMA_ASSERT_BRIEF( v[0] != "zmq-local" && v[0] != "zero-local" && v[0] != "zmq-tcp" && v[0] != "zero-tcp", "zmq support not implemented" );
     return new any_stream( address, size, binary );
 }
 
@@ -330,22 +330,22 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
         if( streams[i].connected() ) { continue; }
         try
         {
-            if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): connecting, attempt " << ( attempts + 1 ) << " of " << ( connect_max_attempts == 0 ? std::string( "unlimited" ) : boost::lexical_cast< std::string >( connect_max_attempts ) ) << "..." << std::endl; }
+            comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connecting, attempt " << ( attempts + 1 ) << " of " << ( connect_max_attempts == 0 ? std::string( "unlimited" ) : boost::lexical_cast< std::string >( connect_max_attempts ) ) << "..." << std::endl;
             streams[i].connect();
-            if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): connected" << std::endl; }
+            comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connected" << std::endl;
             select.read().add( streams[i] );
             --unconnected_count;
             continue;
         }
         catch( std::exception& ex ) { what = ex.what(); }
         catch( ... ) { what = "unknown exception"; }
-        if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): failed to connect" << std::endl; }
+        comma::saymore() << "stream " << i << " (" << streams[i].address() << "): failed to connect" << std::endl;
     }
     ++attempts;
     connected_all_we_could = unconnected_count == 0 || ( permissive && connect_max_attempts > 0 && attempts >= connect_max_attempts );
     if( connected_all_we_could ) { return connected_all_we_could; }
     if( connect_max_attempts == 0 || attempts < connect_max_attempts ) { return connected_all_we_could; }
-    std::cerr << "io-cat: fatal: after " << attempts << " attempt(s): " << what << std::endl;
+    comma::say() << "fatal: after " << attempts << " attempt(s): " << what << std::endl;
     exit( 1 );
 }
 
@@ -354,6 +354,7 @@ struct output_t
     unsigned int size{0};
     bool forever{false};
     std::vector< std::vector< char > > buffers; // todo: quick and dirty, watch performance on push back of large inputs
+
     operator bool() const { return !buffers.empty(); }
 
     output_t() = default;
@@ -409,10 +410,9 @@ static bool _write( unsigned int i, const comma::command_line_options& options,
 int main( int argc, char** argv )
 {
     #ifdef WIN32
-    std::cerr << "io-cat: not implemented on windows" << std::endl;
+    comma::say() << "not implemented on windows" << std::endl;
     return 1;
     #endif
-    
     try
     {
         if( argc < 2 ) { usage(); }
@@ -436,7 +436,7 @@ int main( int argc, char** argv )
         if( size || ( unnamed.size() == 1 && !has_head ) ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         //if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
-        if( unnamed.empty() ) { std::cerr << "io-cat: please specify at least one source" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify at least one source" );
         output = output_t( options, unnamed.size() );
         boost::ptr_vector< stream > streams;
         comma::io::select select;
@@ -447,7 +447,7 @@ int main( int argc, char** argv )
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;
         for( bool done = false; !done; )
         {
-            if( is_shutdown ) { if( verbose ) { std::cerr << "io-cat: received signal" << std::endl; }; break; }
+            if( is_shutdown ) { comma::saymore() << "received signal" << std::endl; break; }
             bool connected_all_we_could = try_connect( streams, select );
             if( !ready( streams, select, connected_all_we_could, blocking ) ) { continue; }
             done = true;
@@ -459,7 +459,7 @@ int main( int argc, char** argv )
                 bool empty = streams[i].empty();
                 if( empty && ( ready || streams[i].eof() ) )
                 { 
-                    if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << unnamed[i] << "): closed" << std::endl; }
+                    comma::saymore() << "stream " << i << " (" << unnamed[i] << "): closed" << std::endl;
                     select.read().remove( streams[i].fd() );
                     streams[i].close();
                     if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { done = true; break; }
@@ -472,7 +472,7 @@ int main( int argc, char** argv )
                     unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count, blocking );
                     if( bytes_read == 0 ) { break; }
                     done = false;
-                    if( size && bytes_read % size != 0 ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) << std::endl; return 1; }
+                    COMMA_ASSERT_BRIEF( !( size && bytes_read % size != 0 ), "stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) );
                     if( !_write( i, options, buffer, bytes_read ) ) { done = true; break; }
                     if( !std::cout.good() ) { done = true; break; }
                     if( unbuffered ) { std::cout.flush(); }
@@ -487,7 +487,7 @@ int main( int argc, char** argv )
         output.finalise( is_shutdown );
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "io-cat: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "io-cat: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }

From 73ea6c7b9a486c75b69c7b2eb4a91a92836b0f84 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 27 Sep 2024 14:00:34 +1000
Subject: [PATCH 0932/1056] io::server class added

---
 io/applications/io-cat.cpp            |  6 +--
 io/impl/{publisher.cpp => server.cpp} | 16 +++---
 io/impl/server.h                      | 78 +++++++++++++++++++++++++++
 io/publisher.cpp                      | 48 +----------------
 io/publisher.h                        | 60 ++-------------------
 io/server.cpp                         | 53 ++++++++++++++++++
 io/server.h                           | 68 +++++++++++++++++++++++
 7 files changed, 214 insertions(+), 115 deletions(-)
 rename io/impl/{publisher.cpp => server.cpp} (91%)
 create mode 100644 io/impl/server.h
 create mode 100644 io/server.cpp
 create mode 100644 io/server.h

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index b9356ae14..f74631af7 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -215,10 +215,10 @@ class udp_stream : public stream
         mutable boost::scoped_ptr< boost::asio::ip::udp::socket > socket_; // boost::asio::ip::udp::socket::fd() is non-const for some reason
 };
 
-class any_stream : public stream
+class client_stream : public stream
 {
     public:
-        any_stream( const std::string& address, unsigned int size, bool binary ): stream( address ), size_( size ), binary_( binary ), closed_( false ) {}
+        client_stream( const std::string& address, unsigned int size, bool binary ): stream( address ), size_( size ), binary_( binary ), closed_( false ) {}
         
         comma::io::file_descriptor fd() const { return ( *istream_ ).fd(); }
         
@@ -289,7 +289,7 @@ static stream* make_stream( const std::string& address, unsigned int size, bool
     const std::vector< std::string >& v = comma::split( address, ':' );
     if( v[0] == "udp" ) { return new udp_stream( address ); }
     COMMA_ASSERT_BRIEF( v[0] != "zmq-local" && v[0] != "zero-local" && v[0] != "zmq-tcp" && v[0] != "zero-tcp", "zmq support not implemented" );
-    return new any_stream( address, size, binary );
+    return new client_stream( address, size, binary );
 }
 
 static bool verbose;
diff --git a/io/impl/publisher.cpp b/io/impl/server.cpp
similarity index 91%
rename from io/impl/publisher.cpp
rename to io/impl/server.cpp
index 66d14d531..e7400166e 100644
--- a/io/impl/publisher.cpp
+++ b/io/impl/server.cpp
@@ -17,7 +17,7 @@
 #include "../../base/exception.h"
 #include "../../io/file_descriptor.h"
 #include "../../string/string.h"
-#include "publisher.h"
+#include "server.h"
 
 namespace comma { namespace io { namespace impl {
 
@@ -181,7 +181,7 @@ class zero_acceptor_ : public acceptor
         bool accepted_;
 };
 
-publisher::publisher( const std::string& name, io::mode::value mode, bool blocking, bool flush )
+server::server( const std::string& name, io::mode::value mode, bool blocking, bool flush )
     : blocking_( blocking ),
       flush_( flush )
 {
@@ -228,7 +228,7 @@ publisher::publisher( const std::string& name, io::mode::value mode, bool blocki
     }
 }
 
-unsigned int publisher::write( const char* buf, std::size_t size, bool do_accept )
+unsigned int server::write( const char* buf, std::size_t size, bool do_accept )
 {
     if( do_accept ) { accept(); }
     if( !blocking_ ) { select_.check(); } // todo: if slow, put all the files in one select
@@ -245,15 +245,15 @@ unsigned int publisher::write( const char* buf, std::size_t size, bool do_accept
     return count;
 }
 
-void publisher::close()
+void server::close()
 {
     if( acceptor_ ) { acceptor_->close(); }
     disconnect_all();
 }
 
-void publisher::disconnect_all() { while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); } }
+void server::disconnect_all() { while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); } }
 
-std::vector< io::ostream* > publisher::accept()
+std::vector< io::ostream* > server::accept()
 {
     std::vector< io::ostream* > streams;
     if( !acceptor_ ) { return streams; }
@@ -267,7 +267,7 @@ std::vector< io::ostream* > publisher::accept()
     }
 }
 
-void publisher::remove_( streams::iterator it )
+void server::remove_( streams::iterator it )
 {
     select_.write().remove( **it );
     ( *it )->close();
@@ -275,6 +275,6 @@ void publisher::remove_( streams::iterator it )
     streams_.erase( it );
 }
 
-std::size_t publisher::size() const { return streams_.size(); }
+std::size_t server::size() const { return streams_.size(); }
 
 } } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/server.h b/io/impl/server.h
new file mode 100644
index 000000000..929aa8d70
--- /dev/null
+++ b/io/impl/server.h
@@ -0,0 +1,78 @@
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+
+/// @author cedric wohlleber
+
+#pragma once
+
+#include <set>
+#include <boost/scoped_ptr.hpp>
+#include <boost/shared_ptr.hpp>
+#include "../file_descriptor.h"
+#include "../select.h"
+#include "../stream.h"
+
+namespace comma { namespace io {
+    
+class server;
+
+} } // namespace comma { namespace io {
+
+namespace comma { namespace io { namespace impl {
+
+struct acceptor
+{
+    virtual ~acceptor() {}
+    virtual io::file_descriptor fd() const = 0;
+    virtual io::ostream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
+    virtual void notify_closed() {} // quick and dirty
+    virtual void close() {}
+};
+    
+class server
+{
+    public:
+        server( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
+
+        unsigned int write( const char* buf, std::size_t size, bool do_accept = true );
+
+        template < typename T >
+        impl::server& operator<<( const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
+        {
+            accept();
+            select_.check();
+            unsigned int count = 0;
+            for( streams::iterator i = streams_.begin(); i != streams_.end(); )
+            {
+                streams::iterator it = i++;
+                if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
+                ( ***it ) << lhs;
+                if( flush_ ) { ( **it )->flush(); }
+                if( ( **it )->good() ) { ++count; }
+                else { remove_( it ); }
+            }
+            return *this;
+        }
+
+        void close();
+        
+        void disconnect_all();
+
+        std::size_t size() const;
+
+        std::vector< io::ostream* > accept();
+        
+        const io::impl::acceptor& acceptor() const { return *acceptor_; }
+
+    private:
+        friend class comma::io::server;
+        bool blocking_;
+        bool flush_;
+        boost::scoped_ptr< io::impl::acceptor > acceptor_;
+        typedef std::set< boost::shared_ptr< io::ostream > > streams;
+        streams streams_;
+        io::select select_;
+        void remove_( streams::iterator it );
+};
+
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/publisher.cpp b/io/publisher.cpp
index 3ce8a265b..2790dde79 100644
--- a/io/publisher.cpp
+++ b/io/publisher.cpp
@@ -1,53 +1,7 @@
 // This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2024 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
 #include "publisher.h"
 
-namespace comma { namespace io {
-
-publisher::publisher( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) : pimpl_( new impl::publisher( name, mode, blocking, flush ) ) {}
-
-publisher::~publisher() { delete pimpl_; }
-
-std::size_t publisher::write( const char* buf, std::size_t size, bool do_accept ) { return pimpl_->write( buf, size, do_accept ); }
-
-std::vector< io::ostream* > publisher::accept() { return pimpl_->accept(); }
-
-void publisher::close() { pimpl_->close(); }
-
-void publisher::disconnect_all() { pimpl_->disconnect_all(); }
-
-std::size_t publisher::size() const { return pimpl_->size(); }
-
-file_descriptor publisher::acceptor_file_descriptor() const { return pimpl_->acceptor_ ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
-
-} } // namespace comma { namespace io {
diff --git a/io/publisher.h b/io/publisher.h
index caa536f8a..23bed1060 100644
--- a/io/publisher.h
+++ b/io/publisher.h
@@ -1,68 +1,14 @@
-// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
 
 /// @author vsevolod vlaskine
 
 #pragma once
 
-#include <stdlib.h>
-#include <string>
-#include <boost/noncopyable.hpp>
-#include "stream.h"
-#include "impl/publisher.h"
+#include "server.h"
 
 namespace comma { namespace io {
 
-/// a simple publisher that opens and writes to using services (e.g. tcp, udp, etc)
-class publisher : public boost::noncopyable
-{
-    public:
-        /// constructor
-        /// @param name ::= tcp:<port> | udp:<port> | <filename>
-        ///     if tcp:<port>, create tcp server
-        ///     @todo if udp:<port>, broadcast on udp
-        ///     if <filename> is a regular file, just write to it
-        ///     @todo if <filename> is named pipe, keep reopening it, if closed
-        ///     if <filename> is Linux domain socket, create Linux domain socket server
-        /// @param mode ascii or binary, a hint for Windows
-        /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
-        publisher( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
-
-        /// destructor
-        ~publisher();
-
-        /// publish to all existing connections (blocking), return number of clients with successful write
-        std::size_t write( const char* buf, std::size_t size, bool do_accept = true );
-
-        /// publish to all existing connections (blocking)
-        /// @note data integrity is the user's responsibility
-        ///       i.e. if someone writes:
-        ///           publisher p( "tcp:localhost:1234" );
-        ///           p << 1 << "," << 2 << std::endl;
-        ///       and a client connects after "1" already
-        ///       has been output, this client will receive
-        ///       ",2", which most likely was not intended
-        template < typename T >
-        publisher& operator<<( const T& rhs ) { pimpl_->operator<<( rhs ); return *this; }
-
-        /// close
-        void close();
-        
-        /// disconnect all existing clients
-        void disconnect_all();
-
-        /// return current number of connected clients
-        std::size_t size() const;
-
-        /// accept waiting clients, non-blocking
-        /// @return number of clients accepted
-        std::vector< io::ostream* > accept();
-        
-        /// return acceptor file descriptor
-        file_descriptor acceptor_file_descriptor() const;
-        
-    private:
-        impl::publisher* pimpl_;
-};
+typedef server publisher; // quick and dirty for backward compatibility
 
 } } // namespace comma { namespace io {
diff --git a/io/server.cpp b/io/server.cpp
new file mode 100644
index 000000000..49c4b5117
--- /dev/null
+++ b/io/server.cpp
@@ -0,0 +1,53 @@
+// This file is part of comma, a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+/// @author vsevolod vlaskine
+
+#include "server.h"
+
+namespace comma { namespace io {
+
+server::server( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) : pimpl_( new impl::server( name, mode, blocking, flush ) ) {}
+
+server::~server() { delete pimpl_; }
+
+std::size_t server::write( const char* buf, std::size_t size, bool do_accept ) { return pimpl_->write( buf, size, do_accept ); }
+
+std::vector< io::ostream* > server::accept() { return pimpl_->accept(); }
+
+void server::close() { pimpl_->close(); }
+
+void server::disconnect_all() { pimpl_->disconnect_all(); }
+
+std::size_t server::size() const { return pimpl_->size(); }
+
+file_descriptor server::acceptor_file_descriptor() const { return pimpl_->acceptor_ ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
+
+} } // namespace comma { namespace io {
diff --git a/io/server.h b/io/server.h
new file mode 100644
index 000000000..980e47e85
--- /dev/null
+++ b/io/server.h
@@ -0,0 +1,68 @@
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <stdlib.h>
+#include <string>
+#include <boost/noncopyable.hpp>
+#include "stream.h"
+#include "impl/server.h"
+
+namespace comma { namespace io {
+
+/// a simple publisher that opens and writes to using services (e.g. tcp, udp, etc)
+class server : public boost::noncopyable
+{
+    public:
+        /// constructor
+        /// @param name ::= tcp:<port> | udp:<port> | <filename>
+        ///     if tcp:<port>, create tcp server
+        ///     @todo if udp:<port>, broadcast on udp
+        ///     if <filename> is a regular file, just write to it
+        ///     @todo if <filename> is named pipe, keep reopening it, if closed
+        ///     if <filename> is Linux domain socket, create Linux domain socket server
+        /// @param mode ascii or binary, a hint for Windows
+        /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
+        server( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
+
+        /// destructor
+        ~server();
+
+        /// publish to all existing connections (blocking), return number of clients with successful write
+        std::size_t write( const char* buf, std::size_t size, bool do_accept = true );
+
+        /// publish to all existing connections (blocking)
+        /// @note data integrity is the user's responsibility
+        ///       i.e. if someone writes:
+        ///           server p( "tcp:localhost:1234" );
+        ///           p << 1 << "," << 2 << std::endl;
+        ///       and a client connects after "1" already
+        ///       has been output, this client will receive
+        ///       ",2", which most likely was not intended
+        template < typename T >
+        server& operator<<( const T& rhs ) { pimpl_->operator<<( rhs ); return *this; }
+
+        /// close
+        void close();
+        
+        /// disconnect all existing clients
+        void disconnect_all();
+
+        /// return current number of connected clients
+        std::size_t size() const;
+
+        /// accept waiting clients, non-blocking
+        /// @return number of clients accepted
+        std::vector< io::ostream* > accept();
+        
+        /// return acceptor file descriptor
+        file_descriptor acceptor_file_descriptor() const;
+        
+    private:
+        impl::server* pimpl_;
+};
+
+} } // namespace comma { namespace io {

From 3c307f41f78de0ae8e7f4bc436c78f29e99e6746 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 29 Sep 2024 20:04:30 +1000
Subject: [PATCH 0933/1056] io::server: refactored to implement io::iserver;
 io::oserver: replacement of publisher

---
 io/applications/io-publish.cpp |   4 +-
 io/impl/publish.cpp            |  13 +--
 io/impl/publish.h              |   4 +-
 io/impl/publisher.h            |  78 ----------------
 io/impl/server.cpp             | 160 +++++++++++++++++----------------
 io/impl/server.h               |  36 +++++---
 io/publisher.cpp               |   7 --
 io/publisher.h                 |   2 +-
 io/server.cpp                  |  21 +++--
 io/server.h                    |  69 +++++++++-----
 io/stream.cpp                  |  14 +--
 io/test/CMakeLists.txt         |  11 ++-
 io/test/io-publish/stdin/input |   4 +-
 io/test/io-publish/test        |  14 ++-
 14 files changed, 196 insertions(+), 241 deletions(-)
 delete mode 100644 io/impl/publisher.h
 delete mode 100644 io/publisher.cpp

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index c0c0a4236..6c22a873c 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -159,13 +159,13 @@ int main( int ac, char** av )
         std::string exec_command = options.value< std::string >( "--exec", "" );
         if( !tail.empty() )
         {
-            if( !exec_command.empty() ) { comma::say() << "expected either --exec or --, got both" << std::endl; return 1; }
+            COMMA_ASSERT_BRIEF( exec_command.empty(), "expected either --exec or --, got both" );
             exec_command = comma::join( tail, ' ' );
         }
         //ProfilerStart( "io-publish.prof" ); {
         if( exec_command.empty() )
         {
-            if( on_demand ) { comma::say() << "got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" << std::endl; return 1; }
+            COMMA_ASSERT_BRIEF( !on_demand, "got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" );
             while( std::cin.good() && !is_shutdown ) { if( !p.read( std::cin ) && exit_on_no_clients ) { break; } }
         }
         else
diff --git a/io/impl/publish.cpp b/io/impl/publish.cpp
index b25bde260..0a91ff4fc 100644
--- a/io/impl/publish.cpp
+++ b/io/impl/publish.cpp
@@ -44,7 +44,7 @@ publish::publish( const std::vector< std::string >& endpoints
     t->resize( endpoints.size() );
     for( std::size_t i = 0; i < endpoints.size(); ++i )
     {
-        if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
+        if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::oserver( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
     }
     acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
 }
@@ -149,10 +149,13 @@ void publish::accept_()
             if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
             {
                 const auto& streams = ( *t )[i]->accept();
-                for( auto s: streams )
+                if( !cache_.empty() )
                 {
-                    for( const auto& c: cache_ ) { ( *s )->write( &c[0], c.size() ); }
-                    if( flush_ ) { ( *s )->flush(); }
+                    for( auto& s: streams )
+                    {
+                        for( const auto& c: cache_ ) { ( *s )->write( &c[0], c.size() ); }
+                        if( flush_ ) { ( *s )->flush(); }
+                    }
                 }
             }
         }
@@ -162,7 +165,7 @@ void publish::accept_()
             for( unsigned int i = 0; i < t->size(); ++i )
             {
                 if( !endpoints_[i].secondary || ( *t )[i] ) { continue; }
-                ( *t )[i].reset( new comma::io::publisher( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
+                ( *t )[i].reset( new comma::io::oserver( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
                 if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
             }
         }
diff --git a/io/impl/publish.h b/io/impl/publish.h
index 98349494d..e71a5382e 100644
--- a/io/impl/publish.h
+++ b/io/impl/publish.h
@@ -17,7 +17,7 @@
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
 #include "../../io/file_descriptor.h"
-#include "../../io/publisher.h"
+#include "../../io/server.h"
 #include "../../string/string.h"
 #include "../../sync/synchronized.h"
 
@@ -26,7 +26,7 @@ namespace comma { namespace io { namespace impl {
 class publish
 {
     public:
-        typedef comma::synchronized< std::vector< std::unique_ptr< comma::io::publisher > > > publishers_t;
+        typedef comma::synchronized< std::vector< std::unique_ptr< comma::io::oserver > > > publishers_t;
         
         typedef publishers_t::scoped_transaction transaction_t;
         
diff --git a/io/impl/publisher.h b/io/impl/publisher.h
deleted file mode 100644
index 7a16f0a02..000000000
--- a/io/impl/publisher.h
+++ /dev/null
@@ -1,78 +0,0 @@
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-
-/// @author cedric wohlleber
-
-#pragma once
-
-#include <set>
-#include <boost/scoped_ptr.hpp>
-#include <boost/shared_ptr.hpp>
-#include "../file_descriptor.h"
-#include "../select.h"
-#include "../stream.h"
-
-namespace comma { namespace io {
-    
-class publisher;
-
-} } // namespace comma { namespace io {
-
-namespace comma { namespace io { namespace impl {
-
-struct acceptor
-{
-    virtual ~acceptor() {}
-    virtual io::file_descriptor fd() const = 0;
-    virtual io::ostream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
-    virtual void notify_closed() {} // quick and dirty
-    virtual void close() {}
-};
-    
-class publisher
-{
-    public:
-        publisher( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
-
-        unsigned int write( const char* buf, std::size_t size, bool do_accept = true );
-
-        template < typename T >
-        impl::publisher& operator<<( const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
-        {
-            accept();
-            select_.check();
-            unsigned int count = 0;
-            for( streams::iterator i = streams_.begin(); i != streams_.end(); )
-            {
-                streams::iterator it = i++;
-                if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
-                ( ***it ) << lhs;
-                if( flush_ ) { ( **it )->flush(); }
-                if( ( **it )->good() ) { ++count; }
-                else { remove_( it ); }
-            }
-            return *this;
-        }
-
-        void close();
-        
-        void disconnect_all();
-
-        std::size_t size() const;
-
-        std::vector< io::ostream* > accept();
-        
-        const io::impl::acceptor& acceptor() const { return *acceptor_; }
-
-    private:
-        friend class comma::io::publisher;
-        bool blocking_;
-        bool flush_;
-        boost::scoped_ptr< io::impl::acceptor > acceptor_;
-        typedef std::set< boost::shared_ptr< io::ostream > > streams;
-        streams streams_;
-        io::select select_;
-        void remove_( streams::iterator it );
-};
-
-} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/server.cpp b/io/impl/server.cpp
index e7400166e..87a40445b 100644
--- a/io/impl/server.cpp
+++ b/io/impl/server.cpp
@@ -21,7 +21,7 @@
 
 namespace comma { namespace io { namespace impl {
 
-class file_acceptor : public acceptor
+template < typename Stream > class file_acceptor : public acceptor< Stream >
 {
     public:
         file_acceptor( const std::string& name, io::mode::value mode ): name_( name ), mode_( mode ), closed_( true ), fd_( io::invalid_file_descriptor ) {}
@@ -35,7 +35,7 @@ class file_acceptor : public acceptor
 #endif
         }
 
-        io::ostream* accept( boost::posix_time::time_duration )
+        Stream* accept( boost::posix_time::time_duration )
         {
             if( !closed_ ) { return NULL; }
 #ifndef WIN32
@@ -43,9 +43,9 @@ class file_acceptor : public acceptor
 #else
             fd_ = _open( &name_[0], O_WRONLY | _O_CREAT, _S_IWRITE );
 #endif
-            if( fd_ == io::invalid_file_descriptor ) { return NULL; }
+            if( fd_ == io::invalid_file_descriptor ) { return nullptr; }
             closed_ = false;
-            return new io::ostream( name_, mode_, io::mode::non_blocking ); // quick and dirty
+            return new Stream( name_, mode_, io::mode::non_blocking ); // quick and dirty
         }
 
         void notify_closed() { closed_ = true; ::close( fd_ ); }
@@ -55,8 +55,8 @@ class file_acceptor : public acceptor
     private:
         const std::string name_;
         const io::mode::value mode_;
-        bool closed_;
-        io::file_descriptor fd_; // todo: make io::ostream non-throwing on construction
+        bool closed_{false};
+        io::file_descriptor fd_{0}; // todo: make io::istream, io::ostream non-throwing on construction
 };
 
 struct Tcp {};
@@ -83,91 +83,87 @@ template <> struct socket_traits< local >
 };
 #endif
 
-template < typename S >
-class socket_acceptor : public acceptor
+template < typename Stream, typename S > class socket_acceptor : public acceptor< Stream >
 {
     public:
         socket_acceptor( const typename socket_traits< S >::name_type& name, io::mode::value mode )
             : mode_( mode )
-            , acceptor_( m_service, socket_traits< S >::endpoint( name ) )
+            , _acceptor( m_service, socket_traits< S >::endpoint( name ) )
         {
 #ifndef WIN32
 #if (BOOST_VERSION >= 106600)
-            select_.read().add( acceptor_.native_handle() );
+            select_.read().add( _acceptor.native_handle() );
 #else
-            select_.read().add( acceptor_.native() );
+            select_.read().add( _acceptor.native() );
 #endif
 #else
 #if (BOOST_VERSION >= 106600)
-            SOCKET socket = acceptor_.native_handle();
+            SOCKET socket = _acceptor.native_handle();
 #else
-            SOCKET socket = acceptor_.native();
+            SOCKET socket = _acceptor.native();
 #endif
             select_.read().add( socket );
 #endif
         }
 
-        io::ostream* accept( boost::posix_time::time_duration timeout )
+        Stream* accept( boost::posix_time::time_duration timeout )
         {
             select_.wait( timeout );
 #ifndef WIN32
 #if (BOOST_VERSION >= 106600)
-            if( !select_.read().ready( acceptor_.native_handle() ) ) { return NULL; }
+            if( !select_.read().ready( _acceptor.native_handle() ) ) { return nullptr; }
 #else
-            if( !select_.read().ready( acceptor_.native() ) ) { return NULL; }
+            if( !select_.read().ready( _acceptor.native() ) ) { return nullptr; }
 #endif
 #else
 #if (BOOST_VERSION >= 106600)
-            SOCKET socket = acceptor_.native_handle();
+            SOCKET socket = _acceptor.native_handle();
 #else
-            SOCKET socket = acceptor_.native();
+            SOCKET socket = _acceptor.native();
 #endif
-            if( !select_.read().ready( socket ) ) { return NULL; }
+            if( !select_.read().ready( socket ) ) { return nullptr; }
 #endif
             typename socket_traits< S >::iostream* stream = new typename socket_traits< S >::iostream;
-            acceptor_.accept( *( stream->rdbuf() ) );
+            _acceptor.accept( *( stream->rdbuf() ) );
 #if (BOOST_VERSION >= 106600)
-            return new io::ostream( stream, stream->rdbuf()->native_handle(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
+            return new Stream( stream, stream->rdbuf()->native_handle(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
 #else
-            return new io::ostream( stream, stream->rdbuf()->native(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
+            return new Stream( stream, stream->rdbuf()->native(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
 #endif
         }
 
-        void close() { acceptor_.close(); }
+        void close() { _acceptor.close(); }
 
 #ifndef WIN32
 #if (BOOST_VERSION >= 106600)
-        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( acceptor_ ).native_handle(); }
+        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( _acceptor ).native_handle(); }
 #else
-        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( acceptor_ ).native(); }
+        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( _acceptor ).native(); }
 #endif
 #else
         io::file_descriptor fd() const { return io::invalid_file_descriptor; }
 #endif
 
     private:
-        io::mode::value mode_;
+        io::mode::value mode_{io::mode::binary};
         io::select select_;
 #if (BOOST_VERSION >= 106600)
         boost::asio::io_context m_service;
 #else
         boost::asio::io_service m_service;
 #endif
-        typename socket_traits< S >::acceptor acceptor_;
+        typename socket_traits< S >::acceptor _acceptor;
 };
 
-class zero_acceptor_ : public acceptor
+template < typename Stream >
+class zero_acceptor_ : public acceptor< Stream >
 {
     public:
-        zero_acceptor_( const std::string& name, io::mode::value mode ):
-            stream_( new io::ostream( name, mode ) ),
-            accepted_( false )
-        {
-        }
+        zero_acceptor_( const std::string& name, io::mode::value mode ): stream_( new Stream( name, mode ) ), accepted_( false ) {}
 
-        io::ostream* accept( boost::posix_time::time_duration )
+        Stream* accept( boost::posix_time::time_duration )
         {
-            if( accepted_ ) { return NULL; }
+            if( accepted_ ) { return nullptr; }
             accepted_ = true;
             return stream_;
         }
@@ -177,11 +173,11 @@ class zero_acceptor_ : public acceptor
         io::file_descriptor fd() const { return io::invalid_file_descriptor; } // quick and dirty
 
     private:
-        io::ostream* stream_;
-        bool accepted_;
+        Stream* stream_{nullptr};
+        bool accepted_{false};
 };
 
-server::server( const std::string& name, io::mode::value mode, bool blocking, bool flush )
+template < typename Stream > server< Stream >::server( const std::string& name, io::mode::value mode, bool blocking, bool flush )
     : blocking_( blocking ),
       flush_( flush )
 {
@@ -189,7 +185,7 @@ server::server( const std::string& name, io::mode::value mode, bool blocking, bo
     if( v[0] == "tcp" )
     {
         if( v.size() != 2 ) { COMMA_THROW( comma::exception, "expected tcp server endpoint, got " << name ); }
-        acceptor_.reset( new socket_acceptor< Tcp >( boost::lexical_cast< unsigned short >( v[1] ), mode ) );
+        _acceptor.reset( new socket_acceptor< Stream, Tcp >( boost::lexical_cast< unsigned short >( v[1] ), mode ) );
     }
     else if( v[0] == "udp" )
     {
@@ -199,82 +195,92 @@ server::server( const std::string& name, io::mode::value mode, bool blocking, bo
     {
 #ifndef WIN32
         if( v.size() != 2 ) { COMMA_THROW( comma::exception, "expected local socket, got " << name ); }
-        acceptor_.reset( new socket_acceptor< local >( v[1], mode ) );
+        _acceptor.reset( new socket_acceptor< Stream, local >( v[1], mode ) );
 #endif
     }
     else if( v[0].substr( 0, 4 ) == "zero" )
     {
-        acceptor_.reset( new zero_acceptor_( name, mode ) );
+        _acceptor.reset( new zero_acceptor_< Stream >( name, mode ) );
     }
     else
     {
         if( name == "-" )
         {
-            streams_.insert( boost::shared_ptr< io::ostream >( new io::ostream( name, mode ) ) );
+            streams_.insert( std::unique_ptr< Stream >( new Stream( name, mode ) ) );
 #ifndef WIN32
-            select_.write().add( 1 );
+            select_.write().add( 1 ); // todo: traits: read/write
 #endif
         }
         else
         {
-            acceptor_.reset( new file_acceptor( name, mode ) );
-            io::ostream* s = acceptor_->accept( boost::posix_time::time_duration() );
-            streams_.insert( boost::shared_ptr< io::ostream >( s ) ); // todo: should we simply abolish file_acceptor and do it in the same way as for stdout?
+            _acceptor.reset( new file_acceptor< Stream >( name, mode ) );
+            Stream* s = _acceptor->accept( boost::posix_time::time_duration() );
+            streams_.insert( std::unique_ptr< Stream >( s ) ); // todo: should we simply abolish file_acceptor and do it in the same way as for stdout?
             if( s->fd() == comma::io::invalid_file_descriptor ) { COMMA_THROW( comma::exception, "failed to open '" << name << "'" ); }
 #ifndef WIN32
-            select_.write().add( s->fd() );
+            select_.write().add( s->fd() ); // todo: traits: read/write
 #endif
         }
     }
 }
 
-unsigned int server::write( const char* buf, std::size_t size, bool do_accept )
+template < typename Stream > void server< Stream >::close()
 {
-    if( do_accept ) { accept(); }
-    if( !blocking_ ) { select_.check(); } // todo: if slow, put all the files in one select
-    unsigned int count = 0;
-    for( streams::iterator i = streams_.begin(); i != streams_.end(); )
-    {
-        streams::iterator it = i++;
-        if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
-        ( **it )->write( buf, size );
-        if( flush_ ) { ( **it )->flush(); }
-        if( ( **it )->good() ) { ++count; }
-        else { remove_( it ); }
-    }
-    return count;
+    if( _acceptor ) { _acceptor->close(); }
+    disconnect_all();
 }
 
-void server::close()
+template < typename Stream > void server< Stream >::disconnect_all()
 {
-    if( acceptor_ ) { acceptor_->close(); }
-    disconnect_all();
+    while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); }
 }
 
-void server::disconnect_all() { while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); } }
-
-std::vector< io::ostream* > server::accept()
+template < typename Stream > std::vector< Stream* > server< Stream >::accept()
 {
-    std::vector< io::ostream* > streams;
-    if( !acceptor_ ) { return streams; }
+    std::vector< Stream* > streams;
+    if( !_acceptor ) { return streams; }
     while( true ) // while( streams_.size() < maxSize ?
     {
-        io::ostream* s = acceptor_->accept();
-        if( s == NULL ) { return streams; }
-        streams.push_back( s );
-        streams_.insert( boost::shared_ptr< io::ostream >( s ) );
-        select_.write().add( *s );
+        Stream* s = _acceptor->accept();
+        if( s == nullptr ) { return streams; }
+        streams.emplace_back( s );
+        streams_.insert( std::unique_ptr< Stream >( s ) );
+        select_.write().add( s->fd() ); // todo! istream/ostream traits
     }
 }
 
-void server::remove_( streams::iterator it )
+template < typename Stream > void server< Stream >::remove_( typename _streams_type::iterator it )
 {
     select_.write().remove( **it );
     ( *it )->close();
-    if( acceptor_ ) { acceptor_->notify_closed(); }
+    if( _acceptor ) { _acceptor->notify_closed(); }
     streams_.erase( it );
 }
 
-std::size_t server::size() const { return streams_.size(); }
+template < typename Stream > std::size_t server< Stream >::size() const { return streams_.size(); }
+
+template < typename Stream > unsigned int server< Stream >::write( const char* buf, std::size_t size, bool do_accept )
+{
+    if( do_accept ) { accept(); }
+    if( !blocking_ ) { select_.check(); } // todo: if slow, put all the files in one select
+    unsigned int count = 0;
+    for( typename _streams_type::iterator i = streams_.begin(); i != streams_.end(); )
+    {
+        typename _streams_type::iterator it = i++;
+        if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
+        ( **it )->write( buf, size );
+        if( flush_ ) { ( **it )->flush(); }
+        if( ( **it )->good() ) { ++count; }
+        else { remove_( it ); }
+    }
+    return count;
+}
+
+// template struct acceptor< io::istream >;
+template struct acceptor< io::ostream >;
+// template struct acceptor< io::iostream >;
+// todo: template struct server< io::istream >;
+template struct server< io::ostream >;
+// todo: template struct server< io::iostream >;
 
 } } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/server.h b/io/impl/server.h
index 929aa8d70..a30852496 100644
--- a/io/impl/server.h
+++ b/io/impl/server.h
@@ -13,38 +13,46 @@
 #include "../stream.h"
 
 namespace comma { namespace io {
-    
-class server;
+
+template < typename Stream > class server;
 
 } } // namespace comma { namespace io {
 
 namespace comma { namespace io { namespace impl {
 
+template < typename Stream >
 struct acceptor
 {
+    typedef Stream stream_type;
+
     virtual ~acceptor() {}
     virtual io::file_descriptor fd() const = 0;
-    virtual io::ostream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
+    virtual Stream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
     virtual void notify_closed() {} // quick and dirty
     virtual void close() {}
 };
-    
+
+template < typename Stream >
 class server
 {
     public:
+        typedef Stream stream_type;
+
         server( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
 
+        // todo!
         unsigned int write( const char* buf, std::size_t size, bool do_accept = true );
 
+        // todo!
         template < typename T >
-        impl::server& operator<<( const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
+        impl::server< Stream >& operator<<( const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
         {
             accept();
             select_.check();
             unsigned int count = 0;
-            for( streams::iterator i = streams_.begin(); i != streams_.end(); )
+            for( typename _streams_type::iterator i = streams_.begin(); i != streams_.end(); )
             {
-                streams::iterator it = i++;
+                typename _streams_type::iterator it = i++;
                 if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
                 ( ***it ) << lhs;
                 if( flush_ ) { ( **it )->flush(); }
@@ -60,19 +68,19 @@ class server
 
         std::size_t size() const;
 
-        std::vector< io::ostream* > accept();
+        std::vector< Stream* > accept(); // quick and dirty; return naked pointers for now
         
-        const io::impl::acceptor& acceptor() const { return *acceptor_; }
+        const io::impl::acceptor< Stream >& acceptor() const { return *_acceptor; }
 
     private:
-        friend class comma::io::server;
+        template < typename > friend class comma::io::server;
         bool blocking_;
         bool flush_;
-        boost::scoped_ptr< io::impl::acceptor > acceptor_;
-        typedef std::set< boost::shared_ptr< io::ostream > > streams;
-        streams streams_;
+        boost::scoped_ptr< io::impl::acceptor< Stream > > _acceptor;
+        typedef std::set< std::unique_ptr< stream_type > > _streams_type;
+        _streams_type streams_;
         io::select select_;
-        void remove_( streams::iterator it );
+        void remove_( typename _streams_type::iterator it );
 };
 
 } } } // namespace comma { namespace io { namespace impl {
diff --git a/io/publisher.cpp b/io/publisher.cpp
deleted file mode 100644
index 2790dde79..000000000
--- a/io/publisher.cpp
+++ /dev/null
@@ -1,7 +0,0 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2024 Vsevolod Vlaskine
-
-/// @author vsevolod vlaskine
-
-#include "publisher.h"
-
diff --git a/io/publisher.h b/io/publisher.h
index 23bed1060..ed18d842d 100644
--- a/io/publisher.h
+++ b/io/publisher.h
@@ -9,6 +9,6 @@
 
 namespace comma { namespace io {
 
-typedef server publisher; // quick and dirty for backward compatibility
+typedef oserver publisher; // quick and dirty for backward compatibility
 
 } } // namespace comma { namespace io {
diff --git a/io/server.cpp b/io/server.cpp
index 49c4b5117..581c7d2f9 100644
--- a/io/server.cpp
+++ b/io/server.cpp
@@ -27,27 +27,30 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #include "server.h"
 
 namespace comma { namespace io {
 
-server::server( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) : pimpl_( new impl::server( name, mode, blocking, flush ) ) {}
+template < typename Stream > server< Stream >::server( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) : pimpl_( new impl::server< Stream >( name, mode, blocking, flush ) ) {}
+
+template < typename Stream > server< Stream >::~server() { delete pimpl_; }
 
-server::~server() { delete pimpl_; }
+template < typename Stream > std::vector< Stream* > server< Stream >::accept() { return pimpl_->accept(); }
 
-std::size_t server::write( const char* buf, std::size_t size, bool do_accept ) { return pimpl_->write( buf, size, do_accept ); }
+template < typename Stream > void server< Stream >::close() { pimpl_->close(); }
 
-std::vector< io::ostream* > server::accept() { return pimpl_->accept(); }
+template < typename Stream > void server< Stream >::disconnect_all() { pimpl_->disconnect_all(); }
 
-void server::close() { pimpl_->close(); }
+template < typename Stream > std::size_t server< Stream >::size() const { return pimpl_->size(); }
 
-void server::disconnect_all() { pimpl_->disconnect_all(); }
+template < typename Stream > file_descriptor server< Stream >::acceptor_file_descriptor() const { return pimpl_->_acceptor ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
 
-std::size_t server::size() const { return pimpl_->size(); }
+std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept ) { return pimpl_->write( buf, size, do_accept ); }
 
-file_descriptor server::acceptor_file_descriptor() const { return pimpl_->acceptor_ ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
+//template class server< io::istream >;
+template class server< io::ostream >;
+//template class server< io::iostream >;
 
 } } // namespace comma { namespace io {
diff --git a/io/server.h b/io/server.h
index 980e47e85..9e3ebc878 100644
--- a/io/server.h
+++ b/io/server.h
@@ -1,4 +1,5 @@
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
 
 /// @author vsevolod vlaskine
@@ -6,15 +7,16 @@
 #pragma once
 
 #include <stdlib.h>
+#include <memory>
 #include <string>
-#include <boost/noncopyable.hpp>
 #include "stream.h"
 #include "impl/server.h"
 
 namespace comma { namespace io {
 
-/// a simple publisher that opens and writes to using services (e.g. tcp, udp, etc)
-class server : public boost::noncopyable
+/// a simple server base class that opens and reads from or writes to streams using services (e.g. tcp, udp, etc)
+template < typename Stream >
+class server
 {
     public:
         /// constructor
@@ -31,20 +33,6 @@ class server : public boost::noncopyable
         /// destructor
         ~server();
 
-        /// publish to all existing connections (blocking), return number of clients with successful write
-        std::size_t write( const char* buf, std::size_t size, bool do_accept = true );
-
-        /// publish to all existing connections (blocking)
-        /// @note data integrity is the user's responsibility
-        ///       i.e. if someone writes:
-        ///           server p( "tcp:localhost:1234" );
-        ///           p << 1 << "," << 2 << std::endl;
-        ///       and a client connects after "1" already
-        ///       has been output, this client will receive
-        ///       ",2", which most likely was not intended
-        template < typename T >
-        server& operator<<( const T& rhs ) { pimpl_->operator<<( rhs ); return *this; }
-
         /// close
         void close();
         
@@ -54,15 +42,50 @@ class server : public boost::noncopyable
         /// return current number of connected clients
         std::size_t size() const;
 
-        /// accept waiting clients, non-blocking
-        /// @return number of clients accepted
-        std::vector< io::ostream* > accept();
-        
         /// return acceptor file descriptor
         file_descriptor acceptor_file_descriptor() const;
+
+        /// publish to all existing connections (blocking)
+        /// @note data integrity is the user's responsibility
+        ///       i.e. if someone writes:
+        ///           server p( "tcp:localhost:1234" );
+        ///           p << 1 << "," << 2 << std::endl;
+        ///       and a client connects after "1" already
+        ///       has been output, this client will receive
+        ///       ",2", which most likely was not intended
+        std::vector< Stream* > accept(); // quick and dirty, use nacked pointers for now
         
-    private:
-        impl::server* pimpl_;
+    protected:
+        server( const server& );
+        server& operator=( const server& );
+        impl::server< Stream >* pimpl_;
+};
+
+struct oserver: public io::server< io::ostream >
+{
+    /// @param name ::= tcp:<port> | udp:<port> | <filename>
+    ///     if tcp:<port>, create tcp server
+    ///     @todo if udp:<port>, broadcast on udp
+    ///     if <filename> is a regular file, just write to it
+    ///     @todo if <filename> is named pipe, keep reopening it, if closed
+    ///     if <filename> is Linux domain socket, create Linux domain socket server
+    /// @param mode ascii or binary, a hint for Windows
+    /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
+    oserver( const std::string& name, comma::io::mode::value mode, bool blocking = false, bool flush = true ): server< io::ostream >( name, mode, blocking, flush ) {}
+
+    /// publish to all existing connections (blocking), return number of clients with successful write
+    std::size_t write( const char* buf, std::size_t size, bool do_accept = true );
+
+    /// publish to all existing connections (blocking)
+    /// @note data integrity is the user's responsibility
+    ///       i.e. if someone writes:
+    ///           server p( "tcp:localhost:1234" );
+    ///           p << 1 << "," << 2 << std::endl;
+    ///       and a client connects after "1" already
+    ///       has been output, this client will receive
+    ///       ",2", which most likely was not intended
+    template < typename T >
+    oserver& operator<<( const T& rhs ) { pimpl_->operator<<( rhs ); return *this; }
 };
 
 } } // namespace comma { namespace io {
diff --git a/io/stream.cpp b/io/stream.cpp
index 92ea7bdc0..8a4d3de2f 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -104,7 +104,7 @@ template <> struct traits < std::iostream >
 {
     typedef std::fstream file_stream; // quick and dirty, does not matter for now
     static bool is_standard( const std::iostream* ) { return false; }
-    static std::iostream* standard( comma::io::mode::value mode ) { (void) mode; return NULL; }
+    static std::iostream* standard( comma::io::mode::value mode ) { (void) mode; return nullptr; }
     static comma::io::file_descriptor standard_fd() { return comma::io::invalid_file_descriptor; }
     #ifdef WIN32
         static io::file_descriptor open( const std::string& name ) { return io::invalid_file_descriptor; }
@@ -127,24 +127,24 @@ template < typename S > void close_file_stream( typename traits< S >::file_strea
 
 template < typename S > stream< S >::~stream()
 {
-    if( stream_ == NULL || impl::traits< S >::is_standard( stream_ ) ) { return; }
+    if( stream_ == nullptr || impl::traits< S >::is_standard( stream_ ) ) { return; }
     delete stream_;
-    stream_ = NULL;
+    stream_ = nullptr;
     close_ = NULL;
 }
 
 template < typename S > S* stream< S >::lazily_make_stream_()
 {
     #ifndef WIN32
-    if( stream_ == NULL ) // quick and dirty: if fstream, cannot open on construction, as pipe might block
+    if( stream_ == nullptr ) // quick and dirty: if fstream, cannot open on construction, as pipe might block
     {
         if( !comma::filesystem::is_regular_file( name_ ) && !blocking_ ) // quick and dirty
         {
             io::select select;
             select.read().add( fd_ ); // todo: express via traits
             select.write().add( fd_ ); // todo: express via traits
-            select.check(); //if( !select.check() ) { return NULL; }
-            if( !select.read().ready( fd_ ) && !select.write().ready( fd_ ) ) { return NULL; }
+            select.check(); //if( !select.check() ) { return nullptr; }
+            if( !select.read().ready( fd_ ) && !select.write().ready( fd_ ) ) { return nullptr; }
         }
         typename impl::traits< S >::file_stream* s = new typename impl::traits< S >::file_stream( name_.c_str(), static_cast< std::ios::openmode >( mode_ ) );
         if( s->bad() ) { COMMA_THROW( comma::exception, "failed to open " << name_ ); }
@@ -209,7 +209,7 @@ template < typename S > const std::string& stream< S >::name() const { return na
 template < typename S > stream< S >::stream( const std::string& name, mode::value m, mode::blocking_value blocking )
     : name_( name )
     , mode_( m )
-    , stream_( NULL )
+    , stream_( nullptr )
     , fd_( comma::io::invalid_file_descriptor )
     , close_d( false )
     , blocking_( blocking )
diff --git a/io/test/CMakeLists.txt b/io/test/CMakeLists.txt
index c14125cbd..bf72a07db 100644
--- a/io/test/CMakeLists.txt
+++ b/io/test/CMakeLists.txt
@@ -1,13 +1,12 @@
-set( KIT io )
-file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/io/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_io )
 add_executable( ${test_name} ${source} )
-target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
-add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+target_link_libraries( ${test_name} comma_io ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_io WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
 if( INSTALL_TESTS )
     install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
     #INSTALL (
-    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_io
     #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
     #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
 endif( INSTALL_TESTS )
diff --git a/io/test/io-publish/stdin/input b/io/test/io-publish/stdin/input
index 34d7c54f6..9e388eec8 100644
--- a/io/test/io-publish/stdin/input
+++ b/io/test/io-publish/stdin/input
@@ -1,12 +1,12 @@
 port=42641
 
 function stdin_cmd()
-{
+{ 
     yes
 }
 export -f stdin_cmd
 
 function client_cmd()
 {
-    socat tcp:localhost:$port - | head -10 > client.out
+    socat tcp:localhost:$port - | head -n10 > client.out
 }
diff --git a/io/test/io-publish/test b/io/test/io-publish/test
index 42987104b..29b6582b6 100755
--- a/io/test/io-publish/test
+++ b/io/test/io-publish/test
@@ -28,9 +28,9 @@ cd output
 [[ $( type -t exec_cmd ) == "function" ]] && options+=" --exec exec_cmd"
 
 if [[ $( type -t stdin_cmd ) == "function" ]]; then
-    stdin_cmd | io-publish tcp:$port $options &
+    stdin_cmd | io-publish tcp:$port $options --verbose &
 else
-    io-publish tcp:$port $options &
+    io-publish tcp:$port $options --verbose &
 fi
 io_publish_pid=$!
 echo "test: io_publish_pid: $io_publish_pid port: $port" >&2
@@ -40,11 +40,11 @@ if [[ $( type -t client_cmd ) == "function" ]]; then
     echo "test: running client command..." >&2
     client_cmd > /dev/null &
     client_cmd_pid=$!
-    echo "client_cmd_pid=$client_cmd_pid" >&2
+    echo "test: client_cmd_pid=$client_cmd_pid" >&2
 fi
 
-[[ $test_duration ]] || test_duration=10
-[[ $report_interval ]] || report_interval=1
+[[ -n "$test_duration" ]] || test_duration=10
+[[ -n "$report_interval" ]] || report_interval=1
 
 loops=$( echo "$test_duration / $report_interval" | bc -l | sed 's/\.[0-9]*$//' )
 
@@ -58,9 +58,7 @@ done | sed 's/,$//;s/,[^,]* <defunct>//g' | grep -v ",bash$" | uniq \
 # when logging the processes above, we filter out lines with just bash at the
 # end, as they are in transition, with their children having just died
 
-if [[ $client_cmd_pid ]]; then
-    kill_pid_and_children $client_cmd_pid
-fi
+if [[ $client_cmd_pid ]]; then kill_pid_and_children $client_cmd_pid; fi
 echo "test: killing io-publish: $io_publish_pid" >&2
 kill_pid_and_children $io_publish_pid
 

From e39eae91ed9b3bd23d81b418a14e8e4a82c3d23e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Sep 2024 12:41:26 +1000
Subject: [PATCH 0934/1056] io::iserver: in progress...

---
 io/impl/server.cpp | 52 +++++++++++++++++++++++++++++++++-------------
 io/impl/server.h   | 42 ++++++++++++++++++-------------------
 io/server.cpp      |  4 ++--
 io/server.h        | 27 +++++++++++++++++++++---
 4 files changed, 84 insertions(+), 41 deletions(-)

diff --git a/io/impl/server.cpp b/io/impl/server.cpp
index 87a40445b..b0fe14168 100644
--- a/io/impl/server.cpp
+++ b/io/impl/server.cpp
@@ -21,6 +21,26 @@
 
 namespace comma { namespace io { namespace impl {
 
+template < typename Stream > struct stream_traits;
+
+template <> struct stream_traits< io::istream >
+{
+    static constexpr bool is_input_stream{true};
+    static constexpr bool is_output_stream{false};
+};
+
+template <> struct stream_traits< io::ostream >
+{
+    static constexpr bool is_input_stream{false};
+    static constexpr bool is_output_stream{true};
+};
+
+template <> struct stream_traits< io::iostream >
+{
+    static constexpr bool is_input_stream{true};
+    static constexpr bool is_output_stream{true};
+};
+
 template < typename Stream > class file_acceptor : public acceptor< Stream >
 {
     public:
@@ -208,7 +228,8 @@ template < typename Stream > server< Stream >::server( const std::string& name,
         {
             streams_.insert( std::unique_ptr< Stream >( new Stream( name, mode ) ) );
 #ifndef WIN32
-            select_.write().add( 1 ); // todo: traits: read/write
+            if( stream_traits< Stream >::is_input_stream ) { select_.read().add( 0 ); }
+            if( stream_traits< Stream >::is_output_stream ) { select_.write().add( 1 ); }
 #endif
         }
         else
@@ -218,7 +239,8 @@ template < typename Stream > server< Stream >::server( const std::string& name,
             streams_.insert( std::unique_ptr< Stream >( s ) ); // todo: should we simply abolish file_acceptor and do it in the same way as for stdout?
             if( s->fd() == comma::io::invalid_file_descriptor ) { COMMA_THROW( comma::exception, "failed to open '" << name << "'" ); }
 #ifndef WIN32
-            select_.write().add( s->fd() ); // todo: traits: read/write
+            if( stream_traits< Stream >::is_input_stream ) { select_.read().add( s->fd() ); }
+            if( stream_traits< Stream >::is_output_stream ) { select_.write().add( s->fd() ); }
 #endif
         }
     }
@@ -245,13 +267,15 @@ template < typename Stream > std::vector< Stream* > server< Stream >::accept()
         if( s == nullptr ) { return streams; }
         streams.emplace_back( s );
         streams_.insert( std::unique_ptr< Stream >( s ) );
-        select_.write().add( s->fd() ); // todo! istream/ostream traits
+        if( stream_traits< Stream >::is_input_stream ) { select_.read().add( s->fd() ); }
+        if( stream_traits< Stream >::is_output_stream ) { select_.write().add( s->fd() ); }
     }
 }
 
 template < typename Stream > void server< Stream >::remove_( typename _streams_type::iterator it )
 {
-    select_.write().remove( **it );
+    if( stream_traits< Stream >::is_input_stream ) { select_.read().remove( **it ); }
+    if( stream_traits< Stream >::is_output_stream ) { select_.write().remove( **it ); }
     ( *it )->close();
     if( _acceptor ) { _acceptor->notify_closed(); }
     streams_.erase( it );
@@ -259,27 +283,27 @@ template < typename Stream > void server< Stream >::remove_( typename _streams_t
 
 template < typename Stream > std::size_t server< Stream >::size() const { return streams_.size(); }
 
-template < typename Stream > unsigned int server< Stream >::write( const char* buf, std::size_t size, bool do_accept )
+template < typename Stream > unsigned int server< Stream >::write( server< io::ostream >* s, const char* buf, std::size_t size, bool do_accept )
 {
-    if( do_accept ) { accept(); }
-    if( !blocking_ ) { select_.check(); } // todo: if slow, put all the files in one select
+    if( do_accept ) { s->accept(); }
+    if( !s->blocking_ ) { s->select_.check(); } // todo: if slow, put all the files in one select
     unsigned int count = 0;
-    for( typename _streams_type::iterator i = streams_.begin(); i != streams_.end(); )
+    for( auto i = s->streams_.begin(); i != s->streams_.end(); )
     {
-        typename _streams_type::iterator it = i++;
-        if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
+        auto it = i++;
+        if( !s->blocking_ && !s->select_.write().ready( **it ) ) { continue; }
         ( **it )->write( buf, size );
-        if( flush_ ) { ( **it )->flush(); }
+        if( s->flush_ ) { ( **it )->flush(); }
         if( ( **it )->good() ) { ++count; }
-        else { remove_( it ); }
+        else { s->remove_( it ); }
     }
     return count;
 }
 
-// template struct acceptor< io::istream >;
+template struct acceptor< io::istream >;
 template struct acceptor< io::ostream >;
 // template struct acceptor< io::iostream >;
-// todo: template struct server< io::istream >;
+template struct server< io::istream >;
 template struct server< io::ostream >;
 // todo: template struct server< io::iostream >;
 
diff --git a/io/impl/server.h b/io/impl/server.h
index a30852496..d6169c97c 100644
--- a/io/impl/server.h
+++ b/io/impl/server.h
@@ -40,40 +40,38 @@ class server
 
         server( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
 
-        // todo!
-        unsigned int write( const char* buf, std::size_t size, bool do_accept = true );
+        void close();
+        
+        void disconnect_all();
+
+        std::size_t size() const;
+
+        std::vector< Stream* > accept(); // quick and dirty; return naked pointers for now
+        
+        const io::impl::acceptor< Stream >& acceptor() const { return *_acceptor; }
+
+        static unsigned int write( server< io::ostream >* s, const char* buf, std::size_t size, bool do_accept = true );
 
-        // todo!
         template < typename T >
-        impl::server< Stream >& operator<<( const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
+        static void write( server< io::ostream >* s, const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
         {
-            accept();
-            select_.check();
+            s->accept();
+            s->select_.check();
             unsigned int count = 0;
-            for( typename _streams_type::iterator i = streams_.begin(); i != streams_.end(); )
+            for( typename _streams_type::iterator i = s->streams_.begin(); i != s->streams_.end(); )
             {
                 typename _streams_type::iterator it = i++;
-                if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
+                if( !s->blocking_ && !s->select_.write().ready( **it ) ) { continue; }
                 ( ***it ) << lhs;
-                if( flush_ ) { ( **it )->flush(); }
+                if( s->flush_ ) { ( **it )->flush(); }
                 if( ( **it )->good() ) { ++count; }
-                else { remove_( it ); }
+                else { s->remove_( it ); }
             }
-            return *this;
         }
 
-        void close();
-        
-        void disconnect_all();
-
-        std::size_t size() const;
-
-        std::vector< Stream* > accept(); // quick and dirty; return naked pointers for now
-        
-        const io::impl::acceptor< Stream >& acceptor() const { return *_acceptor; }
-
-    private:
+    protected:
         template < typename > friend class comma::io::server;
+        template < typename > friend class comma::io::impl::server;
         bool blocking_;
         bool flush_;
         boost::scoped_ptr< io::impl::acceptor< Stream > > _acceptor;
diff --git a/io/server.cpp b/io/server.cpp
index 581c7d2f9..73890bb4b 100644
--- a/io/server.cpp
+++ b/io/server.cpp
@@ -47,9 +47,9 @@ template < typename Stream > std::size_t server< Stream >::size() const { return
 
 template < typename Stream > file_descriptor server< Stream >::acceptor_file_descriptor() const { return pimpl_->_acceptor ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
 
-std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept ) { return pimpl_->write( buf, size, do_accept ); }
+std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::ostream >::write( pimpl_, buf, size, do_accept ); }
 
-//template class server< io::istream >;
+template class server< io::istream >;
 template class server< io::ostream >;
 //template class server< io::iostream >;
 
diff --git a/io/server.h b/io/server.h
index 9e3ebc878..69a00453c 100644
--- a/io/server.h
+++ b/io/server.h
@@ -33,7 +33,7 @@ class server
         /// destructor
         ~server();
 
-        /// close
+        /// stop accepting clients, disconnect all existing clients
         void close();
         
         /// disconnect all existing clients
@@ -71,7 +71,7 @@ struct oserver: public io::server< io::ostream >
     ///     if <filename> is Linux domain socket, create Linux domain socket server
     /// @param mode ascii or binary, a hint for Windows
     /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
-    oserver( const std::string& name, comma::io::mode::value mode, bool blocking = false, bool flush = true ): server< io::ostream >( name, mode, blocking, flush ) {}
+    oserver( const std::string& name, comma::io::mode::value mode, bool blocking = false, bool flush = true ): io::server< io::ostream >( name, mode, blocking, flush ) {}
 
     /// publish to all existing connections (blocking), return number of clients with successful write
     std::size_t write( const char* buf, std::size_t size, bool do_accept = true );
@@ -85,7 +85,28 @@ struct oserver: public io::server< io::ostream >
     ///       has been output, this client will receive
     ///       ",2", which most likely was not intended
     template < typename T >
-    oserver& operator<<( const T& rhs ) { pimpl_->operator<<( rhs ); return *this; }
+    oserver& operator<<( const T& rhs ) { io::impl::server< io::ostream >::write( pimpl_, rhs ); return *this; }
+};
+
+class iserver: public io::server< io::istream >
+{
+    public:
+        /// @param name ::= tcp:<port> | udp:<port> | <filename>
+        ///     if tcp:<port>, create tcp server
+        ///     @todo if udp:<port>, broadcast on udp
+        ///     if <filename> is a regular file, just write to it
+        ///     @todo if <filename> is named pipe, keep reopening it, if closed
+        ///     if <filename> is Linux domain socket, create Linux domain socket server
+        /// @param mode ascii or binary, a hint for Windows
+        /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
+        iserver( const std::string& name, comma::io::mode::value mode, bool blocking = false ): io::server< io::istream >( name, mode, blocking ) {}
+
+        std::size_t read( const char* buf, std::size_t size, bool do_accept = true );
+
+        std::string readline( bool do_accept = true );
+
+    private:
+        unsigned int _index{0};
 };
 
 } } // namespace comma { namespace io {

From 85780ce8e1092bfbbd2417d8103746755a60db67 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Sep 2024 12:51:50 +1000
Subject: [PATCH 0935/1056] io::iserver: in progress...

---
 io/impl/server.cpp | 12 +++++++++++-
 io/impl/server.h   |  4 ++++
 io/server.cpp      |  7 ++++++-
 io/server.h        | 35 +++++++++++++++++++----------------
 4 files changed, 40 insertions(+), 18 deletions(-)

diff --git a/io/impl/server.cpp b/io/impl/server.cpp
index b0fe14168..0f66082ba 100644
--- a/io/impl/server.cpp
+++ b/io/impl/server.cpp
@@ -300,9 +300,19 @@ template < typename Stream > unsigned int server< Stream >::write( server< io::o
     return count;
 }
 
+template < typename Stream > unsigned int server< Stream >::read( server< io::istream >* s, const char* buf, std::size_t size, bool do_accept )
+{
+    COMMA_THROW( comma::exception, "implementing..." );
+}
+
+template < typename Stream > std::string server< Stream >::readline( server< io::istream >* s, bool do_accept )
+{
+    COMMA_THROW( comma::exception, "implementing..." );
+}
+
 template struct acceptor< io::istream >;
 template struct acceptor< io::ostream >;
-// template struct acceptor< io::iostream >;
+// todo: template struct acceptor< io::iostream >;
 template struct server< io::istream >;
 template struct server< io::ostream >;
 // todo: template struct server< io::iostream >;
diff --git a/io/impl/server.h b/io/impl/server.h
index d6169c97c..b4ac43ed5 100644
--- a/io/impl/server.h
+++ b/io/impl/server.h
@@ -69,6 +69,10 @@ class server
             }
         }
 
+        static unsigned int read( server< io::istream >* s, const char* buf, std::size_t size, bool do_accept = true );
+
+        static std::string readline( server< io::istream >* s, bool do_accept = true );
+
     protected:
         template < typename > friend class comma::io::server;
         template < typename > friend class comma::io::impl::server;
diff --git a/io/server.cpp b/io/server.cpp
index 73890bb4b..955ac07ec 100644
--- a/io/server.cpp
+++ b/io/server.cpp
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -49,8 +50,12 @@ template < typename Stream > file_descriptor server< Stream >::acceptor_file_des
 
 std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::ostream >::write( pimpl_, buf, size, do_accept ); }
 
+std::size_t iserver::read( const char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::istream >::read( pimpl_, buf, size, do_accept ); }
+
+std::string iserver::readline( bool do_accept ) { return io::impl::server< io::istream >::readline( pimpl_, do_accept ); }
+
 template class server< io::istream >;
 template class server< io::ostream >;
-//template class server< io::iostream >;
+// todo: template class server< io::iostream >;
 
 } } // namespace comma { namespace io {
diff --git a/io/server.h b/io/server.h
index 69a00453c..e75cca85f 100644
--- a/io/server.h
+++ b/io/server.h
@@ -88,25 +88,28 @@ struct oserver: public io::server< io::ostream >
     oserver& operator<<( const T& rhs ) { io::impl::server< io::ostream >::write( pimpl_, rhs ); return *this; }
 };
 
-class iserver: public io::server< io::istream >
+struct iserver: public io::server< io::istream >
 {
-    public:
-        /// @param name ::= tcp:<port> | udp:<port> | <filename>
-        ///     if tcp:<port>, create tcp server
-        ///     @todo if udp:<port>, broadcast on udp
-        ///     if <filename> is a regular file, just write to it
-        ///     @todo if <filename> is named pipe, keep reopening it, if closed
-        ///     if <filename> is Linux domain socket, create Linux domain socket server
-        /// @param mode ascii or binary, a hint for Windows
-        /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
-        iserver( const std::string& name, comma::io::mode::value mode, bool blocking = false ): io::server< io::istream >( name, mode, blocking ) {}
-
-        std::size_t read( const char* buf, std::size_t size, bool do_accept = true );
+    /// @param name ::= tcp:<port> | udp:<port> | <filename>
+    ///     if tcp:<port>, create tcp server
+    ///     @todo if udp:<port>, broadcast on udp
+    ///     if <filename> is a regular file, just write to it
+    ///     @todo if <filename> is named pipe, keep reopening it, if closed
+    ///     if <filename> is Linux domain socket, create Linux domain socket server
+    /// @param mode ascii or binary, a hint for Windows
+    /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
+    iserver( const std::string& name, comma::io::mode::value mode, bool blocking = false ): io::server< io::istream >( name, mode, blocking ) {}
 
-        std::string readline( bool do_accept = true );
+    /// @todo usage semantics!
+    std::size_t read( const char* buf, std::size_t size, bool do_accept = true );
 
-    private:
-        unsigned int _index{0};
+    /// @todo usage semantics!
+    std::string readline( bool do_accept = true );
 };
 
+// struct ioserver: public io::server< io::iostream >
+// {
+//     // todo
+// };
+
 } } // namespace comma { namespace io {

From f16adffa0c46963a4ce64000c57d5a5662a1c13f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 30 Sep 2024 14:29:09 +1000
Subject: [PATCH 0936/1056] io::iserver: in progress...

---
 io/impl/server.cpp | 49 ++++++++++++++++++++++++++++++++++++++++------
 io/impl/server.h   | 10 ++++++----
 io/server.cpp      |  2 +-
 io/server.h        | 12 ++++++++----
 4 files changed, 58 insertions(+), 15 deletions(-)

diff --git a/io/impl/server.cpp b/io/impl/server.cpp
index 0f66082ba..0856869a7 100644
--- a/io/impl/server.cpp
+++ b/io/impl/server.cpp
@@ -254,7 +254,7 @@ template < typename Stream > void server< Stream >::close()
 
 template < typename Stream > void server< Stream >::disconnect_all()
 {
-    while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); }
+    while( streams_.begin() != streams_.end() ) { _remove( streams_.begin() ); }
 }
 
 template < typename Stream > std::vector< Stream* > server< Stream >::accept()
@@ -272,7 +272,7 @@ template < typename Stream > std::vector< Stream* > server< Stream >::accept()
     }
 }
 
-template < typename Stream > void server< Stream >::remove_( typename _streams_type::iterator it )
+template < typename Stream > void server< Stream >::_remove( typename _streams_type::iterator it )
 {
     if( stream_traits< Stream >::is_input_stream ) { select_.read().remove( **it ); }
     if( stream_traits< Stream >::is_output_stream ) { select_.write().remove( **it ); }
@@ -295,19 +295,56 @@ template < typename Stream > unsigned int server< Stream >::write( server< io::o
         ( **it )->write( buf, size );
         if( s->flush_ ) { ( **it )->flush(); }
         if( ( **it )->good() ) { ++count; }
-        else { s->remove_( it ); }
+        else { s->_remove( it ); }
     }
     return count;
 }
 
-template < typename Stream > unsigned int server< Stream >::read( server< io::istream >* s, const char* buf, std::size_t size, bool do_accept )
+template < typename Stream > void server< Stream >::_remove_bad()
 {
-    COMMA_THROW( comma::exception, "implementing..." );
+    for( auto i = streams_.begin(); i != streams_.end(); ) { if( !( **i )->good() ) { _remove( i ); } }
+}
+
+template < typename Stream > unsigned int server< Stream >::read( server< io::istream >* s, char* buf, std::size_t size, bool do_accept )
+{
+    if( do_accept ) { s->accept(); }
+
+
+    // todo: if blocking, read in the loop
+
+
+    if( s->blocking_ ) { s->select_.wait( boost::posix_time::milliseconds( 100 ) ); } else { s->select_.check(); } // todo? pass timeout as a parameter?
+
+    auto j = s->streams_.begin();
+    for( ; j != s->streams_.end() && ( *j )->fd() != s->_last_read; ++j );
+    if( j == s->streams_.end() ) { j = s->streams_.begin(); s->_last_read = io::invalid_file_descriptor; }
+    for( auto i = j; i != s->streams_.end(); )
+    {
+        auto it = i++;
+        if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
+        ( **it )->read( buf, size );
+        if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
+        s->_remove_bad();
+        s->_last_read = ( *it )->fd();
+        return size;
+    }
+    auto e = j == s->streams_.end() ? j : ++j;
+    for( auto i = s->streams_.begin(); i != e; ) // todo: remove code duplication: combine with the previous loop
+    {
+        auto it = i++;
+        if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
+        ( **it )->read( buf, size );
+        if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
+        s->_remove_bad();
+        s->_last_read = ( *it )->fd();
+        return size;
+    }
+    return 0;
 }
 
 template < typename Stream > std::string server< Stream >::readline( server< io::istream >* s, bool do_accept )
 {
-    COMMA_THROW( comma::exception, "implementing..." );
+    COMMA_THROW( comma::exception, "todo..." );
 }
 
 template struct acceptor< io::istream >;
diff --git a/io/impl/server.h b/io/impl/server.h
index b4ac43ed5..bbd7aa039 100644
--- a/io/impl/server.h
+++ b/io/impl/server.h
@@ -65,11 +65,11 @@ class server
                 ( ***it ) << lhs;
                 if( s->flush_ ) { ( **it )->flush(); }
                 if( ( **it )->good() ) { ++count; }
-                else { s->remove_( it ); }
+                else { s->_remove( it ); }
             }
         }
 
-        static unsigned int read( server< io::istream >* s, const char* buf, std::size_t size, bool do_accept = true );
+        static unsigned int read( server< io::istream >* s, char* buf, std::size_t size, bool do_accept = true );
 
         static std::string readline( server< io::istream >* s, bool do_accept = true );
 
@@ -79,10 +79,12 @@ class server
         bool blocking_;
         bool flush_;
         boost::scoped_ptr< io::impl::acceptor< Stream > > _acceptor;
-        typedef std::set< std::unique_ptr< stream_type > > _streams_type;
+        typedef std::set< std::unique_ptr< Stream > > _streams_type;
+        io::file_descriptor _last_read{io::invalid_file_descriptor}; // quick and dirty
         _streams_type streams_;
         io::select select_;
-        void remove_( typename _streams_type::iterator it );
+        void _remove( typename _streams_type::iterator it );
+        void _remove_bad();
 };
 
 } } } // namespace comma { namespace io { namespace impl {
diff --git a/io/server.cpp b/io/server.cpp
index 955ac07ec..9d05c7164 100644
--- a/io/server.cpp
+++ b/io/server.cpp
@@ -50,7 +50,7 @@ template < typename Stream > file_descriptor server< Stream >::acceptor_file_des
 
 std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::ostream >::write( pimpl_, buf, size, do_accept ); }
 
-std::size_t iserver::read( const char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::istream >::read( pimpl_, buf, size, do_accept ); }
+std::size_t iserver::read( char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::istream >::read( pimpl_, buf, size, do_accept ); }
 
 std::string iserver::readline( bool do_accept ) { return io::impl::server< io::istream >::readline( pimpl_, do_accept ); }
 
diff --git a/io/server.h b/io/server.h
index e75cca85f..50accc1eb 100644
--- a/io/server.h
+++ b/io/server.h
@@ -100,10 +100,14 @@ struct iserver: public io::server< io::istream >
     /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
     iserver( const std::string& name, comma::io::mode::value mode, bool blocking = false ): io::server< io::istream >( name, mode, blocking ) {}
 
-    /// @todo usage semantics!
-    std::size_t read( const char* buf, std::size_t size, bool do_accept = true );
-
-    /// @todo usage semantics!
+    /// read <size> bytes to <buf> from first available client
+    /// return 0 if no clients have data
+    /// start from the next client on the next read to assure round-robin behaviour
+    std::size_t read( char* buf, std::size_t size, bool do_accept = true );
+
+    /// read eol-terminated string from first available client
+    /// return 0 if no clients have data
+    /// start from the next client on the next read to assure round-robin behaviour
     std::string readline( bool do_accept = true );
 };
 

From a152e386e585347f14ee663fd36fbef3efb90be5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 1 Oct 2024 10:02:04 +1000
Subject: [PATCH 0937/1056] io::iserver: in progress...

---
 io/impl/server.cpp | 83 ++++++++++++++++++++++++----------------------
 io/impl/server.h   | 19 +++++++----
 2 files changed, 55 insertions(+), 47 deletions(-)

diff --git a/io/impl/server.cpp b/io/impl/server.cpp
index 0856869a7..f665a858e 100644
--- a/io/impl/server.cpp
+++ b/io/impl/server.cpp
@@ -44,7 +44,7 @@ template <> struct stream_traits< io::iostream >
 template < typename Stream > class file_acceptor : public acceptor< Stream >
 {
     public:
-        file_acceptor( const std::string& name, io::mode::value mode ): name_( name ), mode_( mode ), closed_( true ), fd_( io::invalid_file_descriptor ) {}
+        file_acceptor( const std::string& name, io::mode::value mode ): name_( name ), mode_( mode ), fd_( io::invalid_file_descriptor ) { this->_closed = true; }
 
         ~file_acceptor()
         {
@@ -57,25 +57,26 @@ template < typename Stream > class file_acceptor : public acceptor< Stream >
 
         Stream* accept( boost::posix_time::time_duration )
         {
-            if( !closed_ ) { return NULL; }
+            if( !this->_closed ) { return nullptr; }
 #ifndef WIN32
             fd_ = ::open( &name_[0], O_WRONLY | O_CREAT | O_NONBLOCK, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH ); // quick and dirty
 #else
             fd_ = _open( &name_[0], O_WRONLY | _O_CREAT, _S_IWRITE );
 #endif
             if( fd_ == io::invalid_file_descriptor ) { return nullptr; }
-            closed_ = false;
+            this->_closed = false;
             return new Stream( name_, mode_, io::mode::non_blocking ); // quick and dirty
         }
 
-        void notify_closed() { closed_ = true; ::close( fd_ ); }
+        void notify_closed() { this->_closed = true; ::close( fd_ ); }
         
         io::file_descriptor fd() const { return fd_; }
 
+        bool closed() const { COMMA_THROW( comma::exception, "todo" ); }
+
     private:
         const std::string name_;
         const io::mode::value mode_;
-        bool closed_{false};
         io::file_descriptor fd_{0}; // todo: make io::istream, io::ostream non-throwing on construction
 };
 
@@ -152,7 +153,7 @@ template < typename Stream, typename S > class socket_acceptor : public acceptor
 #endif
         }
 
-        void close() { _acceptor.close(); }
+        void close() { this->_closed = true; _acceptor.close(); }
 
 #ifndef WIN32
 #if (BOOST_VERSION >= 106600)
@@ -164,6 +165,8 @@ template < typename Stream, typename S > class socket_acceptor : public acceptor
         io::file_descriptor fd() const { return io::invalid_file_descriptor; }
 #endif
 
+        bool closed() const { COMMA_THROW( comma::exception, "todo" ); }
+
     private:
         io::mode::value mode_{io::mode::binary};
         io::select select_;
@@ -179,21 +182,23 @@ template < typename Stream >
 class zero_acceptor_ : public acceptor< Stream >
 {
     public:
-        zero_acceptor_( const std::string& name, io::mode::value mode ): stream_( new Stream( name, mode ) ), accepted_( false ) {}
+        zero_acceptor_( const std::string& name, io::mode::value mode ): _stream( new Stream( name, mode ) ), accepted_( false ) {}
 
         Stream* accept( boost::posix_time::time_duration )
         {
             if( accepted_ ) { return nullptr; }
             accepted_ = true;
-            return stream_;
+            return _stream;
         }
 
-        void close() { stream_->close(); }
+        void close() { this->_closed = true; _stream->close(); }
         
         io::file_descriptor fd() const { return io::invalid_file_descriptor; } // quick and dirty
 
+        bool closed() const { return this->_closed || _stream.eof(); }
+
     private:
-        Stream* stream_{nullptr};
+        Stream* _stream{nullptr};
         bool accepted_{false};
 };
 
@@ -307,37 +312,35 @@ template < typename Stream > void server< Stream >::_remove_bad()
 
 template < typename Stream > unsigned int server< Stream >::read( server< io::istream >* s, char* buf, std::size_t size, bool do_accept )
 {
-    if( do_accept ) { s->accept(); }
-
-
-    // todo: if blocking, read in the loop
-
-
-    if( s->blocking_ ) { s->select_.wait( boost::posix_time::milliseconds( 100 ) ); } else { s->select_.check(); } // todo? pass timeout as a parameter?
-
-    auto j = s->streams_.begin();
-    for( ; j != s->streams_.end() && ( *j )->fd() != s->_last_read; ++j );
-    if( j == s->streams_.end() ) { j = s->streams_.begin(); s->_last_read = io::invalid_file_descriptor; }
-    for( auto i = j; i != s->streams_.end(); )
+    while( !s->_acceptor->closed() )
     {
-        auto it = i++;
-        if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
-        ( **it )->read( buf, size );
-        if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
-        s->_remove_bad();
-        s->_last_read = ( *it )->fd();
-        return size;
-    }
-    auto e = j == s->streams_.end() ? j : ++j;
-    for( auto i = s->streams_.begin(); i != e; ) // todo: remove code duplication: combine with the previous loop
-    {
-        auto it = i++;
-        if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
-        ( **it )->read( buf, size );
-        if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
-        s->_remove_bad();
-        s->_last_read = ( *it )->fd();
-        return size;
+        if( do_accept ) { s->accept(); }
+        if( s->blocking_ ) { s->select_.wait( boost::posix_time::milliseconds( 100 ) ); } // todo? pass timeout as a parameter?
+        auto j = s->streams_.begin();
+        for( ; j != s->streams_.end() && ( *j )->fd() != s->_last_read; ++j );
+        if( j == s->streams_.end() ) { j = s->streams_.begin(); s->_last_read = io::invalid_file_descriptor; }
+        for( auto i = j; i != s->streams_.end(); )
+        {
+            auto it = i++;
+            if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
+            ( **it )->read( buf, size );
+            if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
+            s->_remove_bad();
+            s->_last_read = ( *it )->fd();
+            return size;
+        }
+        auto e = j == s->streams_.end() ? j : ++j;
+        for( auto i = s->streams_.begin(); i != e; ) // todo: remove code duplication: combine with the previous loop
+        {
+            auto it = i++;
+            if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
+            ( **it )->read( buf, size );
+            if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
+            s->_remove_bad();
+            s->_last_read = ( *it )->fd();
+            return size;
+        }
+        if( !s->blocking_ ) { return 0; }
     }
     return 0;
 }
diff --git a/io/impl/server.h b/io/impl/server.h
index bbd7aa039..ad845cfb9 100644
--- a/io/impl/server.h
+++ b/io/impl/server.h
@@ -21,15 +21,20 @@ template < typename Stream > class server;
 namespace comma { namespace io { namespace impl {
 
 template < typename Stream >
-struct acceptor
+class acceptor
 {
-    typedef Stream stream_type;
+    public:
+        typedef Stream stream_type;
 
-    virtual ~acceptor() {}
-    virtual io::file_descriptor fd() const = 0;
-    virtual Stream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
-    virtual void notify_closed() {} // quick and dirty
-    virtual void close() {}
+        virtual ~acceptor() {}
+        virtual io::file_descriptor fd() const = 0;
+        virtual Stream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
+        virtual void notify_closed() {} // quick and dirty
+        virtual void close() { _closed = true; }
+        bool closed() const { return _closed; }
+        
+    protected:
+        bool _closed{false};
 };
 
 template < typename Stream >

From 730a6d0c92f8bc434be63d2ce22003b1aca59b23 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 2 Oct 2024 11:01:53 +1000
Subject: [PATCH 0938/1056] io::impl::receive class added

---
 io/impl/publish.cpp | 122 ++++++++++++++++++++++++++++----------------
 io/impl/publish.h   |  63 ++++++++++++++++-------
 2 files changed, 123 insertions(+), 62 deletions(-)

diff --git a/io/impl/publish.cpp b/io/impl/publish.cpp
index 0a91ff4fc..edb54f804 100644
--- a/io/impl/publish.cpp
+++ b/io/impl/publish.cpp
@@ -7,13 +7,13 @@
 
 namespace comma { namespace io { namespace impl {
 
-publish::publish( const std::vector< std::string >& endpoints
-                , unsigned int packet_size
-                , bool discard
-                , bool flush
-                , bool output_number_of_clients
-                , bool update_no_clients
-                , unsigned int cache_size )
+multiserver::multiserver( const std::vector< std::string >& endpoints
+                        , unsigned int packet_size
+                        , bool discard
+                        , bool flush
+                        , bool output_number_of_clients
+                        , bool update_no_clients
+                        , unsigned int cache_size )
     : discard_( discard )
     , flush_( flush )
     , buffer_( packet_size, '\0' )
@@ -49,7 +49,7 @@ publish::publish( const std::vector< std::string >& endpoints
     acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
 }
         
-publish::~publish()
+multiserver::~multiserver()
 {
     is_shutdown_ = true;
     acceptor_thread_->join();
@@ -57,47 +57,14 @@ publish::~publish()
     for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
 }
         
-void publish::disconnect_all()
+void multiserver::disconnect_all()
 {
     transaction_t t( publishers_ );
     for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
     handle_sizes_( t ); // quick and dirty
 }
 
-bool publish::write( const std::string& s )
-{
-    transaction_t t( publishers_ );
-    if( cache_size_ > 0 )
-    {
-        cache_.push_back( s );
-        if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
-    }
-    for( auto& p: *t ) { if( p ) { p->write( &s[0], s.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
-    return handle_sizes_( t );
-}
-
-bool publish::write( const char* buf, unsigned int size )
-{
-    return write( std::string( buf, size ) ); // todo: quick and dirty, watch performance
-}
-
-bool publish::read( std::istream& input )
-{
-    if( is_binary_() )
-    {
-        input.read( &buffer_[0], buffer_.size() );
-        if( input.gcount() < int( buffer_.size() ) || !input.good() ) { return false; }
-    }
-    else
-    {
-        std::getline( input, buffer_ );
-        buffer_ += '\n';
-        if( !input.good() ) { return false; }
-    }
-    return write( buffer_ );
-}
-
-bool publish::handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
+bool multiserver::handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
 {
     if( !output_number_of_clients_ && !update_no_clients_ ) { return true; }
     unsigned int total = 0;
@@ -128,7 +95,7 @@ bool publish::handle_sizes_( transaction_t& t ) // todo? why pass transaction? i
     return true;
 }
 
-void publish::accept_()
+void multiserver::accept_()
 {
     comma::io::select select;
     {
@@ -181,4 +148,71 @@ void publish::accept_()
     }
 }
 
+publish::publish( const std::vector< std::string >& endpoints
+                , unsigned int packet_size
+                , bool discard
+                , bool flush
+                , bool output_number_of_clients
+                , bool update_no_clients
+                , unsigned int cache_size )
+    : multiserver( endpoints
+                , packet_size
+                , discard
+                , flush
+                , output_number_of_clients
+                , update_no_clients
+                , cache_size )
+{
+}
+
+bool publish::write( const std::string& s )
+{
+    transaction_t t( publishers_ );
+    if( cache_size_ > 0 )
+    {
+        cache_.push_back( s );
+        if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
+    }
+    for( auto& p: *t ) { if( p ) { p->write( &s[0], s.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
+    return handle_sizes_( t );
+}
+
+bool publish::write( const char* buf, unsigned int size )
+{
+    return write( std::string( buf, size ) ); // todo: quick and dirty, watch performance
+}
+
+bool publish::read( std::istream& input )
+{
+    if( is_binary_() )
+    {
+        input.read( &buffer_[0], buffer_.size() );
+        if( input.gcount() < int( buffer_.size() ) || !input.good() ) { return false; }
+    }
+    else
+    {
+        std::getline( input, buffer_ );
+        buffer_ += '\n';
+        if( !input.good() ) { return false; }
+    }
+    return write( buffer_ );
+}
+
+receive::receive( const std::vector< std::string >& endpoints
+                , unsigned int packet_size
+                , bool discard
+                , bool flush
+                , bool output_number_of_clients
+                , bool update_no_clients
+                , unsigned int cache_size )
+    : multiserver( endpoints
+                , packet_size
+                , discard
+                , flush
+                , output_number_of_clients
+                , update_no_clients
+                , cache_size )
+{
+}
+
 } } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/publish.h b/io/impl/publish.h
index e71a5382e..193cbb84b 100644
--- a/io/impl/publish.h
+++ b/io/impl/publish.h
@@ -14,7 +14,6 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/iostreams/device/file_descriptor.hpp>
 #include <boost/iostreams/stream.hpp>
-#include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
 #include "../../io/file_descriptor.h"
 #include "../../io/server.h"
@@ -23,7 +22,7 @@
 
 namespace comma { namespace io { namespace impl {
 
-class publish
+class multiserver
 {
     public:
         typedef comma::synchronized< std::vector< std::unique_ptr< comma::io::oserver > > > publishers_t;
@@ -37,27 +36,21 @@ class publish
             endpoint( const std::string& address = "", bool secondary = false ): address( address ), secondary( secondary ) {}
         };
         
-        publish( const std::vector< std::string >& endpoints
-               , unsigned int packet_size
-               , bool discard
-               , bool flush
-               , bool output_number_of_clients
-               , bool update_no_clients
-               , unsigned int cache_size );
+        multiserver( const std::vector< std::string >& endpoints
+                   , unsigned int packet_size
+                   , bool discard
+                   , bool flush
+                   , bool output_number_of_clients
+                   , bool update_no_clients
+                   , unsigned int cache_size );
         
-        ~publish();
+        ~multiserver();
         
         void disconnect_all();
         
-        bool read( std::istream& input );
-
-        bool write( const std::string& s );
-
-        bool write( const char* buf, unsigned int size );
-        
         unsigned int num_clients() const { return num_clients_; }
 
-    private:
+    protected:
         std::vector< endpoint > endpoints_;
         bool discard_;
         bool flush_;
@@ -71,7 +64,7 @@ class publish
         std::vector< unsigned int > sizes_;
         bool has_primary_clients_;
         unsigned int num_clients_;
-        boost::scoped_ptr< boost::thread > acceptor_thread_;
+        std::unique_ptr< boost::thread > acceptor_thread_;
         bool is_shutdown_;
         std::deque< std::string > cache_;
 
@@ -80,4 +73,38 @@ class publish
         void accept_();
 };
 
+struct publish : public multiserver
+{
+    publish( const std::vector< std::string >& endpoints
+            , unsigned int packet_size
+            , bool discard
+            , bool flush
+            , bool output_number_of_clients
+            , bool update_no_clients
+            , unsigned int cache_size );
+    
+    bool read( std::istream& input );
+
+    bool write( const std::string& s );
+
+    bool write( const char* buf, unsigned int size );
+};
+
+struct receive : public multiserver
+{
+    receive( const std::vector< std::string >& endpoints
+            , unsigned int packet_size
+            , bool discard
+            , bool flush
+            , bool output_number_of_clients
+            , bool update_no_clients
+            , unsigned int cache_size );
+    
+    // bool read( std::istream& input );
+
+    // bool write( const std::string& s );
+
+    // bool write( const char* buf, unsigned int size );
+};
+
 } } } // namespace comma { namespace io { namespace impl {

From 1c7ffd1f1eafbccd164ac4ce42569eb1e0b6fe34 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 2 Oct 2024 12:21:59 +1000
Subject: [PATCH 0939/1056] io::impl::receive: in progress...

---
 io/impl/publish.cpp | 124 +++++++++++++++++++++++++++++++-------------
 io/impl/publish.h   |  29 +++++------
 2 files changed, 102 insertions(+), 51 deletions(-)

diff --git a/io/impl/publish.cpp b/io/impl/publish.cpp
index edb54f804..5b1f7cb86 100644
--- a/io/impl/publish.cpp
+++ b/io/impl/publish.cpp
@@ -7,13 +7,30 @@
 
 namespace comma { namespace io { namespace impl {
 
-multiserver::multiserver( const std::vector< std::string >& endpoints
-                        , unsigned int packet_size
-                        , bool discard
-                        , bool flush
-                        , bool output_number_of_clients
-                        , bool update_no_clients
-                        , unsigned int cache_size )
+template < typename S > struct server_traits; // quick and dirty
+
+template <> struct server_traits< io::iserver > // quick and dirty
+{
+    static io::iserver* make( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) { return new io::iserver( name, mode, blocking ); }
+    template < typename T > static void write( T&, const char*, unsigned int ) {} 
+    template < typename T > static void flush( T& ) {}
+};
+
+template <> struct server_traits< io::oserver > // quick and dirty
+{
+    static io::oserver* make( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) { return new io::oserver( name, mode, blocking, flush ); }
+    template < typename T > static void write( T& s, const char* buf, unsigned int size ) { s.write( buf, size ); }
+    template < typename T > static void flush( T& s ) { s.flush(); }
+};
+
+template < typename Server >
+multiserver< Server >::multiserver( const std::vector< std::string >& endpoints
+                                  , unsigned int packet_size
+                                  , bool discard
+                                  , bool flush
+                                  , bool output_number_of_clients
+                                  , bool update_no_clients
+                                  , unsigned int cache_size )
     : discard_( discard )
     , flush_( flush )
     , buffer_( packet_size, '\0' )
@@ -44,27 +61,30 @@ multiserver::multiserver( const std::vector< std::string >& endpoints
     t->resize( endpoints.size() );
     for( std::size_t i = 0; i < endpoints.size(); ++i )
     {
-        if( !endpoints_[i].secondary ) { ( *t )[i].reset( new comma::io::oserver( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
+        if( !endpoints_[i].secondary ) { ( *t )[i].reset( server_traits< Server >::make( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
     }
-    acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
+    acceptor_thread_.reset( new boost::thread( boost::bind( &multiserver< Server >::accept_, boost::ref( *this ))));
 }
-        
-multiserver::~multiserver()
+
+template < typename Server >
+multiserver< Server >::~multiserver()
 {
     is_shutdown_ = true;
     acceptor_thread_->join();
     transaction_t t( publishers_ );
     for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
 }
-        
-void multiserver::disconnect_all()
+
+template < typename Server >
+void multiserver< Server >::disconnect_all()
 {
     transaction_t t( publishers_ );
     for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
     handle_sizes_( t ); // quick and dirty
 }
 
-bool multiserver::handle_sizes_( transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
+template < typename Server >
+bool multiserver< Server >::handle_sizes_( typename multiserver< Server >::transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
 {
     if( !output_number_of_clients_ && !update_no_clients_ ) { return true; }
     unsigned int total = 0;
@@ -95,7 +115,8 @@ bool multiserver::handle_sizes_( transaction_t& t ) // todo? why pass transactio
     return true;
 }
 
-void multiserver::accept_()
+template < typename Server >
+void multiserver< Server >::accept_()
 {
     comma::io::select select;
     {
@@ -120,8 +141,8 @@ void multiserver::accept_()
                 {
                     for( auto& s: streams )
                     {
-                        for( const auto& c: cache_ ) { ( *s )->write( &c[0], c.size() ); }
-                        if( flush_ ) { ( *s )->flush(); }
+                        for( const auto& c: cache_ ) { server_traits< Server >::write( **s, &c[0], c.size() ); }
+                        if( flush_ ) { server_traits< Server >::flush( **s ); }
                     }
                 }
             }
@@ -132,7 +153,7 @@ void multiserver::accept_()
             for( unsigned int i = 0; i < t->size(); ++i )
             {
                 if( !endpoints_[i].secondary || ( *t )[i] ) { continue; }
-                ( *t )[i].reset( new comma::io::oserver( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
+                ( *t )[i].reset( server_traits< Server >::make( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
                 if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
             }
         }
@@ -155,13 +176,13 @@ publish::publish( const std::vector< std::string >& endpoints
                 , bool output_number_of_clients
                 , bool update_no_clients
                 , unsigned int cache_size )
-    : multiserver( endpoints
-                , packet_size
-                , discard
-                , flush
-                , output_number_of_clients
-                , update_no_clients
-                , cache_size )
+    : multiserver< comma::io::oserver >( endpoints
+                                       , packet_size
+                                       , discard
+                                       , flush
+                                       , output_number_of_clients
+                                       , update_no_clients
+                                       , cache_size )
 {
 }
 
@@ -198,21 +219,52 @@ bool publish::read( std::istream& input )
     return write( buffer_ );
 }
 
-receive::receive( const std::vector< std::string >& endpoints
+receive::receive( const std::string& endpoint
                 , unsigned int packet_size
-                , bool discard
                 , bool flush
                 , bool output_number_of_clients
-                , bool update_no_clients
-                , unsigned int cache_size )
-    : multiserver( endpoints
-                , packet_size
-                , discard
-                , flush
-                , output_number_of_clients
-                , update_no_clients
-                , cache_size )
+                , bool update_no_clients )
+    : multiserver< comma::io::iserver >( std::vector< std::string >( 1, endpoint )
+                                       , packet_size
+                                       , false
+                                       , flush
+                                       , output_number_of_clients
+                                       , update_no_clients
+                                       , 0 )
+{
+}
+
+bool receive::read( char* buf, unsigned int size )
+{
+    transaction_t t( publishers_ );
+    auto count = ( *t )[0]->read( buf, size );
+    return handle_sizes_( t ) || count != size;
+}
+
+bool receive::readline( std::string& line ) // quick and dirty
 {
+    transaction_t t( publishers_ );
+    line = ( *t )[0]->readline();
+    return handle_sizes_( t );
 }
 
+bool receive::write( std::ostream& output )
+{
+    if( is_binary_() )
+    {
+        if( read( &buffer_[0], buffer_.size() ) != buffer_.size() ) { return false; }
+    }
+    else
+    {
+        if( !readline( buffer_ ) ) { return false; }
+        buffer_ += '\n';
+    }
+    output.write( &buffer_[0], buffer_.size() );
+    if( flush_ ) { output.flush(); }
+    return output.good();
+}
+
+template class multiserver< io::iserver >;
+template class multiserver< io::oserver >;
+
 } } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/publish.h b/io/impl/publish.h
index 193cbb84b..059343b6c 100644
--- a/io/impl/publish.h
+++ b/io/impl/publish.h
@@ -22,12 +22,13 @@
 
 namespace comma { namespace io { namespace impl {
 
+template < typename Server >
 class multiserver
 {
     public:
-        typedef comma::synchronized< std::vector< std::unique_ptr< comma::io::oserver > > > publishers_t;
+        typedef comma::synchronized< std::vector< std::unique_ptr< Server > > > publishers_t;
         
-        typedef publishers_t::scoped_transaction transaction_t;
+        typedef typename publishers_t::scoped_transaction transaction_t;
         
         struct endpoint
         {
@@ -73,7 +74,7 @@ class multiserver
         void accept_();
 };
 
-struct publish : public multiserver
+struct publish : public multiserver< comma::io::oserver >
 {
     publish( const std::vector< std::string >& endpoints
             , unsigned int packet_size
@@ -90,21 +91,19 @@ struct publish : public multiserver
     bool write( const char* buf, unsigned int size );
 };
 
-struct receive : public multiserver
+class receive : public multiserver< comma::io::iserver >
 {
-    receive( const std::vector< std::string >& endpoints
-            , unsigned int packet_size
-            , bool discard
-            , bool flush
-            , bool output_number_of_clients
-            , bool update_no_clients
-            , unsigned int cache_size );
-    
-    // bool read( std::istream& input );
+    receive( const std::string& endpoint
+           , unsigned int packet_size
+           , bool flush
+           , bool output_number_of_clients
+           , bool update_no_clients );
+
+    bool read( char* buf, unsigned int size );
 
-    // bool write( const std::string& s );
+    bool readline( std::string& line );
 
-    // bool write( const char* buf, unsigned int size );
+    bool write( std::ostream& output );
 };
 
 } } } // namespace comma { namespace io { namespace impl {

From 7a9be8c4140169cd44edda75ef61c6d93d0ffb3b Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 2 Oct 2024 12:32:43 +1000
Subject: [PATCH 0940/1056] io-cat: tcp server: in progress...

---
 io/applications/io-cat.cpp | 81 ++++++++++++++++++++++++++++++++++++--
 1 file changed, 78 insertions(+), 3 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index f74631af7..dc9761d02 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -44,8 +44,9 @@
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
-#include "../../io/stream.h"
 #include "../../io/select.h"
+#include "../../io/server.h"
+#include "../../io/stream.h"
 #include "../../string/string.h"
 
 void usage( bool verbose = false )
@@ -58,6 +59,7 @@ usage: io-cat <address> [<address>] ... [<options>]
 <address>
     local:<path>: local socket
     tcp:<host>:<port>: tcp socket
+    tcp:<port>: tcp server socket (only partly implemented)
     udp:<port>: udp socket
     zmp-<protocol>:<address>: zmq (todo)
     <filename>: file
@@ -123,7 +125,6 @@ connect options
 supported address types: tcp, udp, local (unix) sockets, named pipes, files, zmq (todo)
     
 examples
-    
     single stream
         io-cat tcp:localhost:12345
         io-cat udp:12345
@@ -133,7 +134,6 @@ examples
         io-cat zmq-local:/tmp/socket (not implemented)
         io-cat zmq-tcp:localhost:12345 (not implemented)
         echo hello | io-cat -
-    
     multiple streams
         merge line-based input
             io-cat tcp:localhost:55555 tcp:localhost:88888
@@ -284,10 +284,85 @@ class client_stream : public stream
         }
 };
 
+class server_stream : public stream
+{
+    public:
+        server_stream( const std::string& address, unsigned int size, bool binary ): stream( address ), size_( size ), binary_( binary ), closed_( false ) {}
+        
+        comma::io::file_descriptor fd() const { return ( *istream_ ).fd(); }
+        
+        unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
+        {
+            ( void )buffer, ( void )max_count, ( void )blocking;
+            COMMA_THROW( comma::exception, "todo" );
+
+            // std::size_t available = available_();
+            // if( !blocking && available == 0 ) { return 0; }
+            // if( binary_ )
+            // {
+            //     unsigned int count = size_ ? available / size_ : 0;
+            //     if( max_count && count > max_count ) { count = max_count; }
+            //     if( count == 0 ) { count = 1; } // read at least one packet
+            //     unsigned int size = size_ ? count * size_ : std::min( available, buffer.size() );
+            //     ( *istream_ )->read( &buffer[0], size );
+            //     return ( *istream_ )->gcount() <= 0 ? 0 : ( *istream_ )->gcount();
+            // }
+            // else
+            // {
+            //     std::string line; // quick and dirty, no-one expects ascii to be fast
+            //     std::getline( *( *istream_ ), line );
+            //     if( line.empty() ) { return 0; }
+            //     if( line.size() >= buffer.size() ) { buffer.resize( line.size() + 1 ); }
+            //     ::memcpy( &buffer[0], &line[0], line.size() );
+            //     buffer[ line.size() ] = '\n';
+            //     return line.size() + 1;
+            // }
+        }
+        
+        bool empty() const { COMMA_THROW( comma::exception, "todo" ); } // { return !connected() || closed_ || available_() == 0; }
+        
+        bool eof() const { COMMA_THROW( comma::exception, "todo" ); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
+        
+        void close() { COMMA_THROW( comma::exception, "todo" ); } // { closed_ = true; ( *istream_ ).close(); }
+        
+        bool closed() const { return closed_; }
+        
+        bool connected() const { COMMA_THROW( comma::exception, "todo" ); } // { return bool( istream_ ); }
+        
+        void connect()
+        {
+            { COMMA_THROW( comma::exception, "todo" ); }
+            // if( istream_ ) { return; }
+            // auto blocking_mode = false ? comma::io::mode::non_blocking : comma::io::mode::blocking; // todo? expose on command line?
+            // istream_.reset( new comma::io::istream( address_, comma::io::mode::binary, blocking_mode ) );
+            // if( ( *istream_ )() != &std::cin ) { return; }
+            // std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
+            // std::cin.tie( NULL ); // std::cin is tied to std::cout by default
+        }
+        
+    private:
+        boost::scoped_ptr< comma::io::istream > istream_;
+        unsigned int size_;
+        bool binary_;
+        bool closed_;
+        
+        std::size_t available_() const // seriously quick and dirty
+        {
+            { COMMA_THROW( comma::exception, "todo" ); }
+            // if( ( *istream_ )() == NULL ) { return ( *istream_ ).available_on_file_descriptor(); } // quick and dirty
+            // std::streamsize s = ( *istream_ )->rdbuf()->in_avail();
+            // if( s < 0 ) { return 0; }
+            // // todo: it should be s + available_on_file_descriptor(), but it won't work for std::cin (and potentially for std::ifstream (we have not checked)
+            // //       if performance becomes a problem e.g. for tcp, check whether the stream is not std::cin and use sum instead of max
+            // return std::max( static_cast< std::size_t >( s ), ( *istream_ ).available_on_file_descriptor() );
+        }
+};
+
 static stream* make_stream( const std::string& address, unsigned int size, bool binary )
 {
     const std::vector< std::string >& v = comma::split( address, ':' );
     if( v[0] == "udp" ) { return new udp_stream( address ); }
+    if( v[0] == "tcp" && v.size() == 2 ) { return new server_stream( address, size, binary ); } // todo: quick and dirty for now; a better check if tcp:<port>-like
     COMMA_ASSERT_BRIEF( v[0] != "zmq-local" && v[0] != "zero-local" && v[0] != "zmq-tcp" && v[0] != "zero-tcp", "zmq support not implemented" );
     return new client_stream( address, size, binary );
 }

From d821386bc25d1274b2a8e84e91baa20f3a93a5f5 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 2 Oct 2024 13:21:27 +1000
Subject: [PATCH 0941/1056] io-cat: tcp server: in progress...

---
 io/applications/io-cat.cpp | 36 +++++++++++++++++-------------------
 io/impl/server.cpp         | 12 ++++++++++++
 io/impl/server.h           |  2 ++
 io/server.cpp              |  2 ++
 io/server.h                |  2 ++
 5 files changed, 35 insertions(+), 19 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index dc9761d02..3d557811b 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -287,13 +287,20 @@ class client_stream : public stream
 class server_stream : public stream
 {
     public:
-        server_stream( const std::string& address, unsigned int size, bool binary ): stream( address ), size_( size ), binary_( binary ), closed_( false ) {}
+        server_stream( const std::string& address, unsigned int size, bool binary )
+            : stream( address )
+            , _size( size )
+            , _binary( binary )
+            , _server( address, binary ? comma::io::mode::binary : comma::io::mode::ascii, true ) // todo: always blocking for now
+        {
+        }
         
-        comma::io::file_descriptor fd() const { return ( *istream_ ).fd(); }
+        comma::io::file_descriptor fd() const { COMMA_THROW( comma::exception, "todo" ); }
         
         unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
         {
             ( void )buffer, ( void )max_count, ( void )blocking;
+            
             COMMA_THROW( comma::exception, "todo" );
 
             // std::size_t available = available_();
@@ -323,28 +330,19 @@ class server_stream : public stream
         
         bool eof() const { COMMA_THROW( comma::exception, "todo" ); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
         
-        void close() { COMMA_THROW( comma::exception, "todo" ); } // { closed_ = true; ( *istream_ ).close(); }
+        void close() { _closed = true; _server.close(); }
         
-        bool closed() const { return closed_; }
+        bool closed() const { return _closed; }
         
-        bool connected() const { COMMA_THROW( comma::exception, "todo" ); } // { return bool( istream_ ); }
+        bool connected() const { return true; }
         
-        void connect()
-        {
-            { COMMA_THROW( comma::exception, "todo" ); }
-            // if( istream_ ) { return; }
-            // auto blocking_mode = false ? comma::io::mode::non_blocking : comma::io::mode::blocking; // todo? expose on command line?
-            // istream_.reset( new comma::io::istream( address_, comma::io::mode::binary, blocking_mode ) );
-            // if( ( *istream_ )() != &std::cin ) { return; }
-            // std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
-            // std::cin.tie( NULL ); // std::cin is tied to std::cout by default
-        }
+        void connect() {}
         
     private:
-        boost::scoped_ptr< comma::io::istream > istream_;
-        unsigned int size_;
-        bool binary_;
-        bool closed_;
+        unsigned int _size{0};
+        bool _binary{false};
+        bool _closed{false};
+        comma::io::iserver _server;
         
         std::size_t available_() const // seriously quick and dirty
         {
diff --git a/io/impl/server.cpp b/io/impl/server.cpp
index f665a858e..bef4ffc4c 100644
--- a/io/impl/server.cpp
+++ b/io/impl/server.cpp
@@ -350,6 +350,18 @@ template < typename Stream > std::string server< Stream >::readline( server< io:
     COMMA_THROW( comma::exception, "todo..." );
 }
 
+
+template < typename Stream > std::size_t server< Stream >::max_available( const server< io::istream >* s )
+{
+    std::size_t a = 0;
+    for( const auto& t: s->streams_ )
+    {
+        auto n = ( *t )->rdbuf()->in_avail();
+        if( n > int( a ) ) { a = n; }
+    }
+    return a;
+}
+
 template struct acceptor< io::istream >;
 template struct acceptor< io::ostream >;
 // todo: template struct acceptor< io::iostream >;
diff --git a/io/impl/server.h b/io/impl/server.h
index ad845cfb9..e4e4c2f10 100644
--- a/io/impl/server.h
+++ b/io/impl/server.h
@@ -78,6 +78,8 @@ class server
 
         static std::string readline( server< io::istream >* s, bool do_accept = true );
 
+        static std::size_t max_available( const server< io::istream >* s );
+
     protected:
         template < typename > friend class comma::io::server;
         template < typename > friend class comma::io::impl::server;
diff --git a/io/server.cpp b/io/server.cpp
index 9d05c7164..a703e60a4 100644
--- a/io/server.cpp
+++ b/io/server.cpp
@@ -54,6 +54,8 @@ std::size_t iserver::read( char* buf, std::size_t size, bool do_accept ) { retur
 
 std::string iserver::readline( bool do_accept ) { return io::impl::server< io::istream >::readline( pimpl_, do_accept ); }
 
+std::size_t iserver::max_available() const { return io::impl::server< io::istream >::max_available( pimpl_ ); }
+
 template class server< io::istream >;
 template class server< io::ostream >;
 // todo: template class server< io::iostream >;
diff --git a/io/server.h b/io/server.h
index 50accc1eb..c35bc63dc 100644
--- a/io/server.h
+++ b/io/server.h
@@ -109,6 +109,8 @@ struct iserver: public io::server< io::istream >
     /// return 0 if no clients have data
     /// start from the next client on the next read to assure round-robin behaviour
     std::string readline( bool do_accept = true );
+
+    std::size_t max_available() const;
 };
 
 // struct ioserver: public io::server< io::iostream >

From f958380b1e6a4ea8c05d958e35f8d770cb576105 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 2 Oct 2024 17:30:37 +1000
Subject: [PATCH 0942/1056] io-cat: tcp server: in progress...

---
 io/applications/io-cat.cpp | 48 ++++++++++++++++++++------------------
 1 file changed, 25 insertions(+), 23 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 3d557811b..6a5f8cd73 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -299,31 +299,33 @@ class server_stream : public stream
         
         unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
         {
-            ( void )buffer, ( void )max_count, ( void )blocking;
-            
-            COMMA_THROW( comma::exception, "todo" );
-
-            // std::size_t available = available_();
-            // if( !blocking && available == 0 ) { return 0; }
-            // if( binary_ )
-            // {
-            //     unsigned int count = size_ ? available / size_ : 0;
-            //     if( max_count && count > max_count ) { count = max_count; }
-            //     if( count == 0 ) { count = 1; } // read at least one packet
-            //     unsigned int size = size_ ? count * size_ : std::min( available, buffer.size() );
-            //     ( *istream_ )->read( &buffer[0], size );
-            //     return ( *istream_ )->gcount() <= 0 ? 0 : ( *istream_ )->gcount();
-            // }
-            // else
+            unsigned int total_count{0};
+            ( void )buffer; ( void )max_count; ( void )blocking; ( void )total_count;
+            // while( true )
             // {
-            //     std::string line; // quick and dirty, no-one expects ascii to be fast
-            //     std::getline( *( *istream_ ), line );
-            //     if( line.empty() ) { return 0; }
-            //     if( line.size() >= buffer.size() ) { buffer.resize( line.size() + 1 ); }
-            //     ::memcpy( &buffer[0], &line[0], line.size() );
-            //     buffer[ line.size() ] = '\n';
-            //     return line.size() + 1;
+            //     std::size_t available = _server.max_available();
+            //     if( !blocking && available == 0 ) { return 0; }
+            //     if( binary_ )
+            //     {
+            //         unsigned int count = size_ ? available / size_ : 0;
+            //         if( max_count && count > max_count ) { count = max_count; }
+            //         if( count == 0 ) { count = 1; } // read at least one packet
+            //         unsigned int size = size_ ? count * size_ : std::min( available, buffer.size() );
+            //         ( *istream_ )->read( &buffer[0], size );
+            //         return ( *istream_ )->gcount() <= 0 ? 0 : ( *istream_ )->gcount();
+            //     }
+            //     else
+            //     {
+            //         std::string line; // quick and dirty, no-one expects ascii to be fast
+            //         std::getline( *( *istream_ ), line );
+            //         if( line.empty() ) { return 0; }
+            //         if( line.size() >= buffer.size() ) { buffer.resize( line.size() + 1 ); }
+            //         ::memcpy( &buffer[0], &line[0], line.size() );
+            //         buffer[ line.size() ] = '\n';
+            //         return line.size() + 1;
+            //     }
             // }
+            return 0;
         }
         
         bool empty() const { COMMA_THROW( comma::exception, "todo" ); } // { return !connected() || closed_ || available_() == 0; }

From 9f98e2c9d93b5a3e87b753f6a211fb22286fb044 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 4 Oct 2024 17:42:23 +1000
Subject: [PATCH 0943/1056] csv-seek: --help: minor brush-up

---
 csv/applications/csv-seek.cpp | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
index 881c95932..916770d35 100644
--- a/csv/applications/csv-seek.cpp
+++ b/csv/applications/csv-seek.cpp
@@ -22,7 +22,7 @@ options
     --permissive:          permissive mode: output empty record on error
 
     --size,-s=<size>:      [todo] data is packets of fixed size, otherwise data is expected
-                           line-wise. Alternatively use --binary" << std::endl
+                           line-wise. Alternatively use --binary
 csv options
 )";
     std::cerr << comma::csv::options::usage( verbose ) << std::endl;
@@ -41,12 +41,12 @@ csv options
         colour hue (you would need snark installed with graphics and imaging enabled)
             make data file
                 ( csv-paste value=255 value=0 line-number --head 256; \
-                    csv-paste 'line-number;begin=255;step=-1' line-number value=255 --head 256; \
-                    csv-paste value=0 value=255 'line-number;begin=255;step=-1' --head 256; \
-                    csv-paste line-number value=255 value=0 --head 256; \
-                    csv-paste value=255 'line-number;begin=255;step=-1' value=0 --head 256 ) \
-                    | csv-to-bin 3ub \
-                    > colour-wheel.bin
+                  csv-paste 'line-number;begin=255;step=-1' line-number value=255 --head 256; \
+                  csv-paste value=0 value=255 'line-number;begin=255;step=-1' --head 256; \
+                  csv-paste line-number value=255 value=0 --head 256; \
+                  csv-paste value=255 'line-number;begin=255;step=-1' value=0 --head 256 ) \
+                      | csv-to-bin 3ub \
+                      > colour-wheel.bin
             sample colour hue
                 csv-sliders 'hue;min=0;max=1;step=0.0001' \
                             --frequency 10 \

From 9129c5ef4ebc7a034e55d0a90dbf51319f2caeb7 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 8 Oct 2024 11:32:05 +1100
Subject: [PATCH 0944/1056] csv::ascii::put(): tests for string-quoting added

---
 csv/test/ascii_test.cpp | 34 ++++++++++++++++++++++++++--------
 1 file changed, 26 insertions(+), 8 deletions(-)

diff --git a/csv/test/ascii_test.cpp b/csv/test/ascii_test.cpp
index cc87283b2..3a2e3e521 100644
--- a/csv/test/ascii_test.cpp
+++ b/csv/test/ascii_test.cpp
@@ -40,25 +40,23 @@ namespace comma { namespace csv { namespace ascii_test {
 
 struct nested
 {
-    int x;
-    int y;
-    nested() : x( 0 ), y( 0 ) {}
+    int x{0};
+    int y{0};
 };
 
 struct simple_struct
 {
-    int a;
-    double b;
-    char c;
+    int a{0};
+    double b{0};
+    char c{0};
     std::string s;
     boost::posix_time::ptime t;
     ascii_test::nested nested;
-    simple_struct() : a( 0 ), b( 0 ), c( 0 ) {}
 };
 
 struct test_struct
 {
-    int a;
+    int a{0};
     boost::optional< int > z;
     boost::optional< ascii_test::nested > nested;
 };
@@ -212,6 +210,26 @@ TEST( csv, ascii_get )
 
 TEST( csv, ascii_put )
 {
+}
+
+TEST( csv, ascii_put_string )
+{
+    typedef comma::csv::ascii_test::simple_struct value_t;
+    typedef comma::csv::ascii< value_t > ascii_t;
+    EXPECT_EQ( ascii_t().put( value_t{} ), "0,0,0,\"\",not-a-date-time,0,0" );
+    EXPECT_EQ( ascii_t().put( value_t{1,2,3,"XXX"} ), "1,2,3,\"XXX\",not-a-date-time,0,0" );
+    {
+        comma::csv::options csv;
+        csv.quote.reset();
+        EXPECT_EQ( ascii_t( csv ).put( value_t{} ), "0,0,0,,not-a-date-time,0,0" );
+        EXPECT_EQ( ascii_t( csv ).put( value_t{1,2,3,"XXX"} ), "1,2,3,XXX,not-a-date-time,0,0" );
+    }
+    {
+        comma::csv::options csv;
+        csv.quote = '#';
+        EXPECT_EQ( ascii_t( csv ).put( value_t{} ), "0,0,0,##,not-a-date-time,0,0" );
+        EXPECT_EQ( ascii_t( csv ).put( value_t{1,2,3,"XXX"} ), "1,2,3,#XXX#,not-a-date-time,0,0" );
+    }
     // todo
 }
 

From 28df9c6ad1b0571957b5f1b6eb3f1b1c720d5449 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 8 Oct 2024 16:04:20 +1100
Subject: [PATCH 0945/1056] io-cat: tcp server as input: plugging in...

---
 io/applications/io-cat.cpp | 64 +++++++++++++++++++-------------------
 io/impl/publish.cpp        |  6 ++--
 io/impl/publish.h          |  2 +-
 io/impl/server.cpp         |  4 +--
 io/impl/server.h           |  4 +--
 io/server.cpp              |  4 +--
 io/server.h                |  4 +--
 7 files changed, 44 insertions(+), 44 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 6a5f8cd73..cd130bdbd 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -287,11 +287,12 @@ class client_stream : public stream
 class server_stream : public stream
 {
     public:
-        server_stream( const std::string& address, unsigned int size, bool binary )
+        server_stream( const std::string& address, unsigned int size, bool binary, bool blocking )
             : stream( address )
             , _size( size )
             , _binary( binary )
-            , _server( address, binary ? comma::io::mode::binary : comma::io::mode::ascii, true ) // todo: always blocking for now
+            , _blocking( blocking )
+            , _server( address, binary ? comma::io::mode::binary : comma::io::mode::ascii, blocking )
         {
         }
         
@@ -299,38 +300,36 @@ class server_stream : public stream
         
         unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
         {
-            unsigned int total_count{0};
-            ( void )buffer; ( void )max_count; ( void )blocking; ( void )total_count;
-            // while( true )
-            // {
-            //     std::size_t available = _server.max_available();
-            //     if( !blocking && available == 0 ) { return 0; }
-            //     if( binary_ )
-            //     {
-            //         unsigned int count = size_ ? available / size_ : 0;
-            //         if( max_count && count > max_count ) { count = max_count; }
-            //         if( count == 0 ) { count = 1; } // read at least one packet
-            //         unsigned int size = size_ ? count * size_ : std::min( available, buffer.size() );
-            //         ( *istream_ )->read( &buffer[0], size );
-            //         return ( *istream_ )->gcount() <= 0 ? 0 : ( *istream_ )->gcount();
-            //     }
-            //     else
-            //     {
-            //         std::string line; // quick and dirty, no-one expects ascii to be fast
-            //         std::getline( *( *istream_ ), line );
-            //         if( line.empty() ) { return 0; }
-            //         if( line.size() >= buffer.size() ) { buffer.resize( line.size() + 1 ); }
-            //         ::memcpy( &buffer[0], &line[0], line.size() );
-            //         buffer[ line.size() ] = '\n';
-            //         return line.size() + 1;
-            //     }
-            // }
+            COMMA_ASSERT_BRIEF( blocking == _blocking, "server stream is " << ( _blocking ? "blocking" : "non-blocking" ) << ", but asked to do " << ( blocking ? "blocking" : "non-blocking" ) << " read" );
+            unsigned int count{0};
+            char* p = &buffer[0];
+            while( true )
+            {
+                std::size_t available_at_least = _server.available_at_least();
+                if( !blocking && available_at_least == 0 ) { return 0; }
+                if( _binary )
+                {
+                    if( _server.read( p, _size ) != _size ) { return 0; } // todo? more checks?
+                    ++count;
+                    p += _size;
+                    if( count >= max_count || count * _size >= available_at_least ) { return count * _size; }
+                }
+                else
+                {
+                    std::string line = _server.getline();
+                    if( line.empty() ) { return 0; }
+                    if( line.size() >= buffer.size() ) { buffer.resize( line.size() + 1 ); }
+                    ::memcpy( &buffer[0], &line[0], line.size() );
+                    buffer[ line.size() ] = '\n';
+                    return line.size() + 1;
+                }
+            }
             return 0;
         }
         
         bool empty() const { COMMA_THROW( comma::exception, "todo" ); } // { return !connected() || closed_ || available_() == 0; }
         
-        bool eof() const { COMMA_THROW( comma::exception, "todo" ); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
+        bool eof() const { return !closed(); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
         
         void close() { _closed = true; _server.close(); }
         
@@ -343,6 +342,7 @@ class server_stream : public stream
     private:
         unsigned int _size{0};
         bool _binary{false};
+        bool _blocking{false};
         bool _closed{false};
         comma::io::iserver _server;
         
@@ -358,11 +358,11 @@ class server_stream : public stream
         }
 };
 
-static stream* make_stream( const std::string& address, unsigned int size, bool binary )
+static stream* make_stream( const std::string& address, unsigned int size, bool binary, bool blocking )
 {
     const std::vector< std::string >& v = comma::split( address, ':' );
     if( v[0] == "udp" ) { return new udp_stream( address ); }
-    if( v[0] == "tcp" && v.size() == 2 ) { return new server_stream( address, size, binary ); } // todo: quick and dirty for now; a better check if tcp:<port>-like
+    if( v[0] == "tcp" && v.size() == 2 ) { return new server_stream( address, size, binary, blocking ); } // todo: quick and dirty for now; a better check if tcp:<port>-like
     COMMA_ASSERT_BRIEF( v[0] != "zmq-local" && v[0] != "zero-local" && v[0] != "zmq-tcp" && v[0] != "zero-tcp", "zmq support not implemented" );
     return new client_stream( address, size, binary );
 }
@@ -515,7 +515,7 @@ int main( int argc, char** argv )
         output = output_t( options, unnamed.size() );
         boost::ptr_vector< stream > streams;
         comma::io::select select;
-        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 || ( unnamed.size() == 1 && !has_head ) ) ); }
+        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 || ( unnamed.size() == 1 && !has_head ), blocking ) ); }
         //for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 ) ); }
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
diff --git a/io/impl/publish.cpp b/io/impl/publish.cpp
index 5b1f7cb86..90a17acd7 100644
--- a/io/impl/publish.cpp
+++ b/io/impl/publish.cpp
@@ -241,10 +241,10 @@ bool receive::read( char* buf, unsigned int size )
     return handle_sizes_( t ) || count != size;
 }
 
-bool receive::readline( std::string& line ) // quick and dirty
+bool receive::getline( std::string& line ) // quick and dirty
 {
     transaction_t t( publishers_ );
-    line = ( *t )[0]->readline();
+    line = ( *t )[0]->getline();
     return handle_sizes_( t );
 }
 
@@ -256,7 +256,7 @@ bool receive::write( std::ostream& output )
     }
     else
     {
-        if( !readline( buffer_ ) ) { return false; }
+        if( !getline( buffer_ ) ) { return false; }
         buffer_ += '\n';
     }
     output.write( &buffer_[0], buffer_.size() );
diff --git a/io/impl/publish.h b/io/impl/publish.h
index 059343b6c..f00554f0b 100644
--- a/io/impl/publish.h
+++ b/io/impl/publish.h
@@ -101,7 +101,7 @@ class receive : public multiserver< comma::io::iserver >
 
     bool read( char* buf, unsigned int size );
 
-    bool readline( std::string& line );
+    bool getline( std::string& line );
 
     bool write( std::ostream& output );
 };
diff --git a/io/impl/server.cpp b/io/impl/server.cpp
index bef4ffc4c..d4266c4ed 100644
--- a/io/impl/server.cpp
+++ b/io/impl/server.cpp
@@ -345,13 +345,13 @@ template < typename Stream > unsigned int server< Stream >::read( server< io::is
     return 0;
 }
 
-template < typename Stream > std::string server< Stream >::readline( server< io::istream >* s, bool do_accept )
+template < typename Stream > std::string server< Stream >::getline( server< io::istream >* s, bool do_accept )
 {
     COMMA_THROW( comma::exception, "todo..." );
 }
 
 
-template < typename Stream > std::size_t server< Stream >::max_available( const server< io::istream >* s )
+template < typename Stream > std::size_t server< Stream >::available_at_least( const server< io::istream >* s )
 {
     std::size_t a = 0;
     for( const auto& t: s->streams_ )
diff --git a/io/impl/server.h b/io/impl/server.h
index e4e4c2f10..9d6265015 100644
--- a/io/impl/server.h
+++ b/io/impl/server.h
@@ -76,9 +76,9 @@ class server
 
         static unsigned int read( server< io::istream >* s, char* buf, std::size_t size, bool do_accept = true );
 
-        static std::string readline( server< io::istream >* s, bool do_accept = true );
+        static std::string getline( server< io::istream >* s, bool do_accept = true );
 
-        static std::size_t max_available( const server< io::istream >* s );
+        static std::size_t available_at_least( const server< io::istream >* s );
 
     protected:
         template < typename > friend class comma::io::server;
diff --git a/io/server.cpp b/io/server.cpp
index a703e60a4..a03b59e2c 100644
--- a/io/server.cpp
+++ b/io/server.cpp
@@ -52,9 +52,9 @@ std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept )
 
 std::size_t iserver::read( char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::istream >::read( pimpl_, buf, size, do_accept ); }
 
-std::string iserver::readline( bool do_accept ) { return io::impl::server< io::istream >::readline( pimpl_, do_accept ); }
+std::string iserver::getline( bool do_accept ) { return io::impl::server< io::istream >::getline( pimpl_, do_accept ); }
 
-std::size_t iserver::max_available() const { return io::impl::server< io::istream >::max_available( pimpl_ ); }
+std::size_t iserver::available_at_least() const { return io::impl::server< io::istream >::available_at_least( pimpl_ ); }
 
 template class server< io::istream >;
 template class server< io::ostream >;
diff --git a/io/server.h b/io/server.h
index c35bc63dc..8b06bed7b 100644
--- a/io/server.h
+++ b/io/server.h
@@ -108,9 +108,9 @@ struct iserver: public io::server< io::istream >
     /// read eol-terminated string from first available client
     /// return 0 if no clients have data
     /// start from the next client on the next read to assure round-robin behaviour
-    std::string readline( bool do_accept = true );
+    std::string getline( bool do_accept = true );
 
-    std::size_t max_available() const;
+    std::size_t available_at_least() const;
 };
 
 // struct ioserver: public io::server< io::iostream >

From 1e1d069a6c78e93bd945f8da729c47af676f9555 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 8 Oct 2024 16:18:09 +1100
Subject: [PATCH 0946/1056] io-cat: tcp server as input: plugging in...

---
 io/applications/io-cat.cpp | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index cd130bdbd..a2e44c849 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -327,7 +327,7 @@ class server_stream : public stream
             return 0;
         }
         
-        bool empty() const { COMMA_THROW( comma::exception, "todo" ); } // { return !connected() || closed_ || available_() == 0; }
+        bool empty() const { return _closed || _server.available_at_least() == 0; }
         
         bool eof() const { return !closed(); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
         
@@ -402,13 +402,13 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
     std::string what;
     for( unsigned int i = 0; i < streams.size(); ++i )
     {
-        if( streams[i].connected() ) { continue; }
+        if( streams[i].connected() ) { --unconnected_count; continue; }
         try
         {
             comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connecting, attempt " << ( attempts + 1 ) << " of " << ( connect_max_attempts == 0 ? std::string( "unlimited" ) : boost::lexical_cast< std::string >( connect_max_attempts ) ) << "..." << std::endl;
             streams[i].connect();
             comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connected" << std::endl;
-            select.read().add( streams[i] );
+            select.read().add( streams[i].fd() );
             --unconnected_count;
             continue;
         }
@@ -517,6 +517,7 @@ int main( int argc, char** argv )
         comma::io::select select;
         for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 || ( unnamed.size() == 1 && !has_head ), blocking ) ); }
         //for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 ) ); }
+        comma::saymore() << "created " << unnamed.size() << " stream(s)" << std::endl;
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;

From 3f4af7461a112234284f8fdc09ebe1225849d959 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 8 Oct 2024 16:25:38 +1100
Subject: [PATCH 0947/1056] io::server::select() method added

---
 io/server.cpp | 2 ++
 io/server.h   | 3 +++
 2 files changed, 5 insertions(+)

diff --git a/io/server.cpp b/io/server.cpp
index a03b59e2c..5e323b981 100644
--- a/io/server.cpp
+++ b/io/server.cpp
@@ -48,6 +48,8 @@ template < typename Stream > std::size_t server< Stream >::size() const { return
 
 template < typename Stream > file_descriptor server< Stream >::acceptor_file_descriptor() const { return pimpl_->_acceptor ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
 
+template < typename Stream > const io::select& server< Stream >::select() const { return pimpl_->select_; }
+
 std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::ostream >::write( pimpl_, buf, size, do_accept ); }
 
 std::size_t iserver::read( char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::istream >::read( pimpl_, buf, size, do_accept ); }
diff --git a/io/server.h b/io/server.h
index 8b06bed7b..2fcf237d5 100644
--- a/io/server.h
+++ b/io/server.h
@@ -54,6 +54,9 @@ class server
         ///       has been output, this client will receive
         ///       ",2", which most likely was not intended
         std::vector< Stream* > accept(); // quick and dirty, use nacked pointers for now
+
+        /// return reference to select on the existing streams
+        const io::select& select() const;
         
     protected:
         server( const server& );

From 331f3f26d7d852a2b9cbea00139bfb1801f1f084 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 8 Oct 2024 18:02:42 +1100
Subject: [PATCH 0948/1056] io-cat: tcp server as input: plugging in...

---
 io/applications/io-cat.cpp | 58 +++++++++++++++++++++++---------------
 1 file changed, 36 insertions(+), 22 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index a2e44c849..687d63747 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -151,13 +151,16 @@ class stream
         stream( const std::string& address ): address_( address ) {}
         virtual ~stream() {}
         virtual unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking ) = 0;
-        virtual comma::io::file_descriptor fd() const = 0;
+        virtual comma::io::file_descriptor fd() const { return comma::io::invalid_file_descriptor; }
         virtual bool eof() const = 0;
         virtual bool empty() const = 0;
         virtual void close() = 0;
         virtual bool closed() const = 0;
         virtual bool connected() const = 0;
         virtual void connect() = 0;
+        virtual void add_to( comma::io::select& select ) const { select.read().add( fd() ); }
+        virtual void remove_from( comma::io::select& select ) const { select.read().remove( fd() ); }
+        virtual bool ready( comma::io::select& select ) const { return select.read().ready( fd() ); }
         const std::string& address() const { return address_; }
         
     protected:
@@ -284,7 +287,7 @@ class client_stream : public stream
         }
 };
 
-class server_stream : public stream
+class server_stream : public stream // todo! super-quick and dirty! get streams from the server instead and add/remove them to/from read methods
 {
     public:
         server_stream( const std::string& address, unsigned int size, bool binary, bool blocking )
@@ -296,8 +299,6 @@ class server_stream : public stream
         {
         }
         
-        comma::io::file_descriptor fd() const { COMMA_THROW( comma::exception, "todo" ); }
-        
         unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
         {
             COMMA_ASSERT_BRIEF( blocking == _blocking, "server stream is " << ( _blocking ? "blocking" : "non-blocking" ) << ", but asked to do " << ( blocking ? "blocking" : "non-blocking" ) << " read" );
@@ -329,7 +330,7 @@ class server_stream : public stream
         
         bool empty() const { return _closed || _server.available_at_least() == 0; }
         
-        bool eof() const { return !closed(); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
+        bool eof() const { return closed(); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
         
         void close() { _closed = true; _server.close(); }
         
@@ -338,6 +339,30 @@ class server_stream : public stream
         bool connected() const { return true; }
         
         void connect() {}
+
+        void add_to( comma::io::select& select ) const
+        {
+            for( auto d: _server.select().read()() ) { select.read().add( d ); }
+            select.read().add( _server.acceptor_file_descriptor() ); // uber-quick and dirty
+        }
+
+        void remove_from( comma::io::select& select ) const
+        {
+            for( auto d: _server.select().read()() ) {  select.read().remove( d ); }
+            select.read().add( _server.acceptor_file_descriptor() ); // uber-quick and dirty
+        }
+
+        // todo! void update( comma::io::select& select )
+        // todo! get streams from the server instead and add/remove them to/from read methods
+        // todo! test connecting/disconnecting clients
+        // todo! test multiple clients
+        // todo! examples
+
+        bool ready( comma::io::select& select ) const
+        {
+            for( auto d: _server.select().read()() ) { if( select.read().ready( d ) ) { return true; } }
+            return false;
+        }
         
     private:
         unsigned int _size{0};
@@ -345,17 +370,6 @@ class server_stream : public stream
         bool _blocking{false};
         bool _closed{false};
         comma::io::iserver _server;
-        
-        std::size_t available_() const // seriously quick and dirty
-        {
-            { COMMA_THROW( comma::exception, "todo" ); }
-            // if( ( *istream_ )() == NULL ) { return ( *istream_ ).available_on_file_descriptor(); } // quick and dirty
-            // std::streamsize s = ( *istream_ )->rdbuf()->in_avail();
-            // if( s < 0 ) { return 0; }
-            // // todo: it should be s + available_on_file_descriptor(), but it won't work for std::cin (and potentially for std::ifstream (we have not checked)
-            // //       if performance becomes a problem e.g. for tcp, check whether the stream is not std::cin and use sum instead of max
-            // return std::max( static_cast< std::size_t >( s ), ( *istream_ ).available_on_file_descriptor() );
-        }
 };
 
 static stream* make_stream( const std::string& address, unsigned int size, bool binary, bool blocking )
@@ -378,12 +392,12 @@ static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select
     {
         select.check();
         bool r{connected_all_we_could};
-        for( unsigned int i = 0; i < streams.size() && r; ++i ) { r = streams[i].closed() || select.read().ready( streams[i].fd() ); }
+        for( unsigned int i = 0; i < streams.size() && r; ++i ) { r = streams[i].closed() || streams[i].ready( select ); }
         if( !r ) { boost::this_thread::sleep( boost::posix_time::milliseconds( 10 ) ); } // quick and dirty
         return r;
     }
     for( unsigned int i = 0; i < streams.size(); ++i ) { if( !streams[i].empty() ) { select.check(); return true; } }
-    if( !select.read()().empty() ) { return select.wait( boost::posix_time::seconds( 1 ) ) > 0; }
+    if( !select.read()().empty() ) { return select.wait( boost::posix_time::milliseconds( 100 ) ) > 0; }
     if( connected_all_we_could ) { return true; }
     boost::this_thread::sleep( connect_period );
     return false;
@@ -408,7 +422,7 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
             comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connecting, attempt " << ( attempts + 1 ) << " of " << ( connect_max_attempts == 0 ? std::string( "unlimited" ) : boost::lexical_cast< std::string >( connect_max_attempts ) ) << "..." << std::endl;
             streams[i].connect();
             comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connected" << std::endl;
-            select.read().add( streams[i].fd() );
+            streams[i].add_to( select );
             --unconnected_count;
             continue;
         }
@@ -517,7 +531,7 @@ int main( int argc, char** argv )
         comma::io::select select;
         for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 || ( unnamed.size() == 1 && !has_head ), blocking ) ); }
         //for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 ) ); }
-        comma::saymore() << "created " << unnamed.size() << " stream(s)" << std::endl;
+        comma::saymore() << "created " << unnamed.size() << " stream" << ( unnamed.size() == 1 ? "" : "s" ) << std::endl;
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;
@@ -531,12 +545,12 @@ int main( int argc, char** argv )
             {
                 if( !streams[i].connected() ) { done = connected_all_we_could; continue; }
                 if( streams[i].closed() ) { continue; }
-                bool ready = select.read().ready( streams[i].fd() );
+                bool ready = streams[i].ready( select );
                 bool empty = streams[i].empty();
                 if( empty && ( ready || streams[i].eof() ) )
                 { 
                     comma::saymore() << "stream " << i << " (" << unnamed[i] << "): closed" << std::endl;
-                    select.read().remove( streams[i].fd() );
+                    streams[i].remove_from( select );
                     streams[i].close();
                     if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { done = true; break; }
                     continue;

From eb5dc604b3691b1f4565409013b474b8514bc5af Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 8 Oct 2024 18:21:01 +1100
Subject: [PATCH 0949/1056] io::select::descriptors::clear() implemented

---
 io/select.cpp | 7 +++++--
 io/select.h   | 7 +++++--
 2 files changed, 10 insertions(+), 4 deletions(-)

diff --git a/io/select.cpp b/io/select.cpp
index f64de14cb..2ddc1c6ef 100755
--- a/io/select.cpp
+++ b/io/select.cpp
@@ -98,9 +98,12 @@ std::size_t select::wait( boost::posix_time::time_duration timeout )
 
 std::size_t select::check() { return wait( 0 ); }
 
-select::descriptors::descriptors()
+select::descriptors::descriptors() { reset_fds_(); }
+
+void select::descriptors::clear()
 {
-    reset_fds_();
+    FD_ZERO( &fd_set_ );
+    descriptors_.clear();
 }
 
 fd_set* select::descriptors::reset_fds_()
diff --git a/io/select.h b/io/select.h
index 7c9ed9a0a..516e89be0 100755
--- a/io/select.h
+++ b/io/select.h
@@ -94,15 +94,18 @@ class select
                 /// return true, if file descriptor found in descriptor list and ready
                 bool ready( file_descriptor fd ) const;
                 template < typename T > bool ready( const T& t ) const { return ready( t.fd() ); }
+
+                /// remove all descriptors
+                void clear();
                 
                 /// return set of descriptors
                 const std::set< file_descriptor >& operator()() const { return descriptors_; } //const boost::unordered_set< file_descriptor >& operator()() const { return descriptors_; }
 
             private:
                 friend class select;
-                fd_set* reset_fds_();
+                ::fd_set* reset_fds_();
                 std::set< file_descriptor > descriptors_; //boost::unordered_set< file_descriptor > descriptors_;
-                fd_set fd_set_;
+                ::fd_set fd_set_;
         };
 
         /// return read descriptors

From 113352e0049f4cf6b89c886db43e756342dadd7c Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 8 Oct 2024 18:31:46 +1100
Subject: [PATCH 0950/1056] io-cat: tcp server as input: plugging in...

---
 io/applications/io-cat.cpp | 28 ++++++++++++++++++++++++++--
 io/impl/publish.cpp        | 16 ++++++++--------
 io/impl/publish.h          |  6 +++---
 3 files changed, 37 insertions(+), 13 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 687d63747..498030f2b 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -161,6 +161,7 @@ class stream
         virtual void add_to( comma::io::select& select ) const { select.read().add( fd() ); }
         virtual void remove_from( comma::io::select& select ) const { select.read().remove( fd() ); }
         virtual bool ready( comma::io::select& select ) const { return select.read().ready( fd() ); }
+        virtual void update( comma::io::select& select ) const {}
         const std::string& address() const { return address_; }
         
     protected:
@@ -352,10 +353,17 @@ class server_stream : public stream // todo! super-quick and dirty! get streams
             select.read().add( _server.acceptor_file_descriptor() ); // uber-quick and dirty
         }
 
-        // todo! void update( comma::io::select& select )
+        void update( comma::io::select& select ) const
+        {
+            // todo
+        }
+
+        // todo!? use io::impl::receive()?
         // todo! get streams from the server instead and add/remove them to/from read methods
         // todo! test connecting/disconnecting clients
         // todo! test multiple clients
+        // todo! cpu performance when there are no connections
+        // todo? for now, if server, don't allow multiple input streams
         // todo! examples
 
         bool ready( comma::io::select& select ) const
@@ -388,6 +396,7 @@ static bool permissive;
 
 static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select& select, bool connected_all_we_could, bool blocking )
 {
+    for( const auto& s: streams ) { s.update( select ); } // quick and dirty
     if( blocking )
     {
         select.check();
@@ -535,30 +544,42 @@ int main( int argc, char** argv )
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;
+        comma::say() << "==> A" << std::endl;
         for( bool done = false; !done; )
         {
+            comma::say() << "==> a" << std::endl;
             if( is_shutdown ) { comma::saymore() << "received signal" << std::endl; break; }
+            comma::say() << "==> b" << std::endl;
             bool connected_all_we_could = try_connect( streams, select );
             if( !ready( streams, select, connected_all_we_could, blocking ) ) { continue; }
             done = true;
+            comma::say() << "==> c: streams.size(): " << streams.size() << std::endl;
             for( unsigned int i = 0; i < streams.size(); ++i )
             {
+                comma::say() << "==> d" << std::endl;
                 if( !streams[i].connected() ) { done = connected_all_we_could; continue; }
+                comma::say() << "==> e" << std::endl;
                 if( streams[i].closed() ) { continue; }
+                comma::say() << "==> f" << std::endl;
                 bool ready = streams[i].ready( select );
+                comma::say() << "==> g: ready: " << ready << std::endl;
                 bool empty = streams[i].empty();
                 if( empty && ( ready || streams[i].eof() ) )
-                { 
+                {
+                    comma::say() << "==> h" << std::endl;
                     comma::saymore() << "stream " << i << " (" << unnamed[i] << "): closed" << std::endl;
                     streams[i].remove_from( select );
                     streams[i].close();
                     if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { done = true; break; }
                     continue;
                 }
+                comma::say() << "==> i" << std::endl;
                 if( !ready && empty ) { done = false; continue; }
+                comma::say() << "==> j" << std::endl;
                 unsigned int countdown = round_robin_count;
                 while( !streams[i].eof() ) // todo? check is_shutdown here as well?
                 {
+                    comma::say() << "==> k" << std::endl;
                     unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count, blocking );
                     if( bytes_read == 0 ) { break; }
                     done = false;
@@ -572,8 +593,11 @@ int main( int argc, char** argv )
                         if( countdown == 0 ) { break; }
                     }
                 }
+                comma::say() << "==> l" << std::endl;
             }
+            comma::say() << "==> m" << std::endl;
         }
+        comma::say() << "==> Z" << std::endl;
         output.finalise( is_shutdown );
         return 0;
     }
diff --git a/io/impl/publish.cpp b/io/impl/publish.cpp
index 90a17acd7..c8b64b49b 100644
--- a/io/impl/publish.cpp
+++ b/io/impl/publish.cpp
@@ -57,7 +57,7 @@ multiserver< Server >::multiserver( const std::vector< std::string >& endpoints
     sigemptyset( &new_action.sa_mask );
     sigaction( SIGPIPE, NULL, &old_action );
     sigaction( SIGPIPE, &new_action, NULL );
-    transaction_t t( publishers_ );
+    transaction_t t( servers_ );
     t->resize( endpoints.size() );
     for( std::size_t i = 0; i < endpoints.size(); ++i )
     {
@@ -71,14 +71,14 @@ multiserver< Server >::~multiserver()
 {
     is_shutdown_ = true;
     acceptor_thread_->join();
-    transaction_t t( publishers_ );
+    transaction_t t( servers_ );
     for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
 }
 
 template < typename Server >
 void multiserver< Server >::disconnect_all()
 {
-    transaction_t t( publishers_ );
+    transaction_t t( servers_ );
     for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
     handle_sizes_( t ); // quick and dirty
 }
@@ -120,7 +120,7 @@ void multiserver< Server >::accept_()
 {
     comma::io::select select;
     {
-        transaction_t t( publishers_ );
+        transaction_t t( servers_ );
         for( unsigned int i = 0; i < t->size(); ++i )
         {
             if( !( *t )[i] ) { continue; }
@@ -131,7 +131,7 @@ void multiserver< Server >::accept_()
     while( !is_shutdown_ )
     {
         select.wait( boost::posix_time::millisec( 100 ) ); // todo? make timeout configurable?
-        transaction_t t( publishers_ );
+        transaction_t t( servers_ );
         for( unsigned int i = 0; i < t->size(); ++i )
         {
             if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
@@ -188,7 +188,7 @@ publish::publish( const std::vector< std::string >& endpoints
 
 bool publish::write( const std::string& s )
 {
-    transaction_t t( publishers_ );
+    transaction_t t( servers_ );
     if( cache_size_ > 0 )
     {
         cache_.push_back( s );
@@ -236,14 +236,14 @@ receive::receive( const std::string& endpoint
 
 bool receive::read( char* buf, unsigned int size )
 {
-    transaction_t t( publishers_ );
+    transaction_t t( servers_ );
     auto count = ( *t )[0]->read( buf, size );
     return handle_sizes_( t ) || count != size;
 }
 
 bool receive::getline( std::string& line ) // quick and dirty
 {
-    transaction_t t( publishers_ );
+    transaction_t t( servers_ );
     line = ( *t )[0]->getline();
     return handle_sizes_( t );
 }
diff --git a/io/impl/publish.h b/io/impl/publish.h
index f00554f0b..c245bb4bf 100644
--- a/io/impl/publish.h
+++ b/io/impl/publish.h
@@ -26,9 +26,9 @@ template < typename Server >
 class multiserver
 {
     public:
-        typedef comma::synchronized< std::vector< std::unique_ptr< Server > > > publishers_t;
+        typedef comma::synchronized< std::vector< std::unique_ptr< Server > > > servers_t;
         
-        typedef typename publishers_t::scoped_transaction transaction_t;
+        typedef typename servers_t::scoped_transaction transaction_t;
         
         struct endpoint
         {
@@ -55,7 +55,7 @@ class multiserver
         std::vector< endpoint > endpoints_;
         bool discard_;
         bool flush_;
-        publishers_t publishers_;
+        servers_t servers_;
         std::string buffer_;
         unsigned int packet_size_;
         bool output_number_of_clients_;

From 5fe88d5f25ee2e51825ee51a5ec6d727cafb1a1d Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Wed, 9 Oct 2024 16:40:35 +1100
Subject: [PATCH 0951/1056] io-cat: connecting streams: bug fixed: spurious
 connected stream count update removed

---
 io/applications/io-cat.cpp | 24 +++++-------------------
 1 file changed, 5 insertions(+), 19 deletions(-)

diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 498030f2b..42064a87a 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -425,7 +425,7 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
     std::string what;
     for( unsigned int i = 0; i < streams.size(); ++i )
     {
-        if( streams[i].connected() ) { --unconnected_count; continue; }
+        if( streams[i].connected() ) { continue; }
         try
         {
             comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connecting, attempt " << ( attempts + 1 ) << " of " << ( connect_max_attempts == 0 ? std::string( "unlimited" ) : boost::lexical_cast< std::string >( connect_max_attempts ) ) << "..." << std::endl;
@@ -440,9 +440,10 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
         comma::saymore() << "stream " << i << " (" << streams[i].address() << "): failed to connect" << std::endl;
     }
     ++attempts;
-    connected_all_we_could = unconnected_count == 0 || ( permissive && connect_max_attempts > 0 && attempts >= connect_max_attempts );
-    if( connected_all_we_could ) { return connected_all_we_could; }
-    if( connect_max_attempts == 0 || attempts < connect_max_attempts ) { return connected_all_we_could; }
+    if( unconnected_count == 0 ) { return true; }
+    if( connect_max_attempts == 0 ) { return false; }
+    if( attempts < connect_max_attempts ) { return false; }
+    if( permissive ) { return true; }
     comma::say() << "fatal: after " << attempts << " attempt(s): " << what << std::endl;
     exit( 1 );
 }
@@ -544,42 +545,30 @@ int main( int argc, char** argv )
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;
-        comma::say() << "==> A" << std::endl;
         for( bool done = false; !done; )
         {
-            comma::say() << "==> a" << std::endl;
             if( is_shutdown ) { comma::saymore() << "received signal" << std::endl; break; }
-            comma::say() << "==> b" << std::endl;
             bool connected_all_we_could = try_connect( streams, select );
             if( !ready( streams, select, connected_all_we_could, blocking ) ) { continue; }
             done = true;
-            comma::say() << "==> c: streams.size(): " << streams.size() << std::endl;
             for( unsigned int i = 0; i < streams.size(); ++i )
             {
-                comma::say() << "==> d" << std::endl;
                 if( !streams[i].connected() ) { done = connected_all_we_could; continue; }
-                comma::say() << "==> e" << std::endl;
                 if( streams[i].closed() ) { continue; }
-                comma::say() << "==> f" << std::endl;
                 bool ready = streams[i].ready( select );
-                comma::say() << "==> g: ready: " << ready << std::endl;
                 bool empty = streams[i].empty();
                 if( empty && ( ready || streams[i].eof() ) )
                 {
-                    comma::say() << "==> h" << std::endl;
                     comma::saymore() << "stream " << i << " (" << unnamed[i] << "): closed" << std::endl;
                     streams[i].remove_from( select );
                     streams[i].close();
                     if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { done = true; break; }
                     continue;
                 }
-                comma::say() << "==> i" << std::endl;
                 if( !ready && empty ) { done = false; continue; }
-                comma::say() << "==> j" << std::endl;
                 unsigned int countdown = round_robin_count;
                 while( !streams[i].eof() ) // todo? check is_shutdown here as well?
                 {
-                    comma::say() << "==> k" << std::endl;
                     unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count, blocking );
                     if( bytes_read == 0 ) { break; }
                     done = false;
@@ -593,11 +582,8 @@ int main( int argc, char** argv )
                         if( countdown == 0 ) { break; }
                     }
                 }
-                comma::say() << "==> l" << std::endl;
             }
-            comma::say() << "==> m" << std::endl;
         }
-        comma::say() << "==> Z" << std::endl;
         output.finalise( is_shutdown );
         return 0;
     }

From 0229e4bde3f6a3858de918a3db2a00d00806ac95 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 11 Oct 2024 13:41:12 +1100
Subject: [PATCH 0952/1056] comma-test-util: comma_test_commands_until_error

---
 util/applications/comma-test-util | 56 +++++++++++++++----------------
 1 file changed, 28 insertions(+), 28 deletions(-)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 508b6bd8e..268669d63 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -39,6 +39,31 @@ readonly comma_test_util_include_guard_=1
 
 source $( type -p comma-name-value-util )
 
+function _comma_test_commands_impl()
+{
+    local key value status output until_first_error=$1 fields=$2
+    while IFS='=' read key value ; do
+        [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
+        value="${value/#\"}"
+        value="${value/%\"}"
+        output=$( eval "$value" )
+        status=$? # eval and bash -c both returns one error code, PIPESTATUS has only one value
+        if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
+            local count=0
+            while read line; do
+                if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output/line[$count]" <<< "$line" # todo? escape quote? ${line//\"/\\\"}, otherwise they get removed by bash
+                else echo "$key/output/line[$count]=\"$line\""; fi
+                (( ++count ))
+            done <<< "$output"
+        else
+            if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output" <<< "$output" # todo? escape quotes, otherwise they get removed by bash
+            else echo "$key/output=\"$output\""; fi
+        fi
+        echo "$key/status=$status"
+        if (( status != 0 && until_first_error )); then break; fi
+    done < <( grep '=' ; grep -v '^#' )
+}
+
 # a helper to write tests in the comma-test-run style
 #
 # take line by line on stdin: <test name>="<command>"
@@ -67,34 +92,9 @@ source $( type -p comma-name-value-util )
 # my_basic_test[1]/for/something/output/a="2"
 # my_basic_test[1]/for/something/output/b="4"
 # my_basic_test[1]/for/something/output=0
-#
-function comma_test_commands()
-{
-    local key
-    local value
-    local status
-    local output
-    local fields=$1
-    while IFS='=' read key value ; do
-        [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
-        value="${value/#\"}"
-        value="${value/%\"}"
-        output=$( eval "$value" )
-        status=$?       # eval and bash -c both returns one error code, PIPESTATUS has only one value
-        if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
-            local count=0
-            while read line; do
-                if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output/line[$count]" <<< "$line" # todo? escape quote? ${line//\"/\\\"}, otherwise they get removed by bash
-                else echo "$key/output/line[$count]=\"$line\""; fi
-                (( ++count ))
-            done <<< "$output"
-        else
-            if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output" <<< "$output" # todo? escape quotes, otherwise they get removed by bash
-            else echo "$key/output=\"$output\""; fi
-        fi
-        echo "$key/status=$status"
-    done < <( grep '=' ; grep -v '^#' )
-}
+
+function comma_test_commands() { _comma_test_commands_impl 0 "$@" ; }
+function comma_test_commands_until_first_error() { _comma_test_commands_impl 1 "$@" ; }
 
 # run interactive test, something like
 # > cat input

From 82f5b01078e5e421202d3d9eb4e5abbdeaaa8485 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 11 Oct 2024 13:57:55 +1100
Subject: [PATCH 0953/1056] comma-test-util: comma_test_interactive_commands:
 until_first_error flag added

---
 util/applications/comma-test-util | 18 +++++++++++++++---
 1 file changed, 15 insertions(+), 3 deletions(-)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 268669d63..96f3ee66f 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -96,7 +96,13 @@ function _comma_test_commands_impl()
 function comma_test_commands() { _comma_test_commands_impl 0 "$@" ; }
 function comma_test_commands_until_first_error() { _comma_test_commands_impl 1 "$@" ; }
 
-# run interactive test, something like
+# run interactive test
+#
+# usage: comma_test_interactive_commands [<until_first_error>]
+#        <until_first_error>: 0 (i.e. false) or 1 (i.e. true); default: 0
+#
+# it works as something like
+#
 # > cat input
 # 
 # default/instruction=
@@ -117,6 +123,8 @@ function comma_test_commands_until_first_error() { _comma_test_commands_impl 1 "
 # see for an example: e.g. snark/graphics/applications/test/view-points/colour/scalar/options
 function comma_test_interactive_commands()
 {
+    local until_first_error=$1
+    if [[ -n "$until_first_error" ]]; then until_first_error=1; else until_first_error=0; fi
     (
         function comma_test_interactive_test_case()
         {
@@ -131,7 +139,7 @@ function comma_test_interactive_commands()
             zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600
             result=$?
             echo "$name/status=$result"
-            kill $( pgrep -P $eval_pid )
+            kill $( pgrep -P $eval_pid )break
             wait $eval_pid
             return $result
         }
@@ -148,7 +156,11 @@ function comma_test_interactive_commands()
             [[ -n "$p" ]] || continue
             local n=$( dirname $p )
             if [[ "$n" != "$test_name" ]] ; then
-                [[ -z "$test_name" ]] || comma_test_interactive_test_case $test_name $testcase_number $number_of_testcases <<< "$test_case"
+                if [[ -n "$test_name" ]]; then
+                    comma_test_interactive_test_case $test_name $testcase_number $number_of_testcases <<< "$test_case"
+                    local r=$?
+                    if (( r != 0 && until_first_error )); then return $r; fi
+                fi
                 (( ++testcase_number ))
                 test_name=$n
                 test_case=

From 6731f19141643337f3f6b60e1738d71c40c1435f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 11 Oct 2024 13:59:56 +1100
Subject: [PATCH 0954/1056] comma-test-util:
 comma_test_interactive_commands_until_first_error convenience function added

---
 util/applications/comma-test-util | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 96f3ee66f..522a155a8 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -174,6 +174,8 @@ function comma_test_interactive_commands()
     )
 }
 
+function comma_test_interactive_commands_until_first_error() { comma_test_interactive_commands 1; }
+
 # the tmp directory cleanup for comma_test_run_tarball
 function comma_test_run_tarball_cleanup()
 {

From ca733be365612e7224b371d51a59fafc0af69ead Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 15 Oct 2024 11:52:11 +1100
Subject: [PATCH 0955/1056] io::serial::port: first cut added

---
 io/serial.cpp | 73 +++++++++++++++++++++++++++++++++++++++++++++++++++
 io/serial.h   | 43 ++++++++++++++++++++++++++++++
 2 files changed, 116 insertions(+)
 create mode 100644 io/serial.cpp
 create mode 100644 io/serial.h

diff --git a/io/serial.cpp b/io/serial.cpp
new file mode 100644
index 000000000..9984fc70d
--- /dev/null
+++ b/io/serial.cpp
@@ -0,0 +1,73 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+// All rights reserved.
+
+/// @author dave jennings
+
+#include "serial.h"
+
+namespace comma { namespace io { namespace serial {
+
+port::port( const std::string& name ): _port( _service, name ) {}
+
+port::port( const std::string& name, unsigned int baud_rate )
+    : _port( _service, name )
+{
+    set_baud_rate( baud_rate );
+    set_character_size( 8 );
+    set_flow_control( boost::asio::serial_port_base::flow_control::none );
+    set_parity( boost::asio::serial_port_base::parity::none );
+    set_stop_bits( boost::asio::serial_port_base::stop_bits::one );
+}
+
+void port::set_baud_rate( unsigned int baud_rate ) { _port.set_option( boost::asio::serial_port_base::baud_rate( baud_rate )); }
+
+void port::set_character_size( unsigned int character_size ) { _port.set_option( boost::asio::serial_port_base::character_size( character_size )); }
+
+void port::set_flow_control( boost::asio::serial_port_base::flow_control::type flow_control ) { _port.set_option( boost::asio::serial_port_base::flow_control( flow_control )); }
+
+void port::set_parity( boost::asio::serial_port_base::parity::type parity ) { _port.set_option( boost::asio::serial_port_base::parity( parity )); }
+
+void port::set_stop_bits( boost::asio::serial_port_base::stop_bits::type stop_bits ) { _port.set_option( boost::asio::serial_port_base::stop_bits( stop_bits )); }
+
+std::size_t port::read_some( unsigned char* buf, std::size_t buf_size )
+{
+    boost::system::error_code ec;
+    std::size_t count = _port.read_some( boost::asio::buffer( buf, buf_size ), ec );
+    COMMA_ASSERT( !ec, ec.message() );
+    return count;
+}
+
+std::size_t port::read_some( unsigned char* buf
+                           , std::size_t buf_size
+                           , const boost::asio::deadline_timer::duration_type& timeout )
+{
+    boost::optional< boost::system::error_code > timer_result;
+    boost::asio::deadline_timer timer( _service );
+    timer.expires_from_now( timeout );
+    timer.async_wait( [&timer_result]( const boost::system::error_code& error ) { timer_result.reset( error ); });
+
+    boost::optional< boost::system::error_code > read_result;
+    std::size_t count = 0;
+    _port.async_read_some( boost::asio::buffer( buf, buf_size )
+                         , [&read_result, &count]( const boost::system::error_code& error, std::size_t count_ )
+                         {
+                             read_result.reset( error );
+                             count = count_;
+                         });
+    _service.reset();
+    while( _service.run_one() )
+    {
+        if( read_result ) { timer.cancel(); }
+        if( timer_result ) { _port.cancel(); }
+    }
+    if( *read_result )
+    {
+        // https://www.boost.org/doc/libs/1_65_1/libs/system/doc/reference.html#Header-error_code
+        if( read_result->value() != boost::system::errc::operation_canceled ) { throw boost::system::system_error( *read_result ); }
+    }
+    return count;
+}
+
+std::size_t port::write( const unsigned char* buf, std::size_t to_write ) { return boost::asio::write( _port, boost::asio::buffer( buf, to_write )); }
+
+} } } // namespace comma { namespace io { namespace serial {
diff --git a/io/serial.h b/io/serial.h
new file mode 100644
index 000000000..1fb129677
--- /dev/null
+++ b/io/serial.h
@@ -0,0 +1,43 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+// All rights reserved.
+
+/// @author dave jennings
+
+#pragma once
+
+#include <boost/asio.hpp>
+#include <boost/optional.hpp>
+#include <comma/base/exception.h>
+
+namespace comma { namespace io { namespace serial {
+
+class port
+{
+    public:
+        port( const std::string& name );
+
+        /// open port as 8N1
+        port( const std::string& name, unsigned int baud_rate );
+
+        void set_baud_rate( unsigned int baud_rate );
+
+        void set_character_size( unsigned int character_size );
+
+        void set_flow_control( boost::asio::serial_port_base::flow_control::type flow_control );
+
+        void set_parity( boost::asio::serial_port_base::parity::type parity );
+
+        void set_stop_bits( boost::asio::serial_port_base::stop_bits::type stop_bits );
+
+        std::size_t read_some( unsigned char* buf, std::size_t buf_size );
+
+        std::size_t read_some( unsigned char* buf, std::size_t buf_size, const boost::asio::deadline_timer::duration_type& timeout );
+
+        std::size_t write( const unsigned char* buf, std::size_t to_write );
+
+    private:
+        boost::asio::io_service _service; // renamed as io_context in Boost 1.66 (io_service remains as typedef)
+        boost::asio::serial_port _port;
+};
+
+} } } // namespace comma { namespace io { namespace serial {

From d0f46a889e2d61554779517eb1ab1b3f89feee4a Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 15 Oct 2024 12:55:31 +1100
Subject: [PATCH 0956/1056] io::serial::port: signed char* read/write methods
 added for convenience

---
 io/serial.cpp | 12 ++++++++++++
 io/serial.h   |  6 ++++++
 2 files changed, 18 insertions(+)

diff --git a/io/serial.cpp b/io/serial.cpp
index 9984fc70d..5a589d860 100644
--- a/io/serial.cpp
+++ b/io/serial.cpp
@@ -29,6 +29,8 @@ void port::set_parity( boost::asio::serial_port_base::parity::type parity ) { _p
 
 void port::set_stop_bits( boost::asio::serial_port_base::stop_bits::type stop_bits ) { _port.set_option( boost::asio::serial_port_base::stop_bits( stop_bits )); }
 
+std::size_t port::read_some( char* buf, std::size_t size ) { return read_some( reinterpret_cast< unsigned char* >( buf ), size ); }
+
 std::size_t port::read_some( unsigned char* buf, std::size_t buf_size )
 {
     boost::system::error_code ec;
@@ -37,9 +39,17 @@ std::size_t port::read_some( unsigned char* buf, std::size_t buf_size )
     return count;
 }
 
+std::size_t port::read_some( char* buf
+                           , std::size_t size
+                           , const boost::asio::deadline_timer::duration_type& timeout )
+{
+    return read_some( reinterpret_cast< unsigned char* >( buf ), size, timeout );
+}
+
 std::size_t port::read_some( unsigned char* buf
                            , std::size_t buf_size
                            , const boost::asio::deadline_timer::duration_type& timeout )
+
 {
     boost::optional< boost::system::error_code > timer_result;
     boost::asio::deadline_timer timer( _service );
@@ -68,6 +78,8 @@ std::size_t port::read_some( unsigned char* buf
     return count;
 }
 
+std::size_t port::write( const char* buf, std::size_t to_write ) { return boost::asio::write( _port, boost::asio::buffer( buf, to_write )); }
+
 std::size_t port::write( const unsigned char* buf, std::size_t to_write ) { return boost::asio::write( _port, boost::asio::buffer( buf, to_write )); }
 
 } } } // namespace comma { namespace io { namespace serial {
diff --git a/io/serial.h b/io/serial.h
index 1fb129677..52393ca72 100644
--- a/io/serial.h
+++ b/io/serial.h
@@ -29,10 +29,16 @@ class port
 
         void set_stop_bits( boost::asio::serial_port_base::stop_bits::type stop_bits );
 
+        std::size_t read_some( char* buf, std::size_t buf_size );
+
         std::size_t read_some( unsigned char* buf, std::size_t buf_size );
 
+        std::size_t read_some( char* buf, std::size_t buf_size, const boost::asio::deadline_timer::duration_type& timeout );
+
         std::size_t read_some( unsigned char* buf, std::size_t buf_size, const boost::asio::deadline_timer::duration_type& timeout );
 
+        std::size_t write( const char* buf, std::size_t to_write );
+
         std::size_t write( const unsigned char* buf, std::size_t to_write );
 
     private:

From da3509f77762467cc3e214e174997a390b0568a4 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 15 Oct 2024 13:11:41 +1100
Subject: [PATCH 0957/1056] io/serial.h: use relative path to base/exception.h

so that the build works on a clean system when base/exception.h is not yet installed
---
 io/serial.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/io/serial.h b/io/serial.h
index 52393ca72..513d618dc 100644
--- a/io/serial.h
+++ b/io/serial.h
@@ -5,9 +5,9 @@
 
 #pragma once
 
+#include "../base/exception.h"
 #include <boost/asio.hpp>
 #include <boost/optional.hpp>
-#include <comma/base/exception.h>
 
 namespace comma { namespace io { namespace serial {
 

From dbcbfd349f1029647b49f62a20652116c3468661 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 15 Oct 2024 15:28:26 +1100
Subject: [PATCH 0958/1056] io::serial::port::properties implemented

---
 io/serial.cpp |  3 +++
 io/serial.h   |  8 ++++++++
 io/traits.h   | 28 ++++++++++++++++++++++++++++
 3 files changed, 39 insertions(+)
 create mode 100644 io/traits.h

diff --git a/io/serial.cpp b/io/serial.cpp
index 5a589d860..db9fcb6a3 100644
--- a/io/serial.cpp
+++ b/io/serial.cpp
@@ -9,9 +9,12 @@ namespace comma { namespace io { namespace serial {
 
 port::port( const std::string& name ): _port( _service, name ) {}
 
+port::port( const port::properties& p ): port( p.name, p.baud_rate ) {}
+
 port::port( const std::string& name, unsigned int baud_rate )
     : _port( _service, name )
 {
+    if( baud_rate == 0 ) { return; } // quick and dirty for now
     set_baud_rate( baud_rate );
     set_character_size( 8 );
     set_flow_control( boost::asio::serial_port_base::flow_control::none );
diff --git a/io/serial.h b/io/serial.h
index 513d618dc..8f27814ae 100644
--- a/io/serial.h
+++ b/io/serial.h
@@ -14,11 +14,19 @@ namespace comma { namespace io { namespace serial {
 class port
 {
     public:
+        struct properties
+        {
+            std::string name;
+            unsigned int baud_rate{0};
+        };
+
         port( const std::string& name );
 
         /// open port as 8N1
         port( const std::string& name, unsigned int baud_rate );
 
+        port( const properties& p );
+
         void set_baud_rate( unsigned int baud_rate );
 
         void set_character_size( unsigned int character_size );
diff --git a/io/traits.h b/io/traits.h
new file mode 100644
index 000000000..40d92a7f9
--- /dev/null
+++ b/io/traits.h
@@ -0,0 +1,28 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include "../visiting/traits.h"
+#include "serial.h"
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::io::serial::port::properties >
+{
+    template< typename K, typename V > static void visit( const K&, comma::io::serial::port::properties& t, V& v )
+    {
+        v.apply( "name", t.name );
+        v.apply( "baud_rate", t.baud_rate );
+    }
+    
+    template< typename K, typename V > static void visit( const K&, const comma::io::serial::port::properties& t, V& v )
+    {
+        v.apply( "name", t.name );
+        v.apply( "baud_rate", t.baud_rate );
+    }
+};
+
+} } // namespace comma { namespace visiting { 

From 0bc103a61f4a14bb25451fba95bbaf8da9e511fd Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 17 Oct 2024 14:19:39 +1100
Subject: [PATCH 0959/1056] comma-test-util: comma_test_interactive_commands:
 if command does not have instruction and expected, run it as non-interactive

---
 util/applications/comma-test-util | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 522a155a8..a3ecf1522 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -120,6 +120,8 @@ function comma_test_commands_until_first_error() { _comma_test_commands_impl 1 "
 #
 # comma_test_interactive_commands
 #
+# if test case does not have both instruction and expected, it is deemed non-interactive
+#
 # see for an example: e.g. snark/graphics/applications/test/view-points/colour/scalar/options
 function comma_test_interactive_commands()
 {
@@ -134,9 +136,11 @@ function comma_test_interactive_commands()
             [[ -n "$command" ]] || { echo "$name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
             eval "$command" &
             local eval_pid=$!
-            [[ $instruction ]] && dialog+="$instruction\n\n"
-            dialog+="do you see $expected?"
-            zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600
+            if [[ -n "$instruction" || -n "$expected" ]]; then
+                [[ -z "$instruction" ]] || dialog+="$instruction\n\n"
+                if [[ -n "$expected" ]]; then dialog+="do you see: $expected?"; else dialog+="does it look good?"; fi
+                zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600
+            fi
             result=$?
             echo "$name/status=$result"
             kill $( pgrep -P $eval_pid )break

From 866b901745bd6682fbca3b5c4a6e391d91b57046 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 18 Oct 2024 12:57:50 +1100
Subject: [PATCH 0960/1056] 
 bash/test/comma_name_value_util/comma_path_value_mangle: basic test for empty
 lines added

---
 .../comma_path_value_mangle/expected                 |  5 ++++-
 .../comma_path_value_mangle/test                     | 12 +++++++++---
 2 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/expected b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
index 54da3e682..59c377d89 100644
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/expected
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
@@ -11,4 +11,7 @@ subscript/a_b_0='1'
 subscript_followed_by_path/a_b_0_c='1'
 a="123"
 b="123"
-c="123"
\ No newline at end of file
+c="123"
+
+skip_empty_lines_n='a'
+skip_empty_lines_v='b'
diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/test b/bash/test/comma_name_value_util/comma_path_value_mangle/test
index 78f608eff..be4561030 100755
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/test
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/test
@@ -7,12 +7,18 @@ input="var_a=21
 var_b=22"
 
 echo "$input" | comma_path_value_mangle | sed 's|^|basic/|'
-
 echo -n "$input" | comma_path_value_mangle | sed 's|^|no_newline_at_end/|'
-
 echo "a/b/c=1" | comma_path_value_mangle | sed 's|^|path/|'
 echo "a-b-c=1" | comma_path_value_mangle | sed 's|^|dashes/|'
 echo "a/b-c=1" | comma_path_value_mangle | sed 's|^|path_with_dashes/|'
 echo "a/b[0]=1" | comma_path_value_mangle | sed 's|^|subscript/|'
 echo "a/b[0]/c=1" | comma_path_value_mangle | sed 's|^|subscript_followed_by_path/|'
-( echo a; echo b; echo c ) | comma_path_value_mangle '_' 123
\ No newline at end of file
+( echo a; echo b; echo c ) | comma_path_value_mangle '_' 123
+
+cat <<eof | comma_path_value_mangle
+
+skip_empty_lines/n=a
+
+skip_empty_lines/v=b
+
+eof
\ No newline at end of file

From 937e297055a7872988fcfc3e93c5207abc5cf5fd Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 18 Oct 2024 13:28:37 +1100
Subject: [PATCH 0961/1056] comma-test-util: comma_test_interactive_commands:
 fixed, non-interactive test support and actual-vs-expected comparison added;
 basic test implemented

---
 util/applications/comma-test-util       | 100 ++++++++++++------------
 util/test/test_run/interactive/disabled |   2 +-
 util/test/test_run/interactive/expected |  25 ++++++
 util/test/test_run/interactive/input    |  16 ++++
 util/test/test_run/interactive/test     |   6 +-
 5 files changed, 95 insertions(+), 54 deletions(-)
 create mode 100644 util/test/test_run/interactive/expected
 create mode 100644 util/test/test_run/interactive/input

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index a3ecf1522..629bbaf8e 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -39,26 +39,36 @@ readonly comma_test_util_include_guard_=1
 
 source $( type -p comma-name-value-util )
 
+function _comma_test_command_impl()
+{
+    local key="$1" value="$2"
+    value="${value/#\"}"
+    value="${value/%\"}"
+    output=$( eval "$value" )
+    status=$? # eval and bash -c both returns one error code, PIPESTATUS has only one value
+    if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
+        local count=0
+        while read line; do
+            if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output/line[$count]" <<< "$line" # todo? escape quote? ${line//\"/\\\"}, otherwise they get removed by bash
+            else echo "$key/output/line[$count]=\"$line\""; fi
+            (( ++count ))
+        done <<< "$output"
+    else
+        if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output" <<< "$output" # todo? escape quotes, otherwise they get removed by bash
+        else echo "$key/output=\"$output\""; fi
+    fi
+    return $status
+}
+
+export -f _comma_test_command_impl
+
 function _comma_test_commands_impl()
 {
     local key value status output until_first_error=$1 fields=$2
     while IFS='=' read key value ; do
         [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
-        value="${value/#\"}"
-        value="${value/%\"}"
-        output=$( eval "$value" )
-        status=$? # eval and bash -c both returns one error code, PIPESTATUS has only one value
-        if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
-            local count=0
-            while read line; do
-                if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output/line[$count]" <<< "$line" # todo? escape quote? ${line//\"/\\\"}, otherwise they get removed by bash
-                else echo "$key/output/line[$count]=\"$line\""; fi
-                (( ++count ))
-            done <<< "$output"
-        else
-            if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output" <<< "$output" # todo? escape quotes, otherwise they get removed by bash
-            else echo "$key/output=\"$output\""; fi
-        fi
+        _comma_test_command_impl "$key" "$value"
+        status=$?
         echo "$key/status=$status"
         if (( status != 0 && until_first_error )); then break; fi
     done < <( grep '=' ; grep -v '^#' )
@@ -131,50 +141,40 @@ function comma_test_interactive_commands()
         function comma_test_interactive_test_case()
         {
             local name=$1 testcase_number=$2 number_of_testcases=$3
-            local command instruction expected dialog
-            eval $( comma_path_value_mangle | sed 's/^/local /' )
-            [[ -n "$command" ]] || { echo "$name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
-            eval "$command" &
-            local eval_pid=$!
+            local command instruction expected dialog input
+            input=$( comma_path_value_mangle | sed 's/^/local /' )
+            eval "$input"
+            [[ -n "$command" ]] || { echo "$0: $name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
             if [[ -n "$instruction" || -n "$expected" ]]; then
+                _comma_test_command_impl "$name" "$command" & # eval "$command" &
+                local eval_pid=$!
                 [[ -z "$instruction" ]] || dialog+="$instruction\n\n"
                 if [[ -n "$expected" ]]; then dialog+="do you see: $expected?"; else dialog+="does it look good?"; fi
                 zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600
+                result=$?
+                echo "$name/status=$result"
+                kill $( pgrep -P $eval_pid )break
+                wait $eval_pid
+            else
+                _comma_test_command_impl "$name" "$command"
+                result=$?
+                echo "$name/status=$result"
             fi
-            result=$?
-            echo "$name/status=$result"
-            kill $( pgrep -P $eval_pid )break
-            wait $eval_pid
             return $result
         }
 
-        local test_case
-        local test_name
-        local path
         local lines=$( cat );
-        local number_of_testcases=$( grep '/command=' <<< "$lines" | wc -l )
-        local testcase_number=0
-        while read line ; do
-            [[ "$line" =~ ^# ]] && continue
-            local p=$( cut -d= -f1 <<< "$line" )
-            [[ -n "$p" ]] || continue
-            local n=$( dirname $p )
-            if [[ "$n" != "$test_name" ]] ; then
-                if [[ -n "$test_name" ]]; then
-                    comma_test_interactive_test_case $test_name $testcase_number $number_of_testcases <<< "$test_case"
-                    local r=$?
-                    if (( r != 0 && until_first_error )); then return $r; fi
-                fi
-                (( ++testcase_number ))
-                test_name=$n
-                test_case=
-            fi
-            n=${n//[/\\[}
-            n=${n//]/\\]}
-            test_case=$( echo "$test_case" ; sed "s#^$n/##" <<< "$line" )
-        done <<< "$lines"
-        if [[ -n "$test_case" ]] ; then comma_test_interactive_test_case $test_name $testcase_number $number_of_testcases <<< "$test_case" ; fi
-        return $?
+        local test_cases=$( grep '/command=' <<< "$lines" | cut -d= -f1 | egrep '^[a-zA-Z0-9_]' | sed 's#/command$##' )
+        local number_of_testcases=$( wc -l <<< "$test_cases" )
+        local testcase_number=0 test_case_name
+        while read test_case_name; do
+            local escaped="${test_case_name//[/\\[}"
+            local test_case=$( grep "^$escaped/" <<< "$lines" | sed "s#^$escaped/##" ) # grep --fixed-strings does not seem to work
+            comma_test_interactive_test_case $test_case_name $testcase_number $number_of_testcases <<< "$test_case"
+            local r=$?
+            if (( r != 0 && until_first_error )); then return $r; fi
+            (( ++testcase_number ))
+        done <<< "$test_cases"
     )
 }
 
diff --git a/util/test/test_run/interactive/disabled b/util/test/test_run/interactive/disabled
index bdee1f276..2808ba79e 100644
--- a/util/test/test_run/interactive/disabled
+++ b/util/test/test_run/interactive/disabled
@@ -1 +1 @@
-this test must be run manually using --interactive mode
+this is an interactive test that is run manually as needed
diff --git a/util/test/test_run/interactive/expected b/util/test/test_run/interactive/expected
new file mode 100644
index 000000000..9c98c5705
--- /dev/null
+++ b/util/test/test_run/interactive/expected
@@ -0,0 +1,25 @@
+interactive/success/output/line[0]="input"
+interactive/success/output/line[1]="test"
+interactive/success/status=0
+
+interactive/failure/by_user/output/line[0]="input"
+interactive/failure/by_user/output/line[1]="test"
+interactive/failure/by_user/status=1
+
+interactive/failure/by_expected/output/line[0]="blah"
+interactive/failure/by_expected/output/line[1]="blah"
+interactive/failure/by_expected/status=0
+
+non_interactive/success[0]/output/line[0]="input"
+non_interactive/success[0]/output/line[1]="test"
+non_interactive/success[0]/status=0
+
+non_interactive/success[1]/output/line[0]="input"
+non_interactive/success[1]/output/line[1]="test"
+non_interactive/success[1]/status=0
+
+non_interactive/failure[0]/output=""
+non_interactive/failure[0]/status=2
+
+non_interactive/failure[1]/output=""
+non_interactive/failure[1]/status=2
diff --git a/util/test/test_run/interactive/input b/util/test/test_run/interactive/input
new file mode 100644
index 000000000..b5cf8d733
--- /dev/null
+++ b/util/test/test_run/interactive/input
@@ -0,0 +1,16 @@
+interactive/success/command="ls input test"
+interactive/success/instruction="will run ls on current directory, press YES for the test to succeed"
+interactive/success/expected="list of files in current directory"
+
+interactive/failure/by_user/command="ls input test"
+interactive/failure/by_user/instruction="will run ls on current directory, press NO for the test to fail"
+interactive/failure/by_user/expected="list of files in current directory"
+
+interactive/failure/by_expected/command="ls input test"
+interactive/failure/by_expected/instruction="will run ls on current directory, press YES, the test still should fail on actual/expected mismatch"
+interactive/failure/by_expected/expected="list of files in current directory"
+
+non_interactive/success[0]/command="ls input test"
+non_interactive/success[1]/command="ls input test"
+non_interactive/failure[0]/command="ls non-existent-file"
+non_interactive/failure[1]/command="ls non-existent-file"
diff --git a/util/test/test_run/interactive/test b/util/test/test_run/interactive/test
index 764e581bc..f70da7533 100755
--- a/util/test/test_run/interactive/test
+++ b/util/test/test_run/interactive/test
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 source $(type -p comma-application-util)
-source $(type -p comma-process-util)
+source $(type -p comma-test-util)
+
+comma_test_interactive_commands
 
-zenity --question --text="Do you want the test to succeed?"
-comma_status_ok || exit 1

From d038eac0a3a66a292f3b68b4cf6cc12c3039037b Mon Sep 17 00:00:00 2001
From: rex <rex@super>
Date: Mon, 21 Oct 2024 15:16:21 +1100
Subject: [PATCH 0962/1056] util/application/comma-test-util:
 comma_test_interactive_commands: behaviour made more consistent (zenity is
 run in background instead of system under test)

---
 util/applications/comma-test-util | 21 ++++++++-------------
 1 file changed, 8 insertions(+), 13 deletions(-)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 629bbaf8e..96f5a0a19 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -141,25 +141,20 @@ function comma_test_interactive_commands()
         function comma_test_interactive_test_case()
         {
             local name=$1 testcase_number=$2 number_of_testcases=$3
-            local command instruction expected dialog input
+            local command instruction expected dialog input zenity_pid result
             input=$( comma_path_value_mangle | sed 's/^/local /' )
             eval "$input"
             [[ -n "$command" ]] || { echo "$0: $name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
-            if [[ -n "$instruction" || -n "$expected" ]]; then
-                _comma_test_command_impl "$name" "$command" & # eval "$command" &
-                local eval_pid=$!
+            if [[ -n "$instruction" || -n "$expected" ]]; then                
                 [[ -z "$instruction" ]] || dialog+="$instruction\n\n"
                 if [[ -n "$expected" ]]; then dialog+="do you see: $expected?"; else dialog+="does it look good?"; fi
-                zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600
-                result=$?
-                echo "$name/status=$result"
-                kill $( pgrep -P $eval_pid )break
-                wait $eval_pid
-            else
-                _comma_test_command_impl "$name" "$command"
-                result=$?
-                echo "$name/status=$result"
+                zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600 &
+                zenity_pid=$!
             fi
+            _comma_test_command_impl "$name" "$command"
+            result=$?
+            if [[ -n "$zenity_pid" ]]; then wait $zenity_pid; result=$?; fi
+            echo "$name/status=$result"
             return $result
         }
 

From a96903fc9c4422292242bb7f672ba060725c01cb Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 11:27:52 +1100
Subject: [PATCH 0963/1056] comma-test-util: comma_test_commands: unquoting
 improved

---
 util/applications/comma-test-util     | 20 ++++++++++++++++++--
 util/test/test_util/commands/expected | 20 ++++++++++++++++++++
 util/test/test_util/commands/input    |  6 ++++++
 util/test/test_util/commands/test     |  6 ++++++
 4 files changed, 50 insertions(+), 2 deletions(-)
 create mode 100644 util/test/test_util/commands/expected
 create mode 100644 util/test/test_util/commands/input
 create mode 100755 util/test/test_util/commands/test

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 96f5a0a19..a51b471be 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -39,11 +39,27 @@ readonly comma_test_util_include_guard_=1
 
 source $( type -p comma-name-value-util )
 
+function _comma_test_util_strip()
+{
+    cat <<eof
+import sys
+v = sys.stdin.readline().strip()
+assert v.startswith( '"' ), f'expected command string starting with double quote; got: {v}'
+assert v.endswith( '"' ), f'expected command string ending with with double quote"; got: {v}'
+print( v[1:-1] )
+eof
+}
+
+readonly _comma_test_util_strip_command="$( _comma_test_util_strip )"
+
+function comma_string_unquote() { python3 -c "$_comma_test_util_strip_command"; } # todo: add comma-string-util, parametrise on strip characters
+
+export -f comma_string_unquote
+
 function _comma_test_command_impl()
 {
     local key="$1" value="$2"
-    value="${value/#\"}"
-    value="${value/%\"}"
+    value=$( comma_string_unquote <<< "$value" )
     output=$( eval "$value" )
     status=$? # eval and bash -c both returns one error code, PIPESTATUS has only one value
     if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
diff --git a/util/test/test_util/commands/expected b/util/test/test_util/commands/expected
new file mode 100644
index 000000000..2879510d6
--- /dev/null
+++ b/util/test/test_util/commands/expected
@@ -0,0 +1,20 @@
+basic/output/line[0]="expected"
+basic/output/line[1]="input"
+basic/output/line[2]="output"
+basic/output/line[3]="stats"
+basic/output/line[4]="test"
+basic/status=0
+quoted/single[0]/output/line[0]="input"
+quoted/single[0]/output/line[1]="test"
+quoted/single[0]/status=0
+quoted/single[1]/output/line[0]="input"
+quoted/single[1]/output/line[1]="test"
+quoted/single[1]/status=0
+quoted/double[0]/output/line[0]="input"
+quoted/double[0]/output/line[1]="test"
+quoted/double[0]/status=0
+quoted/double[1]/output/line[0]="input"
+quoted/double[1]/output/line[1]="test"
+quoted/double[1]/status=0
+trailing_spaces/output="input"
+trailing_spaces/status=0
diff --git a/util/test/test_util/commands/input b/util/test/test_util/commands/input
new file mode 100644
index 000000000..1810e53dd
--- /dev/null
+++ b/util/test/test_util/commands/input
@@ -0,0 +1,6 @@
+basic="ls"
+quoted/single[0]="ls 'input' 'test'"
+quoted/single[1]=" ls 'input' 'test' "
+quoted/double[0]="ls \"input\" \"test\""
+quoted/double[1]=" ls \"input\" \"test\" "
+trailing_spaces="ls input"   
diff --git a/util/test/test_util/commands/test b/util/test/test_util/commands/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/util/test/test_util/commands/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands

From dd3c18458cd1553ba4a3d6e8fe952167eb70ac48 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 11:41:54 +1100
Subject: [PATCH 0964/1056] comma-test-util: comma_test_interactive_commands:
 unquoting improved

---
 util/applications/comma-test-util             | 10 ++++++++--
 .../test_util/interactive_commands/expected   | 20 +++++++++++++++++++
 .../test/test_util/interactive_commands/input |  6 ++++++
 util/test/test_util/interactive_commands/test |  6 ++++++
 4 files changed, 40 insertions(+), 2 deletions(-)
 create mode 100644 util/test/test_util/interactive_commands/expected
 create mode 100644 util/test/test_util/interactive_commands/input
 create mode 100755 util/test/test_util/interactive_commands/test

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index a51b471be..a3da5750c 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -158,8 +158,14 @@ function comma_test_interactive_commands()
         {
             local name=$1 testcase_number=$2 number_of_testcases=$3
             local command instruction expected dialog input zenity_pid result
-            input=$( comma_path_value_mangle | sed 's/^/local /' )
-            eval "$input"
+            #input=$( comma_path_value_mangle | sed 's/^/local /' )
+            #eval "$input"
+            while IFS='=' read key value; do # have to do it piecemeal to avoid bash quoting difficulties
+                if [[ "$key" == "command" ]]; then command="$value"
+                elif [[ "$key" == "instruction" ]]; then instruction="$value"
+                elif [[ "$key" == "expected" ]]; then expected="$value"
+                else echo "$0: test '$name': expected 'command', 'instruction', or 'expected', got: '$key'" >&2; return 1; fi
+            done
             [[ -n "$command" ]] || { echo "$0: $name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
             if [[ -n "$instruction" || -n "$expected" ]]; then                
                 [[ -z "$instruction" ]] || dialog+="$instruction\n\n"
diff --git a/util/test/test_util/interactive_commands/expected b/util/test/test_util/interactive_commands/expected
new file mode 100644
index 000000000..2879510d6
--- /dev/null
+++ b/util/test/test_util/interactive_commands/expected
@@ -0,0 +1,20 @@
+basic/output/line[0]="expected"
+basic/output/line[1]="input"
+basic/output/line[2]="output"
+basic/output/line[3]="stats"
+basic/output/line[4]="test"
+basic/status=0
+quoted/single[0]/output/line[0]="input"
+quoted/single[0]/output/line[1]="test"
+quoted/single[0]/status=0
+quoted/single[1]/output/line[0]="input"
+quoted/single[1]/output/line[1]="test"
+quoted/single[1]/status=0
+quoted/double[0]/output/line[0]="input"
+quoted/double[0]/output/line[1]="test"
+quoted/double[0]/status=0
+quoted/double[1]/output/line[0]="input"
+quoted/double[1]/output/line[1]="test"
+quoted/double[1]/status=0
+trailing_spaces/output="input"
+trailing_spaces/status=0
diff --git a/util/test/test_util/interactive_commands/input b/util/test/test_util/interactive_commands/input
new file mode 100644
index 000000000..762a7c91b
--- /dev/null
+++ b/util/test/test_util/interactive_commands/input
@@ -0,0 +1,6 @@
+basic/command="ls"
+quoted/single[0]/command="ls 'input' 'test'"
+quoted/single[1]/command=" ls 'input' 'test' "
+quoted/double[0]/command="ls \"input\" \"test\""
+quoted/double[1]/command=" ls \"input\" \"test\" "
+trailing_spaces/command="ls input"   
diff --git a/util/test/test_util/interactive_commands/test b/util/test/test_util/interactive_commands/test
new file mode 100755
index 000000000..8b1bfde81
--- /dev/null
+++ b/util/test/test_util/interactive_commands/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_interactive_commands

From 592755b1196336d4cbb96b4035393ea4e46be2f9 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 12:07:31 +1100
Subject: [PATCH 0965/1056] comma-test-util: comma_test_interactive_commands:
 unquoting improved

---
 util/applications/comma-test-util             | 33 ++++++++++++++-----
 util/test/test_util/commands/expected         |  6 ++++
 util/test/test_util/commands/input            |  3 ++
 .../test_util/interactive_commands/expected   |  9 +++++
 .../test/test_util/interactive_commands/input |  6 +++-
 5 files changed, 48 insertions(+), 9 deletions(-)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index a3da5750c..db139bd3a 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -39,27 +39,42 @@ readonly comma_test_util_include_guard_=1
 
 source $( type -p comma-name-value-util )
 
+function _comma_test_util_unquote()
+{
+    cat <<eof
+import sys
+for v in sys.stdin.readlines(): 
+    v = v.strip()
+    assert v.startswith( '"' ), f'comma-string-unquote: expected string starting with double quote; got: {v}'
+    assert v.endswith( '"' ), f'comma-string-unquote: expected string ending with with double quote"; got: {v}'
+    print( v[1:-1] )
+eof
+}
+
 function _comma_test_util_strip()
 {
     cat <<eof
 import sys
-v = sys.stdin.readline().strip()
-assert v.startswith( '"' ), f'expected command string starting with double quote; got: {v}'
-assert v.endswith( '"' ), f'expected command string ending with with double quote"; got: {v}'
-print( v[1:-1] )
+for line in sys.stdin.readlines(): print( line.strip() )
 eof
 }
 
 readonly _comma_test_util_strip_command="$( _comma_test_util_strip )"
+readonly _comma_test_util_unquote_command="$( _comma_test_util_unquote )"
+
+function comma-string-strip() { python3 -c "$_comma_test_util_strip_command"; } # todo: add comma-string-util, parametrise on strip characters
+
+export -f comma-string-strip
 
-function comma_string_unquote() { python3 -c "$_comma_test_util_strip_command"; } # todo: add comma-string-util, parametrise on strip characters
+function comma-string-unquote() { python3 -c "$_comma_test_util_unquote_command"; } # todo: add comma-string-util, parametrise on strip characters
 
-export -f comma_string_unquote
+export -f comma-string-unquote
 
 function _comma_test_command_impl()
 {
     local key="$1" value="$2"
-    value=$( comma_string_unquote <<< "$value" )
+    key=$( comma-string-strip <<< "$key" )
+    value=$( comma-string-unquote <<< "$value" )
     output=$( eval "$value" )
     status=$? # eval and bash -c both returns one error code, PIPESTATUS has only one value
     if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
@@ -83,6 +98,7 @@ function _comma_test_commands_impl()
     local key value status output until_first_error=$1 fields=$2
     while IFS='=' read key value ; do
         [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
+        key=$( comma-string-strip <<< "$key" )
         _comma_test_command_impl "$key" "$value"
         status=$?
         echo "$key/status=$status"
@@ -161,6 +177,7 @@ function comma_test_interactive_commands()
             #input=$( comma_path_value_mangle | sed 's/^/local /' )
             #eval "$input"
             while IFS='=' read key value; do # have to do it piecemeal to avoid bash quoting difficulties
+                key=$( comma-string-strip <<< "$key" )
                 if [[ "$key" == "command" ]]; then command="$value"
                 elif [[ "$key" == "instruction" ]]; then instruction="$value"
                 elif [[ "$key" == "expected" ]]; then expected="$value"
@@ -181,7 +198,7 @@ function comma_test_interactive_commands()
         }
 
         local lines=$( cat );
-        local test_cases=$( grep '/command=' <<< "$lines" | cut -d= -f1 | egrep '^[a-zA-Z0-9_]' | sed 's#/command$##' )
+        local test_cases=$( cut -d= -f1 <<< "$lines" | grep -v '^#' | comma-string-strip | grep '/command$' | egrep '^[a-zA-Z0-9_]' | sed 's#/command$##' )
         local number_of_testcases=$( wc -l <<< "$test_cases" )
         local testcase_number=0 test_case_name
         while read test_case_name; do
diff --git a/util/test/test_util/commands/expected b/util/test/test_util/commands/expected
index 2879510d6..ca16897d4 100644
--- a/util/test/test_util/commands/expected
+++ b/util/test/test_util/commands/expected
@@ -10,6 +10,12 @@ quoted/single[0]/status=0
 quoted/single[1]/output/line[0]="input"
 quoted/single[1]/output/line[1]="test"
 quoted/single[1]/status=0
+quoted/single[2]/output/line[0]="input"
+quoted/single[2]/output/line[1]="test"
+quoted/single[2]/status=0
+quoted/single[3]/output/line[0]="input"
+quoted/single[3]/output/line[1]="test"
+quoted/single[3]/status=0
 quoted/double[0]/output/line[0]="input"
 quoted/double[0]/output/line[1]="test"
 quoted/double[0]/status=0
diff --git a/util/test/test_util/commands/input b/util/test/test_util/commands/input
index 1810e53dd..6772dad96 100644
--- a/util/test/test_util/commands/input
+++ b/util/test/test_util/commands/input
@@ -1,6 +1,9 @@
 basic="ls"
 quoted/single[0]="ls 'input' 'test'"
 quoted/single[1]=" ls 'input' 'test' "
+quoted/single[2]=    " ls 'input' 'test' "
+quoted/single[3] =    " ls 'input' 'test' "
 quoted/double[0]="ls \"input\" \"test\""
 quoted/double[1]=" ls \"input\" \"test\" "
 trailing_spaces="ls input"   
+# commented_test="exit 1"
\ No newline at end of file
diff --git a/util/test/test_util/interactive_commands/expected b/util/test/test_util/interactive_commands/expected
index 2879510d6..f91213a1a 100644
--- a/util/test/test_util/interactive_commands/expected
+++ b/util/test/test_util/interactive_commands/expected
@@ -10,6 +10,15 @@ quoted/single[0]/status=0
 quoted/single[1]/output/line[0]="input"
 quoted/single[1]/output/line[1]="test"
 quoted/single[1]/status=0
+quoted/single[2]/output/line[0]="input"
+quoted/single[2]/output/line[1]="test"
+quoted/single[2]/status=0
+quoted/single[3]/output/line[0]="input"
+quoted/single[3]/output/line[1]="test"
+quoted/single[3]/status=0
+quoted/single[4]/output/line[0]="input"
+quoted/single[4]/output/line[1]="test"
+quoted/single[4]/status=0
 quoted/double[0]/output/line[0]="input"
 quoted/double[0]/output/line[1]="test"
 quoted/double[0]/status=0
diff --git a/util/test/test_util/interactive_commands/input b/util/test/test_util/interactive_commands/input
index 762a7c91b..0ebad17f4 100644
--- a/util/test/test_util/interactive_commands/input
+++ b/util/test/test_util/interactive_commands/input
@@ -1,6 +1,10 @@
 basic/command="ls"
 quoted/single[0]/command="ls 'input' 'test'"
 quoted/single[1]/command=" ls 'input' 'test' "
+quoted/single[2]/command= " ls 'input' 'test' "
+quoted/single[3]/command =" ls 'input' 'test' "
+quoted/single[4]/command = " ls 'input' 'test' "
 quoted/double[0]/command="ls \"input\" \"test\""
 quoted/double[1]/command=" ls \"input\" \"test\" "
-trailing_spaces/command="ls input"   
+trailing_spaces/command="ls input"
+# commented_test/command="exit 1"  # todo: add checks to expected

From b939e4797e4bccb5c66c40e8cb7d3645aed0b7a7 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 12:10:25 +1100
Subject: [PATCH 0966/1056] util/test/test_util/commands: todo comment added

---
 util/test/test_util/commands/input | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/util/test/test_util/commands/input b/util/test/test_util/commands/input
index 6772dad96..b83463c43 100644
--- a/util/test/test_util/commands/input
+++ b/util/test/test_util/commands/input
@@ -6,4 +6,4 @@ quoted/single[3] =    " ls 'input' 'test' "
 quoted/double[0]="ls \"input\" \"test\""
 quoted/double[1]=" ls \"input\" \"test\" "
 trailing_spaces="ls input"   
-# commented_test="exit 1"
\ No newline at end of file
+# commented_test="exit 1" # todo: add checks to expected
\ No newline at end of file

From f363223ca25643e51764670bb6c0f68ded45f5ef Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 12:24:16 +1100
Subject: [PATCH 0967/1056] name_value/test/name-value-get: escaping fixed

---
 name_value/test/name-value-get/input | 26 +++++++++++++-------------
 1 file changed, 13 insertions(+), 13 deletions(-)

diff --git a/name_value/test/name-value-get/input b/name_value/test/name-value-get/input
index 36a1fce14..9afbc617d 100644
--- a/name_value/test/name-value-get/input
+++ b/name_value/test/name-value-get/input
@@ -1,28 +1,28 @@
-basics[0]=echo a=1 | name-value-get a
-basics[1]=echo '{ "a": 1, "b": 2, "c": 3}' | name-value-get b
+basics[0]="echo a=1 | name-value-get a"
+basics[1]="echo '{ \"a\": 1, \"b\": 2, \"c\": 3}' | name-value-get b"
 
-path[0]=echo '{ "a": 1, "b": 2, "c": { "d": 3 }}' | name-value-get c/d
-path[1]=( echo a/b/c=0; echo a/b/d=-1; ) | name-value-get a/b/d
+path[0]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": 3 }}' | name-value-get c/d"
+path[1]="( echo a/b/c=0; echo a/b/d=-1; ) | name-value-get a/b/d"
 
-xml[0]=echo '{ "a": 1, "b": 2, "c": { "d": "omega" }}' | name-value-convert --to xml | name-value-get c/d
+xml[0]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": \"omega\" }}' | name-value-convert --to xml | name-value-get c/d"
 
-non_existant[0]=echo '{ "a": 1, "b": 2, "c": { "d": 3 }}' | name-value-get d
-non_existant[1]=echo '{ "a": 1, "b": 2, "c": { "d": 3 }}' | name-value-get x/b
+non_existant[0]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": 3 }}' | name-value-get d"
+non_existant[1]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": 3 }}' | name-value-get x/b"
 
-empty_input[0]=name-value-get x < /dev/null
+empty_input[0]="name-value-get x < /dev/null"
 
 multiple_results[0]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-convert --to json | name-value-get a/b | tr '\\n' ';'"
-multiple_results[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/e=2; ) | name-value-get a/b | tr \'\\\n\' \';\'"
+multiple_results[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/e=2; ) | name-value-get a/b | tr '\\n' ';'"
 
 indexed_path[0]="echo a[0]=1 | name-value-get a[0]"
 indexed_path[1]="echo a[0]=1 | name-value-convert --to json | name-value-get a[0]"
-indexed_path[2]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a/b[0] | tr \'\\\n\' \';\'"
+indexed_path[2]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a/b[0] | tr '\\n' ';'"
 indexed_path[3]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a/b[1]/c"
-indexed_path[4]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a | tr \'\\\n\' \';\'"
+indexed_path[4]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a | tr '\\n' ';'"
 
 regex[0]="( echo a/alpha=0 ; echo a/aleph=1 ) | name-value-get 'a/ale.*' "
-regex[1]="( echo a/alpha=0 ; echo a/aleph=1; echo a/chi=2; ) | name-value-get 'a/al.*' | tr \'\\\n\' \';\'"
-regex[2]="( echo a/phi=0 ; echo a/psi=1; echo a/rho=2; ) | name-value-get --regex 'a/[pr]h[io]' | tr \'\\\n\' \';\'"
+regex[1]="( echo a/alpha=0 ; echo a/aleph=1; echo a/chi=2; ) | name-value-get 'a/al.*' | tr '\\n' ';'"
+regex[2]="( echo a/phi=0 ; echo a/psi=1; echo a/rho=2; ) | name-value-get --regex 'a/[pr]h[io]' | tr '\\n' ';'"
 
 whitespace[0]="( echo a/b/c=0; echo; echo a/b/d=1; echo; echo a/b/e=2; ) | name-value-get a/b/e"
 whitespace[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/ e =2; ) | name-value-get 'a/b/ e '"

From f79ee817cb184eb25323396da37f3d22b291403b Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 13:20:32 +1100
Subject: [PATCH 0968/1056] csv/test/csv-strings: typo in test (missing quote)
 fixed

---
 csv/test/csv-strings/input | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
index f3b123240..3ace06be6 100644
--- a/csv/test/csv-strings/input
+++ b/csv/test/csv-strings/input
@@ -102,7 +102,7 @@ path_common/dirname[0]="{ echo /; } | csv-strings path-common --dirname-on-singl
 path_common/dirname[1]="{ echo /a; } | csv-strings path-common --dirname-on-single-record --once"
 path_common/dirname[2]="{ echo /aaa; } | csv-strings path-common --dirname-on-single-record --once"
 path_common/dirname[3]="{ echo /aaa/; } | csv-strings path-common --dirname-on-single-record --once"
-path_common/dirname[4]="{ echo /aaa/bbb; } | csv-strings path-common --dirname-on-single-record --once
+path_common/dirname[4]="{ echo /aaa/bbb; } | csv-strings path-common --dirname-on-single-record --once"
 path_common/dirname[5]="{ echo /aaa/bbb/ccc; } | csv-strings path-common --dirname-on-single-record --once"
 path_common/dirname[6]="{ echo a; } | csv-strings path-common --dirname-on-single-record --once"
 path_common/dirname[7]="{ echo aaa; } | csv-strings path-common --dirname-on-single-record --once"

From a73fa9958f8d684cff65e35db4016904a7312319 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 13:22:22 +1100
Subject: [PATCH 0969/1056] csv/test/csv-blocks/group/input: typo in test
 (missing closing quote) fixed

---
 csv/test/csv-blocks/group/input | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/csv/test/csv-blocks/group/input b/csv/test/csv-blocks/group/input
index 79d9a03c2..627a1e016 100644
--- a/csv/test/csv-blocks/group/input
+++ b/csv/test/csv-blocks/group/input
@@ -14,11 +14,11 @@ group/scalar/span[5]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from s
 
 group/scalar/gap_and_span[0]="( echo 1; echo 2; echo 5; echo 6; echo 7; echo 8; echo 9 ) | csv-blocks group --fields scalar --gap 2 --span 4"
 
-group/scalar/range[0]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5
-group/scalar/range[1]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --discard-out-of-range
-group/scalar/range[2]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5
-group/scalar/range[3]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5 --discard-out-of-range
-group/scalar/range[4]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5
-group/scalar/range[5]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5 --discard-out-of-range
-group/scalar/range[6]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0
-group/scalar/range[7]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0 --discard-out-of-range
+group/scalar/range[0]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5"
+group/scalar/range[1]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --discard-out-of-range"
+group/scalar/range[2]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5"
+group/scalar/range[3]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5 --discard-out-of-range"
+group/scalar/range[4]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5"
+group/scalar/range[5]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5 --discard-out-of-range"
+group/scalar/range[6]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0"
+group/scalar/range[7]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0 --discard-out-of-range"

From 43f562cc4de71f15c728a38dd039d9f939374da1 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 22 Oct 2024 15:50:14 +1100
Subject: [PATCH 0970/1056] util/test/test_util: expected files fixed

---
 util/test/test_util/commands/expected             | 7 ++-----
 util/test/test_util/commands/input                | 2 +-
 util/test/test_util/interactive_commands/expected | 7 ++-----
 util/test/test_util/interactive_commands/input    | 2 +-
 4 files changed, 6 insertions(+), 12 deletions(-)

diff --git a/util/test/test_util/commands/expected b/util/test/test_util/commands/expected
index ca16897d4..905e619f1 100644
--- a/util/test/test_util/commands/expected
+++ b/util/test/test_util/commands/expected
@@ -1,8 +1,5 @@
-basic/output/line[0]="expected"
-basic/output/line[1]="input"
-basic/output/line[2]="output"
-basic/output/line[3]="stats"
-basic/output/line[4]="test"
+basic/output/line[0]="input"
+basic/output/line[1]="test"
 basic/status=0
 quoted/single[0]/output/line[0]="input"
 quoted/single[0]/output/line[1]="test"
diff --git a/util/test/test_util/commands/input b/util/test/test_util/commands/input
index b83463c43..11ba21a3f 100644
--- a/util/test/test_util/commands/input
+++ b/util/test/test_util/commands/input
@@ -1,4 +1,4 @@
-basic="ls"
+basic="ls input test"
 quoted/single[0]="ls 'input' 'test'"
 quoted/single[1]=" ls 'input' 'test' "
 quoted/single[2]=    " ls 'input' 'test' "
diff --git a/util/test/test_util/interactive_commands/expected b/util/test/test_util/interactive_commands/expected
index f91213a1a..7407a7975 100644
--- a/util/test/test_util/interactive_commands/expected
+++ b/util/test/test_util/interactive_commands/expected
@@ -1,8 +1,5 @@
-basic/output/line[0]="expected"
-basic/output/line[1]="input"
-basic/output/line[2]="output"
-basic/output/line[3]="stats"
-basic/output/line[4]="test"
+basic/output/line[0]="input"
+basic/output/line[1]="test"
 basic/status=0
 quoted/single[0]/output/line[0]="input"
 quoted/single[0]/output/line[1]="test"
diff --git a/util/test/test_util/interactive_commands/input b/util/test/test_util/interactive_commands/input
index 0ebad17f4..f4e02c174 100644
--- a/util/test/test_util/interactive_commands/input
+++ b/util/test/test_util/interactive_commands/input
@@ -1,4 +1,4 @@
-basic/command="ls"
+basic/command="ls input test"
 quoted/single[0]/command="ls 'input' 'test'"
 quoted/single[1]/command=" ls 'input' 'test' "
 quoted/single[2]/command= " ls 'input' 'test' "

From dde8e198e85a206e44677eddff09d35d826b3eba Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 28 Oct 2024 15:44:59 +1100
Subject: [PATCH 0971/1056] csv-play: --help: refactored

---
 csv/applications/csv-play.cpp | 133 +++++++++++++++++-----------------
 1 file changed, 68 insertions(+), 65 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 8e618a287..c392acd82 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -80,73 +80,76 @@ static void interactive_help( std::string prefix )
     std::cerr << prefix << "<q>: quit" << std::endl;
 }
 
-static void usage( bool )
+static void usage( bool verbose )
 {
-    std::cerr << std::endl;
-    std::cerr << "play back timestamped data from standard input in a real time manner" << std::endl;
-    std::cerr << "to standard output or optionally into given files/pipes" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: csv-play [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --speed: speed-up playback by a factor, default is 1 (inverse to --slowdown)" << std::endl;
-    std::cerr << "    --slowdown,--slow: slow-down playback by a factor, default is 1 (inverse to --speed)" << std::endl;
-    std::cerr << "    --quiet: don't print warnings when lagging behind" << std::endl;
-    std::cerr << "    --fields <fields> : specify where timestamp is" << std::endl;
-    std::cerr << "                        e.g., if timestamp is the 4th field: --fields=\",,,t\"" << std::endl;
-    std::cerr << "                        default: the timestamp is the first field" << std::endl;
-    std::cerr << "    --binary <format> : use binary format" << std::endl;
-    std::cerr << "    --clients: minimum number of clients to connect to each stream" << std::endl;
-    std::cerr << "               before playback starts; default 0" << std::endl;
-    std::cerr << "               can be specified individually for each client, e.g." << std::endl;
-    std::cerr << "               csv-play file1;pipe;clients=1 file2;tcp:1234;clients=3" << std::endl;
-    std::cerr << "    --interactive,-i: react to key presses:" << std::endl;
+    std::cerr << R"(
+play back timestamped data from standard input in a real time manner
+to standard output or optionally into given files/pipes
+
+usage: csv-play [<options>]
+
+options
+    --speed: speed-up playback by a factor, default is 1 (inverse to --slowdown)
+    --slowdown,--slow: slow-down playback by a factor, default is 1 (inverse to --speed)
+    --quiet: don't print warnings when lagging behind
+    --fields <fields> : specify where timestamp is
+                        e.g., if timestamp is the 4th field: --fields=',,,t'
+                        default: the timestamp is the first field
+    --binary <format> : use binary format
+    --clients: minimum number of clients to connect to each stream
+               before playback starts; default 0
+               can be specified individually for each client, e.g.
+               csv-play file1;pipe;clients=1 file2;tcp:1234;clients=3
+    --interactive,-i: react to key presses:"
+)";
     interactive_help( "    --interactive,-i: " );
-    std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
-    std::cerr << "    --paused-at-start,--paused: start playback as paused, implies --interactive" << std::endl;
-    std::cerr << "    --pause-at=[<timestamp>]; pause when timestamp reached, implies --interactive" << std::endl;
-    std::cerr << "    --resolution=<second>: timestamp resolution; timestamps closer than this value will be" << std::endl;
-    std::cerr << "                           played without delay; the rationale is that microsleep used in csv-play" << std::endl;
-    std::cerr << "                           (boost::this_thread::sleep()) is essentially imprecise and may create" << std::endl;
-    std::cerr << "                           unnecessary delays in the data" << std::endl;
-    std::cerr << "                           default 0.01" << std::endl;
-    std::cerr << "    --from <timestamp> : play back data starting at <timestamp> ( iso format )" << std::endl;
-    std::cerr << "    --to <timestamp> : play back data up to <timestamp> ( iso format )" << std::endl;
-    std::cerr << comma::csv::format::usage();
-    std::cerr << std::endl;
-    std::cerr << "output" << std::endl;
-    std::cerr << "    -: write to stdout (default)" << std::endl;
-    std::cerr << "    offset=<offset>: add <offset> seconds to the timestamp of this source" << std::endl;
-    std::cerr << "    <filename>: write to file or named pipe, e.g. csv-play \"points.csv;pipe\"" << std::endl;
-    std::cerr << "    tcp:<port>: open tcp server socket on given port and write to the tcp clients" << std::endl;
-    std::cerr << "    local:<name>: same as tcp, but use unix/linux domain sockets" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    output timestamped 3d points in real time manner to stdout (e.g. for visualisation)" << std::endl;
-    std::cerr << "        cat points.csv | csv-play | view-points --fields=,x,y,z" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    play back several files and output to, say, named pipes:" << std::endl;
-    std::cerr << "        mkfifo file1.pipe file2.pipe" << std::endl;
-    std::cerr << "        csv-play \"file1.csv;pipe1\" \"file2.csv;pipe2\" &" << std::endl;
-    std::cerr << "        view-points pipe1 pipe2 --fields=,x,y,z" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    same as above, but block, until all the pipes are connected:" << std::endl;
-    std::cerr << "        csv-play \"file1.csv;pipe1\" \"file2.csv;pipe2\" --clients=1 &" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    output multiple inputs of the same format to stdout:" << std::endl;
-    std::cerr << "        csv-play \"file1.csv;-\" \"file2.csv;-\" &" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    use binary data (try it)" << std::endl;
-    std::cerr << "        > csv-play <( csv-paste line-number | csv-repeat --pace --period 1 | csv-time-amp | csv-to-bin t,ui --flush )';-;binary=t,ui' \\" << std::endl;
-    std::cerr << "                 <( csv-paste line-number value=0 | csv-repeat --pace --period 1 | csv-time-stamp | csv-to-bin t,2ui --flush )';tcp:8888;binary=t,2ui' \\" << std::endl;
-    std::cerr << "            | csv-from-bin t,ui" << std::endl;
-    std::cerr << "        > #in another shell, run" << std::endl;
-    std::cerr << "        > socat tcp:localhost:8888 - | csv-from-bin t,2ui" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    pause and step through output:" << std::endl;
-    std::cerr << "        echo 0 | csv-repeat --period 0.1 --yes | csv-paste - line-number \\" << std::endl;
-    std::cerr << "            | csv-time-stamp | csv-play --interactive" << std::endl;
-    std::cerr << std::endl;
+    std::cerr << R"(    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )
+    --paused-at-start,--paused: start playback as paused, implies --interactive
+    --pause-at=[<timestamp>]; pause when timestamp reached, implies --interactive
+    --resolution=<second>: timestamp resolution; timestamps closer than this value will be
+                           played without delay; the rationale is that microsleep used in csv-play
+                           (boost::this_thread::sleep()) is essentially imprecise and may create
+                           unnecessary delays in the data
+                           default 0.01
+    --from <timestamp> : play back data starting at <timestamp> ( iso format )
+    --to <timestamp> : play back data up to <timestamp> ( iso format )
+)" << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose );
+    std::cerr << R"(
+output
+    -: write to stdout (default)
+    offset=<offset>: add <offset> seconds to the timestamp of this source
+    <filename>: write to file or named pipe, e.g. csv-play 'points.csv;pipe'
+    tcp:<port>: open tcp server socket on given port and write to the tcp clients
+    local:<name>: same as tcp, but use unix/linux domain sockets
+
+examples
+    output timestamped 3d points in real time manner to stdout (e.g. for visualisation)
+        cat points.csv | csv-play | view-points --fields=,x,y,z
+
+    play back several files and output to, say, named pipes:
+        mkfifo file1.pipe file2.pipe
+        csv-play 'file1.csv;pipe1' 'file2.csv;pipe2' &
+        view-points pipe1 pipe2 --fields=,x,y,z
+
+    same as above, but block, until all the pipes are connected:
+        csv-play 'file1.csv;pipe1' 'file2.csv;pipe2' --clients=1 &
+
+    output multiple inputs of the same format to stdout:
+        csv-play 'file1.csv;-' 'file2.csv;-' &
+
+    use binary data (try it)
+        > csv-play <( csv-paste line-number | csv-repeat --pace --period 1 | csv-time-amp | csv-to-bin t,ui --flush )';-;binary=t,ui' \
+                   <( csv-paste line-number value=0 | csv-repeat --pace --period 1 | csv-time-stamp | csv-to-bin t,2ui --flush )';tcp:8888;binary=t,2ui' \
+            | csv-from-bin t,ui
+        > #in another shell, run
+        > socat tcp:localhost:8888 - | csv-from-bin t,2ui
+
+    pause and step through output:
+        echo 0 | csv-repeat --period 0.1 --yes | csv-paste - line-number | csv-time-stamp | csv-play --interactive
+
+)" << std::endl;
     exit( 0 );
 }
 

From adf36972888c885278660037a899239c28685b51 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 28 Oct 2024 16:08:03 +1100
Subject: [PATCH 0972/1056] csv-play: minor brush-up

---
 csv/applications/csv-play.cpp | 61 ++++++++++-------------------------
 1 file changed, 17 insertions(+), 44 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index c392acd82..cdf57c61b 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -162,16 +162,15 @@ class playback_state_t
     playback_state_t() : state_( state::running ) {}
 
     bool is_running() const { return state_ == state::running; }
+
     bool is_paused() const { return state_ == state::paused; }
 
     void pause( const boost::posix_time::ptime& t = boost::posix_time::not_a_date_time )
     {
-        if( state_ != state::paused )
-        {
-            state_ = state::paused;
-            paused_time_ = boost::posix_time::microsec_clock::universal_time();
-            if( ! t.is_not_a_date_time() ) { std::cerr << "csv-play: paused at " << boost::posix_time::to_iso_string( t ) << std::endl; }
-        }
+        if( state_ == state::paused ) { return; }
+        state_ = state::paused;
+        paused_time_ = boost::posix_time::microsec_clock::universal_time();
+        if( ! t.is_not_a_date_time() ) { std::cerr << "csv-play: paused at " << boost::posix_time::to_iso_string( t ) << std::endl; }
     }
 
     void unpause()
@@ -181,12 +180,10 @@ class playback_state_t
 
     void run()
     {
-        if( state_ != state::running )
-        {
-            if( state_ == state::paused ) { unpause(); }
-            state_ = state::running;
-            std::cerr << "csv-play: resumed" << std::endl;
-        }
+        if( state_ == state::running ) { return; }
+        if( state_ == state::paused ) { unpause(); }
+        state_ = state::running;
+        std::cerr << "csv-play: resumed" << std::endl;
     }
 
     void read_once()
@@ -195,14 +192,10 @@ class playback_state_t
         state_ = state::read_once;
     }
 
-    void has_read_once()
-    {
-        if( state_ == state::read_once ) { pause(); }
-    }
+    void has_read_once() { if( state_ == state::read_once ) { pause(); } }
 
 private:
     enum class state { running, paused, read_once, read_block };
-
     state state_;
     boost::posix_time::ptime paused_time_;
 };
@@ -219,23 +212,11 @@ class key_press_handler_t
         key k = get_key();
         switch( k )
         {
-            case key::space:
-                if( playback.is_running() ) { playback.pause( t ); }
-                else { playback.run(); }
-                break;
-            case key::down_arrow:
-            case key::right_arrow:
-                playback.read_once();
-                break;
-            case key::q:
-                quit = true;
-                break;
-            case key::t:
-                std::cerr << boost::posix_time::to_iso_string( t ) << std::endl;
-                break;
-            case key::none:
-            case key::other:
-                break;
+            case key::space: if( playback.is_running() ) { playback.pause( t ); } else { playback.run(); } break;
+            case key::down_arrow: case key::right_arrow: playback.read_once(); break;
+            case key::q: quit = true; break;
+            case key::t: std::cerr << boost::posix_time::to_iso_string( t ) << std::endl; break;
+            case key::none: case key::other: break;
         }
     }
     
@@ -346,16 +327,8 @@ int main( int argc, char** argv )
         {
             boost::posix_time::ptime now = multiplay->now();
             key_press_handler.update( now );
-            if( pause_at_timestamp && !now.is_not_a_date_time() && *pause_at_timestamp < now )
-            {
-                playback.pause( now );
-                pause_at_timestamp = boost::none;
-            }
-            if( playback.is_paused() )
-            {
-                boost::this_thread::sleep( boost::posix_time::millisec( 200 ) );
-                continue;
-            }
+            if( pause_at_timestamp && !now.is_not_a_date_time() && *pause_at_timestamp < now ) { playback.pause( now ); pause_at_timestamp = boost::none; }
+            if( playback.is_paused() ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }
             if( !multiplay->read() ) { break; }
             playback.has_read_once();
         }

From 6311331a7f66fc5422d985bd1fbe54f253bcf6bf Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 28 Oct 2024 16:23:29 +1100
Subject: [PATCH 0973/1056] csv-play: minor brush-up

---
 csv/applications/csv-play.cpp       | 10 ++---
 csv/applications/play/multiplay.cpp | 66 +++++++++--------------------
 csv/applications/play/multiplay.h   | 58 ++++++++++---------------
 csv/applications/play/play.cpp      | 22 +++-------
 csv/applications/play/play.h        |  6 +--
 5 files changed, 54 insertions(+), 108 deletions(-)

diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index cdf57c61b..66e513089 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -153,7 +153,7 @@ examples
     exit( 0 );
 }
 
-static boost::scoped_ptr< comma::Multiplay > multiplay;
+static boost::scoped_ptr< comma::csv::applications::play::Multiplay > multiplay;
 static bool quit = false;
 
 class playback_state_t
@@ -308,14 +308,14 @@ int main( int argc, char** argv )
         comma::csv::options csv( argc, argv );
         csv.full_xpath = false;
         comma::name_value::parser name_value("filename,output", ';', '=', false );
-        std::vector< comma::Multiplay::SourceConfig > sourceConfigs( configstrings.size() );
-        comma::Multiplay::SourceConfig defaultConfig( "-", options.value( "--clients", 0 ), csv );
-        for( unsigned int i = 0U; i < configstrings.size(); ++i ) { sourceConfigs[i] = name_value.get< comma::Multiplay::SourceConfig >( configstrings[i], defaultConfig ); }
+        std::vector< comma::csv::applications::play::Multiplay::SourceConfig > source_configs( configstrings.size() );
+        comma::csv::applications::play::Multiplay::SourceConfig defaultConfig( "-", options.value( "--clients", 0 ), csv );
+        for( unsigned int i = 0U; i < configstrings.size(); ++i ) { source_configs[i] = name_value.get< comma::csv::applications::play::Multiplay::SourceConfig >( configstrings[i], defaultConfig ); }
         boost::posix_time::ptime fromtime;
         if( !from.empty() ) { fromtime = boost::posix_time::from_iso_string( from ); }
         boost::posix_time::ptime totime;
         if( !to.empty() ) { totime = boost::posix_time::from_iso_string( to ); }
-        multiplay.reset( new comma::Multiplay( sourceConfigs, speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int>( resolution * 1000000 )), fromtime, totime, flush ));
+        multiplay.reset( new comma::csv::applications::play::Multiplay( source_configs, speed, quiet, boost::posix_time::microseconds( static_cast< unsigned int >( resolution * 1000000 )), fromtime, totime, flush ));
         if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
         boost::optional< std::string > pause_at_option = options.optional< std::string >( "--pause-at" );
         boost::optional< boost::posix_time::ptime > pause_at_timestamp = boost::make_optional< boost::posix_time::ptime >( false, boost::posix_time::not_a_date_time );
diff --git a/csv/applications/play/multiplay.cpp b/csv/applications/play/multiplay.cpp
index ac590b0ee..6c22eec26 100644
--- a/csv/applications/play/multiplay.cpp
+++ b/csv/applications/play/multiplay.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
 #include <sstream>
@@ -35,13 +34,8 @@
 #include "../../../string/string.h"
 #include "multiplay.h"
 
-namespace comma {
-
+namespace comma { namespace csv { namespace applications { namespace play {
 
-/*!
-    @brief Constructor
-    @param configs csv options
-*/
 Multiplay::Multiplay( const std::vector< SourceConfig >& configs
                     , double speed
                     , bool quiet
@@ -51,8 +45,8 @@ Multiplay::Multiplay( const std::vector< SourceConfig >& configs
                     , bool flush )
     : m_configs( configs )
     , istreams_( configs.size() )
-    , m_inputStreams( configs.size() )
-    , m_publishers( configs.size() )
+    , _input_streams( configs.size() )
+    , _publishers( configs.size() )
     , m_play( speed, quiet, resolution )
     , m_timestamps( configs.size() )
     , m_started( false )
@@ -66,11 +60,11 @@ Multiplay::Multiplay( const std::vector< SourceConfig >& configs
         // todo: quick and dirty for now: blocking streams for named pipes
         istreams_[i].reset( new io::istream( configs[i].options.filename, m_configs[i].options.binary() ? io::mode::binary : io::mode::ascii, io::mode::blocking ) );
         if( !( *istreams_[i] )() ) { COMMA_THROW( comma::exception, "named pipe " << configs[i].options.filename << " is closed (todo: support closed named pipes)" ); }
-        m_inputStreams[i].reset( new csv::input_stream< time >( *( *istreams_[i] )(), m_configs[i].options ) );
+        _input_streams[i].reset( new csv::input_stream< time >( *( *istreams_[i] )(), m_configs[i].options ) );
         unsigned int j;
         for( j = 0; j < i && configs[j].outputFileName != configs[i].outputFileName; ++j ); // quick and dirty: unique publishers
-        if( j == i ) { m_publishers[i].reset( new io::publisher( configs[i].outputFileName, m_configs[i].options.binary() ? io::mode::binary : io::mode::ascii, true, flush ) ); }
-        else { m_publishers[i] = m_publishers[j]; }
+        if( j == i ) { _publishers[i].reset( new io::publisher( configs[i].outputFileName, m_configs[i].options.binary() ? io::mode::binary : io::mode::ascii, true, flush ) ); }
+        else { _publishers[i] = _publishers[j]; }
         boost::posix_time::time_duration d;
         if( configs[i].offset.total_microseconds() != 0 )
         {
@@ -92,7 +86,7 @@ void Multiplay::close()
     for( unsigned int i = 0U; i < m_configs.size(); i++ )
     {
         istreams_[i]->close();
-        m_publishers[i]->close();
+        _publishers[i]->close();
     }
 }
 
@@ -112,21 +106,14 @@ bool Multiplay::ready() // quick and dirty; should not it be in io::Publisher?
     if( m_started ) { return true; }
     for( unsigned int i = 0; i < m_configs.size(); ++i )
     {
-        m_publishers[i]->accept();
-        if( m_publishers[i]->size() < m_configs[i].minNumberOfClients )
-        {
-            boost::this_thread::sleep( boost::posix_time::millisec( 200 ) );
-            return false;
-        }
+        _publishers[i]->accept();
+        if( _publishers[i]->size() < m_configs[i].minNumberOfClients ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); return false; }
     }
     m_started = true;
     return true;
 }
     
-/*!
-    @brief try to read from all files and write the oldest
-    @return true if at least one file could be read
-*/
+/// @brief try to read from all files and write the oldest; return true if at least one file could be read
 bool Multiplay::read()
 {
     if( !ready() ) { return true; }
@@ -134,19 +121,12 @@ bool Multiplay::read()
     for( unsigned int i = 0U; i < m_configs.size(); ++i )
     {
         if( !m_timestamps[i].is_not_a_date_time() ) { end = false; continue; }
-        const time* time = m_inputStreams[i]->read();
+        const time* time = _input_streams[i]->read();
         if( time == NULL ) { continue; }
         boost::posix_time::ptime t = time->timestamp;
-        if( m_configs[i].offset.total_microseconds() != 0 )
-        {
-            t += m_configs[i].offset;
-        }
+        if( m_configs[i].offset.total_microseconds() != 0 ) { t += m_configs[i].offset; }
         end = false;
-        if( ( ( !m_from.is_not_a_date_time() ) && ( t < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( t > m_to ) ) )
-        {            
-            i--;
-            continue;
-        }
+        if( ( ( !m_from.is_not_a_date_time() ) && ( t < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( t > m_to ) ) ) { i--; continue; }
         m_timestamps[i] = t;
     }
     if( end ) { return false; }
@@ -158,23 +138,20 @@ bool Multiplay::read()
         oldest = m_timestamps[i];
         index = i;
     }
-    if( ( ( !m_from.is_not_a_date_time() ) && ( oldest < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( oldest > m_to ) ) )
-    {
-        return true;
-    }
+    if( ( ( !m_from.is_not_a_date_time() ) && ( oldest < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( oldest > m_to ) ) ) { return true; }
     now_ = oldest;
     m_play.wait( oldest );
     if( m_configs[index].options.binary() )
     {
         if( binary_[index] )
         {
-            ::memcpy( &buf_fer[0], m_inputStreams[index]->binary().last(), buf_fer.size() );
+            ::memcpy( &buf_fer[0], _input_streams[index]->binary().last(), buf_fer.size() );
             binary_[index]->put( time( oldest ), &buf_fer[0] );
-            m_publishers[index]->write( &buf_fer[0], buf_fer.size() );
+            _publishers[index]->write( &buf_fer[0], buf_fer.size() );
         }
         else
         {
-            m_publishers[index]->write( m_inputStreams[index]->binary().last(), m_configs[index].options.format().size() );
+            _publishers[index]->write( _input_streams[index]->binary().last(), m_configs[index].options.format().size() );
         }
     }
     else
@@ -182,18 +159,17 @@ bool Multiplay::read()
         static std::string endl = impl::endl(); // quick and dirty, since publisher is not std::stream
         if( ascii_[index] )
         {
-            std::vector< std::string > last = m_inputStreams[index]->ascii().last();
+            std::vector< std::string > last = _input_streams[index]->ascii().last();
             ascii_[index]->put( time( oldest ), last );
-            ( *m_publishers[index] ) << comma::join( last, m_configs[index].options.delimiter ) << endl;
+            ( *_publishers[index] ) << comma::join( last, m_configs[index].options.delimiter ) << endl;
         }
         else
         {
-            ( *m_publishers[index] ) << comma::join( m_inputStreams[index]->ascii().last(), m_configs[index].options.delimiter ) << endl;
+            ( *_publishers[index] ) << comma::join( _input_streams[index]->ascii().last(), m_configs[index].options.delimiter ) << endl;
         }
     }
     m_timestamps[index] = boost::posix_time::not_a_date_time;
     return true;
 }
 
-} // namespace comma {
-
+} } } } // namespace comma { namespace csv { namespace applications { namespace play {
diff --git a/csv/applications/play/multiplay.h b/csv/applications/play/multiplay.h
index 040db7bcd..ec3816df6 100644
--- a/csv/applications/play/multiplay.h
+++ b/csv/applications/play/multiplay.h
@@ -30,17 +30,17 @@
 
 /// @author cedric wohlleber
 
-#ifndef COMMA_CSV_MULTIPLAY_H
-#define COMMA_CSV_MULTIPLAY_H
+#pragma once
 
 #include <vector>
 #include <boost/thread/thread_time.hpp>
 #include "../../../csv/options.h"
 #include "../../../csv/stream.h"
 #include "../../../io/publisher.h"
+#include "../../../io/stream.h"
 #include "play.h"
 
-namespace comma {
+namespace comma { namespace csv { namespace applications { namespace play {
 
 /// gets data from multiple input files, and output in a real time manner to output files,  using timestamps
 class Multiplay
@@ -59,21 +59,18 @@ class Multiplay
             std::size_t minNumberOfClients;
             csv::options options;
             boost::posix_time::time_duration offset;
-            SourceConfig( const std::string& output, const csv::options& csv ) :
-                outputFileName( output ), minNumberOfClients( 0 ), options( csv ) {}
-            SourceConfig( const std::string& output, std::size_t n, const csv::options& csv ) :
-                outputFileName( output ), minNumberOfClients( n ), options( csv ) {}
+            SourceConfig( const std::string& output, const csv::options& csv ): outputFileName( output ), minNumberOfClients( 0 ), options( csv ) {}
+            SourceConfig( const std::string& output, std::size_t n, const csv::options& csv ): outputFileName( output ), minNumberOfClients( n ), options( csv ) {}
             SourceConfig() { options.full_xpath = false; };
         };
 
         Multiplay( const std::vector< SourceConfig >& configs
-                , double speed = 1.0
-                , bool quiet = false
-                , const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds( 1 )
-                , boost::posix_time::ptime from = boost::posix_time::not_a_date_time
-                , boost::posix_time::ptime to = boost::posix_time::not_a_date_time
-                , bool flush = true
-                 );
+                 , double speed = 1.0
+                 , bool quiet = false
+                 , const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds( 1 )
+                 , boost::posix_time::ptime from = boost::posix_time::not_a_date_time
+                 , boost::posix_time::ptime to = boost::posix_time::not_a_date_time
+                 , bool flush = true );
 
         void close();
 
@@ -86,8 +83,8 @@ class Multiplay
     private:
         std::vector<SourceConfig> m_configs;
         std::vector< boost::shared_ptr< comma::io::istream > > istreams_;
-        std::vector< boost::shared_ptr< csv::input_stream< time > > > m_inputStreams;
-        std::vector< boost::shared_ptr< comma::io::publisher > > m_publishers;
+        std::vector< boost::shared_ptr< csv::input_stream< time > > > _input_streams;
+        std::vector< boost::shared_ptr< comma::io::publisher > > _publishers;
         csv::impl::play m_play;
         std::vector< boost::posix_time::ptime > m_timestamps;
         boost::posix_time::ptime now_;
@@ -100,29 +97,21 @@ class Multiplay
         bool ready();
 };
 
-} // namespace comma {
+} } } } // namespace comma { namespace csv { namespace applications { namespace play {
 
 namespace comma { namespace visiting {
 
-template <> struct traits< comma::Multiplay::time >
+template <> struct traits< comma::csv::applications::play::Multiplay::time >
 {
-    template < typename Key, class Visitor >
-    static void visit( Key, comma::Multiplay::time& t, Visitor& v )
-    {
-        v.apply( "t", t.timestamp );
-    }
-
-    template < typename Key, class Visitor >
-    static void visit( Key, const comma::Multiplay::time& t, Visitor& v )
-    {
-        v.apply( "t", t.timestamp );
-    }
+    typedef comma::csv::applications::play::Multiplay::time type_t;
+    template < typename Key, class Visitor > static void visit( Key, type_t& t, Visitor& v ) { v.apply( "t", t.timestamp ); }
+    template < typename Key, class Visitor > static void visit( Key, const type_t& t, Visitor& v ) { v.apply( "t", t.timestamp ); }
 };
 
-template <> struct traits< comma::Multiplay::SourceConfig >
+template <> struct traits< comma::csv::applications::play::Multiplay::SourceConfig >
 {
-    template < typename Key, class Visitor >
-    static void visit( Key, comma::Multiplay::SourceConfig& c, Visitor& v )
+    typedef comma::csv::applications::play::Multiplay::SourceConfig type_t;
+    template < typename Key, class Visitor > static void visit( Key, type_t& c, Visitor& v )
     {
         v.apply( "options", c.options );
         v.apply( "output", c.outputFileName );
@@ -132,8 +121,7 @@ template <> struct traits< comma::Multiplay::SourceConfig >
 		c.offset = boost::posix_time::microseconds( static_cast< boost::int64_t >( duration * 1e6 ) );
     }
 
-    template < typename Key, class Visitor >
-    static void visit( Key, const comma::Multiplay::SourceConfig& c, Visitor& v )
+    template < typename Key, class Visitor > static void visit( Key, const type_t& c, Visitor& v )
     {
         v.apply( "options", c.options );
         v.apply( "output", c.outputFileName );
@@ -145,5 +133,3 @@ template <> struct traits< comma::Multiplay::SourceConfig >
 };
 
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_CSV_MULTIPLAY_H
diff --git a/csv/applications/play/play.cpp b/csv/applications/play/play.cpp
index 3d794e4b6..f138045e8 100644
--- a/csv/applications/play/play.cpp
+++ b/csv/applications/play/play.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
 #include <boost/thread/thread.hpp>
@@ -54,7 +53,6 @@ play::play( double speed, bool quiet, const boost::posix_time::time_duration& re
 /// @param time timestamp as ptime
 void play::wait( const boost::posix_time::ptime& time )
 {
-
     if ( !m_times_initialized )
     {
         boost::posix_time::ptime systemTime = boost::get_system_time();
@@ -70,7 +68,7 @@ void play::wait( const boost::posix_time::ptime& time )
             boost::posix_time::ptime systemTime = boost::get_system_time();
             const boost::posix_time::ptime target = m_systemFirst + boost::posix_time::milliseconds( static_cast<long>(( time - m_first ).total_milliseconds() / m_speed ) );
             const boost::posix_time::time_duration lag = systemTime - target;
-            if ( !m_quiet && ( lag > m_resolution ) ) // no need to be alarmed for a lag less than the expected accuracy
+            if ( !m_quiet && lag > m_resolution ) // no need to be alarmed for a lag less than the expected accuracy
             {
                 if( !m_lag )
                 {
@@ -83,14 +81,11 @@ void play::wait( const boost::posix_time::ptime& time )
             {
                 if( !m_quiet && m_lag )
                 {
-                    m_lag = false;
                     std::cerr << "csv-play: recovered after " << m_lagCounter << " packets " << std::endl;
+                    m_lag = false;
                     m_lagCounter = 0U;
                 }
-                if ( lag < -m_resolution ) // no need to sleep less than the expected accuracy
-                {
-                    boost::this_thread::sleep( target );
-                }
+                if( lag < -m_resolution ) { boost::this_thread::sleep( target ); } // no need to sleep less than the expected accuracy
             }
             m_last = time;
         }
@@ -103,17 +98,10 @@ void play::wait( const boost::posix_time::ptime& time )
 
 /// wait until a timestamp
 /// @param isoTime timestamp in iso format
-void play::wait( const std::string& isoTime )
-{
-    wait( boost::posix_time::from_iso_string( isoTime ) );
-}
+void play::wait( const std::string& isoTime ) { wait( boost::posix_time::from_iso_string( isoTime ) ); }
 
 /// allow for a pause in playback
 /// @param pause_duration duration of pause
-void play::paused_for( const boost::posix_time::time_duration& pause_duration )
-{
-    if( m_times_initialized ) { m_systemFirst += pause_duration; }
-}
-
+void play::paused_for( const boost::posix_time::time_duration& pause_duration ) { if( m_times_initialized ) { m_systemFirst += pause_duration; } }
 
 } } } // namespace comma { namespace csv { namespace impl {
diff --git a/csv/applications/play/play.h b/csv/applications/play/play.h
index fa9acccbf..e4b0815ff 100644
--- a/csv/applications/play/play.h
+++ b/csv/applications/play/play.h
@@ -27,11 +27,9 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
-#ifndef COMMA_CSV_APPLICATIONS_PLAY_H
-#define COMMA_CSV_APPLICATIONS_PLAY_H
+#pragma once
 
 #include <boost/optional.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
@@ -63,5 +61,3 @@ class play
 };
 
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // COMMA_CSV_APPLICATIONS_PLAY_H

From 4af210ae6b7f0a91ce557a74571eb78b25283747 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 28 Oct 2024 17:06:38 +1100
Subject: [PATCH 0974/1056] csv-play: optionally using clients rather than
 servers for output streams; plugging in...

---
 csv/applications/CMakeLists.txt     |  2 +-
 csv/applications/play/multiplay.cpp | 14 +++++-----
 csv/applications/play/multiplay.h   | 41 +++++++++++++++++++++++++++--
 3 files changed, 47 insertions(+), 10 deletions(-)

diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index b0d3ed4fe..9a3b6fa06 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -34,7 +34,7 @@ add_executable( csv-from-bin ${dir}/csv-from-bin.cpp )
 add_executable( csv-calc ${dir}/csv-calc.cpp )
 add_executable( csv-calc-new ${dir}/csv-calc.new.cpp )
 add_executable( csv-crc ${dir}/csv-crc.cpp )
-add_executable( csv-play ${dir}/csv-play.cpp ${dir}/play/multiplay.cpp ${dir}/play/play.cpp )
+add_executable( csv-play ${dir}/csv-play.cpp ${dir}/play/multiplay.h ${dir}/play/multiplay.cpp ${dir}/play/play.h ${dir}/play/play.cpp )
 add_executable( csv-shape ${dir}/csv-shape.cpp )
 add_executable( csv-shuffle ${dir}/csv-shuffle.cpp )
 add_executable( csv-thin ${dir}/csv-thin.cpp )
diff --git a/csv/applications/play/multiplay.cpp b/csv/applications/play/multiplay.cpp
index 6c22eec26..75777355c 100644
--- a/csv/applications/play/multiplay.cpp
+++ b/csv/applications/play/multiplay.cpp
@@ -63,7 +63,7 @@ Multiplay::Multiplay( const std::vector< SourceConfig >& configs
         _input_streams[i].reset( new csv::input_stream< time >( *( *istreams_[i] )(), m_configs[i].options ) );
         unsigned int j;
         for( j = 0; j < i && configs[j].outputFileName != configs[i].outputFileName; ++j ); // quick and dirty: unique publishers
-        if( j == i ) { _publishers[i].reset( new io::publisher( configs[i].outputFileName, m_configs[i].options.binary() ? io::mode::binary : io::mode::ascii, true, flush ) ); }
+        if( j == i ) { _publishers[i].reset( new comma::csv::applications::play::server_publisher( configs[i].outputFileName, m_configs[i].options.binary(), flush ) ); }
         else { _publishers[i] = _publishers[j]; }
         boost::posix_time::time_duration d;
         if( configs[i].offset.total_microseconds() != 0 )
@@ -71,7 +71,7 @@ Multiplay::Multiplay( const std::vector< SourceConfig >& configs
             if( m_configs[i].options.binary() )
             {
                 binary_[i].reset( new csv::binary< time >( m_configs[i].options.fields ) );
-                buf_fer.resize( m_configs[i].options.format().size() );
+                _buffer.resize( m_configs[i].options.format().size() );
             }
             else
             {
@@ -145,9 +145,9 @@ bool Multiplay::read()
     {
         if( binary_[index] )
         {
-            ::memcpy( &buf_fer[0], _input_streams[index]->binary().last(), buf_fer.size() );
-            binary_[index]->put( time( oldest ), &buf_fer[0] );
-            _publishers[index]->write( &buf_fer[0], buf_fer.size() );
+            ::memcpy( &_buffer[0], _input_streams[index]->binary().last(), _buffer.size() );
+            binary_[index]->put( time( oldest ), &_buffer[0] );
+            _publishers[index]->write( &_buffer[0], _buffer.size() );
         }
         else
         {
@@ -161,11 +161,11 @@ bool Multiplay::read()
         {
             std::vector< std::string > last = _input_streams[index]->ascii().last();
             ascii_[index]->put( time( oldest ), last );
-            ( *_publishers[index] ) << comma::join( last, m_configs[index].options.delimiter ) << endl;
+            _publishers[index]->write_line( comma::join( last, m_configs[index].options.delimiter ) );
         }
         else
         {
-            ( *_publishers[index] ) << comma::join( _input_streams[index]->ascii().last(), m_configs[index].options.delimiter ) << endl;
+            _publishers[index]->write_line( comma::join( _input_streams[index]->ascii().last(), m_configs[index].options.delimiter ) );
         }
     }
     m_timestamps[index] = boost::posix_time::not_a_date_time;
diff --git a/csv/applications/play/multiplay.h b/csv/applications/play/multiplay.h
index ec3816df6..5e1e32304 100644
--- a/csv/applications/play/multiplay.h
+++ b/csv/applications/play/multiplay.h
@@ -42,6 +42,43 @@
 
 namespace comma { namespace csv { namespace applications { namespace play {
 
+struct publisher // todo? quick and dirty; improve and put someplace generic
+{
+    virtual ~publisher() = default;
+    virtual unsigned int size() const = 0;
+    virtual void close() = 0;
+    virtual void accept() {}
+    virtual void write( const char* buf, unsigned int size ) = 0;
+    virtual void write_line( const std::string& ) = 0;
+};
+
+class server_publisher: public publisher
+{
+    public:
+        server_publisher( const std::string& name, bool binary, bool flush ): _oserver( name, binary ? io::mode::binary : io::mode::ascii, true, flush || !binary ) {}
+        unsigned int size() const { return _oserver.size(); }
+        void close() { _oserver.close(); }
+        void accept() { _oserver.accept(); }
+        void write( const char* buf, unsigned int size ) { _oserver.write( buf, size ); }
+        void write_line( const std::string& s ) { _oserver.write( &s[0], s.size() ); _oserver.write( "\n", 1 ); }
+    private:
+        io::oserver _oserver;
+};
+
+class client_publisher: public publisher
+{
+    public:
+        client_publisher( const std::string& name, bool binary, bool flush ): _ostream( name, binary ? io::mode::binary : io::mode::ascii, io::mode::non_blocking ), _flush( flush ) {}
+        unsigned int size() const { return 1; }
+        void close() { _ostream.close(); }
+        void accept() {}
+        void write( const char* buf, unsigned int size ) { _ostream->write( buf, size ); if( _flush ) { _ostream->flush(); } }
+        void write_line( const std::string& s ) { _ostream->write( &s[0], s.size() ); if( _flush ) { _ostream->flush(); } ( *_ostream ) << std::endl; }
+    private:
+        io::ostream _ostream;
+        bool _flush{false};
+};
+
 /// gets data from multiple input files, and output in a real time manner to output files,  using timestamps
 class Multiplay
 {
@@ -84,7 +121,7 @@ class Multiplay
         std::vector<SourceConfig> m_configs;
         std::vector< boost::shared_ptr< comma::io::istream > > istreams_;
         std::vector< boost::shared_ptr< csv::input_stream< time > > > _input_streams;
-        std::vector< boost::shared_ptr< comma::io::publisher > > _publishers;
+        std::vector< boost::shared_ptr< comma::csv::applications::play::publisher > > _publishers;
         csv::impl::play m_play;
         std::vector< boost::posix_time::ptime > m_timestamps;
         boost::posix_time::ptime now_;
@@ -93,7 +130,7 @@ class Multiplay
         boost::posix_time::ptime m_to;
         std::vector< boost::shared_ptr< csv::ascii< time > > > ascii_;
         std::vector< boost::shared_ptr< csv::binary< time > > > binary_;
-        std::vector< char > buf_fer;
+        std::vector< char > _buffer;
         bool ready();
 };
 

From 6ad92bec32a325093b7573a4cb62c376bafca0fc Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 28 Oct 2024 17:18:22 +1100
Subject: [PATCH 0975/1056] csv-play: optionally using clients rather than
 servers for output streams; first cut implemented

---
 csv/applications/play/multiplay.cpp | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/csv/applications/play/multiplay.cpp b/csv/applications/play/multiplay.cpp
index 75777355c..bdb81e305 100644
--- a/csv/applications/play/multiplay.cpp
+++ b/csv/applications/play/multiplay.cpp
@@ -63,8 +63,16 @@ Multiplay::Multiplay( const std::vector< SourceConfig >& configs
         _input_streams[i].reset( new csv::input_stream< time >( *( *istreams_[i] )(), m_configs[i].options ) );
         unsigned int j;
         for( j = 0; j < i && configs[j].outputFileName != configs[i].outputFileName; ++j ); // quick and dirty: unique publishers
-        if( j == i ) { _publishers[i].reset( new comma::csv::applications::play::server_publisher( configs[i].outputFileName, m_configs[i].options.binary(), flush ) ); }
-        else { _publishers[i] = _publishers[j]; }
+        if( j == i )
+        {
+            const auto& s = comma::split( configs[i].outputFileName, ':' ); // todo: quick and dirty for now; add usage semantics for local sockets
+            if( s.size() > 2 && s[0] == "tcp" ) { _publishers[i].reset( new comma::csv::applications::play::client_publisher( configs[i].outputFileName, m_configs[i].options.binary(), flush ) ); }
+            else { _publishers[i].reset( new comma::csv::applications::play::server_publisher( configs[i].outputFileName, m_configs[i].options.binary(), flush ) ); }
+        }
+        else
+        {
+            _publishers[i] = _publishers[j];
+        }
         boost::posix_time::time_duration d;
         if( configs[i].offset.total_microseconds() != 0 )
         {

From fa092285ffea7a5de2b595e5bf59872c775acc55 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Tue, 29 Oct 2024 16:48:37 +1100
Subject: [PATCH 0976/1056] comma-resources-util: explicitly request
 cpu,core,socket from lscpu

---
 bash/comma-resources-util | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/bash/comma-resources-util b/bash/comma-resources-util
index 165b72a0d..85ae2038d 100644
--- a/bash/comma-resources-util
+++ b/bash/comma-resources-util
@@ -168,13 +168,8 @@ export -f comma_queue_is_empty_infile
 # Extract cpu count, cores and sockets from lscpu
 function comma_cpu_resources()
 {
-    local lscpu=$( lscpu --parse )
-    local fields=$( echo "$lscpu" | grep '^#' | tail -1 | sed 's/^[# ]*//' )
-    {
-        # lscpu --parse gives us zero-based indexes. Add one to get the count
-        echo "$lscpu" | tail -1 | csv-shuffle --fields $fields --output CPU,Core,Socket
-        echo "1,1,1"
-    } | csv-calc sum --format 3i | name-value-from-csv --fields cpu,core,socket --prefix cpu
+    local fields='cpu,core,socket'
+    { lscpu --parse="$fields" | grep -v '^#' | tail -n1; echo 1,1,1; } | csv-calc sum --format 3i | name-value-from-csv --fields="$fields" --prefix=cpu
 }
 
 # Output the most commonly used system resources: number of CPUs, total RAM,

From 1196036fc781583db9d482c5efc1c0d4da24259a Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 5 Nov 2024 16:52:15 +1100
Subject: [PATCH 0977/1056] python: dictionary.update(): first cut implemented;
 testing...

---
 python/comma/dictionary/__init__.py           |  2 +-
 .../comma/dictionary/test/test_dictionary.py  |  9 ++++
 python/comma/dictionary/util.py               | 43 ++++++++++++++++++-
 3 files changed, 52 insertions(+), 2 deletions(-)

diff --git a/python/comma/dictionary/__init__.py b/python/comma/dictionary/__init__.py
index fa16bc6a1..3edd02acb 100644
--- a/python/comma/dictionary/__init__.py
+++ b/python/comma/dictionary/__init__.py
@@ -1,3 +1,3 @@
 # Copyright (c) 2023 Vsevolod Vlaskine
 
-from .util import at, has, leaves, parents, set
+from .util import at, has, leaves, parents, set, update
diff --git a/python/comma/dictionary/test/test_dictionary.py b/python/comma/dictionary/test/test_dictionary.py
index ea3605de0..772d276b7 100644
--- a/python/comma/dictionary/test/test_dictionary.py
+++ b/python/comma/dictionary/test/test_dictionary.py
@@ -108,3 +108,12 @@ def test_dictionary_set():
     dictionary.set(f, '[4]/a', 44)
     dictionary.set(f, '[4]/b', 55)
     assert f[4] == {'a': 44, 'b': 55 }
+
+def test_dictionary_update():
+    assert dictionary.update( {}, {} ) == {}
+    assert dictionary.update( { 'a': 1, 'b': 2 }, {} ) == { 'a': 1, 'b': 2 }
+    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'c': 3 } ) == { 'a': 1, 'b': 2, 'c': 3 }
+    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'c': 3, 'd': { 'e': 4 } } ) == { 'a': 1, 'b': 2, 'c': 3, 'd': { 'e': 4 } }
+    assert dictionary.update( {}, { 'c': 3 } ) == { 'c': 3 }
+    assert dictionary.update( {}, { 'c': 3, 'd': { 'e': 4 } } ) == { 'c': 3, 'd': { 'e': 4 } }
+    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'a': 4, 'c': 3 }, verbose=True ) == { 'a': 4, 'b': 2, 'c': 3 }
\ No newline at end of file
diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/util.py
index affdbe51b..69fec8244 100644
--- a/python/comma/dictionary/util.py
+++ b/python/comma/dictionary/util.py
@@ -131,4 +131,45 @@ def _set( d, p ):
                 if ( len( s ) == 1 or s[0] != '' ) and not s[0] in d: raise KeyError( f'on path {path}: {s[0]} not found' )
                 _set( eval( f'd[{s[1]}' if s[0] == '' else f'd["{s[0]}"][{s[1]}', { 'd': d } ), p[1:])
     _set( d, path.split( delimiter ) )
-    return d
\ No newline at end of file
+    return d
+
+def update( d0, d, verbose=False ):
+    '''
+    nested update of d0 by values in d
+    
+    examples
+    --------
+        >>> todo
+    '''
+    def _update_path( path, k, bracketed=False ):
+        p = copy.deepcopy( path )
+        if bracketed:
+            if len( p ) == 0: p = [ f'[{k}]' ]
+            else: p[-1] = f'{p[-1]}[{k}]'
+        else: p.append( k )
+        return p
+
+    def _update_path_none( path, k, bracketed=False ): return path
+
+    def _assign( _d0, k, v, path, _p ):
+        t = _d0[k]
+        if isinstance( t, typing.Dict ) or isinstance( t, typing.List ): _update( t, v, path, _p )
+        else: _d0[k] = v
+
+    def _update( _d0, _d, path, _p ):
+        if isinstance( _d0, typing.Dict ):
+            assert isinstance( _d, typing.Dict ), f'expected dictionary in d at {"/".join( path )}; got: {type(_d)=}'
+            for k, v in _d.items():
+                if k in _d0: _assign( _d0, k, v, _p( path, k ), _p )
+                else: _d0[k] = copy.deepcopy( v )
+        elif isinstance( _d0, typing.List ):
+            assert isinstance( _d, typing.List ), f'expected list in d at {"/".join( path )}; got: {type(_d)=}'
+            for i, v in enumerate( _d ):
+                if i < len( _d0 ): _update( _d0, i, v, _p( path, i, True ), _p )
+                else: _d0.append( copy.deepcopy( v ) )
+        else:
+            raise NotImplementedError( f'expected list or dictionary in d0 at {"/".join( path )}; got: {type(d0)=}' )
+
+    _p = _update_path if verbose else _update_path_none
+    _update( d0, d, [], _p )
+    return d0

From dd5934299ed747db8b9cd1a91dbbbcb8796b8f9b Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 5 Nov 2024 17:00:27 +1100
Subject: [PATCH 0978/1056] python: dictionary.update(): lists: typo fixed,
 unit tests added

---
 python/comma/dictionary/test/test_dictionary.py | 12 +++++++++++-
 python/comma/dictionary/util.py                 |  2 +-
 2 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/python/comma/dictionary/test/test_dictionary.py b/python/comma/dictionary/test/test_dictionary.py
index 772d276b7..8c462598e 100644
--- a/python/comma/dictionary/test/test_dictionary.py
+++ b/python/comma/dictionary/test/test_dictionary.py
@@ -116,4 +116,14 @@ def test_dictionary_update():
     assert dictionary.update( { 'a': 1, 'b': 2 }, { 'c': 3, 'd': { 'e': 4 } } ) == { 'a': 1, 'b': 2, 'c': 3, 'd': { 'e': 4 } }
     assert dictionary.update( {}, { 'c': 3 } ) == { 'c': 3 }
     assert dictionary.update( {}, { 'c': 3, 'd': { 'e': 4 } } ) == { 'c': 3, 'd': { 'e': 4 } }
-    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'a': 4, 'c': 3 }, verbose=True ) == { 'a': 4, 'b': 2, 'c': 3 }
\ No newline at end of file
+    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'a': 4, 'c': 3 } ) == { 'a': 4, 'b': 2, 'c': 3 }
+    assert dictionary.update( { 'a': 1, 'b': 2, 'd': { 'e': { 'f': 3 }, 'g': { 'h': 4 } } }, { 'd': { 'e': { 'f': 5 }, 'g': { 'h': 4 } } } ) == { 'a': 1, 'b': 2, 'd': { 'e': { 'f': 5 }, 'g': { 'h': 4 } } }
+    assert dictionary.update( [], [] ) == []
+    assert dictionary.update( [1, 2], [] ) == [1, 2]
+    assert dictionary.update( [1, 2], [3, 4, 5] ) == [3, 4, 5]
+    assert dictionary.update( [1, { 'a': 1, 'b': { 'c': 2 } }], [1, {}, 5] ) == [1, { 'a': 1, 'b': { 'c': 2 } }, 5]
+    assert dictionary.update( [1, { 'a': 1, 'b': { 'c': 2 } }], [1, { 'a': 4 }, 5] ) == [1, { 'a': 4, 'b': { 'c': 2 } }, 5]
+    assert dictionary.update( [1, { 'a': 1, 'b': { 'c': 2 } }], [1, { 'a': 4, 'b': { 'c': 6, 'd': 7 } }, 5] ) == [1, { 'a': 4, 'b': { 'c': 6, 'd': 7 } }, 5]
+    assert dictionary.update( [1, 2, [3, 4, 5]], [] ) == [1, 2, [3, 4, 5]]
+    assert dictionary.update( [], [1, 2, [3, 4, 5]] ) == [1, 2, [3, 4, 5]]
+    assert dictionary.update( [1, 2, [3, 4, 5]], [1, 2, [3, 4, 6, 7]] ) == [1, 2, [3, 4, 6, 7]]
diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/util.py
index 69fec8244..04e8b802b 100644
--- a/python/comma/dictionary/util.py
+++ b/python/comma/dictionary/util.py
@@ -165,7 +165,7 @@ def _update( _d0, _d, path, _p ):
         elif isinstance( _d0, typing.List ):
             assert isinstance( _d, typing.List ), f'expected list in d at {"/".join( path )}; got: {type(_d)=}'
             for i, v in enumerate( _d ):
-                if i < len( _d0 ): _update( _d0, i, v, _p( path, i, True ), _p )
+                if i < len( _d0 ): _assign( _d0, i, v, _p( path, i, True ), _p )
                 else: _d0.append( copy.deepcopy( v ) )
         else:
             raise NotImplementedError( f'expected list or dictionary in d0 at {"/".join( path )}; got: {type(d0)=}' )

From 95ac8a048e4ab559d4eccf9c6a559b531d8a66bd Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 5 Nov 2024 17:59:48 +1100
Subject: [PATCH 0979/1056] python: dictionary.update(): test case and example
 added

---
 python/comma/dictionary/test/test_dictionary.py | 2 ++
 python/comma/dictionary/util.py                 | 4 +++-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/python/comma/dictionary/test/test_dictionary.py b/python/comma/dictionary/test/test_dictionary.py
index 8c462598e..05f2f0790 100644
--- a/python/comma/dictionary/test/test_dictionary.py
+++ b/python/comma/dictionary/test/test_dictionary.py
@@ -127,3 +127,5 @@ def test_dictionary_update():
     assert dictionary.update( [1, 2, [3, 4, 5]], [] ) == [1, 2, [3, 4, 5]]
     assert dictionary.update( [], [1, 2, [3, 4, 5]] ) == [1, 2, [3, 4, 5]]
     assert dictionary.update( [1, 2, [3, 4, 5]], [1, 2, [3, 4, 6, 7]] ) == [1, 2, [3, 4, 6, 7]]
+    assert dictionary.update( { 'a': 1, 'b': 2, 'c': [3, 4, 5]}, { 'a': 6, 'c': [7, 8, 9, 10] } ) == { 'a': 6, 'b': 2, 'c': [7, 8, 9, 10]}
+    # todo: more tests on corner cases, negative cases, etc
diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/util.py
index 04e8b802b..b80b6dc0c 100644
--- a/python/comma/dictionary/util.py
+++ b/python/comma/dictionary/util.py
@@ -139,7 +139,9 @@ def update( d0, d, verbose=False ):
     
     examples
     --------
-        >>> todo
+        >>> import comma.dictionary
+        >>> comma.dictionary.update( { 'a': 1, 'b': 2, 'c': [3, 4, 5]}, { 'a': 6, 'c': [7, 8, 9, 10] } )
+        { 'a': 6, 'b': 2, 'c': [7, 8, 9, 10]}
     '''
     def _update_path( path, k, bracketed=False ):
         p = copy.deepcopy( path )

From 8d5f8d7c47a3ec8579867bff0b19667db9c8db95 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Tue, 5 Nov 2024 18:34:25 +1100
Subject: [PATCH 0980/1056] python: dictionary.update(): using old f"{...}"
 notation for backward-compatibility

---
 python/comma/dictionary/util.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/util.py
index b80b6dc0c..9bc5a69a5 100644
--- a/python/comma/dictionary/util.py
+++ b/python/comma/dictionary/util.py
@@ -160,17 +160,17 @@ def _assign( _d0, k, v, path, _p ):
 
     def _update( _d0, _d, path, _p ):
         if isinstance( _d0, typing.Dict ):
-            assert isinstance( _d, typing.Dict ), f'expected dictionary in d at {"/".join( path )}; got: {type(_d)=}'
+            assert isinstance( _d, typing.Dict ), f'expected dictionary in d at {"/".join( path )}; got: type(_d)={type(_d)}'
             for k, v in _d.items():
                 if k in _d0: _assign( _d0, k, v, _p( path, k ), _p )
                 else: _d0[k] = copy.deepcopy( v )
         elif isinstance( _d0, typing.List ):
-            assert isinstance( _d, typing.List ), f'expected list in d at {"/".join( path )}; got: {type(_d)=}'
+            assert isinstance( _d, typing.List ), f'expected list in d at {"/".join( path )}; got: type(_d)={type(_d)}'
             for i, v in enumerate( _d ):
                 if i < len( _d0 ): _assign( _d0, i, v, _p( path, i, True ), _p )
                 else: _d0.append( copy.deepcopy( v ) )
         else:
-            raise NotImplementedError( f'expected list or dictionary in d0 at {"/".join( path )}; got: {type(d0)=}' )
+            raise NotImplementedError( f'expected list or dictionary in d0 at {"/".join( path )}; got: type(d0)={type(d0)}' )
 
     _p = _update_path if verbose else _update_path_none
     _update( d0, d, [], _p )

From effe588bae0bfc32b7b8c34c9485b092d2ed96d0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 8 Nov 2024 00:18:07 +1100
Subject: [PATCH 0981/1056] containers: cached: first cut implemented

---
 containers/cached.h             | 32 ++++++++++++++++++++++++++++++++
 containers/test/cached_test.cpp | 10 ++++++++++
 2 files changed, 42 insertions(+)
 create mode 100644 containers/cached.h
 create mode 100644 containers/test/cached_test.cpp

diff --git a/containers/cached.h b/containers/cached.h
new file mode 100644
index 000000000..acc9a9196
--- /dev/null
+++ b/containers/cached.h
@@ -0,0 +1,32 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All Rights Reserved
+
+#include <unordered_map>
+
+namespace comma {
+
+template < typename T, typename K >
+class cached
+{
+    public:
+        template < typename... Args >
+        T& operator()( Args... args );
+
+        void clear() { _cache.clear(); }
+
+        const std::unordered_map< K, T >& cache() const { return _cache; }
+
+    private:
+        std::unordered_map< K, T > _cache;
+};
+
+template < typename T, typename K >
+template < typename... Args >
+T& cached< T, K >::operator()( Args... args )
+{
+    K k{ args... };
+    auto i = _cache.find( k );
+    return ( i == _cache.end() ? _cache.insert_emplace( k, T( k ) ).first : i )->second;
+}
+
+} // namespace comma {
diff --git a/containers/test/cached_test.cpp b/containers/test/cached_test.cpp
new file mode 100644
index 000000000..c9c6e410a
--- /dev/null
+++ b/containers/test/cached_test.cpp
@@ -0,0 +1,10 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All Rights Reserved
+
+#include <gtest/gtest.h>
+#include "../cached.h"
+
+TEST( cached, basics )
+{
+    // todo
+}

From 0ab47a0c164963274960f43722681c9477567008 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 8 Nov 2024 11:41:50 +1100
Subject: [PATCH 0982/1056] containers: cached: beefed up; still, usage is
 clunky...

---
 containers/cached.h             | 37 ++++++++++++----
 containers/test/cached_test.cpp | 75 ++++++++++++++++++++++++++++++++-
 2 files changed, 103 insertions(+), 9 deletions(-)

diff --git a/containers/cached.h b/containers/cached.h
index acc9a9196..e88f6cde9 100644
--- a/containers/cached.h
+++ b/containers/cached.h
@@ -1,32 +1,53 @@
 // Copyright (c) 2024 Vsevolod Vlaskine
 // All Rights Reserved
 
+#include <deque>
 #include <unordered_map>
 
 namespace comma {
 
-template < typename T, typename K >
+template < typename T, typename K, typename Hash = std::hash< K > >
 class cached
 {
     public:
+        cached( unsigned int max_size = 0 ): _size( max_size ) {}
+
         template < typename... Args >
         T& operator()( Args... args );
 
-        void clear() { _cache.clear(); }
+        void clear() { _values.clear(); }
+
+        void pop( unsigned int size = 1 );
 
-        const std::unordered_map< K, T >& cache() const { return _cache; }
+        const std::unordered_map< K, T, Hash >& values() const { return _values; }
 
     private:
-        std::unordered_map< K, T > _cache;
+        std::unordered_map< K, T, Hash > _values;
+        std::deque< K > _keys;
+        unsigned int _size{0};
 };
 
-template < typename T, typename K >
+template < typename T, typename K, typename Hash >
 template < typename... Args >
-T& cached< T, K >::operator()( Args... args )
+T& cached< T, K, Hash >::operator()( Args... args )
 {
     K k{ args... };
-    auto i = _cache.find( k );
-    return ( i == _cache.end() ? _cache.insert_emplace( k, T( k ) ).first : i )->second;
+    auto i = _values.find( k );
+    if( i != _values.end() ) { return i->second; }
+    if( _size > 0 && _values.size() == _size ) { pop(); }
+    _keys.emplace_back( k );
+    return _values.emplace( std::make_pair( k, T( k ) ) ).first->second;
+}
+
+template < typename T, typename K, typename Hash >
+inline void cached< T, K, Hash >::pop( unsigned int size )
+{
+    for( unsigned int i = 0; i < size; ++i )
+    {
+        if( _keys.empty() ) { return; }
+        _values.erase( _keys.front() );
+        _keys.pop_front();
+    }
 }
 
 } // namespace comma {
diff --git a/containers/test/cached_test.cpp b/containers/test/cached_test.cpp
index c9c6e410a..999381f87 100644
--- a/containers/test/cached_test.cpp
+++ b/containers/test/cached_test.cpp
@@ -2,9 +2,82 @@
 // All Rights Reserved
 
 #include <gtest/gtest.h>
+#include <boost/functional/hash.hpp>
 #include "../cached.h"
 
+struct square
+{
+    typedef int key;
+
+    square( int x ): a( x ) {}
+
+    int calculate( int x ) const { return a * x; }
+
+    int a{0};
+};
+
 TEST( cached, basics )
 {
-    // todo
+    comma::cached< square, int > c;
+    EXPECT_EQ( c( 5 ).calculate( 5 ), 25 );
+    EXPECT_EQ( c.values().size(), 1 );
+    EXPECT_EQ( c( 5 ).calculate( 5 ), 25 );
+    EXPECT_EQ( c.values().size(), 1 );
+    EXPECT_EQ( c( 10 ).calculate( 10 ), 100 );
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c( 10 ).calculate( 10 ), 100 );
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.values().size(), 3 );
+    EXPECT_EQ( c( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.values().size(), 3 );
+    c.pop();
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.values().size(), 2 );
 }
+
+struct someclass
+{
+    typedef std::pair< int, int > key;
+
+    struct hash
+    {
+        std::size_t operator()( key const& p ) const
+        {
+            std::size_t seed = 0;
+            boost::hash_combine( seed, p.first );
+            boost::hash_combine( seed, p.second );
+            return seed;
+        }
+    };
+
+    someclass( const key& k ) {}
+
+    void dummy( int x, int y ) const {}
+};
+
+// struct pair_hash : public std::unary_function< Array, std::size_t >
+// {
+//     std::size_t operator()( Array const& array ) const
+//     {
+//         std::size_t seed = 0;
+//         for( std::size_t i = 0; i < Size; ++i ) { boost::hash_combine( seed, array[i] ); }
+//         return seed;
+//         // return boost::hash_range( &array[0], &array[Size] ); // not so easy...
+//     }
+// };
+
+TEST( cached, key )
+{
+    comma::cached< someclass, someclass::key, someclass::hash > c;
+    c( 1, 2 ).dummy( 1, 2 );
+    EXPECT_EQ( c.values().size(), 1 );
+    c( 1, 2 ).dummy( 1, 2 );
+    EXPECT_EQ( c.values().size(), 1 );
+    c( 3, 1 ).dummy( 3, 1 );
+    EXPECT_EQ( c.values().size(), 2 );
+    c( 3, 1 ).dummy( 3, 1 );
+    EXPECT_EQ( c.values().size(), 2 );
+}
\ No newline at end of file

From 6b2c64afac2567ee7549532042e7b0c732733250 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 8 Nov 2024 12:18:19 +1100
Subject: [PATCH 0983/1056] containers: cached: usage improved; first cut
 complete

---
 containers/cached.h             |  29 +++++++--
 containers/test/cached_test.cpp | 111 +++++++++++++++++++++++++-------
 2 files changed, 111 insertions(+), 29 deletions(-)

diff --git a/containers/cached.h b/containers/cached.h
index e88f6cde9..250ed5ef2 100644
--- a/containers/cached.h
+++ b/containers/cached.h
@@ -12,8 +12,13 @@ class cached
     public:
         cached( unsigned int max_size = 0 ): _size( max_size ) {}
 
-        template < typename... Args >
-        T& operator()( Args... args );
+        template < typename... Args > T& get( Args... args );
+
+        template < typename... Args > const T& get( Args... args ) const;
+
+        template < typename... Args > auto operator()( Args... args ) { return get( args... )( args... ); }
+
+        template < typename... Args > auto operator()( Args... args ) const { return get( args... )( args... ); }
 
         void clear() { _values.clear(); }
 
@@ -21,15 +26,27 @@ class cached
 
         const std::unordered_map< K, T, Hash >& values() const { return _values; }
 
-    private:
-        std::unordered_map< K, T, Hash > _values;
-        std::deque< K > _keys;
+    protected:
+        mutable std::unordered_map< K, T, Hash > _values;
+        mutable std::deque< K > _keys;
         unsigned int _size{0};
 };
 
 template < typename T, typename K, typename Hash >
 template < typename... Args >
-T& cached< T, K, Hash >::operator()( Args... args )
+T& cached< T, K, Hash >::get( Args... args )
+{
+    K k{ args... };
+    auto i = _values.find( k );
+    if( i != _values.end() ) { return i->second; }
+    if( _size > 0 && _values.size() == _size ) { pop(); }
+    _keys.emplace_back( k );
+    return _values.emplace( std::make_pair( k, T( k ) ) ).first->second;
+}
+
+template < typename T, typename K, typename Hash >
+template < typename... Args >
+const T& cached< T, K, Hash >::get( Args... args ) const
 {
     K k{ args... };
     auto i = _values.find( k );
diff --git a/containers/test/cached_test.cpp b/containers/test/cached_test.cpp
index 999381f87..aa41dbfcf 100644
--- a/containers/test/cached_test.cpp
+++ b/containers/test/cached_test.cpp
@@ -2,6 +2,7 @@
 // All Rights Reserved
 
 #include <gtest/gtest.h>
+#include <vector>
 #include <boost/functional/hash.hpp>
 #include "../cached.h"
 
@@ -19,22 +20,22 @@ struct square
 TEST( cached, basics )
 {
     comma::cached< square, int > c;
-    EXPECT_EQ( c( 5 ).calculate( 5 ), 25 );
+    EXPECT_EQ( c.get( 5 ).calculate( 5 ), 25 );
     EXPECT_EQ( c.values().size(), 1 );
-    EXPECT_EQ( c( 5 ).calculate( 5 ), 25 );
+    EXPECT_EQ( c.get( 5 ).calculate( 5 ), 25 );
     EXPECT_EQ( c.values().size(), 1 );
-    EXPECT_EQ( c( 10 ).calculate( 10 ), 100 );
+    EXPECT_EQ( c.get( 10 ).calculate( 10 ), 100 );
     EXPECT_EQ( c.values().size(), 2 );
-    EXPECT_EQ( c( 10 ).calculate( 10 ), 100 );
+    EXPECT_EQ( c.get( 10 ).calculate( 10 ), 100 );
     EXPECT_EQ( c.values().size(), 2 );
-    EXPECT_EQ( c( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.get( 20 ).calculate( 20 ), 400 );
     EXPECT_EQ( c.values().size(), 3 );
-    EXPECT_EQ( c( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.get( 20 ).calculate( 20 ), 400 );
     EXPECT_EQ( c.values().size(), 3 );
     c.pop();
     EXPECT_EQ( c.values().size(), 2 );
     EXPECT_EQ( c.values().size(), 2 );
-    EXPECT_EQ( c( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.get( 20 ).calculate( 20 ), 400 );
     EXPECT_EQ( c.values().size(), 2 );
 }
 
@@ -58,26 +59,90 @@ struct someclass
     void dummy( int x, int y ) const {}
 };
 
-// struct pair_hash : public std::unary_function< Array, std::size_t >
-// {
-//     std::size_t operator()( Array const& array ) const
-//     {
-//         std::size_t seed = 0;
-//         for( std::size_t i = 0; i < Size; ++i ) { boost::hash_combine( seed, array[i] ); }
-//         return seed;
-//         // return boost::hash_range( &array[0], &array[Size] ); // not so easy...
-//     }
-// };
-
 TEST( cached, key )
 {
     comma::cached< someclass, someclass::key, someclass::hash > c;
-    c( 1, 2 ).dummy( 1, 2 );
+    c.get( 1, 2 ).dummy( 1, 2 );
+    EXPECT_EQ( c.values().size(), 1 );
+    c.get( 1, 2 ).dummy( 1, 2 );
+    EXPECT_EQ( c.values().size(), 1 );
+    c.get( 3, 1 ).dummy( 3, 1 );
+    EXPECT_EQ( c.values().size(), 2 );
+    c.get( 3, 1 ).dummy( 3, 1 );
+    EXPECT_EQ( c.values().size(), 2 );
+}
+
+struct plan
+{
+    struct params
+    {
+        int size{0};
+        bool real{false};
+        bool inverse{false};
+
+        bool operator==( const params& rhs ) const { return size == rhs.size && real == rhs.real && inverse == rhs.inverse; }
+
+        params( const std::vector< int >& v, bool real, bool inverse ): size( v.size() ), real( real ), inverse( inverse ) {}
+
+        params( const std::set< int >& v, bool x ): size( v.size() ), real( x ), inverse( x ) {}
+    };
+
+    plan( const params& ) {}
+
+    void operator()( const std::vector< int >&, bool, bool ) {}
+
+    void operator()( const std::set< int >&, bool ) {}
+
+    void size() {}
+};
+
+namespace std {
+
+template <> struct hash< plan::params >
+{
+    std::size_t operator()( plan::params const& k ) const
+    {
+        std::size_t seed = 0;
+        boost::hash_combine( seed, k.size );
+        boost::hash_combine( seed, k.real );
+        boost::hash_combine( seed, k.inverse );
+        return seed;
+    }
+};
+
+} // namespace std {
+
+TEST( cached, hashing_non_intrusive )
+{
+    comma::cached< plan, plan::params > c;
+    c.get( std::vector{ 1, 2, 3 }, true, false )( std::vector{ 1, 2, 3 }, true, false );
     EXPECT_EQ( c.values().size(), 1 );
-    c( 1, 2 ).dummy( 1, 2 );
+    c.get( std::vector{ 1, 2, 3 }, true, false )( std::vector{ 1, 2, 3 }, true, false );
     EXPECT_EQ( c.values().size(), 1 );
-    c( 3, 1 ).dummy( 3, 1 );
+    c.get( std::vector{ 1, 2 }, true, false )( std::vector{ 1, 2 }, true, false );
     EXPECT_EQ( c.values().size(), 2 );
-    c( 3, 1 ).dummy( 3, 1 );
+    c.get( std::vector{ 1, 2 }, true, false )( std::vector{ 1, 2 }, true, false );
+    c.get( std::vector{ 1, 2 }, true, false ).size();
     EXPECT_EQ( c.values().size(), 2 );
-}
\ No newline at end of file
+}
+
+TEST( cached, operators )
+{
+    comma::cached< plan, plan::params > plans;
+    plans( std::vector{ 1, 2, 3 }, true, false );
+    EXPECT_EQ( plans.values().size(), 1 );
+    plans( std::vector{ 1, 2, 3 }, true, false );
+    EXPECT_EQ( plans.values().size(), 1 );
+    plans( std::vector{ 1, 2 }, true, false );
+    EXPECT_EQ( plans.values().size(), 2 );
+    plans( std::vector{ 1, 2 }, true, false );
+    EXPECT_EQ( plans.values().size(), 2 );
+
+    plans( std::set{ 1, 2 }, true );
+    EXPECT_EQ( plans.values().size(), 3 );
+    plans( std::set{ 1, 2 }, true );
+    EXPECT_EQ( plans.values().size(), 3 );
+    plans( std::vector{ 1, 2 }, true, true );
+    EXPECT_EQ( plans.values().size(), 3 );
+}
+

From 7d99e0cf69c1e28afc82f36fb1e435a01225e71d Mon Sep 17 00:00:00 2001
From: Jared Silbermann <jared.silbermann@missionsystems.com.au>
Date: Fri, 8 Nov 2024 14:26:44 +1100
Subject: [PATCH 0984/1056] containers: cached: using unique_ptr for now;
 proper move semantics: todo

---
 containers/cached.h | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/containers/cached.h b/containers/cached.h
index 250ed5ef2..f30d41193 100644
--- a/containers/cached.h
+++ b/containers/cached.h
@@ -2,8 +2,8 @@
 // All Rights Reserved
 
 #include <deque>
+#include <memory>
 #include <unordered_map>
-
 namespace comma {
 
 template < typename T, typename K, typename Hash = std::hash< K > >
@@ -27,7 +27,7 @@ class cached
         const std::unordered_map< K, T, Hash >& values() const { return _values; }
 
     protected:
-        mutable std::unordered_map< K, T, Hash > _values;
+        mutable std::unordered_map< K, std::unique_ptr< T >, Hash > _values; // todo! use proper move semantics instead of unique_ptr
         mutable std::deque< K > _keys;
         unsigned int _size{0};
 };
@@ -38,10 +38,10 @@ T& cached< T, K, Hash >::get( Args... args )
 {
     K k{ args... };
     auto i = _values.find( k );
-    if( i != _values.end() ) { return i->second; }
+    if( i != _values.end() ) { return *( i->second ); }
     if( _size > 0 && _values.size() == _size ) { pop(); }
     _keys.emplace_back( k );
-    return _values.emplace( std::make_pair( k, T( k ) ) ).first->second;
+    return *( _values.emplace( std::make_pair( k, std::make_unique< T >( k ) ) ).first->second );
 }
 
 template < typename T, typename K, typename Hash >
@@ -50,10 +50,10 @@ const T& cached< T, K, Hash >::get( Args... args ) const
 {
     K k{ args... };
     auto i = _values.find( k );
-    if( i != _values.end() ) { return i->second; }
+    if( i != _values.end() ) { return *( i->second ); }
     if( _size > 0 && _values.size() == _size ) { pop(); }
     _keys.emplace_back( k );
-    return _values.emplace( std::make_pair( k, T( k ) ) ).first->second;
+    return *( _values.emplace( std::make_pair( k, std::make_unique< T >( k ) ) ).first->second );
 }
 
 template < typename T, typename K, typename Hash >

From f452e28ebbb65c9f8b23d056cd2288ca4d8bf4ad Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 8 Nov 2024 14:35:59 +1100
Subject: [PATCH 0985/1056] containers: cached: typo fixed

---
 containers/cached.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/containers/cached.h b/containers/cached.h
index f30d41193..0ec819807 100644
--- a/containers/cached.h
+++ b/containers/cached.h
@@ -24,7 +24,7 @@ class cached
 
         void pop( unsigned int size = 1 );
 
-        const std::unordered_map< K, T, Hash >& values() const { return _values; }
+        const std::unordered_map< K, std::unique_ptr< T >, Hash >& values() const { return _values; }
 
     protected:
         mutable std::unordered_map< K, std::unique_ptr< T >, Hash > _values; // todo! use proper move semantics instead of unique_ptr

From 62b17b3e7e56b2170bea6c10f3656ad769a54c69 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 8 Nov 2024 14:57:15 +1100
Subject: [PATCH 0986/1056] containers/test/cached_test.cpp: typo fixed

---
 containers/test/cached_test.cpp | 22 +++++++++++-----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/containers/test/cached_test.cpp b/containers/test/cached_test.cpp
index aa41dbfcf..e3ebc6734 100644
--- a/containers/test/cached_test.cpp
+++ b/containers/test/cached_test.cpp
@@ -115,34 +115,34 @@ template <> struct hash< plan::params >
 TEST( cached, hashing_non_intrusive )
 {
     comma::cached< plan, plan::params > c;
-    c.get( std::vector{ 1, 2, 3 }, true, false )( std::vector{ 1, 2, 3 }, true, false );
+    c.get( std::vector< int >{ 1, 2, 3 }, true, false )( std::vector< int >{ 1, 2, 3 }, true, false );
     EXPECT_EQ( c.values().size(), 1 );
-    c.get( std::vector{ 1, 2, 3 }, true, false )( std::vector{ 1, 2, 3 }, true, false );
+    c.get( std::vector< int >{ 1, 2, 3 }, true, false )( std::vector< int >{ 1, 2, 3 }, true, false );
     EXPECT_EQ( c.values().size(), 1 );
-    c.get( std::vector{ 1, 2 }, true, false )( std::vector{ 1, 2 }, true, false );
+    c.get( std::vector< int >{ 1, 2 }, true, false )( std::vector< int >{ 1, 2 }, true, false );
     EXPECT_EQ( c.values().size(), 2 );
-    c.get( std::vector{ 1, 2 }, true, false )( std::vector{ 1, 2 }, true, false );
-    c.get( std::vector{ 1, 2 }, true, false ).size();
+    c.get( std::vector< int >{ 1, 2 }, true, false )( std::vector< int >{ 1, 2 }, true, false );
+    c.get( std::vector< int >{ 1, 2 }, true, false ).size();
     EXPECT_EQ( c.values().size(), 2 );
 }
 
 TEST( cached, operators )
 {
     comma::cached< plan, plan::params > plans;
-    plans( std::vector{ 1, 2, 3 }, true, false );
+    plans( std::vector< int >{ 1, 2, 3 }, true, false );
     EXPECT_EQ( plans.values().size(), 1 );
-    plans( std::vector{ 1, 2, 3 }, true, false );
+    plans( std::vector< int >{ 1, 2, 3 }, true, false );
     EXPECT_EQ( plans.values().size(), 1 );
-    plans( std::vector{ 1, 2 }, true, false );
+    plans( std::vector< int >{ 1, 2 }, true, false );
     EXPECT_EQ( plans.values().size(), 2 );
-    plans( std::vector{ 1, 2 }, true, false );
+    plans( std::vector< int >{ 1, 2 }, true, false );
     EXPECT_EQ( plans.values().size(), 2 );
 
     plans( std::set{ 1, 2 }, true );
     EXPECT_EQ( plans.values().size(), 3 );
-    plans( std::set{ 1, 2 }, true );
+    plans( std::set< int >{ 1, 2 }, true );
     EXPECT_EQ( plans.values().size(), 3 );
-    plans( std::vector{ 1, 2 }, true, true );
+    plans( std::vector< int >{ 1, 2 }, true, true );
     EXPECT_EQ( plans.values().size(), 3 );
 }
 

From af7e83841336300e80860745c4abc1218f541a5c Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 8 Nov 2024 15:05:12 +1100
Subject: [PATCH 0987/1056] containers/test/cached_test.cpp: one typo missed in
 last commit

---
 containers/test/cached_test.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/containers/test/cached_test.cpp b/containers/test/cached_test.cpp
index e3ebc6734..68f4238b5 100644
--- a/containers/test/cached_test.cpp
+++ b/containers/test/cached_test.cpp
@@ -138,7 +138,7 @@ TEST( cached, operators )
     plans( std::vector< int >{ 1, 2 }, true, false );
     EXPECT_EQ( plans.values().size(), 2 );
 
-    plans( std::set{ 1, 2 }, true );
+    plans( std::set< int >{ 1, 2 }, true );
     EXPECT_EQ( plans.values().size(), 3 );
     plans( std::set< int >{ 1, 2 }, true );
     EXPECT_EQ( plans.values().size(), 3 );

From 913146047500435dcaf384732e9ef2a42b355421 Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Sat, 23 Nov 2024 18:54:38 +1100
Subject: [PATCH 0988/1056] csv-split.cpp: create correctly sized read buffer
 for larger records

---
 csv/applications/csv-split.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index 9284dc048..504f28ded 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -70,7 +70,7 @@ template < typename T > static int run()
         _setmode( _fileno( stdin ), _O_BINARY );
     #endif
     bool has_size = csv.has_field( "size" );
-    std::vector< char > buffer( 32768 ); // quick and dirty
+    std::vector< char > buffer( std::max< unsigned int >( size, 32768 )); // quick and dirty
     typedef comma::csv::applications::input< T > input_t;
     comma::csv::binary< input_t > binary( csv );
     input_t header;

From b4754692f516a7770a8965652ee5719cf2882eeb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 20 Dec 2024 15:18:24 +1100
Subject: [PATCH 0989/1056] comma::containers::find_or_throw(): first cut
 implemented

---
 containers/find.h | 52 +++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 52 insertions(+)
 create mode 100644 containers/find.h

diff --git a/containers/find.h b/containers/find.h
new file mode 100644
index 000000000..76e7b58a6
--- /dev/null
+++ b/containers/find.h
@@ -0,0 +1,52 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <map>
+#include <unordered_map>
+#include "../base/exception.h"
+
+namespace comma { namespace containers {
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > const V& find_or_throw( const std::map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > V& find_or_throw( std::map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > const V& find_or_throw( const std::unordered_map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > V& find_or_throw( std::unordered_map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+
+namespace impl {
+
+template < typename M, typename K > inline const auto& find_or_throw( const M& m, const K& k, const std::string& message )
+{
+    auto it = m.find( k );
+    COMMA_ASSERT( it != m.end(), ( message.empty() ? std::string() : ( message + ": " ) ) << "k '" << k << "' not found" );
+    return it->second;
+}
+
+template < typename M, typename K > inline auto& find_or_throw( M& m, const K& k, const std::string& message )
+{
+    auto it = m.find( k );
+    COMMA_ASSERT( it != m.end(), ( message.empty() ? std::string() : ( message + ": " ) ) << "k '" << k << "' not found" );
+    return it->second;
+}
+
+} // namespace impl {
+
+template < typename K, typename V > inline const V& find_or_throw( const std::map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+template < typename K, typename V > inline V& find_or_throw( std::map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+template < typename K, typename V > inline const V& find_or_throw( const std::unordered_map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+template < typename K, typename V > inline V& find_or_throw( std::unordered_map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+} } // namespace comma { namespace containers {

From 935d0e12a66a2e147b87091dfc01479d2651389f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 20 Dec 2024 16:14:47 +1100
Subject: [PATCH 0990/1056] comma::enums: first cut of a few convenience
 methods implemented

---
 containers/enums.h | 53 ++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 53 insertions(+)
 create mode 100644 containers/enums.h

diff --git a/containers/enums.h b/containers/enums.h
new file mode 100644
index 000000000..b1b1fb572
--- /dev/null
+++ b/containers/enums.h
@@ -0,0 +1,53 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <map>
+#include <string>
+#include <vector>
+#include "find.h"
+
+namespace comma { namespace enums {
+
+/// trivial convenience wrapper; works only for enums with sequential values
+template < typename Enum, typename K = std::string >
+std::map< K, Enum > as_map( const std::vector< K >& keys, unsigned int begin = 0 );
+
+/// trivial convenience wrapper; works only for enums with sequential values
+template < typename Enum, typename K = std::string >
+std::map< Enum, K > as_key_map( const std::vector< K >& keys, unsigned int begin = 0 );
+
+/// trivial convenience wrapper
+template < typename Enum, typename K = std::string >
+Enum find( const K& k, const std::vector< K >& keys, unsigned int begin = 0 );
+
+// todo: visiting traits
+template < typename Enum, typename Names >
+struct named: public Enum, Names
+{
+    const std::string& name() { return this->names()[static_cast< unsigned int >( *this )]; }
+};
+
+
+template < typename Enum, typename K >
+inline std::map< K, Enum > as_map( const std::vector< K >& keys, unsigned int begin )
+{
+    std::map< K, Enum > m;
+    for( unsigned int i{0}, j{begin}; i < keys.size(); ++i, ++j ) { m[keys[i]] = static_cast< Enum >( j ); }
+    return m;
+}
+
+template < typename Enum, typename K >
+inline std::map< Enum, K > as_key_map( const std::vector< K >& keys, unsigned int begin )
+{
+    std::map< Enum, K > m;
+    for( unsigned int i{0}, j{begin}; i < keys.size(); ++i, ++j ) { m[static_cast< Enum >( j )] = keys[i]; }
+    return m;
+}
+
+template < typename Enum, typename K >
+Enum find( const K& k, const std::vector< K >& keys, unsigned int begin ) { return containers::find_or_throw< K, Enum >( as_map< Enum, K >( keys, begin ), k ); }
+
+} } // namespace comma { namespace enums {

From c5b1643787aaa31c040e782b49b236b94b73b7f9 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 23 Dec 2024 14:43:49 +1100
Subject: [PATCH 0991/1056] strings::choice: support for named enums added

---
 string/choice.h             |  3 ++-
 string/test/string_test.cpp | 17 +++++++++++++++++
 2 files changed, 19 insertions(+), 1 deletion(-)

diff --git a/string/choice.h b/string/choice.h
index 35fff959f..623e3a580 100644
--- a/string/choice.h
+++ b/string/choice.h
@@ -12,7 +12,7 @@ template < typename Derived, typename Base = std::string >
 struct choice: public Base
 {
     typedef Base base_t;
-    choice( typename Derived::values rhs = static_cast< typename Derived::values >( 0 ) ): Base( Derived::choices()[rhs] ) {}
+    choice( typename Derived::values rhs = static_cast< typename Derived::values >( 0 ) ): Base( Derived::choices()[static_cast< unsigned int >( rhs )] ) {}
     choice( const std::string& rhs ) { operator=( rhs ); }
     choice& operator=( const std::string& rhs ) { assert_valid( rhs ); Base::operator=( rhs ); return *this; }
     typename Derived::values to_enum() const;
@@ -20,6 +20,7 @@ struct choice: public Base
     static void assert_valid( const std::string& rhs );
     bool valid() const { return valid( std::string( *this ) ); } // quick and dirty for now
     void assert_valid() const { assert_valid( std::string( *this ) ); } // quick and dirty for now
+    operator typename Derived::values() const { return to_enum(); }
 };
 
 template < typename Derived, typename Base >
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index b37dd6603..86f824f51 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -451,9 +451,16 @@ struct fruit
     enum values { apple, orange, juicymambo };
 };
 
+struct veg
+{
+    static std::vector< std::string > choices() { return { "cucumber", "pumpkin" }; }
+    enum class values { cucumber, pumpkin };
+};
+
 struct grocery_store
 {
     strings::choice< comma::fruit > fruit;
+    strings::choice< comma::veg > veg;
 };
 
 namespace visiting {
@@ -463,11 +470,13 @@ template <> struct traits< grocery_store >
     template < typename Key, class Visitor > static void visit( const Key& k, grocery_store& p, Visitor& v )
     {
         v.apply( "fruit", p.fruit );
+        v.apply( "veg", p.veg );
     }
 
     template < typename Key, class Visitor > static void visit( const Key& k, const grocery_store& p, Visitor& v )
     {
         v.apply( "fruit", p.fruit );
+        v.apply( "veg", p.veg );
     }
 };
 
@@ -480,9 +489,17 @@ TEST( strings, choice )
     EXPECT_EQ( strings::choice< fruit >( "orange" ), "orange" );
     EXPECT_EQ( strings::choice< fruit >( fruit::orange ), "orange" );
     EXPECT_EQ( strings::choice< fruit >( fruit::orange ).to_enum(), fruit::orange );
+    EXPECT_EQ( strings::choice< fruit >( fruit::orange ), fruit::orange );
     EXPECT_TRUE( strings::choice< fruit >::valid( "juicymambo" ) );
     EXPECT_FALSE( strings::choice< fruit >::valid( "driedmambo" ) );
     EXPECT_THROW( strings::choice< fruit >( "driedmambo" ), comma::exception );
+
+    EXPECT_EQ( strings::choice< veg >(), "cucumber" );
+    EXPECT_EQ( strings::choice< veg >().to_enum(), veg::values::cucumber );
+    EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ), "pumpkin" );
+    EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ).to_enum(), veg::values::pumpkin );
+    EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ), veg::values::pumpkin );
+
     // todo: test visiting...
 }
 

From caa567eee46aac8154690dd47e517bd57e557ba6 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 23 Dec 2024 15:40:35 +1100
Subject: [PATCH 0992/1056] strings::choice: basic visiting unit test added

---
 string/test/CMakeLists.txt  |  2 +-
 string/test/string_test.cpp | 32 +++++++++++++++++++++++++++-----
 2 files changed, 28 insertions(+), 6 deletions(-)

diff --git a/string/test/CMakeLists.txt b/string/test/CMakeLists.txt
index f6a0e1af7..6d1199d84 100644
--- a/string/test/CMakeLists.txt
+++ b/string/test/CMakeLists.txt
@@ -2,7 +2,7 @@ set( KIT string )
 file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
 set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
 add_executable( ${test_name} ${source} )
-target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
+target_link_libraries( ${test_name} comma_base comma_string comma_name_value ${GTEST_BOTH_LIBRARIES} pthread )
 add_test( NAME ${test_name} COMMAND ${test_name} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
 if( INSTALL_TESTS )
     install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 86f824f51..997e4b72a 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -1,8 +1,10 @@
 // Copyright (c) 2023 vsevolod vlaskine
 
 #include <list>
+#include <sstream>
 #include <gtest/gtest.h>
 #include "../../base/exception.h"
+#include "../../name_value/serialize.h"
 #include "../choice.h"
 #include "../split.h"
 #include "../string.h"
@@ -457,7 +459,7 @@ struct veg
     enum class values { cucumber, pumpkin };
 };
 
-struct grocery_store
+struct groceries
 {
     strings::choice< comma::fruit > fruit;
     strings::choice< comma::veg > veg;
@@ -465,15 +467,15 @@ struct grocery_store
 
 namespace visiting {
 
-template <> struct traits< grocery_store >
+template <> struct traits< groceries >
 {
-    template < typename Key, class Visitor > static void visit( const Key& k, grocery_store& p, Visitor& v )
+    template < typename Key, class Visitor > static void visit( const Key& k, groceries& p, Visitor& v )
     {
         v.apply( "fruit", p.fruit );
         v.apply( "veg", p.veg );
     }
 
-    template < typename Key, class Visitor > static void visit( const Key& k, const grocery_store& p, Visitor& v )
+    template < typename Key, class Visitor > static void visit( const Key& k, const groceries& p, Visitor& v )
     {
         v.apply( "fruit", p.fruit );
         v.apply( "veg", p.veg );
@@ -500,7 +502,27 @@ TEST( strings, choice )
     EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ).to_enum(), veg::values::pumpkin );
     EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ), veg::values::pumpkin );
 
-    // todo: test visiting...
+    {
+        std::istringstream iss( R"({})" );
+        auto g = comma::read_json< groceries >( iss );
+        EXPECT_EQ( g.fruit, "apple" );
+        EXPECT_EQ( g.veg, "cucumber" );
+        EXPECT_EQ( comma::json_to_string( g, false ), R"({"fruit":"apple","veg":"cucumber"})" );
+    }
+    {
+        std::istringstream iss( R"({ "fruit": "orange" })" );
+        auto g = comma::read_json< groceries >( iss );
+        EXPECT_EQ( g.fruit, "orange" );
+        EXPECT_EQ( g.veg, "cucumber" );
+        EXPECT_EQ( comma::json_to_string( g, false ), R"({"fruit":"orange","veg":"cucumber"})" );
+    }
+    {
+        std::istringstream iss( R"({ "fruit": "orange", "veg": "pumpkin" })" );
+        auto g = comma::read_json< groceries >( iss );
+        EXPECT_EQ( g.fruit, "orange" );
+        EXPECT_EQ( g.veg, "pumpkin" );
+        EXPECT_EQ( comma::json_to_string( g, false ), R"({"fruit":"orange","veg":"pumpkin"})" );
+    }
 }
 
 } // namespace comma {

From c548c146bbd3a3828dfbc53849ae477cdc64f097 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 24 Dec 2024 11:36:00 +1100
Subject: [PATCH 0993/1056] string: strings::make_choice() convenience function
 implemented, basic unit test added

---
 string/choice.h             | 32 ++++++++++++++++++++++++++------
 string/test/string_test.cpp |  3 +++
 2 files changed, 29 insertions(+), 6 deletions(-)

diff --git a/string/choice.h b/string/choice.h
index 623e3a580..45f19e852 100644
--- a/string/choice.h
+++ b/string/choice.h
@@ -3,6 +3,7 @@
 #pragma once
 
 #include <string>
+#include <vector>
 #include "../base/exception.h"
 #include "string.h"
 
@@ -23,16 +24,35 @@ struct choice: public Base
     operator typename Derived::values() const { return to_enum(); }
 };
 
-template < typename Derived, typename Base >
-typename Derived::values choice< Derived, Base >::to_enum() const
+template < typename Enum >
+Enum make_choice( const std::string& name, const std::vector< std::string >& choices ); // convenience function, quick and dirty for now
+
+namespace impl {
+
+template < typename Enum, typename T, typename V >
+inline Enum make_choice( const T& name, const V& choices ) // quick and dirty for now
 {
     unsigned int i = 0;
-    for( const auto& c: Derived::choices() ) { if( *this == c ) { return static_cast< typename Derived::values >( i ); } ++i; }
-    COMMA_THROW( comma::exception, "could not convert to enum value: '" << std::string( *this ) << "'" ); // in theory never here
+    for( const auto& c: choices ) { if( name == c ) { return static_cast< Enum >( i ); } ++i; }
+    COMMA_THROW( comma::exception, "could not convert to enum value: '" << name << "'" ); // in theory never here
+}
+
+} // namespace impl {
+
+template < typename Enum >
+inline Enum make_choice( const std::string& name, const std::vector< std::string >& choices )
+{
+    return impl::make_choice< Enum >( name, choices );
+}
+
+template < typename Derived, typename Base >
+inline typename Derived::values choice< Derived, Base >::to_enum() const
+{
+    return impl::make_choice< typename Derived::values >( static_cast< const Base& >( *this ), Derived::choices() );
 }
 
 template < typename Derived, typename Base >
-bool choice< Derived, Base >::valid( const std::string& rhs )
+inline bool choice< Derived, Base >::valid( const std::string& rhs )
 {
     unsigned int i = 0;
     for( const auto& c: Derived::choices() ) { if( rhs == c ) { return true; } ++i; }
@@ -40,7 +60,7 @@ bool choice< Derived, Base >::valid( const std::string& rhs )
 }
 
 template < typename Derived, typename Base >
-void choice< Derived, Base >::assert_valid( const std::string& rhs )
+inline void choice< Derived, Base >::assert_valid( const std::string& rhs )
 {
     COMMA_ASSERT( valid( rhs ), "expected one of: " << comma::join( Derived::choices(), ',' ) << "; got: '" << rhs << "'" );
 }
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 997e4b72a..264093db2 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -523,6 +523,9 @@ TEST( strings, choice )
         EXPECT_EQ( g.veg, "pumpkin" );
         EXPECT_EQ( comma::json_to_string( g, false ), R"({"fruit":"orange","veg":"pumpkin"})" );
     }
+
+    EXPECT_EQ( strings::make_choice< fruit::values >( "orange", { "apple", "orange" } ), fruit::orange );
+    EXPECT_EQ( strings::make_choice< veg::values >( "pumpkin", { "cucumber", "pumpkin" } ), veg::values::pumpkin );
 }
 
 } // namespace comma {

From 74afd887e55b2971b562621ded6d0f3932ea9aed Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Mon, 30 Dec 2024 14:01:18 +1100
Subject: [PATCH 0994/1056] named_variant: more basic tests added

---
 base/test/base_test.cpp         | 34 ++++++++++++++++++++++-
 visiting/test/CMakeLists.txt    |  2 +-
 visiting/test/visiting_test.cpp | 48 +++++++++++++++++++++++++++++++++
 3 files changed, 82 insertions(+), 2 deletions(-)

diff --git a/base/test/base_test.cpp b/base/test/base_test.cpp
index 5e1df090c..ad72c58f5 100644
--- a/base/test/base_test.cpp
+++ b/base/test/base_test.cpp
@@ -26,6 +26,22 @@ TEST( base, variant )
         v.values.t = 2;
         v.values.values.t = 3;
     }
+    {
+        comma::impl::variant< int, float, double > v;
+        EXPECT_FALSE( v );
+        v.set< int >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< float >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< double >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+    }
     {
         comma::impl::variant< int, float, double > v;
         EXPECT_FALSE( v.is< int >() );
@@ -113,11 +129,27 @@ TEST( base, named_variant )
     {
         struct naming { static std::array< std::string, 3 > names() { return { "a", "b", "c" }; } };
         typedef comma::named_variant< naming, int, float, double > variant_t;
-        variant_t v;
         EXPECT_EQ( variant_t::name_of< int >(), "a" );
         EXPECT_EQ( variant_t::name_of< float >(), "b" );
         EXPECT_EQ( variant_t::name_of< double >(), "c" );
     }
+    {
+        struct naming { static std::array< std::string, 3 > names() { return { "a", "b", "c" }; } };
+        comma::named_variant< naming, int, float, double > v;
+        EXPECT_FALSE( v );
+        v.set< int >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< float >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< double >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+    }
 }
 
 } // namespace comma {
diff --git a/visiting/test/CMakeLists.txt b/visiting/test/CMakeLists.txt
index 99dbaad9d..398724ecd 100644
--- a/visiting/test/CMakeLists.txt
+++ b/visiting/test/CMakeLists.txt
@@ -2,7 +2,7 @@ set( KIT visiting )
 file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
 set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
 add_executable( ${test_name} ${source} )
-target_link_libraries( ${test_name} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread )
+target_link_libraries( ${test_name} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread ) # comma_name_value comma_xpath
 add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
 if( INSTALL_TESTS )
     install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
diff --git a/visiting/test/visiting_test.cpp b/visiting/test/visiting_test.cpp
index 0dd98d8b7..97e66537b 100644
--- a/visiting/test/visiting_test.cpp
+++ b/visiting/test/visiting_test.cpp
@@ -12,6 +12,7 @@
 #include <boost/noncopyable.hpp>
 #include "../../base/optional.h"
 #include "../../base/types.h"
+//#include "../../name_value/serialize.h"
 #include "../apply.h"
 #include "../visit.h"
 
@@ -49,6 +50,7 @@ class o_stream_visitor : public boost::noncopyable
     private:
         std::ostream& m_stream;
         bool empty( const char* name ) { return *name == 0; }
+        bool empty( const std::string& name ) { return name.empty(); }
         bool empty( std::size_t ) { return false; }
 };
 
@@ -255,6 +257,52 @@ TEST( visiting, optional )
     }
 }
 
+struct some_struct
+{
+    struct naming { static std::array< std::string, 3 > names() { return { "a", "b", "c" }; } };
+    typedef comma::named_variant< naming, int, std::pair< std::string, float >, double > named_variant_t;
+    named_variant_t variant;
+};
+
+} } } /// namespace comma { namespace visiting { namespace test {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< test::some_struct >
+{
+    template < typename Key, typename visitor > static void visit( const Key&,       test::some_struct& p, visitor& v ) { v.apply( "variant", p.variant ); }
+    template < typename Key, typename visitor > static void visit( const Key&, const test::some_struct& p, visitor& v ) { v.apply( "variant", p.variant ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace visiting { namespace test {
+
+TEST( visiting, named_variant )
+{
+    {
+        test::some_struct t;
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:variant={ } }" );
+    }
+    {
+        // test::some_struct t;
+        // t.variant.set( std::pair< std::string, float >( "hello", 5 ) );
+        // std::ostringstream oss;
+        // o_stream_visitor v( oss );
+        // visiting::apply( v, t );
+        // //EXPECT_EQ( oss.str(), "{ object:variant={ } }" );
+        // std::cerr << "=============" << std::endl;
+        // std::cerr << oss.str() << std::endl;
+        // std::cerr << "=============" << std::endl;
+        // write_json( t, std::cerr );
+        // std::cerr << "=============" << std::endl;
+    }
+    // todo! test serialization and deserialization! make test dependent on name_value?
+}
+
 } } } /// namespace comma { namespace visiting { namespace test {
 
 int main( int argc, char* argv[] )

From ebcda93a0343ccec31eec8408b6aa4a307c37e73 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Thu, 2 Jan 2025 13:36:24 +1100
Subject: [PATCH 0995/1056] variant::index() and named_variant::name()
 implemented, basic tests added

---
 base/test/base_test.cpp | 14 ++++++++++++++
 base/variant.h          |  4 ++++
 2 files changed, 18 insertions(+)

diff --git a/base/test/base_test.cpp b/base/test/base_test.cpp
index ad72c58f5..2a2bb343a 100644
--- a/base/test/base_test.cpp
+++ b/base/test/base_test.cpp
@@ -121,6 +121,16 @@ TEST( base, variant )
         EXPECT_EQ( variant_t::index_of< int >(), 0 );
         EXPECT_EQ( variant_t::index_of< float >(), 1 );
         EXPECT_EQ( variant_t::index_of< double >(), 2 );
+        variant_t v;
+        EXPECT_EQ( v.index(), 3 );
+        v.set< int >( 5 );
+        EXPECT_EQ( v.index(), 0 );
+        v.set< float >( 5 );
+        EXPECT_EQ( v.index(), 1 );
+        v.set< double >( 5 );
+        EXPECT_EQ( v.index(), 2 );
+        v.reset();
+        EXPECT_EQ( v.index(), 3 );
     }
 }
 
@@ -139,16 +149,20 @@ TEST( base, named_variant )
         EXPECT_FALSE( v );
         v.set< int >( 5 );
         EXPECT_TRUE( v );
+        EXPECT_EQ( v.name(), "a" );
         v.reset();
         EXPECT_FALSE( v );
         v.set< float >( 5 );
         EXPECT_TRUE( v );
+        EXPECT_EQ( v.name(), "b" );
         v.reset();
         EXPECT_FALSE( v );
         v.set< double >( 5 );
         EXPECT_TRUE( v );
+        EXPECT_EQ( v.name(), "c" );
         v.reset();
         EXPECT_FALSE( v );
+        EXPECT_THROW( v.name(), comma::exception );
     }
 }
 
diff --git a/base/variant.h b/base/variant.h
index 27be453bd..5d0989c8b 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -56,6 +56,7 @@ template < typename T, typename... Args > struct variant  // todo? use tuple ins
     template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, values ); }
     void reset() { t.reset(); values.reset(); }
     template < typename S > static unsigned int rindex() { return std::is_same< T, S >::value ? size - 1 : variant< Args... >::template rindex< S >(); }
+    unsigned int index( unsigned int i = 0 ) const { return t ? i : values.index( i + 1 ); }
 };
 
 template < typename T > struct variant< T >  // todo? use tuple instead?
@@ -71,6 +72,7 @@ template < typename T > struct variant< T >  // todo? use tuple instead?
     template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, type_is_not_on_type_list() ); }
     void reset() { t.reset(); }
     template < typename S > static unsigned int rindex() { bool same_type = std::is_same< T, S >::value; COMMA_ASSERT( same_type, "type not found in type list" ); return 0; }
+    unsigned int index( unsigned int i = 0 ) const { return t ? i : ( i + 1 ); }
 };
 
 } // namespace impl {
@@ -95,6 +97,7 @@ class variant
         template < typename S > const boost::optional< S >& optional() const { return _values.template optional< S >(); }
         void reset() { _values.reset(); }
         template < typename S > static unsigned int index_of() { return impl::variant< Args... >::size - impl::variant< Args... >::template rindex< S >() - 1; }
+        unsigned int index() const { return _values.index(); }
     protected:
         impl::variant< Args... > _values;
 };
@@ -116,6 +119,7 @@ struct named_variant : public variant< Args... >, public Names
     typedef Names names_t;
     typedef variant< Args... > variant_t;
     template < typename S > static const std::string& name_of() { return Names::names()[ variant_t::template index_of< S >() ]; }
+    const auto& name() const { COMMA_ASSERT( bool( *this ), "asked for name, but value is not set" ); return this->names()[this->index()]; }
 };
 
 template < typename Names >

From 08f53ca9c2fbae7e3370079fade92e5ef158a783 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 21 Jan 2025 20:56:04 +1100
Subject: [PATCH 0996/1056] io-publish: read timeout handling: implementing...

---
 io/applications/io-publish.cpp | 59 +++++++++++++++++++++++++++-------
 1 file changed, 47 insertions(+), 12 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 6c22a873c..3d24bef57 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -9,6 +9,7 @@
 #include "../../io/file_descriptor.h"
 #include "../../io/publisher.h"
 #include "../../io/impl/publish.h"
+#include "../../io/select.h"
 #include "../../name_value/map.h"
 #include "../../string/string.h"
 #include "../../sync/synchronized.h"
@@ -40,6 +41,12 @@ stream options
     --exec=[<command>]: read from <command> rather than stdin
     -- [<command>]: alternate syntax for specifying a command (simplifies quoting)
     --on-demand: only run <command> when a client is connected
+    --timeout-read,--read-timeout=<seconds>; exit or disconnect if no input data
+                                             for longer than <seconds>
+                                             limitation: if an input packet is half-read
+                                                         io-publish still will block on read
+    --timeout-reconnect,--reconnect-on-read-timeout, only if --exec present
+    --timeout-is-error; exit with error on timeout
 
 client options
     --exit-on-no-clients,-e: once the last client disconnects, exit
@@ -92,7 +99,7 @@ class command
     public:
         command( const std::string& command ): command_( command ), child_pid_( -1 )
         {
-            comma::verbose << "launching command: " << command << std::endl;
+            comma::saymore() << "launching command: " << command << std::endl;
             int fd[2];
             if( ::pipe( fd ) == -1 ) { comma::last_error::to_exception( "couldn't open pipe" ); } // create a pipe to send the child stdout to the parent stdin
             fd_ = fd[0];
@@ -109,7 +116,7 @@ class command
                 exit( 1 );
             }
             child_pid_ = pid;
-            comma::verbose << "launched command with pid: " << pid << std::endl;
+            comma::saymore() << "launched command with pid: " << pid << std::endl;
             ::close( STDIN_FILENO );
             ::close( fd[1] ); // don't need pipe input in the parent
         }
@@ -118,14 +125,14 @@ class command
 
         ~command()
         {
-            comma::verbose << "closing file descriptor " << fd_ << " for " << comma::split( command_ )[0] << "..." << std::endl;
+            comma::saymore() << "closing file descriptor " << fd_ << " for " << comma::split( command_ )[0] << "..." << std::endl;
             ::close( fd_ );
-            comma::verbose << "sending SIGTERM to " << comma::split( command_ )[0] << " (pid " << child_pid_ << ")..." << std::endl;
+            comma::saymore() << "sending SIGTERM to " << comma::split( command_ )[0] << " (pid " << child_pid_ << ")..." << std::endl;
             ::kill( -child_pid_, SIGTERM );
-            comma::verbose << "waiting for pid " << child_pid_ << "..." << std::endl;
-            if( ::waitpid( -child_pid_, NULL, 0 ) < 0 ) { comma::verbose << "warning: waiting for pid " << child_pid_ << " failed" << std::endl; }
+            comma::saymore() << "waiting for pid " << child_pid_ << "..." << std::endl;
+            if( ::waitpid( -child_pid_, NULL, 0 ) < 0 ) { comma::saymore() << "warning: waiting for pid " << child_pid_ << " failed" << std::endl; }
             while( std::getchar() >= 0 ); // todo: lame, but select or c-style reading produce bizarre results; investigate sometime
-            comma::verbose << "waiting for pid " << child_pid_ << " done" << std::endl;
+            comma::saymore() << "waiting for pid " << child_pid_ << " done" << std::endl;
         }
 
     private:
@@ -142,21 +149,28 @@ int main( int ac, char** av )
         for( int i = 0; i < ac && std::string( "--" ) != av[i]; ++i ) { head.push_back( av[i] ); }
         for( int i = head.size() + 1; i < ac; ++i ) { tail.push_back( av[i] ); }
         comma::command_line_options options( head, usage );
-        const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand", "-.+" );
+        const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand,--timeout-reconnect,--reconnect-on-read-timeout,--timeout-is-error", "-.+" );
         if( names.empty() ) { comma::say() << "please specify at least one stream; use '-' for stdout" << std::endl; return 1; }
         options.assert_mutually_exclusive( "--cache-size,--cache", "--on-demand" );
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
         comma::signal_flag is_shutdown( signals );
         bool on_demand = options.exists( "--on-demand" );
         bool exit_on_no_clients = options.exists( "--exit-on-no-clients,-e" );
+        std::string exec_command = options.value< std::string >( "--exec", "" );
+        bool reconnect_on_read_timeout = options.exists( "--timeout-reconnect,--reconnect-on-read-timeout" );
+        bool timeout_is_error = options.exists( "--timeout-is-error" );
+        boost::optional< double > read_timeout = options.optional< double >( "--timeout-read,--read-timeout" );
+        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || read_timeout, "--reconnect-on-read-timeout requires --read-timeout <seconds>" );
+        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || !exec_command.empty(), "--reconnect-on-read-timeout requires --exec <command>" );
+        COMMA_ASSERT_BRIEF( !timeout_is_error || read_timeout, "--timeout-is-error requires --read-timeout <seconds>" );
+        unsigned int size = options.value( "-s,--size", 0 );
         comma::io::impl::publish p( names
-                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                  , size * options.value( "-m,--multiplier", 1 )
                                   , !options.exists( "--no-discard" )
                                   , !options.exists( "--no-flush" )
                                   , options.exists( "--output-number-of-clients,--clients" )
                                   , exit_on_no_clients || on_demand
                                   , options.value( "--cache-size,--cache", 0 ) );
-        std::string exec_command = options.value< std::string >( "--exec", "" );
         if( !tail.empty() )
         {
             COMMA_ASSERT_BRIEF( exec_command.empty(), "expected either --exec or --, got both" );
@@ -166,17 +180,38 @@ int main( int ac, char** av )
         if( exec_command.empty() )
         {
             COMMA_ASSERT_BRIEF( !on_demand, "got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" );
-            while( std::cin.good() && !is_shutdown ) { if( !p.read( std::cin ) && exit_on_no_clients ) { break; } }
+            comma::io::select select;
+            if( read_timeout ) { select.read().add( 0 ); }
+            std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
+            std::cin.tie( NULL ); // std::cin is tied to std::cout by default
+            while( std::cin.good() && !is_shutdown )
+            {
+                if( read_timeout )
+                {
+                    auto available = std::cin.rdbuf()->in_avail();
+                    if( available == 0 ) // todo! || ( size > 0 && available < size ) )
+                    {
+                        select.wait( *read_timeout );
+                        if( !select.read().ready( 0 ) )
+                        {
+                            comma::say() << "read: timeout no input after " << *read_timeout << " seconds" << std::endl;
+                            exit( timeout_is_error ? 1 : 0 );
+                        }
+                    }
+                }
+                if( !p.read( std::cin ) && exit_on_no_clients ) { break; }
+            }
         }
         else
         {
+            COMMA_ASSERT_BRIEF( !read_timeout, "--read-timeout with --exec: implementing..." );
             bool done = false;
             int fd[2];
             if( ::pipe( fd ) == -1 ) { comma::last_error::to_exception( "couldn't open pipe" ); } // create a pipe to send the child stdout to the parent stdin
             while( !done && !is_shutdown )
             {
                 if( on_demand && p.num_clients() == 0 ) { ::sleep( 0.1 ); continue; } // todo? make timeout configurable?
-                comma::verbose << "number of clients: " << p.num_clients() << std::endl;
+                comma::saymore() << "number of clients: " << p.num_clients() << std::endl;
                 command cmd( exec_command );
                 typedef boost::iostreams::file_descriptor_source fd_t;
                 boost::iostreams::stream< fd_t > is( fd_t( cmd.fd(), boost::iostreams::never_close_handle ) );

From 1c1ab5c141033a416c6f3cd63e219d7f2299af5a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 21 Jan 2025 22:53:06 +1100
Subject: [PATCH 0997/1056] io-publish: --timeout: first cut implemented; todo:
 test with --exec; decide what to do with ascii input (e.g. throw on
 --timeout?)

---
 io/applications/io-publish.cpp | 39 ++++++++++++++++----------------
 io/impl/publish.cpp            | 35 ++++++++++++++++++++++++-----
 io/impl/publish.h              | 41 ++++++++++++++++++++++------------
 3 files changed, 76 insertions(+), 39 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 3d24bef57..2df96287c 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -163,14 +163,14 @@ int main( int ac, char** av )
         COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || read_timeout, "--reconnect-on-read-timeout requires --read-timeout <seconds>" );
         COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || !exec_command.empty(), "--reconnect-on-read-timeout requires --exec <command>" );
         COMMA_ASSERT_BRIEF( !timeout_is_error || read_timeout, "--timeout-is-error requires --read-timeout <seconds>" );
-        unsigned int size = options.value( "-s,--size", 0 );
         comma::io::impl::publish p( names
-                                  , size * options.value( "-m,--multiplier", 1 )
+                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
                                   , !options.exists( "--no-discard" )
                                   , !options.exists( "--no-flush" )
                                   , options.exists( "--output-number-of-clients,--clients" )
                                   , exit_on_no_clients || on_demand
-                                  , options.value( "--cache-size,--cache", 0 ) );
+                                  , options.value( "--cache-size,--cache", 0 )
+                                  , read_timeout );
         if( !tail.empty() )
         {
             COMMA_ASSERT_BRIEF( exec_command.empty(), "expected either --exec or --, got both" );
@@ -180,26 +180,15 @@ int main( int ac, char** av )
         if( exec_command.empty() )
         {
             COMMA_ASSERT_BRIEF( !on_demand, "got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" );
-            comma::io::select select;
-            if( read_timeout ) { select.read().add( 0 ); }
             std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
             std::cin.tie( NULL ); // std::cin is tied to std::cout by default
-            while( std::cin.good() && !is_shutdown )
+            while( std::cin.good() && !is_shutdown && !p.is_timeout() )
             {
-                if( read_timeout )
+                if( !p.read( std::cin ) )
                 {
-                    auto available = std::cin.rdbuf()->in_avail();
-                    if( available == 0 ) // todo! || ( size > 0 && available < size ) )
-                    {
-                        select.wait( *read_timeout );
-                        if( !select.read().ready( 0 ) )
-                        {
-                            comma::say() << "read: timeout no input after " << *read_timeout << " seconds" << std::endl;
-                            exit( timeout_is_error ? 1 : 0 );
-                        }
-                    }
+                    if( exit_on_no_clients ) { break; }
+                    if( read_timeout && p.is_timeout() ) { comma::say() << "timeout: received no data after " << *read_timeout << " seconds" << std::endl; break; }
                 }
-                if( !p.read( std::cin ) && exit_on_no_clients ) { break; }
             }
         }
         else
@@ -215,12 +204,24 @@ int main( int ac, char** av )
                 command cmd( exec_command );
                 typedef boost::iostreams::file_descriptor_source fd_t;
                 boost::iostreams::stream< fd_t > is( fd_t( cmd.fd(), boost::iostreams::never_close_handle ) );
-                while( is.good() && !is_shutdown && p.read( is ) );
+                while( is.good() && !is_shutdown )
+                {
+                    if( !p.read( is, cmd.fd() ) )
+                    {
+                        //if( exit_on_no_clients ) { break; }
+                        if( read_timeout && p.is_timeout() )
+                        {
+                            comma::say() << "timeout: received no data after " << *read_timeout << " seconds" << std::endl;
+                            if( !reconnect_on_read_timeout ) { break; }
+                        }
+                    }
+                }
                 if( !on_demand ) { break; }
                 p.disconnect_all();
             }
         }
         //ProfilerStop(); }
+        if( p.is_timeout() ) { return timeout_is_error ? 1 : 0; }
         if( is_shutdown ) { comma::say() << "interrupted by signal" << std::endl; }
         return 0;
     }
diff --git a/io/impl/publish.cpp b/io/impl/publish.cpp
index c8b64b49b..e97a09d7a 100644
--- a/io/impl/publish.cpp
+++ b/io/impl/publish.cpp
@@ -175,7 +175,8 @@ publish::publish( const std::vector< std::string >& endpoints
                 , bool flush
                 , bool output_number_of_clients
                 , bool update_no_clients
-                , unsigned int cache_size )
+                , unsigned int cache_size
+                , const boost::optional< double >& timeout )
     : multiserver< comma::io::oserver >( endpoints
                                        , packet_size
                                        , discard
@@ -183,6 +184,7 @@ publish::publish( const std::vector< std::string >& endpoints
                                        , output_number_of_clients
                                        , update_no_clients
                                        , cache_size )
+    , _timeout( timeout )
 {
 }
 
@@ -203,18 +205,39 @@ bool publish::write( const char* buf, unsigned int size )
     return write( std::string( buf, size ) ); // todo: quick and dirty, watch performance
 }
 
-bool publish::read( std::istream& input )
+static bool _enough( std::istream& is, unsigned int size )
 {
+    auto available = is.rdbuf()->in_avail();
+    return ( size == 0 && available > 0 ) || ( size > 0 && available >= size );
+}
+
+bool publish::read( std::istream& is, io::file_descriptor fd )
+{
+    if( _timeout )
+    {
+        _is_timeout = false;
+        if( !_enough( is, packet_size_ ) && !is.eof() )
+        {
+            if( _select.read()().empty() || *_select.read()().begin() != fd )
+            {
+                _select.read().clear(); // todo: quick and dirty, watch performance
+                _select.read().add( fd );
+            }
+            _select.wait( *_timeout );
+            _is_timeout = !_enough( is, packet_size_ ) && !_select.read().ready( fd );
+            if( _is_timeout ) { return false; }
+        }
+    }
     if( is_binary_() )
     {
-        input.read( &buffer_[0], buffer_.size() );
-        if( input.gcount() < int( buffer_.size() ) || !input.good() ) { return false; }
+        is.read( &buffer_[0], buffer_.size() );
+        if( is.gcount() < int( buffer_.size() ) || !is.good() || is.eof() ) { return false; }
     }
     else
     {
-        std::getline( input, buffer_ );
+        std::getline( is, buffer_ );
         buffer_ += '\n';
-        if( !input.good() ) { return false; }
+        if( !is.good() || is.eof() ) { return false; }
     }
     return write( buffer_ );
 }
diff --git a/io/impl/publish.h b/io/impl/publish.h
index c245bb4bf..a21db620b 100644
--- a/io/impl/publish.h
+++ b/io/impl/publish.h
@@ -14,8 +14,11 @@
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/iostreams/device/file_descriptor.hpp>
 #include <boost/iostreams/stream.hpp>
+#include <boost/optional.hpp>
 #include <boost/thread.hpp>
+#include "../../base/none.h"
 #include "../../io/file_descriptor.h"
+#include "../../io/select.h"
 #include "../../io/server.h"
 #include "../../string/string.h"
 #include "../../sync/synchronized.h"
@@ -74,21 +77,31 @@ class multiserver
         void accept_();
 };
 
-struct publish : public multiserver< comma::io::oserver >
+class publish : public multiserver< comma::io::oserver >
 {
-    publish( const std::vector< std::string >& endpoints
-            , unsigned int packet_size
-            , bool discard
-            , bool flush
-            , bool output_number_of_clients
-            , bool update_no_clients
-            , unsigned int cache_size );
-    
-    bool read( std::istream& input );
-
-    bool write( const std::string& s );
-
-    bool write( const char* buf, unsigned int size );
+    public:
+        publish( const std::vector< std::string >& endpoints
+               , unsigned int packet_size
+               , bool discard
+               , bool flush
+               , bool output_number_of_clients
+               , bool update_no_clients
+               , unsigned int cache_size
+               , const boost::optional< double >& timeout = comma::silent_none< double >() );
+        
+        bool read( std::istream& input, io::file_descriptor fd = 0 );
+
+        bool write( const std::string& s );
+
+        bool write( const char* buf, unsigned int size );
+
+        bool is_timeout() const { return _is_timeout; }
+
+    protected:
+        comma::io::select _select;
+        boost::optional< double > _timeout;
+        io::file_descriptor _fd{0};
+        bool _is_timeout{false};
 };
 
 class receive : public multiserver< comma::io::iserver >

From 81b1e020443be8eaebbc02e8bc11d8d14cf5b711 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 21 Jan 2025 22:58:17 +1100
Subject: [PATCH 0998/1056] io-publish: --exec: inadvertently introduced bug
 fixed: break on read() returning false

---
 io/applications/io-publish.cpp | 13 ++++++-------
 1 file changed, 6 insertions(+), 7 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 2df96287c..2c0c05dc6 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -206,15 +206,14 @@ int main( int ac, char** av )
                 boost::iostreams::stream< fd_t > is( fd_t( cmd.fd(), boost::iostreams::never_close_handle ) );
                 while( is.good() && !is_shutdown )
                 {
-                    if( !p.read( is, cmd.fd() ) )
+                    if( p.read( is, cmd.fd() ) ) { continue; }
+                    //if( exit_on_no_clients ) { break; }
+                    if( read_timeout && p.is_timeout() )
                     {
-                        //if( exit_on_no_clients ) { break; }
-                        if( read_timeout && p.is_timeout() )
-                        {
-                            comma::say() << "timeout: received no data after " << *read_timeout << " seconds" << std::endl;
-                            if( !reconnect_on_read_timeout ) { break; }
-                        }
+                        comma::say() << "timeout: received no data after " << *read_timeout << " seconds" << std::endl;
+                        if( !reconnect_on_read_timeout ) { break; }
                     }
+                    break;
                 }
                 if( !on_demand ) { break; }
                 p.disconnect_all();

From 022f4f4093556e2bce9a56273cb7e161a6f6d91a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 22 Jan 2025 11:32:24 +1100
Subject: [PATCH 0999/1056] io-publish: --reconnect-on-read-timeout renamed to
 --reconnect-on-timeout; io-topics: timeout and reconnect_on_timeout added to
 topic configuration; debugging...

---
 io/applications/io-publish.cpp | 10 +++++-----
 io/applications/io-topics      | 36 ++++++++++++++++++++--------------
 2 files changed, 26 insertions(+), 20 deletions(-)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 2c0c05dc6..70b0ad760 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -45,7 +45,7 @@ stream options
                                              for longer than <seconds>
                                              limitation: if an input packet is half-read
                                                          io-publish still will block on read
-    --timeout-reconnect,--reconnect-on-read-timeout, only if --exec present
+    --timeout-reconnect,--reconnect-on-timeout; reconnect on read timeout only if --exec present
     --timeout-is-error; exit with error on timeout
 
 client options
@@ -149,7 +149,7 @@ int main( int ac, char** av )
         for( int i = 0; i < ac && std::string( "--" ) != av[i]; ++i ) { head.push_back( av[i] ); }
         for( int i = head.size() + 1; i < ac; ++i ) { tail.push_back( av[i] ); }
         comma::command_line_options options( head, usage );
-        const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand,--timeout-reconnect,--reconnect-on-read-timeout,--timeout-is-error", "-.+" );
+        const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand,--timeout-reconnect,--reconnect-on-timeout,--timeout-is-error", "-.+" );
         if( names.empty() ) { comma::say() << "please specify at least one stream; use '-' for stdout" << std::endl; return 1; }
         options.assert_mutually_exclusive( "--cache-size,--cache", "--on-demand" );
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
@@ -157,11 +157,11 @@ int main( int ac, char** av )
         bool on_demand = options.exists( "--on-demand" );
         bool exit_on_no_clients = options.exists( "--exit-on-no-clients,-e" );
         std::string exec_command = options.value< std::string >( "--exec", "" );
-        bool reconnect_on_read_timeout = options.exists( "--timeout-reconnect,--reconnect-on-read-timeout" );
+        bool reconnect_on_read_timeout = options.exists( "--timeout-reconnect,--reconnect-on-timeout" );
         bool timeout_is_error = options.exists( "--timeout-is-error" );
         boost::optional< double > read_timeout = options.optional< double >( "--timeout-read,--read-timeout" );
-        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || read_timeout, "--reconnect-on-read-timeout requires --read-timeout <seconds>" );
-        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || !exec_command.empty(), "--reconnect-on-read-timeout requires --exec <command>" );
+        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || read_timeout, "--reconnect-on-timeout requires --read-timeout <seconds>" );
+        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || !exec_command.empty(), "--reconnect-on-timeout requires --exec <command>" );
         COMMA_ASSERT_BRIEF( !timeout_is_error || read_timeout, "--timeout-is-error requires --read-timeout <seconds>" );
         comma::io::impl::publish p( names
                                   , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
diff --git a/io/applications/io-topics b/io/applications/io-topics
index 0dd42e1fa..6f1f17218 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -200,20 +200,22 @@ function publish_topic_fields() { publish_topic_fields_help | grep -v '^ ' | cut
 function publish_topic_fields_help()
 {
     cat <<eof
-address;           passed verbatim to io-publish, port attribute will be ignored
-binary;            for binary data, binary format of data, overrides size
-cache_size;        same meaning as io-publish --cache-size
-command;           command for the publisher to run
-input;             input topic for publish command to read on stdin
-multiplier;        passed to io-publish
-on_demand;         same meaning as io-publish --on-demand
-on_exit;           command to run when publisher stops
-port;              tcp port for publishing, unless address field is present
-secondary/address; passed verbatim to io-publish as '<address>;secondary',
-                   in this case port attribute ignored
-secondary/port;    secondary tcp port for publishing, unless address field is
-                   present, io-publish as 'tcp:<port>;secondary'
-size;              for binary data, size of the binary record
+address;              passed verbatim to io-publish, port attribute will be ignored
+binary;               for binary data, binary format of data, overrides size
+cache_size;           same meaning as io-publish --cache-size
+command;              command for the publisher to run
+input;                input topic for publish command to read on stdin
+multiplier;           passed to io-publish
+on_demand;            same meaning as io-publish --on-demand
+on_exit;              command to run when publisher stops
+port;                 tcp port for publishing, unless address field is present
+reconnect_on_timeout; same meaning as io-publish --reconnect-on-timeout
+secondary/address;    passed verbatim to io-publish as '<address>;secondary',
+                      in this case port attribute ignored
+secondary/port;       secondary tcp port for publishing, unless address field is
+                      present, io-publish as 'tcp:<port>;secondary'
+size;                 for binary data, size of the binary record
+timeout;              same meaning as io-publish --timeout=<seconds>
 eof
 }
 
@@ -333,8 +335,10 @@ function publish_command()
     [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
     if [[ -n "$topic_multiplier" ]]; then multiplier="--multiplier $topic_multiplier"; else unset multiplier; fi
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
+    if [[ "$topic_timeout" == 1 || "$topic_timeout" == "true" ]]; then timeout="--timeout=$timeout"; else unset timeout; fi
+    if [[ "$topic_reconnect_on_timeout" == 1 || "$topic_reconnect_on_timeout" == "true" ]]; then reconnect_on_timeout="--reconnect-on-timeout"; else unset reconnect_on_timeout; fi
     if [[ -n "$topic_cache_size" ]]; then cache_size="--cache-size=$topic_cache_size"; else unset cache_size; fi
-    local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size -- "
+    local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size $timeout $reconnect_on_timeout -- "
     verbose "publish topic_command: $topic_command"
     local expanded_topic_command=$( expanded_command "$topic_command" )
     verbose "publish expanded_topic_command: $expanded_topic_command"
@@ -351,6 +355,8 @@ function cat_command()
     (( ignore_command )) || [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
     set_topic_address
     if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi # todo? remove? is it even used anywhere?
+    if [[ "$topic_timeout" == 1 || "$topic_timeout" == "true" ]]; then timeout="--timeout=$timeout"; else unset timeout; fi
+    if [[ "$topic_reconnect_on_timeout" == 1 || "$topic_reconnect_on_timeout" == "true" ]]; then reconnect_on_timeout="--reconnect-on-timeout"; else unset reconnect_on_timeout; fi
     if [[ -n "$topic_cache_size" ]]; then cache_size=$topic_cache_size; else unset cache_size; fi
     if [[ -n "$topic_flush" ]]; then flush_option="--flush"; else unset flush_option; fi # todo! make flush default?!
     if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi

From 88a26098c83765dc5cb22ef27e4947d708ca4556 Mon Sep 17 00:00:00 2001
From: seva <seva@tinbox>
Date: Fri, 24 Jan 2025 15:31:55 +1100
Subject: [PATCH 1000/1056] python: files/namespaces privatised

---
 python/comma/application/__init__.py                        | 3 ++-
 .../comma/application/{command_line.py => _command_line.py} | 0
 python/comma/csv/__init__.py                                | 6 +++---
 python/comma/csv/{options.py => _options.py}                | 0
 python/comma/csv/{stream.py => _stream.py}                  | 2 +-
 python/comma/csv/{struct.py => _struct.py}                  | 0
 python/comma/dictionary/__init__.py                         | 2 +-
 python/comma/dictionary/{util.py => _util.py}               | 0
 python/comma/filesystem/__init__.py                         | 2 +-
 python/comma/filesystem/{impl.py => _impl.py}               | 0
 python/comma/io/__init__.py                                 | 2 +-
 .../{readlines_unbuffered.py => _readlines_unbuffered.py}   | 1 -
 python/comma/io/windows_binary.py                           | 6 ++----
 python/comma/numpy/__init__.py                              | 2 +-
 python/comma/numpy/{functions.py => _functions.py}          | 0
 python/comma/signal/__init__.py                             | 2 +-
 python/comma/signal/{signal.py => _signal.py}               | 0
 python/comma/util/__init__.py                               | 4 ++--
 python/comma/util/{help_formatter.py => _help_formatter.py} | 0
 python/comma/util/{warning.py => _warning.py}               | 0
 20 files changed, 15 insertions(+), 17 deletions(-)
 rename python/comma/application/{command_line.py => _command_line.py} (100%)
 rename python/comma/csv/{options.py => _options.py} (100%)
 rename python/comma/csv/{stream.py => _stream.py} (99%)
 rename python/comma/csv/{struct.py => _struct.py} (100%)
 rename python/comma/dictionary/{util.py => _util.py} (100%)
 rename python/comma/filesystem/{impl.py => _impl.py} (100%)
 rename python/comma/io/{readlines_unbuffered.py => _readlines_unbuffered.py} (99%)
 rename python/comma/numpy/{functions.py => _functions.py} (100%)
 rename python/comma/signal/{signal.py => _signal.py} (100%)
 rename python/comma/util/{help_formatter.py => _help_formatter.py} (100%)
 rename python/comma/util/{warning.py => _warning.py} (100%)

diff --git a/python/comma/application/__init__.py b/python/comma/application/__init__.py
index 3ba012175..d7233de96 100644
--- a/python/comma/application/__init__.py
+++ b/python/comma/application/__init__.py
@@ -27,4 +27,5 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .command_line import *
+from ._command_line import set_dictionary_action, remove_argparse_options
+
diff --git a/python/comma/application/command_line.py b/python/comma/application/_command_line.py
similarity index 100%
rename from python/comma/application/command_line.py
rename to python/comma/application/_command_line.py
diff --git a/python/comma/csv/__init__.py b/python/comma/csv/__init__.py
index 53598c0bc..b21d6aceb 100644
--- a/python/comma/csv/__init__.py
+++ b/python/comma/csv/__init__.py
@@ -29,6 +29,6 @@
 
 from . import format
 from . import time
-from .struct import struct
-from .stream import stream, numpy_scalar_to_string
-from .options import add as add_options
+from ._struct import struct
+from ._stream import stream, numpy_scalar_to_string
+from ._options import add as add_options
diff --git a/python/comma/csv/options.py b/python/comma/csv/_options.py
similarity index 100%
rename from python/comma/csv/options.py
rename to python/comma/csv/_options.py
diff --git a/python/comma/csv/stream.py b/python/comma/csv/_stream.py
similarity index 99%
rename from python/comma/csv/stream.py
rename to python/comma/csv/_stream.py
index 3bdc89b81..8e5064a59 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/_stream.py
@@ -14,7 +14,7 @@
 from ..io import readlines_unbuffered
 from ..numpy import merge_arrays, types_of_dtype, structured_dtype
 from . import time as csv_time
-from .struct import struct
+from ._struct import struct
 
 DEFAULT_PRECISION = 12
 NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATCH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
diff --git a/python/comma/csv/struct.py b/python/comma/csv/_struct.py
similarity index 100%
rename from python/comma/csv/struct.py
rename to python/comma/csv/_struct.py
diff --git a/python/comma/dictionary/__init__.py b/python/comma/dictionary/__init__.py
index 3edd02acb..4705183ed 100644
--- a/python/comma/dictionary/__init__.py
+++ b/python/comma/dictionary/__init__.py
@@ -1,3 +1,3 @@
 # Copyright (c) 2023 Vsevolod Vlaskine
 
-from .util import at, has, leaves, parents, set, update
+from ._util import at, has, leaves, parents, set, update
diff --git a/python/comma/dictionary/util.py b/python/comma/dictionary/_util.py
similarity index 100%
rename from python/comma/dictionary/util.py
rename to python/comma/dictionary/_util.py
diff --git a/python/comma/filesystem/__init__.py b/python/comma/filesystem/__init__.py
index ecf88f4d4..bd07fc5c1 100644
--- a/python/comma/filesystem/__init__.py
+++ b/python/comma/filesystem/__init__.py
@@ -1 +1 @@
-from .impl import find, walk
\ No newline at end of file
+from ._impl import find, walk
\ No newline at end of file
diff --git a/python/comma/filesystem/impl.py b/python/comma/filesystem/_impl.py
similarity index 100%
rename from python/comma/filesystem/impl.py
rename to python/comma/filesystem/_impl.py
diff --git a/python/comma/io/__init__.py b/python/comma/io/__init__.py
index 9acc4e680..477c16ed9 100644
--- a/python/comma/io/__init__.py
+++ b/python/comma/io/__init__.py
@@ -27,4 +27,4 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .readlines_unbuffered import readlines_unbuffered
+from ._readlines_unbuffered import readlines_unbuffered
diff --git a/python/comma/io/readlines_unbuffered.py b/python/comma/io/_readlines_unbuffered.py
similarity index 99%
rename from python/comma/io/readlines_unbuffered.py
rename to python/comma/io/_readlines_unbuffered.py
index 94ec2a389..b8c158524 100644
--- a/python/comma/io/readlines_unbuffered.py
+++ b/python/comma/io/_readlines_unbuffered.py
@@ -31,7 +31,6 @@
 if sys.version_info.major < 3: from itertools import ifilter
 else: ifilter = filter # quick and dirty, tired of googling...
 
-
 def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
     """
     read the given number of lines from source, such as stdin, without buffering
diff --git a/python/comma/io/windows_binary.py b/python/comma/io/windows_binary.py
index 85249fa0d..3123fc897 100644
--- a/python/comma/io/windows_binary.py
+++ b/python/comma/io/windows_binary.py
@@ -6,10 +6,8 @@
 '''
 import sys
 
-
 # todo check this still allows ascii
 # todo if not, provide a function instead
 if sys.platform == "win32":
-        import os
-        import msvcrt
-        msvcrt.setmode(sys.stdout.fileno(), os.O_BINARY)
+    import os, msvcrt
+    msvcrt.setmode(sys.stdout.fileno(), os.O_BINARY)
diff --git a/python/comma/numpy/__init__.py b/python/comma/numpy/__init__.py
index fca93ccd7..8cc2cc9dd 100644
--- a/python/comma/numpy/__init__.py
+++ b/python/comma/numpy/__init__.py
@@ -27,4 +27,4 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .functions import *
+from ._functions import merge_arrays, strip_byte_order_prefix, shape_to_string, types_of_dtype, structured_dtype, type_to_string
diff --git a/python/comma/numpy/functions.py b/python/comma/numpy/_functions.py
similarity index 100%
rename from python/comma/numpy/functions.py
rename to python/comma/numpy/_functions.py
diff --git a/python/comma/signal/__init__.py b/python/comma/signal/__init__.py
index c2a318e96..af8770deb 100644
--- a/python/comma/signal/__init__.py
+++ b/python/comma/signal/__init__.py
@@ -27,4 +27,4 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .signal import is_shutdown
+from ._signal import is_shutdown
diff --git a/python/comma/signal/signal.py b/python/comma/signal/_signal.py
similarity index 100%
rename from python/comma/signal/signal.py
rename to python/comma/signal/_signal.py
diff --git a/python/comma/util/__init__.py b/python/comma/util/__init__.py
index 000e7ad61..3d4c43554 100644
--- a/python/comma/util/__init__.py
+++ b/python/comma/util/__init__.py
@@ -27,5 +27,5 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .help_formatter import argparse_fmt
-from .warning import warning
\ No newline at end of file
+from ._help_formatter import argparse_fmt
+from ._warning import warning
\ No newline at end of file
diff --git a/python/comma/util/help_formatter.py b/python/comma/util/_help_formatter.py
similarity index 100%
rename from python/comma/util/help_formatter.py
rename to python/comma/util/_help_formatter.py
diff --git a/python/comma/util/warning.py b/python/comma/util/_warning.py
similarity index 100%
rename from python/comma/util/warning.py
rename to python/comma/util/_warning.py

From 705d78aac28acfc2e64fa3cfa17bfd6024d13065 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 20 Feb 2025 23:42:36 +1100
Subject: [PATCH 1001/1056] python/comma/numpy/test/test_functions.py:
 namespace problem for ubuntu 18.04

---
 python/comma/numpy/test/test_functions.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/python/comma/numpy/test/test_functions.py b/python/comma/numpy/test/test_functions.py
index d049183fd..636b61a0e 100644
--- a/python/comma/numpy/test/test_functions.py
+++ b/python/comma/numpy/test/test_functions.py
@@ -174,8 +174,8 @@ def test_structure_out_of_order(self):
             self.assertEqual( sorted_fields1, sorted_fields2 )
             self.assertEqual( len( ndtype1.descr ), 4 )
             self.assertEqual( len( ndtype2.descr ), 5 )  # shall be 4
-            self.assertEqual( len( functions.types_of_dtype( ndtype1 ) ), 4 )
-            self.assertEqual( len( functions.types_of_dtype( ndtype2 ) ), 5 )  # shall be 4
+            self.assertEqual( len( types_of_dtype( ndtype1 ) ), 4 )
+            self.assertEqual( len( types_of_dtype( ndtype2 ) ), 5 )  # shall be 4
         except ValueError:
             import sys
             print( file = sys.stderr )

From a99a0ce031705c468557d65bc5002a0b10a265b3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 24 Mar 2025 12:12:24 +1100
Subject: [PATCH 1002/1056] base: exception method implementation moved to cpp

---
 base/exception.cpp             | 49 ++++++++++++++++++++++++++++++++++
 base/exception.h               | 44 +-----------------------------
 base/test/CMakeLists.txt       |  2 +-
 containers/test/CMakeLists.txt |  2 +-
 dynamic/shared_library.h       |  4 +--
 dynamic/test/include_test.cpp  |  1 +
 6 files changed, 55 insertions(+), 47 deletions(-)
 create mode 100644 base/exception.cpp

diff --git a/base/exception.cpp b/base/exception.cpp
new file mode 100644
index 000000000..2cf93c5b9
--- /dev/null
+++ b/base/exception.cpp
@@ -0,0 +1,49 @@
+// Copyright (c) 2011 The University of Sydney
+
+#include "exception.h"
+
+namespace comma {
+
+exception::exception( const char *message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : std::runtime_error( message )
+    , _message( message )
+    , _filename( filename )
+    , _line( line_number )
+    , _function( function_name )
+{
+    _formatted_string( brief );
+}
+
+exception::exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : std::runtime_error( message.c_str() )
+    , _message( message )
+    , _filename( filename )
+    , _line( line_number )
+    , _function( function_name )
+{
+    _formatted_string( brief );
+}
+
+const char* exception::what() const throw()
+{
+    const char* string = "exception::what() _formatted_message.c_str() threw exception";
+    try { string = _formatted_message.c_str(); } catch( ... ) {}
+    return string;
+}
+
+void exception::_formatted_string( bool brief )
+{
+    std::ostringstream oss;
+    oss << error() << std::endl;
+    if( !brief )
+    {
+        oss << "============================================" << std::endl
+            << "file: "     << _filename << std::endl
+            << "line: "     << _line << std::endl
+            << "function: " << _function << std::endl
+            << "============================================" << std::endl;
+    }
+    _formatted_message = oss.str();
+}
+
+}  // namespace comma
diff --git a/base/exception.h b/base/exception.h
index 1a2746c15..5b92b0e92 100644
--- a/base/exception.h
+++ b/base/exception.h
@@ -89,51 +89,9 @@ class exception : public std::runtime_error
 
         std::string     _message;
         std::string     _filename;
-        unsigned long   _line;
+        unsigned long   _line{0};
         std::string     _function;
         std::string     _formatted_message;
 };
 
-inline exception::exception( const char *message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
-    : std::runtime_error( message )
-    , _message( message )
-    , _filename( filename )
-    , _line( line_number )
-    , _function( function_name )
-{
-    _formatted_string( brief );
-}
-
-inline exception::exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
-    : std::runtime_error( message.c_str() )
-    , _message( message )
-    , _filename( filename )
-    , _line( line_number )
-    , _function( function_name )
-{
-    _formatted_string( brief );
-}
-
-inline const char* exception::what() const throw()
-{
-    const char* string = "exception::what() _formatted_message.c_str() threw exception";
-    try { string = _formatted_message.c_str(); } catch( ... ) {}
-    return string;
-}
-
-inline void exception::_formatted_string( bool brief )
-{
-    std::ostringstream oss;
-    oss << error() << std::endl;
-    if( !brief )
-    {
-        oss << "============================================" << std::endl
-            << "file: "     << _filename << std::endl
-            << "line: "     << _line << std::endl
-            << "function: " << _function << std::endl
-            << "============================================" << std::endl;
-    }
-    _formatted_message = oss.str();
-}
-
 }  // namespace comma
diff --git a/base/test/CMakeLists.txt b/base/test/CMakeLists.txt
index 0e78c696c..9fb546dd8 100644
--- a/base/test/CMakeLists.txt
+++ b/base/test/CMakeLists.txt
@@ -2,7 +2,7 @@ set( KIT base )
 file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
 set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
 add_executable( ${test_name} ${source} )
-target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} pthread )
+target_link_libraries( ${test_name} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
 add_test( NAME ${test_name} COMMAND ${test_name} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
 if( INSTALL_TESTS )
     install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
diff --git a/containers/test/CMakeLists.txt b/containers/test/CMakeLists.txt
index b9b7a7532..4442cc2c5 100644
--- a/containers/test/CMakeLists.txt
+++ b/containers/test/CMakeLists.txt
@@ -2,7 +2,7 @@ set( KIT containers )
 file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
 set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
 add_executable( ${test_name} ${source} )
-target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} pthread ) # target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} comma_base pthread ) # target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
 add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
 if( INSTALL_TESTS )
     install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
index 38c3246d8..ac908cbb0 100644
--- a/dynamic/shared_library.h
+++ b/dynamic/shared_library.h
@@ -45,9 +45,9 @@ inline shared_library::shared_library( const std::string& lib, std::vector<std::
 template < typename T, typename... Args >
 inline T* shared_library::make( const std::string& library_symbol, Args... args ) const
 {
-    char* error;
+    char* error{nullptr};
     auto symbol = dlsym(handle_, &library_symbol[0]);
-    COMMA_ASSERT( error == NULL, error );
+    COMMA_ASSERT( error == nullptr, error );
     if( symbol == nullptr ) { std::cerr << dlerror() << std::endl; }
     COMMA_ASSERT( symbol, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");
     T* (*create_)(Args...) = reinterpret_cast<T*(*)(Args...)>(symbol);
diff --git a/dynamic/test/include_test.cpp b/dynamic/test/include_test.cpp
index dd696fcd0..dbe7b6d29 100644
--- a/dynamic/test/include_test.cpp
+++ b/dynamic/test/include_test.cpp
@@ -14,6 +14,7 @@ TEST( initialise, no_args )
 {
     comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
     auto p = library.make< comma::dynamic::test::simple >( "comma_dynamic_test_create_simple" );
+    ( void )p;
 }
 
 
From 8cc2876ff37473ceb0f1bc48b188c6455f857eda Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Sun, 6 Apr 2025 22:00:49 +1000
Subject: [PATCH 1003/1056] comma-test-run: --until-first-failure:
 --assert-status alias added

---
 util/applications/comma-test-run  |  2 +-
 util/applications/comma-test-util | 28 ++++++++++++++++++----------
 2 files changed, 19 insertions(+), 11 deletions(-)

diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index ea92fece4..34e958dc0 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -68,7 +68,7 @@ function description_test_selection()
 --tags-excluded=[<tags>]; |-separated tags or regular expressions, do not run tests with given tags (see below)
 --tags-list; list tags for all subdirectories as <dir>,<tags>
 --to=[<dir>]; run tests up to a given test, the latter included, where test directories are ordered lexicographically
---until-first-failure; exit after the first failure (works only when tests run serially)
+--until-first-failure,--assert-status; exit after the first failure i.e. test script or command returning non-zero (works only when tests run serially)
 --white-list=[<file>]; only run these tests mentioned in the <file>, applied first before black list;
   comment lines starting with # are ignored; each entry in the list matches to a sub-directory or
   directories name using pattern ^<subdir>; see examples
diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index db139bd3a..41937c579 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -95,15 +95,23 @@ export -f _comma_test_command_impl
 
 function _comma_test_commands_impl()
 {
-    local key value status output until_first_error=$1 fields=$2
+    local key value status output until_first_failure=$1 fields=$2 assert_status=0
+    local input=$( grep '=' ; grep -v '^#' )
+    # local critical_tests=()
+    # while IFS='=' read key value ; do
+    #     [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
+    #     key=$( comma-string-strip <<< "$key" )
+    #     # todo: if $key is $blah/assert_status=1, then critical_tests+=( "$blah" )  
+    # done <<< "$input"
     while IFS='=' read key value ; do
         [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
         key=$( comma-string-strip <<< "$key" )
         _comma_test_command_impl "$key" "$value"
         status=$?
         echo "$key/status=$status"
-        if (( status != 0 && until_first_error )); then break; fi
-    done < <( grep '=' ; grep -v '^#' )
+        if (( status != 0 && until_first_failure )); then break; fi
+        # todo: if (( status != 0 && $key in critical tests )); then break; - or maybe it should be: return 1
+    done <<< "$input"
 }
 
 # a helper to write tests in the comma-test-run style
@@ -136,12 +144,12 @@ function _comma_test_commands_impl()
 # my_basic_test[1]/for/something/output=0
 
 function comma_test_commands() { _comma_test_commands_impl 0 "$@" ; }
-function comma_test_commands_until_first_error() { _comma_test_commands_impl 1 "$@" ; }
+function comma_test_commands_until_first_failure() { _comma_test_commands_impl 1 "$@" ; }
 
 # run interactive test
 #
-# usage: comma_test_interactive_commands [<until_first_error>]
-#        <until_first_error>: 0 (i.e. false) or 1 (i.e. true); default: 0
+# usage: comma_test_interactive_commands [<until_first_failure>]
+#        <until_first_failure>: 0 (i.e. false) or 1 (i.e. true); default: 0
 #
 # it works as something like
 #
@@ -167,8 +175,8 @@ function comma_test_commands_until_first_error() { _comma_test_commands_impl 1 "
 # see for an example: e.g. snark/graphics/applications/test/view-points/colour/scalar/options
 function comma_test_interactive_commands()
 {
-    local until_first_error=$1
-    if [[ -n "$until_first_error" ]]; then until_first_error=1; else until_first_error=0; fi
+    local until_first_failure=$1
+    if [[ -n "$until_first_failure" ]]; then until_first_failure=1; else until_first_failure=0; fi
     (
         function comma_test_interactive_test_case()
         {
@@ -206,13 +214,13 @@ function comma_test_interactive_commands()
             local test_case=$( grep "^$escaped/" <<< "$lines" | sed "s#^$escaped/##" ) # grep --fixed-strings does not seem to work
             comma_test_interactive_test_case $test_case_name $testcase_number $number_of_testcases <<< "$test_case"
             local r=$?
-            if (( r != 0 && until_first_error )); then return $r; fi
+            if (( r != 0 && until_first_failure )); then return $r; fi
             (( ++testcase_number ))
         done <<< "$test_cases"
     )
 }
 
-function comma_test_interactive_commands_until_first_error() { comma_test_interactive_commands 1; }
+function comma_test_interactive_commands_until_first_failure() { comma_test_interactive_commands 1; }
 
 # the tmp directory cleanup for comma_test_run_tarball
 function comma_test_run_tarball_cleanup()

From c5826e5bb4a53839306f0c7e9bddaea7bfaf4727 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 7 Apr 2025 18:26:30 +1000
Subject: [PATCH 1004/1056] csv-calc, io-ls: comma::verbose phased out

---
 csv/applications/csv-calc.cpp | 15 +++++++--------
 io/applications/io-ls.cpp     | 25 ++++++++++---------------
 2 files changed, 17 insertions(+), 23 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 00cac2faa..f0cf64087 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -21,7 +21,6 @@
 #include <boost/scoped_ptr.hpp>
 #include <boost/unordered_map.hpp>
 #include <boost/date_time/posix_time/posix_time_types.hpp>
-#include "../../application/verbose.h"
 #include "../../base/exception.h"
 #include "../../base/none.h"
 #include "../../csv/format.h"
@@ -49,7 +48,7 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "column-wise calculation, optionally by id and block" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage: cat data.csv | " << comma::verbose.app_name() << " <what> [<options>] > calc.csv" << std::endl;
+    std::cerr << "usage: cat data.csv | csv-calc <what> [<options>] > calc.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "<what>: comma-separated list of operations" << std::endl;
     std::cerr << "        results will be output in the same order" << std::endl;
@@ -115,13 +114,13 @@ static void usage( bool verbose )
         std::cerr << std::endl;
     }
     std::cerr << "examples" << std::endl;
-    std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.9" << std::endl;
-    std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.1,percentile=0.9" << std::endl;
-    std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.9:interpolate --verbose" << std::endl;
+    std::cerr << "    seq 1 1000 | csv-calc percentile=0.9" << std::endl;
+    std::cerr << "    seq 1 1000 | csv-calc percentile=0.1,percentile=0.9" << std::endl;
+    std::cerr << "    seq 1 1000 | csv-calc percentile=0.9:interpolate --verbose" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | " << comma::verbose.app_name() << " --fields=a,block percentile=0.9" << std::endl;
+    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | csv-calc --fields=a,block percentile=0.9" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | " << comma::verbose.app_name() << " --fields=a,id percentile=0.9" << std::endl;
+    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | csv-calc --fields=a,id percentile=0.9" << std::endl;
     std::cerr << std::endl;
     std::cerr << std::endl;
     exit( -1 );
@@ -353,7 +352,7 @@ template < typename T, typename V > struct map_traits
 
 template < typename V > struct map_traits< boost::posix_time::ptime, V >
 {
-    struct hash : public std::unary_function< boost::posix_time::ptime, std::size_t >
+    struct hash : public std::function< boost::posix_time::ptime( std::size_t ) >
     {
         std::size_t operator()( const boost::posix_time::ptime& t ) const
         {
diff --git a/io/applications/io-ls.cpp b/io/applications/io-ls.cpp
index 05ad1fe2a..916b8ad2e 100644
--- a/io/applications/io-ls.cpp
+++ b/io/applications/io-ls.cpp
@@ -169,12 +169,12 @@ void process_tcp(std::istream& is, const comma::csv::options& csv)
     comma::csv::output_stream<output_t> os(std::cout, csv);
     //first line is header
     std::getline(is,line);
-    comma::verbose<<line<<std::endl;
-    while(is.good())
+    comma::saymore() << line << std::endl;
+    while( is.good() )
     {
         std::getline(is,line);
-        comma::verbose<<line<<std::endl;
-        output.scan(line);
+        comma::saymore() << line << std::endl;
+        output.scan( line );
         if(port && output.local.port != *port) {continue;}
         if(state && output.state != *state) {continue;}
         os.write(output);
@@ -184,7 +184,7 @@ void usage(bool detail)
 {
     std::cerr << "    list tcp connections; reads and parses lines from /proc/net/tcp file and outputs them in csv format" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage:  " << comma::verbose.app_name() << " [ <options> ]" << std::endl;
+    std::cerr << "usage:  io-ls [ <options> ]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: show help" << std::endl;
@@ -201,7 +201,7 @@ void usage(bool detail)
     }
     else { std::cerr << "    see --help --verbose for more details" << std::endl<< std::endl; }
     std::cerr << "example" << std::endl;
-    std::cerr << "    (" << comma::verbose.app_name() << " --output-fields; "<<comma::verbose.app_name() << ") | column -ts, " << std::endl;
+    std::cerr << "    (io-ls --output-fields; io-ls | column -ts, " << std::endl;
     std::cerr << std::endl;
     std::cerr << "    io-ls --fields=local,state | csv-join --fields=,,state <(io-ls --enum-state)\";fields=state\"" << std::endl;
     std::cerr << std::endl;
@@ -221,14 +221,9 @@ int main( int ac, char** av )
         state=options.optional<unsigned int>("--state");
         std::fstream file("/proc/net/tcp", std::ios::in);
         process_tcp(file, csv);
+        return 0;
     }
-    catch( std::exception& ex )
-    {
-        std::cerr << comma::verbose.app_name() << ": " << ex.what() << std::endl; return 1;
-    }
-    catch( ... )
-    {
-        std::cerr << comma::verbose.app_name() << ": " << "unknown exception" << std::endl; return 1;
-    }
-    return 0;
+    catch( std::exception& ex ) { comma::say() << ": " << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << ": unknown exception" << std::endl; }
+    return 1;
 }

From 02d702415a74d0fb96a28be5dc9d24dc4e80df12 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 7 Apr 2025 19:19:37 +1000
Subject: [PATCH 1005/1056] comma-test-util: comma_test_commands: assert
 keyword added; todo: add to interactive commands...

---
 util/applications/comma-test-util             | 41 +++++++++++--------
 util/test/test_util/commands/assert/expected  |  6 +++
 util/test/test_util/commands/assert/input     |  4 ++
 util/test/test_util/commands/assert/test      | 10 +++++
 .../test_util/commands/{ => quoting}/expected |  0
 .../test_util/commands/{ => quoting}/input    |  0
 .../test_util/commands/{ => quoting}/test     |  0
 7 files changed, 44 insertions(+), 17 deletions(-)
 create mode 100644 util/test/test_util/commands/assert/expected
 create mode 100644 util/test/test_util/commands/assert/input
 create mode 100755 util/test/test_util/commands/assert/test
 rename util/test/test_util/commands/{ => quoting}/expected (100%)
 rename util/test/test_util/commands/{ => quoting}/input (100%)
 rename util/test/test_util/commands/{ => quoting}/test (100%)

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 41937c579..b460ae7ed 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -95,23 +95,20 @@ export -f _comma_test_command_impl
 
 function _comma_test_commands_impl()
 {
-    local key value status output until_first_failure=$1 fields=$2 assert_status=0
-    local input=$( grep '=' ; grep -v '^#' )
-    # local critical_tests=()
-    # while IFS='=' read key value ; do
-    #     [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
-    #     key=$( comma-string-strip <<< "$key" )
-    #     # todo: if $key is $blah/assert_status=1, then critical_tests+=( "$blah" )  
-    # done <<< "$input"
-    while IFS='=' read key value ; do
-        [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
-        key=$( comma-string-strip <<< "$key" )
+    local lhs key value status output until_first_failure=$1 fields=$2 predicate
+    while IFS='=' read lhs value ; do
+        [[ -n "$lhs" && ! "$lhs" =~ \#.* ]] || continue
+        local a=( $lhs )
+        if (( ${#a[@]} == 1 )); then predicate=; key=${a[0]}
+        elif (( ${#a[@]} == 2 )); then predicate=${a[0]}; key=${a[1]}
+        else echo "$0: expected [<predicate>] <test_name>=<command>, got: '$lhs=$value'" >&2; return 1; fi
         _comma_test_command_impl "$key" "$value"
         status=$?
         echo "$key/status=$status"
-        if (( status != 0 && until_first_failure )); then break; fi
-        # todo: if (( status != 0 && $key in critical tests )); then break; - or maybe it should be: return 1
-    done <<< "$input"
+        (( status != 0 )) || continue
+        if (( until_first_failure )); then return 1; fi 
+        if [[ "$predicate" == 'assert' ]]; then return 1; fi
+    done < <( grep '=' ; grep -v '^#' )
 }
 
 # a helper to write tests in the comma-test-run style
@@ -130,7 +127,6 @@ function _comma_test_commands_impl()
 #
 # if output fields are specified then the output will be split by field
 #
-#
 # e.g:
 # 
 # source $( type -p comma-test-util )
@@ -142,6 +138,17 @@ function _comma_test_commands_impl()
 # my_basic_test[1]/for/something/output/a="2"
 # my_basic_test[1]/for/something/output/b="4"
 # my_basic_test[1]/for/something/output=0
+#
+# 'assert' keyword: if present, do not run the remaining tests in the input file
+#
+# e.g, in the following example, the second test case my/test[1] does NOT run because
+#      the first failing test case my/test[0] has 'assert' in front of it
+#
+# source $( type -p comma-test-util )
+# ( echo 'assert my/test[0]="ls non-existent"'; echo 'my/test[1]="ls ."' ) | comma_test_commands
+# ls: cannot access 'non-existent': No such file or directory
+# my/test[0]/output=""
+# my/test[0]/status=2
 
 function comma_test_commands() { _comma_test_commands_impl 0 "$@" ; }
 function comma_test_commands_until_first_failure() { _comma_test_commands_impl 1 "$@" ; }
@@ -180,7 +187,7 @@ function comma_test_interactive_commands()
     (
         function comma_test_interactive_test_case()
         {
-            local name=$1 testcase_number=$2 number_of_testcases=$3
+            local name="$1" testcase_number=$2 number_of_testcases=$3
             local command instruction expected dialog input zenity_pid result
             #input=$( comma_path_value_mangle | sed 's/^/local /' )
             #eval "$input"
@@ -212,7 +219,7 @@ function comma_test_interactive_commands()
         while read test_case_name; do
             local escaped="${test_case_name//[/\\[}"
             local test_case=$( grep "^$escaped/" <<< "$lines" | sed "s#^$escaped/##" ) # grep --fixed-strings does not seem to work
-            comma_test_interactive_test_case $test_case_name $testcase_number $number_of_testcases <<< "$test_case"
+            comma_test_interactive_test_case "$test_case_name" $testcase_number $number_of_testcases <<< "$test_case"
             local r=$?
             if (( r != 0 && until_first_failure )); then return $r; fi
             (( ++testcase_number ))
diff --git a/util/test/test_util/commands/assert/expected b/util/test/test_util/commands/assert/expected
new file mode 100644
index 000000000..444ca4026
--- /dev/null
+++ b/util/test/test_util/commands/assert/expected
@@ -0,0 +1,6 @@
+basics[0]/output=""
+basics[0]/status=2
+basics[1]/output=""
+basics[1]/status=2
+status=1
+output/lines/count=4
diff --git a/util/test/test_util/commands/assert/input b/util/test/test_util/commands/assert/input
new file mode 100644
index 000000000..71d7b29b0
--- /dev/null
+++ b/util/test/test_util/commands/assert/input
@@ -0,0 +1,4 @@
+basics[0]="ls ./non-existent-file"
+assert basics[1]="ls ./non-existent-file"
+basics[1]="ls"
+basics[2]="ls ./non-existent-file"
diff --git a/util/test/test_util/commands/assert/test b/util/test/test_util/commands/assert/test
new file mode 100755
index 000000000..1a4e681a8
--- /dev/null
+++ b/util/test/test_util/commands/assert/test
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+output=$( comma_test_commands )
+status=$?
+echo "$output"
+echo "status=$status"
+echo "output/lines/count=$( wc -l <<< "$output" )"
\ No newline at end of file
diff --git a/util/test/test_util/commands/expected b/util/test/test_util/commands/quoting/expected
similarity index 100%
rename from util/test/test_util/commands/expected
rename to util/test/test_util/commands/quoting/expected
diff --git a/util/test/test_util/commands/input b/util/test/test_util/commands/quoting/input
similarity index 100%
rename from util/test/test_util/commands/input
rename to util/test/test_util/commands/quoting/input
diff --git a/util/test/test_util/commands/test b/util/test/test_util/commands/quoting/test
similarity index 100%
rename from util/test/test_util/commands/test
rename to util/test/test_util/commands/quoting/test

From 4120704140fb609cabf324891535d23cd603e672 Mon Sep 17 00:00:00 2001
From: rex <rex@super>
Date: Mon, 14 Apr 2025 08:52:45 +1000
Subject: [PATCH 1006/1056] comma-test-util: assert keyword for interactive
 tests

---
 util/applications/comma-test-util             | 126 +++++++++++++++---
 .../interactive_commands/assert/expected      |   6 +
 .../interactive_commands/assert/input         |   5 +
 .../interactive_commands/assert/test          |  10 ++
 4 files changed, 125 insertions(+), 22 deletions(-)
 create mode 100644 util/test/test_util/interactive_commands/assert/expected
 create mode 100644 util/test/test_util/interactive_commands/assert/input
 create mode 100755 util/test/test_util/interactive_commands/assert/test

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index b460ae7ed..9b03f7824 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -59,8 +59,40 @@ for line in sys.stdin.readlines(): print( line.strip() )
 eof
 }
 
+function _comma_test_util_test_case_name()
+{
+     cat <<eof
+import sys
+import re
+for line in sys.stdin:
+    match = re.match(r'(?:\S+\s+)?([^\s=]+)/command$', line)
+    if match:
+        print(match.group(1))
+eof
+}
+
+function _comma_test_util_test_case()
+{
+    cat <<eof
+import sys
+import re
+test_case_name = sys.argv[1]
+lines = sys.stdin.read().splitlines()
+for line in lines:
+    match = re.match(r'(?:(\S+)\s+)?(' + re.escape(test_case_name) + r')/(.+?)=(.*)', line)
+    if match:
+        predicate = match.group(1)
+        key = match.group(3)
+        val = match.group(4)
+        prefix = (predicate + ' ') if predicate else ''
+        print(f'{prefix}{key}={val}')
+eof
+}
+
 readonly _comma_test_util_strip_command="$( _comma_test_util_strip )"
 readonly _comma_test_util_unquote_command="$( _comma_test_util_unquote )"
+readonly _comma_test_util_test_case_name_command="$( _comma_test_util_test_case_name )"
+readonly _comma_test_util_test_case_command="$( _comma_test_util_test_case )"
 
 function comma-string-strip() { python3 -c "$_comma_test_util_strip_command"; } # todo: add comma-string-util, parametrise on strip characters
 
@@ -70,6 +102,14 @@ function comma-string-unquote() { python3 -c "$_comma_test_util_unquote_command"
 
 export -f comma-string-unquote
 
+function comma-string-test-case-name() { python3 -c "$_comma_test_util_test_case_name_command"; } # todo: add comma-string-util, parametrise on strip characters
+
+export -f comma-string-test-case-name
+
+function comma-string-test-case() { local name="$1"; python3 -c "$_comma_test_util_test_case_command" "$name"; } # todo: add comma-string-util, parametrise on strip characters
+
+export -f comma-string-test-case
+
 function _comma_test_command_impl()
 {
     local key="$1" value="$2"
@@ -180,48 +220,90 @@ function comma_test_commands_until_first_failure() { _comma_test_commands_impl 1
 # if test case does not have both instruction and expected, it is deemed non-interactive
 #
 # see for an example: e.g. snark/graphics/applications/test/view-points/colour/scalar/options
+#
+# 'assert' keyword: if present, do not run the remaining tests in the input file
+# predicates (like assert) are individually assosciated with command | instruction | expected
+#
+# in the folllowing example, my/test[1] will NOT  run if
+#   - command returns non-zero status (assert command)
+#   - zenity prompt returns non-zero status (assert expected)
+# there is currently no implementation for assert instruction
+# 
+# > cat input
+# 
+# assert my/test[0]/command=<command>
+# my/test[0]/instruction=<instruction>
+# assert my/test[0]/expected=<expected >
+# my/test[1]/command=<command>
 function comma_test_interactive_commands()
 {
     local until_first_failure=$1
     if [[ -n "$until_first_failure" ]]; then until_first_failure=1; else until_first_failure=0; fi
-    (
+    (   
         function comma_test_interactive_test_case()
-        {
+        {   
             local name="$1" testcase_number=$2 number_of_testcases=$3
-            local command instruction expected dialog input zenity_pid result
-            #input=$( comma_path_value_mangle | sed 's/^/local /' )
-            #eval "$input"
-            while IFS='=' read key value; do # have to do it piecemeal to avoid bash quoting difficulties
+            declare -A interactive_test
+            local lhs value dialog zenity_pid command_result zenity_result result
+            while IFS='=' read lhs value; do
+                local a predicate key
+                a=( $lhs )
+                if (( ${#a[@]} == 1 )); then predicate=""; key=${a[0]};
+                elif (( ${#a[@]} == 2 )); then predicate=${a[0]}; key=${a[1]};
+                else echo "$0: expected [<predicate>] <key>=<value>, got: '$lhs=$value'" >&2; return 1; fi
                 key=$( comma-string-strip <<< "$key" )
-                if [[ "$key" == "command" ]]; then command="$value"
-                elif [[ "$key" == "instruction" ]]; then instruction="$value"
-                elif [[ "$key" == "expected" ]]; then expected="$value"
-                else echo "$0: test '$name': expected 'command', 'instruction', or 'expected', got: '$key'" >&2; return 1; fi
+                case "$key" in
+                    command|instruction|expected)
+                        interactive_test["$key"]="$value"
+                        interactive_test["${key}_predicate"]="$predicate"
+                        ;;
+                    *)
+                        echo "$0: test '$name': expected 'command', 'instruction', or 'expected', got: '$key'" >&2; 
+                        return 2
+                        ;;
+                esac
             done
-            [[ -n "$command" ]] || { echo "$0: $name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
-            if [[ -n "$instruction" || -n "$expected" ]]; then                
-                [[ -z "$instruction" ]] || dialog+="$instruction\n\n"
-                if [[ -n "$expected" ]]; then dialog+="do you see: $expected?"; else dialog+="does it look good?"; fi
+
+            [[ -n "${interactive_test[command]}" ]] || { echo "$0: $name/command not specified" >&2; return 3; }
+            if [[ -n "${interactive_test[instruction]}" || -n "${interactive_test[expected]}" ]]; then
+                [[ -z "${interactive_test[instruction]}" ]] || dialog+="${interactive_test[instruction]}\n\n"
+                if [[ -n "${interactive_test[expected]}" ]]; then dialog+="do you see: ${interactive_test[expected]}?"; else dialog+="does it look good?"; fi
                 zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600 &
                 zenity_pid=$!
             fi
-            _comma_test_command_impl "$name" "$command"
-            result=$?
-            if [[ -n "$zenity_pid" ]]; then wait $zenity_pid; result=$?; fi
+
+            _comma_test_command_impl "$name" "${interactive_test[command]}"
+            command_result=$?
+            if [[ -n "$zenity_pid" ]]; then
+                wait $zenity_pid
+                zenity_result=$?
+                result=$(( command_result != 0 || zenity_result != 0 ? 1 : 0 ))
+            else
+                result=$command_result
+            fi
             echo "$name/status=$result"
-            return $result
+            
+            (( result != 0 )) || return $result
+            if (( until_first_failure )); then return 4; fi
+            if [[ "${interactive_test[command_predicate]}" == "assert" ]]; then
+                (( command_result != 0 )) && return 5
+            fi
+            [[ -n "$zenity_result" ]] || return 0
+            if [[ "${interactive_test[expected_predicate]}" == "assert" ]]; then
+                (( zenity_result != 0 )) && return 6
+            fi
+            return 0
         }
 
         local lines=$( cat );
-        local test_cases=$( cut -d= -f1 <<< "$lines" | grep -v '^#' | comma-string-strip | grep '/command$' | egrep '^[a-zA-Z0-9_]' | sed 's#/command$##' )
+        local test_cases=$( cut -d= -f1 <<< "$lines" | grep -v '^#' | comma-string-strip | grep '/command$' | egrep '^[a-zA-Z0-9_]' | comma-string-test-case-name )
         local number_of_testcases=$( wc -l <<< "$test_cases" )
         local testcase_number=0 test_case_name
         while read test_case_name; do
-            local escaped="${test_case_name//[/\\[}"
-            local test_case=$( grep "^$escaped/" <<< "$lines" | sed "s#^$escaped/##" ) # grep --fixed-strings does not seem to work
+            local test_case=$(comma-string-test-case "$test_case_name" <<< "$lines")
             comma_test_interactive_test_case "$test_case_name" $testcase_number $number_of_testcases <<< "$test_case"
             local r=$?
-            if (( r != 0 && until_first_failure )); then return $r; fi
+            (( r == 0 )) || return $r;
             (( ++testcase_number ))
         done <<< "$test_cases"
     )
diff --git a/util/test/test_util/interactive_commands/assert/expected b/util/test/test_util/interactive_commands/assert/expected
new file mode 100644
index 000000000..b5adf5dca
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/expected
@@ -0,0 +1,6 @@
+basics[0]/output=""
+basics[0]/status=2
+basics[2]/output=""
+basics[2]/status=2
+status=5
+output/lines/count=4
diff --git a/util/test/test_util/interactive_commands/assert/input b/util/test/test_util/interactive_commands/assert/input
new file mode 100644
index 000000000..83164c4c0
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/input
@@ -0,0 +1,5 @@
+basics[0]/command="ls ./non-existent-file"
+assert basics[1]="ls ./non-existent-file"
+assert basics[2]/command="ls ./non-existent-file"
+basics[3]/command="ls"
+basics[4]/command="ls ./non-existent-file"
diff --git a/util/test/test_util/interactive_commands/assert/test b/util/test/test_util/interactive_commands/assert/test
new file mode 100755
index 000000000..78a402201
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/test
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+output=$( comma_test_interactive_commands )
+status=$?
+echo "$output"
+echo "status=$status"
+echo "output/lines/count=$( wc -l <<< "$output" )"
\ No newline at end of file

From 87931d1ae763f8e244cc69cd3f7a20b00aeb1f38 Mon Sep 17 00:00:00 2001
From: rex <rexcrisp@outlook.com.au>
Date: Mon, 14 Apr 2025 20:08:11 +1000
Subject: [PATCH 1007/1056] rename  _comma_test_case_name and 
 _comma_test_name_parse; unquote instruction/expected strings in zenity
 dialogue; add user prompt test case

---
 util/applications/comma-test-util               | 17 +++++++----------
 .../interactive_commands/assert/disabled        |  1 +
 .../interactive_commands/assert/expected        |  6 +++---
 .../test_util/interactive_commands/assert/input |  9 +++++----
 4 files changed, 16 insertions(+), 17 deletions(-)
 create mode 100644 util/test/test_util/interactive_commands/assert/disabled

diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 9b03f7824..69393582d 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -71,7 +71,7 @@ for line in sys.stdin:
 eof
 }
 
-function _comma_test_util_test_case()
+function _comma_test_util_test_name_parse()
 {
     cat <<eof
 import sys
@@ -92,7 +92,7 @@ eof
 readonly _comma_test_util_strip_command="$( _comma_test_util_strip )"
 readonly _comma_test_util_unquote_command="$( _comma_test_util_unquote )"
 readonly _comma_test_util_test_case_name_command="$( _comma_test_util_test_case_name )"
-readonly _comma_test_util_test_case_command="$( _comma_test_util_test_case )"
+readonly _comma_test_util_test_name_parse_command="$( _comma_test_util_test_name_parse )"
 
 function comma-string-strip() { python3 -c "$_comma_test_util_strip_command"; } # todo: add comma-string-util, parametrise on strip characters
 
@@ -102,13 +102,9 @@ function comma-string-unquote() { python3 -c "$_comma_test_util_unquote_command"
 
 export -f comma-string-unquote
 
-function comma-string-test-case-name() { python3 -c "$_comma_test_util_test_case_name_command"; } # todo: add comma-string-util, parametrise on strip characters
+function _comma_test_case_name() { python3 -c "$_comma_test_util_test_case_name_command"; } # todo: add comma-string-util, parametrise on strip characters
 
-export -f comma-string-test-case-name
-
-function comma-string-test-case() { local name="$1"; python3 -c "$_comma_test_util_test_case_command" "$name"; } # todo: add comma-string-util, parametrise on strip characters
-
-export -f comma-string-test-case
+function _comma_test_name_parse() { local name="$1"; python3 -c "$_comma_test_util_test_name_parse_command" "$name"; } # todo: add comma-string-util, parametrise on strip characters
 
 function _comma_test_command_impl()
 {
@@ -254,6 +250,7 @@ function comma_test_interactive_commands()
                 key=$( comma-string-strip <<< "$key" )
                 case "$key" in
                     command|instruction|expected)
+                        if [[ "$key" == "instruction" || "$key" == "expected" ]]; then value=$(echo "$value" | sed -E "s/^(['\"])(.*)\1$/\2/"); fi
                         interactive_test["$key"]="$value"
                         interactive_test["${key}_predicate"]="$predicate"
                         ;;
@@ -296,11 +293,11 @@ function comma_test_interactive_commands()
         }
 
         local lines=$( cat );
-        local test_cases=$( cut -d= -f1 <<< "$lines" | grep -v '^#' | comma-string-strip | grep '/command$' | egrep '^[a-zA-Z0-9_]' | comma-string-test-case-name )
+        local test_cases=$( cut -d= -f1 <<< "$lines" | grep -v '^#' | comma-string-strip | grep '/command$' | egrep '^[a-zA-Z0-9_]' | _comma_test_case_name )
         local number_of_testcases=$( wc -l <<< "$test_cases" )
         local testcase_number=0 test_case_name
         while read test_case_name; do
-            local test_case=$(comma-string-test-case "$test_case_name" <<< "$lines")
+            local test_case=$(_comma_test_name_parse "$test_case_name" <<< "$lines")
             comma_test_interactive_test_case "$test_case_name" $testcase_number $number_of_testcases <<< "$test_case"
             local r=$?
             (( r == 0 )) || return $r;
diff --git a/util/test/test_util/interactive_commands/assert/disabled b/util/test/test_util/interactive_commands/assert/disabled
new file mode 100644
index 000000000..2808ba79e
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/disabled
@@ -0,0 +1 @@
+this is an interactive test that is run manually as needed
diff --git a/util/test/test_util/interactive_commands/assert/expected b/util/test/test_util/interactive_commands/assert/expected
index b5adf5dca..cac43217b 100644
--- a/util/test/test_util/interactive_commands/assert/expected
+++ b/util/test/test_util/interactive_commands/assert/expected
@@ -1,6 +1,6 @@
 basics[0]/output=""
-basics[0]/status=2
-basics[2]/output=""
-basics[2]/status=2
+basics[0]/status=1
+basics[1]/output=""
+basics[1]/status=2
 status=5
 output/lines/count=4
diff --git a/util/test/test_util/interactive_commands/assert/input b/util/test/test_util/interactive_commands/assert/input
index 83164c4c0..35ea63842 100644
--- a/util/test/test_util/interactive_commands/assert/input
+++ b/util/test/test_util/interactive_commands/assert/input
@@ -1,5 +1,6 @@
 basics[0]/command="ls ./non-existent-file"
-assert basics[1]="ls ./non-existent-file"
-assert basics[2]/command="ls ./non-existent-file"
-basics[3]/command="ls"
-basics[4]/command="ls ./non-existent-file"
+basics[0]/instruction="this test command will FAIL safely, press YES for the user test to pass"
+assert basics[0]/expected="'ls: cannot access 'non-existent': No such file or directory'"
+assert basics[1]/command="ls ./non-existent-file"
+basics[2]/command="ls"
+basics[3]/command="ls ./non-existent-file"

From c6e03dbb512795ceb7cf1f63948de7043b5253ff Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 14 Apr 2025 20:26:25 +1000
Subject: [PATCH 1008/1056] util/test/test_util/interactive_commands: test
 moved to util/test/test_util/interactive_commands/command

---
 util/test/test_util/interactive_commands/{ => command}/expected | 0
 util/test/test_util/interactive_commands/{ => command}/input    | 0
 util/test/test_util/interactive_commands/{ => command}/test     | 0
 3 files changed, 0 insertions(+), 0 deletions(-)
 rename util/test/test_util/interactive_commands/{ => command}/expected (100%)
 rename util/test/test_util/interactive_commands/{ => command}/input (100%)
 rename util/test/test_util/interactive_commands/{ => command}/test (100%)

diff --git a/util/test/test_util/interactive_commands/expected b/util/test/test_util/interactive_commands/command/expected
similarity index 100%
rename from util/test/test_util/interactive_commands/expected
rename to util/test/test_util/interactive_commands/command/expected
diff --git a/util/test/test_util/interactive_commands/input b/util/test/test_util/interactive_commands/command/input
similarity index 100%
rename from util/test/test_util/interactive_commands/input
rename to util/test/test_util/interactive_commands/command/input
diff --git a/util/test/test_util/interactive_commands/test b/util/test/test_util/interactive_commands/command/test
similarity index 100%
rename from util/test/test_util/interactive_commands/test
rename to util/test/test_util/interactive_commands/command/test

From 46584986fe1b1323309c336c805519ad885bf29f Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 14 Apr 2025 20:33:29 +1000
Subject: [PATCH 1009/1056] util/test/test_util/interactive_commands/assert:
 made it optional instead of disabled

---
 .../test_util/interactive_commands/assert/{disabled => optional}  | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename util/test/test_util/interactive_commands/assert/{disabled => optional} (100%)

diff --git a/util/test/test_util/interactive_commands/assert/disabled b/util/test/test_util/interactive_commands/assert/optional
similarity index 100%
rename from util/test/test_util/interactive_commands/assert/disabled
rename to util/test/test_util/interactive_commands/assert/optional

From a293ecbaeafbffb357d91bcbd54a4a3e7abcc714 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 00:33:41 +0000
Subject: [PATCH 1010/1056] comma-progress: using stl functional instead of
 boost functional

---
 util/applications/comma-progress.cpp | 32 +++++++++++-----------------
 1 file changed, 13 insertions(+), 19 deletions(-)

diff --git a/util/applications/comma-progress.cpp b/util/applications/comma-progress.cpp
index 1e10392b3..43127b312 100644
--- a/util/applications/comma-progress.cpp
+++ b/util/applications/comma-progress.cpp
@@ -27,23 +27,19 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-#include <boost/date_time/posix_time/ptime.hpp>
-#include <vector>
-#include <boost/unordered_map.hpp>
 #include <deque>
-#include <boost/unordered_set.hpp>
 #include <functional>
-#include <boost/functional.hpp>
+#include <vector>
+#include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/math/special_functions/round.hpp>
+#include <boost/unordered_map.hpp>
+#include <boost/unordered_set.hpp>
 #include "../../csv/stream.h"
 #include "../../visiting/traits.h"
 #include "../../application/command_line_options.h"
 #include "../../name_value/ptree.h"
 
-static const std::string& name() {
-    static const std::string name = "comma-progress";
-    return name;
-}
+static const char* name() { return "comma-progress"; }
 
 static char delimiter = ';';
 static const char equal_sign = '=';
@@ -422,8 +418,8 @@ int main( int ac, char** av )
         }
         else if( options.exists( "--elapsed" ) )
         {
-            boost::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output_elapsed );
-            boost::function< const impl_::log*() > extractor( &get_log );
+            std::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output_elapsed );
+            std::function< const impl_::log*() > extractor( &get_log );
             if( options.exists( "--from-path-value,--from-pv" ) )
             {
                 extractor = &get_log_path_value;
@@ -434,18 +430,16 @@ int main( int ac, char** av )
         }
         else
         {
-            boost::function< const impl_::log*() > extractor( &get_log );
-            boost::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output );
+            std::function< const impl_::log*() > extractor( &get_log );
+            std::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output );
             impl_::process_begin_end< impl_::log >( extractor , outputting );
             
             return 0;
         }
         
     }
-    catch( std::exception& e ) {
-        std::cerr << name() << ": exception caught - " << e.what() << std::endl;
-    }
-    catch(...) {
-        std::cerr << name() << ": unknown exception caught, terminating." << std::endl;
-    }
+    catch( std::exception& e ) { comma::say() << "exception caught - " << e.what() << std::endl; }
+    catch(...) { comma::say() << "unknown exception" << std::endl; }
+    return 1;
 }
+

From bd8bce09ba725c80268b47338c7cf6308a39b957 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 00:38:07 +0000
Subject: [PATCH 1011/1056] application: command_line_options: getting rid of
 boost functional

---
 application/command_line_options.h | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/application/command_line_options.h b/application/command_line_options.h
index b5efa142f..ca3f51270 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -5,11 +5,11 @@
 
 #pragma once
 
+#include <functional>
 #include <iostream>
 #include <map>
 #include <string>
 #include <vector>
-#include <boost/function.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include "../base/exception.h"
@@ -71,18 +71,18 @@ class command_line_options
         /// constructor
         /// if --help,-h present, call usage()
         /// if --verbose,-v present, call usage( verbose )
-        command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage = NULL, boost::function< void( int, char** ) > bash_completion = NULL );
+        command_line_options( int argc, char ** argv, std::function< void( bool ) > usage = NULL, std::function< void( int, char** ) > bash_completion = NULL );
 
         /// constructor
         /// if --help,-h present, call usage()
         /// if --verbose,-v present, call usage( verbose )
-        command_line_options( const std::vector< std::string >& argv, boost::function< void( bool ) > usage = NULL );
+        command_line_options( const std::vector< std::string >& argv, std::function< void( bool ) > usage = NULL );
         
         /// constructor
         /// if --help,-h present, call usage()
         /// if --verbose,-v present, call usage( verbose )
         template< typename Iterator >
-        command_line_options( Iterator begin, Iterator end, boost::function< void( bool ) > usage = NULL );
+        command_line_options( Iterator begin, Iterator end, std::function< void( bool ) > usage = NULL );
 
         /// constructor
         command_line_options( const command_line_options& rhs );
@@ -191,7 +191,7 @@ class command_line_options
         
 };
 
-template< typename Iterator > inline command_line_options::command_line_options( Iterator begin, Iterator end, boost::function< void( bool ) > usage )
+template< typename Iterator > inline command_line_options::command_line_options( Iterator begin, Iterator end, std::function< void( bool ) > usage )
 {
     argv_.resize( std::distance( begin, end ) );
     for ( Iterator i = begin; i < end; ++i ) { argv_[i] = *i; }

From aef388fd950d1a9d3fea4b4bc954dc7d3556a36a Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 00:38:49 +0000
Subject: [PATCH 1012/1056] application: command_line_options: getting rid of
 boost functional

---
 application/command_line_options.cpp | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index b63331704..91f1af574 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -5,10 +5,10 @@
 
 #include <algorithm>
 #include <array>
+#include <functional>
 #include <set>
 #include <sstream>
 #include <unordered_map>
-#include <boost/bind/bind.hpp>
 #include <boost/config/warning_disable.hpp>
 #include <boost/iostreams/stream.hpp>
 #include <boost/iostreams/device/null.hpp>
@@ -85,7 +85,7 @@ void command_line_options::_init_verbose( const std::string& path )
     if( exists( "--titlebar-application-name,--tbn" ) ) { comma::io::terminal::titlebar_ostream s; s << comma::application::detail::name; }
 }
 
-command_line_options::command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage, boost::function< void( int, char** ) > bash_completion )
+command_line_options::command_line_options( int argc, char ** argv, std::function< void( bool ) > usage, std::function< void( int, char** ) > bash_completion )
 {
     argv_.resize( argc );
     for( int i = 0; i < argc; ++i ) { argv_[i] = argv[i]; }
@@ -95,7 +95,7 @@ command_line_options::command_line_options( int argc, char ** argv, boost::funct
     if( usage && exists( "--help,-h" ) ) { usage( comma::application::detail::verbosity_level > 0 ); exit( 0 ); }
 }
 
-command_line_options::command_line_options( const std::vector< std::string >& argv, boost::function< void( bool ) > usage )
+command_line_options::command_line_options( const std::vector< std::string >& argv, std::function< void( bool ) > usage )
     : argv_( argv )
 {
     _fill_map( argv_ );
@@ -281,12 +281,12 @@ namespace impl {
         description_t d;
         bool r = boost::spirit::qi::phrase_parse( s.begin()
                                                 , s.end()
-                                                ,      name[ boost::bind( push_back_, boost::ref( d.names ), boost::placeholders::_1 ) ]
-                                                    >> *( ',' >> name[ boost::bind( push_back_, boost::ref( d.names ), boost::placeholders::_1 ) ] )
-                                                    >> -( '=' >> ( value[ boost::bind( got_value, boost::ref( d ), boost::placeholders::_1 ) ]
-                                                                | optional_value[ boost::bind( got_optional_value, boost::ref( d ), boost::placeholders::_1 ) ] ) )
-                                                    >> -( ';' >> default_value[ boost::bind( got_default_value, boost::ref( d ), boost::placeholders::_1 ) ] )
-                                                    >> -( ';' >> *( ascii::space ) >> help[ boost::bind( set_, boost::ref( d.help ), boost::placeholders::_1 ) ] )
+                                                ,      name[ std::bind( push_back_, boost::ref( d.names ), std::placeholders::_1 ) ]
+                                                    >> *( ',' >> name[ std::bind( push_back_, boost::ref( d.names ), std::placeholders::_1 ) ] )
+                                                    >> -( '=' >> ( value[ std::bind( got_value, boost::ref( d ), std::placeholders::_1 ) ]
+                                                                | optional_value[ std::bind( got_optional_value, boost::ref( d ), std::placeholders::_1 ) ] ) )
+                                                    >> -( ';' >> default_value[ std::bind( got_default_value, boost::ref( d ), std::placeholders::_1 ) ] )
+                                                    >> -( ';' >> *( ascii::space ) >> help[ std::bind( set_, boost::ref( d.help ), std::placeholders::_1 ) ] )
                                                     >> qi::eoi
                                                 , ascii::space );
         if( !r ) { COMMA_THROW( comma::exception, "invalid option description: \"" << s << "\"" ); }

From 7a3422daeb981604f5c1f8b8f9bbf3518c42aa15 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 00:40:32 +0000
Subject: [PATCH 1013/1056] csv-calc: getting rid of boost functional

---
 csv/applications/csv-calc.cpp | 41 ++++++++++++++++++-----------------
 1 file changed, 21 insertions(+), 20 deletions(-)

diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index f0cf64087..2d1208ab6 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -10,6 +10,7 @@
 #endif
 
 #include <deque>
+#include <functional>
 #include <iostream>
 #include <map>
 #include <type_traits>
@@ -196,8 +197,8 @@ class Values
         comma::csv::format::element id_element_;
         unsigned int block_;
         unsigned int id_;
-        boost::function< comma::uint32( const char* ) > block_from_bin_;
-        boost::function< comma::uint32( const char* ) > id_from_bin_;
+        std::function< comma::uint32( const char* ) > block_from_bin_;
+        std::function< comma::uint32( const char* ) > id_from_bin_;
         template < typename T > static comma::uint32 from_bin_( const char* buf ) { return comma::csv::format::traits< T >::from_bin( buf ); }
 
         void init_indices_()
@@ -237,15 +238,15 @@ class Values
                 block_element_ = input_format_.offset( *block_index_ );
                 switch( block_element_.type )
                 {
-                    case comma::csv::format::char_t: block_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int8: block_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint8: block_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::char_t: block_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int8: block_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint8: block_from_bin_ = std::bind( &Values::from_bin_< unsigned char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int16: block_from_bin_ = std::bind( &Values::from_bin_< comma::int16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint16: block_from_bin_ = std::bind( &Values::from_bin_< comma::uint16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int32: block_from_bin_ = std::bind( &Values::from_bin_< comma::int32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint32: block_from_bin_ = std::bind( &Values::from_bin_< comma::uint32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int64: block_from_bin_ = std::bind( &Values::from_bin_< comma::int64 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint64: block_from_bin_ = std::bind( &Values::from_bin_< comma::uint64 >, std::placeholders::_1 ); break;
                     default: COMMA_THROW( comma::exception, "expected integer for block id, got format " << input_format_.string() );
                 }
             }
@@ -254,15 +255,15 @@ class Values
                 id_element_ = input_format_.offset( *id_index_ );
                 switch( id_element_.type )
                 {
-                    case comma::csv::format::char_t: id_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int8: id_from_bin_ = boost::bind( &Values::from_bin_< char >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint8: id_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::int64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, boost::placeholders::_1 ); break;
-                    case comma::csv::format::uint64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, boost::placeholders::_1 ); break;
+                    case comma::csv::format::char_t: id_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int8: id_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint8: id_from_bin_ = std::bind( &Values::from_bin_< unsigned char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int16: id_from_bin_ = std::bind( &Values::from_bin_< comma::int16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint16: id_from_bin_ = std::bind( &Values::from_bin_< comma::uint16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int32: id_from_bin_ = std::bind( &Values::from_bin_< comma::int32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint32: id_from_bin_ = std::bind( &Values::from_bin_< comma::uint32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int64: id_from_bin_ = std::bind( &Values::from_bin_< comma::int64 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint64: id_from_bin_ = std::bind( &Values::from_bin_< comma::uint64 >, std::placeholders::_1 ); break;
                     default: COMMA_THROW( comma::exception, "expected integer for block id, got format " << input_format_.string() );
                 }
             }

From 0ad93654ad4549772cf040fb485e94212ebc7423 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 00:41:58 +0000
Subject: [PATCH 1014/1056] csv-units: getting rid of boost functional

---
 csv/applications/csv-units.cpp | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index 701b2bc0f..fa7addbe8 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -3,6 +3,7 @@
 /// @author vsevolod vlaskine
 /// @author kai huang
 
+#include <functional>
 #include <iostream>
 #include <boost/array.hpp>
 #include <boost/bind/bind.hpp>
@@ -272,7 +273,7 @@ namespace units {
 
     /// A type to allow a lookup table for converting units
     //typedef double (* cast_function)( double );
-    typedef boost::function< double( double ) > cast_function;
+    typedef std::function< double( double ) > cast_function;
 
     /// Retrieve a function that will convert between the two given
     /// measurement units.
@@ -311,14 +312,14 @@ namespace units {
             map[metres][feet] = cast< length_t, imperial_us_length_t >;
             map[metres][nautical_miles] = cast< length_t, nautical_mile_t >;
             map[metres][statute_miles] = cast< length_t, statute_mile_t >;
-            map[hours][minutes] = boost::bind( &scale, boost::placeholders::_1, 60.0 );
-            map[hours][seconds] = boost::bind( &scale, boost::placeholders::_1, 3600.0 );
-            map[minutes][seconds] = boost::bind( &scale, boost::placeholders::_1, 60.0 );
-            map[minutes][hours] = boost::bind( &scale, boost::placeholders::_1, 1.0 / 60.0 );
-            map[seconds][hours] = boost::bind( &scale, boost::placeholders::_1, 1.0 / 3600.0 );
-            map[seconds][minutes] = boost::bind( &scale, boost::placeholders::_1, 1.0 / 60.0 );
-            map[percent][fraction] = boost::bind( &scale, boost::placeholders::_1, 0.01 );
-            map[fraction][percent] = boost::bind( &scale, boost::placeholders::_1, 100.0 );
+            map[hours][minutes] = std::bind( &scale, std::placeholders::_1, 60.0 );
+            map[hours][seconds] = std::bind( &scale, std::placeholders::_1, 3600.0 );
+            map[minutes][seconds] = std::bind( &scale, std::placeholders::_1, 60.0 );
+            map[minutes][hours] = std::bind( &scale, std::placeholders::_1, 1.0 / 60.0 );
+            map[seconds][hours] = std::bind( &scale, std::placeholders::_1, 1.0 / 3600.0 );
+            map[seconds][minutes] = std::bind( &scale, std::placeholders::_1, 1.0 / 60.0 );
+            map[percent][fraction] = std::bind( &scale, std::placeholders::_1, 0.01 );
+            map[fraction][percent] = std::bind( &scale, std::placeholders::_1, 100.0 );
         }
         return map[from][to];
     }

From 885777dbd78ea9c93bf03ab117072db49f39df8f Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 00:44:19 +0000
Subject: [PATCH 1015/1056] name_value/impl/json_writer: compilation problem
 fixed: const end (cend) replaced with non-const end when modifying string

---
 name_value/impl/json_writer.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index 4afcfc3ea..a1a33ae9b 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -55,7 +55,7 @@ template< typename C > inline void json_remove_quotes( std::basic_string< C >& j
         *source++ = *next_token++;
         target = next_token;
     }
-    json_text.erase( pretty ? source : ( source - 1 ), json_text.cend() );
+    json_text.erase( pretty ? source : ( source - 1 ), json_text.end() );
 }
 
 template< class PTree > void write_json( std::basic_ostream< typename PTree::key_type::value_type > &stream, const PTree &ptree, bool const pretty = true, bool unquote_numbers = true )

From 4ec4e335395bf5c36ec2f6007864dda981863663 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 06:04:46 +0000
Subject: [PATCH 1016/1056] csv/test/csv-crc/test: bug fixed: variables with
 multiline values quoted

---
 csv/test/csv-crc/test | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/csv/test/csv-crc/test b/csv/test/csv-crc/test
index 0f991b0d5..a36f24dfd 100755
--- a/csv/test/csv-crc/test
+++ b/csv/test/csv-crc/test
@@ -2,8 +2,8 @@
 
 # read individual test parameters and data
 input=$( cat )
-eval "$( grep = <<< $input )"
-data=$( grep -v = <<< $input )
+eval "$( grep = <<< "$input" )"
+data=$( grep -v = <<< "$input" )
 
 [[ $operation ]] || exit 1
 [[ $data ]] || exit 1
@@ -22,4 +22,4 @@ function run_test()
 
 output=$( run_test )
 echo "$output" | name-value-from-csv -f line -d : --line-number -p output
-echo count=$( wc -l <<< $output )
+echo count=$( wc -l <<< "$output" )
\ No newline at end of file

From 5f5d18e5967e349a3ca4506e54099303feaf712c Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 07:51:39 +0000
Subject: [PATCH 1017/1056] name_value/impl: yaml placeholder created

---
 name_value/impl/yaml.cpp | 56 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 56 insertions(+)
 create mode 100644 name_value/impl/yaml.cpp

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
new file mode 100644
index 000000000..b081ed60b
--- /dev/null
+++ b/name_value/impl/yaml.cpp
@@ -0,0 +1,56 @@
+#include <yaml.h>
+#include <iostream>
+#include "yaml.h"
+
+namespace comma { namespace property_tree { namespace impl { namespace yaml {
+
+enum storage_flags { VAR, VAL, SEQ };
+
+void process_layer( yaml_parser_t *parser, unsigned int depth = 0 )
+{
+    yaml_event_t event;
+    int storage = VAR; // mapping cannot start with VAL definition w/o VAR key
+    while( true )
+    {
+        yaml_parser_parse( parser, &event );
+        if( event.type == YAML_SCALAR_EVENT ) // parse value either as a new leaf in the mapping or as a leaf value (one of them, in case it's a sequence)
+        {
+            if( storage ) { std::cerr << "==> a: depth: " << depth << " scalar: event.data.scalar.value: " << event.data.scalar.value << std::endl; }
+            else { std::cerr << "==> b: depth: " << depth << " scalar: event.data.scalar.value: " << event.data.scalar.value << std::endl; }
+            storage ^= VAL; // flip VAR/VAL switch for the next event
+        }
+        else if ( event.type == YAML_SEQUENCE_START_EVENT) { std::cerr << "==> c: depth: " << depth << " sequence: start" << std::endl; storage = SEQ; } // sequence - all the following scalars will be appended to the last_leaf
+        else if (event.type == YAML_SEQUENCE_END_EVENT) { std::cerr << "==> d: depth: " << depth << " sequence: end" << std::endl; storage = VAR; }
+        else if ( event.type == YAML_MAPPING_START_EVENT )
+        {
+            std::cerr << "==> e: depth: " << depth << " mapping: start" << std::endl;
+            process_layer( parser, depth + 1 );
+            storage ^= VAL; // flip VAR/VAL, w/o touching SEQ
+        }
+        else if ( event.type == YAML_MAPPING_END_EVENT || event.type == YAML_STREAM_END_EVENT )
+        {
+            std::cerr << "==> e: depth: " << depth << " mapping: end" << std::endl;
+            break;
+        }
+        yaml_event_delete( &event );
+    }
+}
+
+boost::property_tree::ptree to_ptree( const std::string& s )
+{
+    boost::property_tree::ptree t;
+    yaml_parser_t parser;
+    yaml_parser_initialize( &parser );
+    yaml_parser_set_input_string( &parser, reinterpret_cast< const unsigned char* >( &s[0] ), s.size() );
+    process_layer( &parser );
+    yaml_parser_delete( &parser );
+    return t; // todo!!!
+}
+
+std::string from_ptree( const boost::property_tree::ptree& )
+{
+    std::string s;
+    return s;
+}
+
+} } } } // namespace comma { namespace property_tree { namespace impl { namespace yaml {

From 86bacd54f6ba672e4b4748dc268b3900663ebbf4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 19:48:43 +1000
Subject: [PATCH 1018/1056] name_value: property_tree: yaml support: in
 progress...

---
 CMakeLists.txt            |   1 +
 name_value/CMakeLists.txt |   8 ++-
 name_value/impl/yaml.cpp  | 104 ++++++++++++++++++++++++++++----------
 name_value/impl/yaml.h    |  46 +++++++++++++++++
 4 files changed, 132 insertions(+), 27 deletions(-)
 create mode 100644 name_value/impl/yaml.h

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 4d69ec426..357da2d9d 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -153,6 +153,7 @@ OPTION( BUILD_APPLICATIONS "build applications" ON )
 SET( comma_BUILD_APPLICATIONS ${BUILD_APPLICATIONS} )
 
 option( BUILD_SHARED_LIBS "build with shared libraries" ON )
+option( comma_BUILD_NAME_VALUE_YAML "build name_value with yaml support; requires libyaml; e.g. apt install libyaml-dev" OFF )
 option( comma_BUILD_PYTHON "build python" ON )
 option( comma_BUILD_XML "build xml" OFF )
 option( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index 615d5009f..611545ec9 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -7,12 +7,18 @@ FILE( GLOB impl_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/*.h )
 SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} ${impl_includes} )
 #ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} ${impl_includes} comma_application comma_string comma_xpath )
 
+if( comma_BUILD_NAME_VALUE_YAML )
+    set( source "${source};${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/yaml.cpp" )
+endif( comma_BUILD_NAME_VALUE_YAML )
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} ) # comma_application
+target_link_libraries( ${TARGET_NAME} comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} ) # comma_application
+if( comma_BUILD_NAME_VALUE_YAML )
+    target_link_libraries( ${TARGET_NAME} yaml )
+endif( comma_BUILD_NAME_VALUE_YAML )
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index b081ed60b..3ec996463 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -1,50 +1,102 @@
+// This file is part of comma library
+// Copyright (c) 2025 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+// 4. Additionally, source code from this repository produced after 2022
+//    must not be used in training or test datasets for training language
+//    models and/or automated code generation
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
 #include <yaml.h>
 #include <iostream>
+#include "../../base/exception.h"
 #include "yaml.h"
 
 namespace comma { namespace property_tree { namespace impl { namespace yaml {
 
-enum storage_flags { VAR, VAL, SEQ };
-
-void process_layer( yaml_parser_t *parser, unsigned int depth = 0 )
+static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
 {
-    yaml_event_t event;
-    int storage = VAR; // mapping cannot start with VAL definition w/o VAR key
+    struct on { enum state { name = 0, value = 1, sequence = 2 }; };
+    int state = on::name; // mapping cannot start with VAL definition w/o VAR key
+    std::string name, value;
     while( true )
     {
+        yaml_event_t event;
         yaml_parser_parse( parser, &event );
-        if( event.type == YAML_SCALAR_EVENT ) // parse value either as a new leaf in the mapping or as a leaf value (one of them, in case it's a sequence)
-        {
-            if( storage ) { std::cerr << "==> a: depth: " << depth << " scalar: event.data.scalar.value: " << event.data.scalar.value << std::endl; }
-            else { std::cerr << "==> b: depth: " << depth << " scalar: event.data.scalar.value: " << event.data.scalar.value << std::endl; }
-            storage ^= VAL; // flip VAR/VAL switch for the next event
-        }
-        else if ( event.type == YAML_SEQUENCE_START_EVENT) { std::cerr << "==> c: depth: " << depth << " sequence: start" << std::endl; storage = SEQ; } // sequence - all the following scalars will be appended to the last_leaf
-        else if (event.type == YAML_SEQUENCE_END_EVENT) { std::cerr << "==> d: depth: " << depth << " sequence: end" << std::endl; storage = VAR; }
-        else if ( event.type == YAML_MAPPING_START_EVENT )
+        switch( event.type )
         {
-            std::cerr << "==> e: depth: " << depth << " mapping: start" << std::endl;
-            process_layer( parser, depth + 1 );
-            storage ^= VAL; // flip VAR/VAL, w/o touching SEQ
-        }
-        else if ( event.type == YAML_MAPPING_END_EVENT || event.type == YAML_STREAM_END_EVENT )
-        {
-            std::cerr << "==> e: depth: " << depth << " mapping: end" << std::endl;
-            break;
+            case YAML_SCALAR_EVENT:
+                ( state ? name : value ) = reinterpret_cast< const char* >( event.data.scalar.value );
+                state ^= on::value; // flip on::name/on::value switch for the next event
+                break;
+            case YAML_SEQUENCE_START_EVENT:
+                // todo: parse sequence
+                state = on::sequence;
+                break;
+            case YAML_SEQUENCE_END_EVENT:
+                // todo: end parsing sequence
+                state = on::name;
+                break;
+            case YAML_MAPPING_START_EVENT:
+            {
+                // todo: create children
+                auto q = t; // todo! pass child instead!
+                parse( parser, t );
+                state ^= on::value; // flip on::name/on::value switch for the next event
+                break;
+            }
+            case YAML_MAPPING_END_EVENT:
+            case YAML_STREAM_END_EVENT:
+                break;
+            default:
+            {
+                auto e = event.type;
+                yaml_event_delete( &event );       
+                COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
+            }
         }
         yaml_event_delete( &event );
     }
 }
 
-boost::property_tree::ptree to_ptree( const std::string& s )
+boost::property_tree::ptree& to_ptree( boost::property_tree::ptree& t, const std::string& s )
 {
-    boost::property_tree::ptree t;
     yaml_parser_t parser;
     yaml_parser_initialize( &parser );
     yaml_parser_set_input_string( &parser, reinterpret_cast< const unsigned char* >( &s[0] ), s.size() );
-    process_layer( &parser );
+    parse( &parser, t );
     yaml_parser_delete( &parser );
-    return t; // todo!!!
+    return t;
+}
+
+boost::property_tree::ptree to_ptree( const std::string& s )
+{
+    boost::property_tree::ptree t;
+    to_ptree( t, s );
+    return t;
 }
 
 std::string from_ptree( const boost::property_tree::ptree& )
diff --git a/name_value/impl/yaml.h b/name_value/impl/yaml.h
new file mode 100644
index 000000000..a1d353028
--- /dev/null
+++ b/name_value/impl/yaml.h
@@ -0,0 +1,46 @@
+// This file is part of comma library
+// Copyright (c) 2025 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+// 4. Additionally, source code from this repository produced after 2022
+//    must not be used in training or test datasets for training language
+//    models and/or automated code generation
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#pragma once
+
+#include <string>
+#include <boost/property_tree/ptree.hpp>
+
+namespace comma { namespace property_tree { namespace impl { namespace yaml {
+
+boost::property_tree::ptree to_ptree( const std::string& s );
+
+boost::property_tree::ptree& to_ptree( boost::property_tree::ptree& t, const std::string& s );
+
+std::string from_ptree( const boost::property_tree::ptree& t );
+
+} } } } // namespace comma { namespace property_tree { namespace impl { namespace yaml {

From 76952987efd0014006302a4bee3beb11480012d4 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 21:29:01 +1000
Subject: [PATCH 1019/1056] name_value: property_tree: yaml support: in
 progress...

---
 name_value/CMakeLists.txt                     |  2 +
 .../applications/name-value-convert.cpp       | 41 ++++++----
 name_value/impl/yaml.cpp                      | 66 ++++++++++++----
 name_value/impl/yaml.h                        |  8 +-
 name_value/ptree.cpp                          | 77 ++++++++++++++++++-
 name_value/ptree.h                            | 10 +++
 6 files changed, 166 insertions(+), 38 deletions(-)

diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index 611545ec9..c61830fed 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -8,6 +8,8 @@ SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} ${impl_includes} )
 #ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} ${impl_includes} comma_application comma_string comma_xpath )
 
 if( comma_BUILD_NAME_VALUE_YAML )
+    # find_package( yaml REQUIRED ) # todo
+    set( CMAKE_CXX_FLAGS "-Dcomma_BUILD_NAME_VALUE_YAML ${CMAKE_CXX_FLAGS}" ) # todo? move to the main CMakeLists.txt?
     set( source "${source};${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/yaml.cpp" )
 endif( comma_BUILD_NAME_VALUE_YAML )
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index e61acd5e7..4c80d0d1d 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -37,12 +37,13 @@ static void usage( bool verbose = false )
     std::cerr << "    --strict: return error if path specified in --path not found" << std::endl;
     std::cerr << std::endl;
     std::cerr << "formats" << std::endl;
-    std::cerr << "    info: info data (see boost::property_tree)" << std::endl;
-    std::cerr << "    ini: ini data" << std::endl;
-    std::cerr << "    json: json data" << std::endl;
-    std::cerr << "    xml: xml data" << std::endl;
-    std::cerr << "    path-value: path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
-    std::cerr << "    dot: as graphviz dot language, see: https://graphviz.org/doc/info/lang.html" << std::endl;
+    std::cerr << "    dot        : as graphviz dot language, see: https://graphviz.org/doc/info/lang.html" << std::endl;
+    std::cerr << "    info       : info data (see boost::property_tree)" << std::endl;
+    std::cerr << "    ini        : ini data" << std::endl;
+    std::cerr << "    json       : json data" << std::endl;
+    std::cerr << "    path-value : path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
+    std::cerr << "    xml        : xml data" << std::endl;
+    std::cerr << "    yaml       : implementing..." << std::endl;
     std::cerr << std::endl;
     std::cerr << "name/path-value options" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal sign>: default '='" << std::endl;
@@ -99,7 +100,7 @@ static path_mode indices_mode = comma::property_tree::disabled;
 static bool use_index = true;
 static comma::property_tree::path_value::check_repeated_paths check_type( comma::property_tree::path_value::no_check );
 
-enum Types { ini, info, json, xml, path_value, dot, void_t };
+enum Types { ini, info, json, xml, yaml, path_value, dot, void_t };
 
 template < Types Type > struct traits {};
 
@@ -126,6 +127,12 @@ template <> struct traits< json >
     static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::name_value::impl::write_json( os, ptree, !minify_json, !quote_numbers ); }
 };
 
+template <> struct traits< yaml >
+{
+    static void input( std::istream& is, boost::property_tree::ptree& ptree ) { comma::property_tree::read_yaml( is, ptree ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::property_tree::write_yaml( os, ptree ); }
+};
+
 template <> struct traits< xml >
 {
     static void input( std::istream& is, boost::property_tree::ptree& ptree ) { comma::property_tree::read_xml( is, ptree ); }
@@ -222,22 +229,24 @@ int main( int ac, char** av )
             else if( *from == "info" ) { input = &traits< info >::input; }
             else if( *from == "json" ) { input = &traits< json >::input; }
             else if( *from == "xml" ) { input = &traits< xml >::input; }
+            else if( *from == "yaml" ) { input = &traits< yaml >::input; }
             else if( *from == "path-value" || *from == "pv" ) { input = &traits< path_value >::input; }
             else if( *from == "dot" ) { input = &traits< dot >::input; }
-            else { std::cerr << "name-value-convert: expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
+            else { comma::say() << "expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         }
         else
         {
-            if( linewise ) {  std::cerr << "name-value-convert: if --linewise is present, --from must be given" << std::endl; return 1; }
+            if( linewise ) {  comma::say() << "if --linewise is present, --from must be given" << std::endl; return 1; }
             input = &traits< void_t >::input;
         }
         if( to == "ini" ) { output = &traits< ini >::output; }
         else if( to == "info" ) { output = &traits< info >::output; }
         else if( to == "json" ) { output = &traits< json >::output; }
+        else if( to == "yaml" ) { output = &traits< yaml >::output; }
         else if( to == "xml" ) { output = &traits< xml >::output; }
         else if( to == "path-value" || to == "pv" ) { output = &traits< path_value >::output; }
         else if( to == "dot" ) { output = &traits< dot >::output; }
-        else { std::cerr << "name-value-convert: expected --to format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
+        else { comma::say() << "expected --to format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         if( use_index )
         {
             if( options.exists( "--no-brackets" ) ) { indices_mode = comma::property_tree::without_brackets; }
@@ -288,7 +297,7 @@ int main( int ac, char** av )
                 for( const auto& path: paths )
                 {
                     auto child = comma::property_tree::get_tree( ptree, path ); // paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' )
-                    if( !child ) { if( strict ) { std::cerr << "name-value-convert: path \"" << path << "\" not found" << std::endl; return 1; } else { continue; } }
+                    if( !child ) { if( strict ) { comma::say() << "path \"" << path << "\" not found" << std::endl; return 1; } else { continue; } }
                     boost::optional< std::string > value = child->get_optional< std::string >( "" );
                     std::cout << eol;
                     if( value && !value->empty() ) // todo? output empty values?
@@ -307,10 +316,10 @@ int main( int ac, char** av )
         }
         return 0;
     }
-    catch( boost::property_tree::ptree_bad_data& ex ) { std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl; }
-    catch( boost::property_tree::ptree_bad_path& ex ) { std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl; }
-    catch( boost::property_tree::ptree_error& ex ) { boost::regex e( "<unspecified file>" ); std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl; }
-    catch( std::exception& ex ) { std::cerr << "name-value-convert: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "name-value-convert: unknown exception" << std::endl; }
+    catch( boost::property_tree::ptree_bad_data& ex ) { comma::say() << "bad data: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_bad_path& ex ) { comma::say() << "bad path: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_error& ex ) { boost::regex e( "<unspecified file>" ); comma::say() << "parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index 3ec996463..efdbaf1d6 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -35,33 +35,69 @@
 #include "../../base/exception.h"
 #include "yaml.h"
 
-namespace comma { namespace property_tree { namespace impl { namespace yaml {
+namespace comma { namespace name_value { namespace impl { namespace yaml {
+
+// static boost::property_tree::ptree xml_to_ptree_( boost::property_tree::ptree& ptree)
+// {
+//     boost::property_tree::ptree out= boost::property_tree::ptree();
+//     boost::property_tree::ptree unnamed_array= boost::property_tree::ptree();
+//     for ( boost::property_tree::ptree::iterator i=ptree.begin(); i!=ptree.end(); i++ )
+//     {
+//         //look ahead for duplicate name
+//         boost::property_tree::ptree::iterator lah = i;
+//         if ( ++lah != ptree.end() && i->first == lah->first )
+//         {
+//             //add to unnamed array
+//             unnamed_array.push_back( std::make_pair( "", xml_to_ptree_( i->second ) ) );
+//         }
+//         else
+//         {
+//             if(unnamed_array.size()!=0)
+//             {
+//                 //assert((i-1)->first==i->first);
+//                 //the last of duplicated name
+//                 unnamed_array.push_back( std::make_pair( "", xml_to_ptree_( i->second ) ) );
+//                 out.add_child(i->first,unnamed_array);
+//                 unnamed_array= boost::property_tree::ptree();
+//             }
+//             else
+//             {
+//                 out.add_child(i->first, xml_to_ptree_(i->second) );
+//             }
+//         }
+//     }
+//     out.put_value( comma::strip( ptree.get_value<std::string>(), " \n\t" ));
+//     return out;
+// }
 
 static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
 {
-    struct on { enum state { name = 0, value = 1, sequence = 2 }; };
+    struct on { enum state { name, value, sequence }; };
     int state = on::name; // mapping cannot start with VAL definition w/o VAR key
     std::string name, value;
     while( true )
     {
         yaml_event_t event;
         yaml_parser_parse( parser, &event );
+        std::cerr << "==> a: " << event.type << std::endl;
         switch( event.type )
         {
             case YAML_SCALAR_EVENT:
+                std::cerr << "==> b: on: " << event.data.scalar.value << std::endl;
                 ( state ? name : value ) = reinterpret_cast< const char* >( event.data.scalar.value );
                 state ^= on::value; // flip on::name/on::value switch for the next event
                 break;
             case YAML_SEQUENCE_START_EVENT:
-                // todo: parse sequence
+                std::cerr << "==> c" << std::endl; 
                 state = on::sequence;
                 break;
             case YAML_SEQUENCE_END_EVENT:
-                // todo: end parsing sequence
+                std::cerr << "==> d" << std::endl; 
                 state = on::name;
                 break;
             case YAML_MAPPING_START_EVENT:
             {
+                std::cerr << "==> e" << std::endl;
                 // todo: create children
                 auto q = t; // todo! pass child instead!
                 parse( parser, t );
@@ -69,8 +105,17 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
                 break;
             }
             case YAML_MAPPING_END_EVENT:
+                std::cerr << "==> f" << std::endl;
             case YAML_STREAM_END_EVENT:
+                std::cerr << "==> g" << std::endl;
                 break;
+            case YAML_NO_EVENT:
+            case YAML_DOCUMENT_START_EVENT:
+            case YAML_DOCUMENT_END_EVENT:
+            case YAML_STREAM_START_EVENT:
+            case YAML_ALIAS_EVENT:
+                std::cerr << "==> h" << std::endl;
+                continue; // todo? handle?
             default:
             {
                 auto e = event.type;
@@ -78,11 +123,12 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
                 COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
             }
         }
+        std::cerr << "==> z" << std::endl;
         yaml_event_delete( &event );
     }
 }
 
-boost::property_tree::ptree& to_ptree( boost::property_tree::ptree& t, const std::string& s )
+boost::property_tree::ptree& to_ptree( const std::string& s, boost::property_tree::ptree& t )
 {
     yaml_parser_t parser;
     yaml_parser_initialize( &parser );
@@ -92,17 +138,11 @@ boost::property_tree::ptree& to_ptree( boost::property_tree::ptree& t, const std
     return t;
 }
 
-boost::property_tree::ptree to_ptree( const std::string& s )
-{
-    boost::property_tree::ptree t;
-    to_ptree( t, s );
-    return t;
-}
-
 std::string from_ptree( const boost::property_tree::ptree& )
 {
     std::string s;
+    // todo
     return s;
 }
 
-} } } } // namespace comma { namespace property_tree { namespace impl { namespace yaml {
+} } } } // namespace comma { namespace name_value { namespace impl { namespace yaml {
diff --git a/name_value/impl/yaml.h b/name_value/impl/yaml.h
index a1d353028..1af05093a 100644
--- a/name_value/impl/yaml.h
+++ b/name_value/impl/yaml.h
@@ -35,12 +35,10 @@
 #include <string>
 #include <boost/property_tree/ptree.hpp>
 
-namespace comma { namespace property_tree { namespace impl { namespace yaml {
+namespace comma { namespace name_value { namespace impl { namespace yaml {
 
-boost::property_tree::ptree to_ptree( const std::string& s );
-
-boost::property_tree::ptree& to_ptree( boost::property_tree::ptree& t, const std::string& s );
+boost::property_tree::ptree& to_ptree( const std::string& s, boost::property_tree::ptree& t );
 
 std::string from_ptree( const boost::property_tree::ptree& t );
 
-} } } } // namespace comma { namespace property_tree { namespace impl { namespace yaml {
+} } } } // namespace comma { namespace name_value { namespace impl { namespace yaml {
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index cc8b56e02..986e116bd 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -20,6 +20,7 @@
 #include "../xpath/xpath.h"
 #include "../visiting/visit.h"
 #include "../visiting/while.h"
+#include "impl/yaml.h"
 #include "ptree.h"
 
 namespace comma {
@@ -421,7 +422,7 @@ void property_tree::from_unknown_seekable( std::istream& stream, boost::property
         return;
     }
     catch( const boost::property_tree::ptree_error&  ex ) {}
-    catch(...) { throw; }
+    catch( ... ) { throw; }
     try
     {
         stream.clear();
@@ -430,7 +431,7 @@ void property_tree::from_unknown_seekable( std::istream& stream, boost::property
         return;
     }
     catch( const boost::property_tree::ptree_error&  ex ) {}
-    catch(...) { throw; }
+    catch( ... ) { throw; }
     try
     {
         stream.clear();
@@ -439,10 +440,78 @@ void property_tree::from_unknown_seekable( std::istream& stream, boost::property
         return;
     }
     catch( const boost::property_tree::ptree_error&  ex ) {}
-    catch( const comma::exception&  ex ) {}
-    catch(...) { throw; }
+    catch( const comma::exception& ex ) {}
+    catch( ... ) { throw; }
+    try
+    {
+        stream.clear();
+        stream.seekg( 0, std::ios::beg );
+        comma::property_tree::read_yaml( stream, ptree );
+        return;
+    }
+    catch( const boost::property_tree::ptree_error&  ex ) {}
+    catch( const comma::exception& ex ) {}
+    catch( ... ) { throw; }
     // TODO: add try for ini format (currently the problem is that path-value treats ini sections and comments as valid entries; possible solution: make path-value parser stricter)
     COMMA_THROW( comma::exception, "failed to guess format" );
 }
 
+#if defined comma_BUILD_NAME_VALUE_YAML
+
+boost::property_tree::ptree property_tree::from_yaml( const std::string& s )
+{
+    boost::property_tree::ptree t;
+    from_yaml( s, t );
+    return t;
+}
+
+void property_tree::read_yaml( std::istream& is, boost::property_tree::ptree& t )
+{
+    std::ostringstream oss;
+    while( is.good() && !is.eof() ) // quick and dirty, watch performance
+    {
+        std::string line;
+        std::getline( std::cin, line );
+        if( line.empty() ) { continue; }
+        oss << line << std::endl;
+    }
+    from_yaml( oss.str(), t );
+}
+
+void property_tree::write_yaml( std::ostream& os, const boost::property_tree::ptree& t ) { os << to_yaml( t ) << std::endl; }
+
+boost::property_tree::ptree& property_tree::from_yaml( const std::string& s, boost::property_tree::ptree& t )
+{
+    return comma::name_value::impl::yaml::to_ptree( s, t );
+}
+
+std::string property_tree::to_yaml( const boost::property_tree::ptree& t )
+{
+    COMMA_THROW( comma::exception, "todo" );
+}
+
+#else // #if defined comma_BUILD_NAME_VALUE_YAML
+
+boost::property_tree::ptree property_tree::from_yaml( const std::string& s )
+{
+    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
+}
+
+boost::property_tree::ptree& property_tree::from_yaml( const std::string& s, boost::property_tree::ptree& t )
+{
+    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
+}
+
+boost::property_tree::ptree& property_tree::from_yaml( std::istream& is, boost::property_tree::ptree& t )
+{
+    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
+}
+
+std::string property_tree::to_yaml( const boost::property_tree::ptree& t )
+{
+    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
+}
+
+#endif // #if defined comma_BUILD_NAME_VALUE_YAML
+
 } // namespace comma {
diff --git a/name_value/ptree.h b/name_value/ptree.h
index 32710fd47..7ab9d69b8 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -102,6 +102,16 @@ struct property_tree // quick and dirty
     /// guess format and read boost property tree from stream (a wrapper for from_unknown_seekable that buffers input from a non-seekable stream)
     static void from_unknown( std::istream& stream, boost::property_tree::ptree& ptree, path_value::check_repeated_paths check_type = path_value::no_check, char equal_sign = '=', char delimiter = ',', bool use_index = true );
 
+    static boost::property_tree::ptree from_yaml( const std::string& s );
+
+    static boost::property_tree::ptree& from_yaml( const std::string& s, boost::property_tree::ptree& t );
+
+    static void read_yaml( std::istream& is, boost::property_tree::ptree& t );
+
+    static std::string to_yaml( const boost::property_tree::ptree& t );
+
+    static void write_yaml( std::ostream& os, const boost::property_tree::ptree& t );
+
     /// guess format and read boost property tree from a seekable stream (pipe or terminal input is not accepted)
     static void from_unknown_seekable( std::istream& stream, boost::property_tree::ptree& ptree, path_value::check_repeated_paths check_type = path_value::no_check, char equal_sign = '=', char delimiter = ',', bool use_index = false  );
 

From 93e2b143952a38353d801b6b309e39bd554da7a0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 23 Apr 2025 21:43:49 +1000
Subject: [PATCH 1020/1056] name_value: property_tree: yaml support: in
 progress...

---
 name_value/impl/yaml.cpp | 22 ++++++++++++----------
 1 file changed, 12 insertions(+), 10 deletions(-)

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index efdbaf1d6..f0e273008 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -72,14 +72,16 @@ namespace comma { namespace name_value { namespace impl { namespace yaml {
 
 static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
 {
+    COMMA_THROW( comma::exception, "implementing..." );
+    std::cerr << "==> A" << std::endl;
     struct on { enum state { name, value, sequence }; };
-    int state = on::name; // mapping cannot start with VAL definition w/o VAR key
+    int state = on::name; // mapping cannot start with on::value definition w/o on::name key
     std::string name, value;
     while( true )
     {
         yaml_event_t event;
         yaml_parser_parse( parser, &event );
-        std::cerr << "==> a: " << event.type << std::endl;
+        std::cerr << "==> a: type : " << event.type << std::endl;
         switch( event.type )
         {
             case YAML_SCALAR_EVENT:
@@ -108,20 +110,20 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
                 std::cerr << "==> f" << std::endl;
             case YAML_STREAM_END_EVENT:
                 std::cerr << "==> g" << std::endl;
-                break;
+                return;
             case YAML_NO_EVENT:
             case YAML_DOCUMENT_START_EVENT:
             case YAML_DOCUMENT_END_EVENT:
             case YAML_STREAM_START_EVENT:
             case YAML_ALIAS_EVENT:
                 std::cerr << "==> h" << std::endl;
-                continue; // todo? handle?
-            default:
-            {
-                auto e = event.type;
-                yaml_event_delete( &event );       
-                COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
-            }
+                break; // todo? handle?
+            // default:
+            // {
+            //     auto e = event.type;
+            //     yaml_event_delete( &event );       
+            //     COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
+            // }
         }
         std::cerr << "==> z" << std::endl;
         yaml_event_delete( &event );

From b0a858021f69849387889409e5af35792b9a5186 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 24 Apr 2025 11:35:17 +1000
Subject: [PATCH 1021/1056] name_value: property_tree: yaml support: in
 progress...

---
 name_value/impl/yaml.cpp | 65 +++++++++++++++++++++-------------------
 1 file changed, 35 insertions(+), 30 deletions(-)

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index f0e273008..696619898 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -70,53 +70,60 @@ namespace comma { namespace name_value { namespace impl { namespace yaml {
 //     return out;
 // }
 
-static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
+static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool expecting_value = false, bool is_sequence = false )
 {
-    COMMA_THROW( comma::exception, "implementing..." );
-    std::cerr << "==> A" << std::endl;
-    struct on { enum state { name, value, sequence }; };
-    int state = on::name; // mapping cannot start with on::value definition w/o on::name key
-    std::string name, value;
+    //COMMA_THROW( comma::exception, "implementing..." );
+    std::cerr << "==> a" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
+    std::string scalar;
+    std::pair< std::string, boost::property_tree::ptree > seq;
     while( true )
     {
         yaml_event_t event;
         yaml_parser_parse( parser, &event );
-        std::cerr << "==> a: type : " << event.type << std::endl;
-        switch( event.type )
+        auto event_type = event.type;
+        scalar = event.type == YAML_SCALAR_EVENT ? std::string( reinterpret_cast< const char* >( event.data.scalar.value ) ) : "";
+        yaml_event_delete( &event );
+        switch( event_type )
         {
             case YAML_SCALAR_EVENT:
-                std::cerr << "==> b: on: " << event.data.scalar.value << std::endl;
-                ( state ? name : value ) = reinterpret_cast< const char* >( event.data.scalar.value );
-                state ^= on::value; // flip on::name/on::value switch for the next event
+                if( is_sequence )
+                {
+                    std::cerr << "==> nooo" << std::endl;
+                    // todo
+                    // t.add_child( "", boost::property_tree::ptree() ).put_value( scalar )
+                    break;
+                }
+                if( expecting_value )
+                {
+                    std::cerr << "==> b.0: put value: " << scalar << std::endl;
+                    t.put_value( scalar );
+                    return;
+                }
+                std::cerr << "==> b.1: add child: " << scalar << std::endl;
+                parse( parser, scalar.empty() ? t : t.add_child( scalar, boost::property_tree::ptree() ), true );
+                expecting_value = false;
                 break;
             case YAML_SEQUENCE_START_EVENT:
-                std::cerr << "==> c" << std::endl; 
-                state = on::sequence;
+                std::cerr << "==> c: seq start" << std::endl; 
+                //parse( parser, t.add_child( scalar, boost::property_tree::ptree() ), false, true );
+                parse( parser, t, false, true );
                 break;
             case YAML_SEQUENCE_END_EVENT:
-                std::cerr << "==> d" << std::endl; 
-                state = on::name;
-                break;
+                std::cerr << "==> d: seq end" << std::endl;
+                return;
             case YAML_MAPPING_START_EVENT:
-            {
-                std::cerr << "==> e" << std::endl;
-                // todo: create children
-                auto q = t; // todo! pass child instead!
+                std::cerr << "==> e: map start" << std::endl;
                 parse( parser, t );
-                state ^= on::value; // flip on::name/on::value switch for the next event
-                break;
-            }
+                return;
             case YAML_MAPPING_END_EVENT:
-                std::cerr << "==> f" << std::endl;
             case YAML_STREAM_END_EVENT:
-                std::cerr << "==> g" << std::endl;
-                return;
+            case YAML_DOCUMENT_END_EVENT:
             case YAML_NO_EVENT:
+                std::cerr << "==> f: map end" << std::endl;
+                return;
             case YAML_DOCUMENT_START_EVENT:
-            case YAML_DOCUMENT_END_EVENT:
             case YAML_STREAM_START_EVENT:
             case YAML_ALIAS_EVENT:
-                std::cerr << "==> h" << std::endl;
                 break; // todo? handle?
             // default:
             // {
@@ -125,8 +132,6 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t )
             //     COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
             // }
         }
-        std::cerr << "==> z" << std::endl;
-        yaml_event_delete( &event );
     }
 }
 

From 162b36cd5bcddfab952bfb81d5d0a201505fac96 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 24 Apr 2025 12:35:19 +1000
Subject: [PATCH 1022/1056] name_value: property_tree: yaml support: in
 progress...

---
 name_value/impl/yaml.cpp | 24 +++++++++++++++---------
 1 file changed, 15 insertions(+), 9 deletions(-)

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index 696619898..50008fc3d 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -55,7 +55,7 @@ namespace comma { namespace name_value { namespace impl { namespace yaml {
 //             if(unnamed_array.size()!=0)
 //             {
 //                 //assert((i-1)->first==i->first);
-//                 //the last of duplicated name
+//                 //the previous_scalar of duplicated name
 //                 unnamed_array.push_back( std::make_pair( "", xml_to_ptree_( i->second ) ) );
 //                 out.add_child(i->first,unnamed_array);
 //                 unnamed_array= boost::property_tree::ptree();
@@ -74,7 +74,8 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool e
 {
     //COMMA_THROW( comma::exception, "implementing..." );
     std::cerr << "==> a" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
-    std::string scalar;
+    std::string scalar, previous_scalar;
+    bool previous_was_scalar{false};
     std::pair< std::string, boost::property_tree::ptree > seq;
     while( true )
     {
@@ -86,34 +87,39 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool e
         switch( event_type )
         {
             case YAML_SCALAR_EVENT:
+                std::cerr << "==> b: scalar: " << scalar << std::endl;
                 if( is_sequence )
                 {
-                    std::cerr << "==> nooo" << std::endl;
-                    // todo
-                    // t.add_child( "", boost::property_tree::ptree() ).put_value( scalar )
+                    std::cerr << "==> b.0: scalar: " << scalar << " previous_was_scalar: " << previous_was_scalar << std::endl;
+                    if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
+                    previous_was_scalar = true;
+                    previous_scalar = scalar;
+                    std::cerr << "==> b.1: scalar: " << scalar << " previous_scalar: " << previous_scalar << std::endl;
                     break;
                 }
                 if( expecting_value )
                 {
-                    std::cerr << "==> b.0: put value: " << scalar << std::endl;
+                    std::cerr << "==> b.2: put value: " << scalar << std::endl;
                     t.put_value( scalar );
                     return;
                 }
-                std::cerr << "==> b.1: add child: " << scalar << std::endl;
+                std::cerr << "==> b.3: add child: " << scalar << std::endl;
                 parse( parser, scalar.empty() ? t : t.add_child( scalar, boost::property_tree::ptree() ), true );
                 expecting_value = false;
                 break;
             case YAML_SEQUENCE_START_EVENT:
+                previous_was_scalar = false;
                 std::cerr << "==> c: seq start" << std::endl; 
-                //parse( parser, t.add_child( scalar, boost::property_tree::ptree() ), false, true );
                 parse( parser, t, false, true );
                 break;
             case YAML_SEQUENCE_END_EVENT:
+                if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
                 std::cerr << "==> d: seq end" << std::endl;
                 return;
             case YAML_MAPPING_START_EVENT:
+                previous_was_scalar = false;
                 std::cerr << "==> e: map start" << std::endl;
-                parse( parser, t );
+                parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t ); // todo
                 return;
             case YAML_MAPPING_END_EVENT:
             case YAML_STREAM_END_EVENT:

From 11006668fbe75a46d12138be8d94cf1f2dcbe894 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 24 Apr 2025 13:45:36 +1000
Subject: [PATCH 1023/1056] name_value: property_tree: yaml support: in
 progress...

---
 name_value/impl/yaml.cpp | 199 +++++++++++++++++++++++++++++++++------
 1 file changed, 169 insertions(+), 30 deletions(-)

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index 50008fc3d..5fb4a0acd 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -70,13 +70,135 @@ namespace comma { namespace name_value { namespace impl { namespace yaml {
 //     return out;
 // }
 
-static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool expecting_value = false, bool is_sequence = false )
+// static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool expecting_value = false, bool is_sequence = false )
+// {
+//     //COMMA_THROW( comma::exception, "implementing..." );
+//     std::cerr << "==> A" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
+//     std::string scalar, previous_scalar;
+//     bool previous_was_scalar{false};
+//     while( true )
+//     {
+//         yaml_event_t event;
+//         yaml_parser_parse( parser, &event );
+//         auto event_type = event.type;
+//         scalar = event.type == YAML_SCALAR_EVENT ? std::string( reinterpret_cast< const char* >( event.data.scalar.value ) ) : "";
+//         yaml_event_delete( &event );
+//         //std::cerr << "==> a: scalar: " << scalar << std::endl;
+//         switch( event_type )
+//         {
+//             case YAML_SCALAR_EVENT:
+//                 std::cerr << "==> b: scalar: " << scalar << std::endl;
+//                 if( is_sequence )
+//                 {
+//                     std::cerr << "==> b.0: scalar: " << scalar << " previous_was_scalar: " << previous_was_scalar << std::endl;
+//                     if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
+//                     previous_was_scalar = true;
+//                     previous_scalar = scalar;
+//                     break;
+//                 }
+//                 if( expecting_value )
+//                 {
+//                     std::cerr << "==> b.2: put value: " << scalar << std::endl;
+//                     t.put_value( scalar );
+//                     return;
+//                 }
+//                 std::cerr << "==> b.3: add child: " << scalar << std::endl;
+//                 parse( parser, scalar.empty() ? t : t.add_child( scalar, boost::property_tree::ptree() ), true );
+//                 expecting_value = false;
+//                 break;
+//             case YAML_SEQUENCE_START_EVENT:
+//                 previous_was_scalar = false;
+//                 std::cerr << "==> c: seq start: is_sequence: " << is_sequence << std::endl; 
+//                 parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t, false, true );
+//                 break;
+//             case YAML_SEQUENCE_END_EVENT:
+//                 if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
+//                 std::cerr << "==> d: seq end" << std::endl;
+//                 return;
+//             case YAML_MAPPING_START_EVENT:
+//                 previous_was_scalar = false;
+//                 std::cerr << "==> e: map start" << std::endl;
+//                 parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t ); // todo
+//                 return;
+//             case YAML_MAPPING_END_EVENT:
+//                 std::cerr << "==> f: map end" << std::endl;
+//                 return;
+//             case YAML_STREAM_END_EVENT:
+//             case YAML_DOCUMENT_END_EVENT:
+//             case YAML_NO_EVENT:
+//                 std::cerr << "==> f: stream/document end or no event" << std::endl;
+//                 return;
+//             case YAML_DOCUMENT_START_EVENT:
+//             case YAML_STREAM_START_EVENT:
+//             case YAML_ALIAS_EVENT:
+//                 break; // todo? handle?
+//             // default:
+//             // {
+//             //     auto e = event.type;
+//             //     yaml_event_delete( &event );       
+//             //     COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
+//             // }
+//         }
+//     }
+// }
+
+// static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool expecting_value = false, bool is_sequence = false )
+// {
+//     //COMMA_THROW( comma::exception, "implementing..." );
+//     std::cerr << "==> A" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
+//     std::string scalar, previous_scalar;
+//     bool previous_was_scalar{false};
+//     while( true )
+//     {
+//         yaml_event_t event;
+//         yaml_parser_parse( parser, &event );
+//         auto event_type = event.type;
+//         scalar = event.type == YAML_SCALAR_EVENT ? std::string( reinterpret_cast< const char* >( event.data.scalar.value ) ) : "";
+//         yaml_event_delete( &event );
+//         //std::cerr << "==> a: scalar: " << scalar << std::endl;
+//         switch( event_type )
+//         {
+//             case YAML_SCALAR_EVENT:
+//                 std::cerr << "==> b: scalar: " << scalar << std::endl;
+//                 break;
+//             case YAML_SEQUENCE_START_EVENT:
+//                 std::cerr << "==> c: seq start" << std::endl;
+//                 break;
+//             case YAML_SEQUENCE_END_EVENT:
+//                 std::cerr << "==> d: seq end" << std::endl;
+//                 break;
+//             case YAML_MAPPING_START_EVENT:
+//                 std::cerr << "==> e: map start" << std::endl;
+//                 break;
+//             case YAML_MAPPING_END_EVENT:
+//                 std::cerr << "==> f: map end" << std::endl;
+//                 break;
+//             case YAML_STREAM_END_EVENT:
+//             case YAML_DOCUMENT_END_EVENT:
+//             case YAML_NO_EVENT:
+//                 std::cerr << "==> f: stream/document end or no event" << std::endl;
+//                 return;
+//             case YAML_DOCUMENT_START_EVENT:
+//             case YAML_STREAM_START_EVENT:
+//             case YAML_ALIAS_EVENT:
+//                 break; // todo? handle?
+//             // default:
+//             // {
+//             //     auto e = event.type;
+//             //     yaml_event_delete( &event );       
+//             //     COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
+//             // }
+//         }
+//     }
+// }
+
+enum class on { none, scalar, seq, map };
+
+static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on what = on::none, bool is_name = false )
 {
     //COMMA_THROW( comma::exception, "implementing..." );
-    std::cerr << "==> a" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
-    std::string scalar, previous_scalar;
-    bool previous_was_scalar{false};
-    std::pair< std::string, boost::property_tree::ptree > seq;
+    //std::cerr << "==> A" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
+    std::string scalar;
     while( true )
     {
         yaml_event_t event;
@@ -87,45 +209,62 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool e
         switch( event_type )
         {
             case YAML_SCALAR_EVENT:
-                std::cerr << "==> b: scalar: " << scalar << std::endl;
-                if( is_sequence )
-                {
-                    std::cerr << "==> b.0: scalar: " << scalar << " previous_was_scalar: " << previous_was_scalar << std::endl;
-                    if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
-                    previous_was_scalar = true;
-                    previous_scalar = scalar;
-                    std::cerr << "==> b.1: scalar: " << scalar << " previous_scalar: " << previous_scalar << std::endl;
-                    break;
-                }
-                if( expecting_value )
+                switch( what )
                 {
-                    std::cerr << "==> b.2: put value: " << scalar << std::endl;
-                    t.put_value( scalar );
-                    return;
+                    case on::none:
+                        COMMA_THROW( comma::exception, "expected map or sequence, got scalar" );
+                    case on::scalar:
+                        // todo
+                        break;
+                    case on::map:
+                        if( is_name ) { parse( parser, t.add_child( scalar, boost::property_tree::ptree() ), on::map, false ); break; }
+                        t.put_value( scalar );
+                        return;
+                    case on::seq:
+                        if( is_name ) {}
+                        t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( scalar );
+                        break;
                 }
-                std::cerr << "==> b.3: add child: " << scalar << std::endl;
-                parse( parser, scalar.empty() ? t : t.add_child( scalar, boost::property_tree::ptree() ), true );
-                expecting_value = false;
+                // std::cerr << "==> b: scalar: " << scalar << std::endl;
+                // if( is_sequence )
+                // {
+                //     std::cerr << "==> b.0: scalar: " << scalar << " previous_was_scalar: " << previous_was_scalar << std::endl;
+                //     if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
+                //     previous_was_scalar = true;
+                //     previous_scalar = scalar;
+                //     break;
+                // }
+                // if( expecting_value )
+                // {
+                //     std::cerr << "==> b.2: put value: " << scalar << std::endl;
+                //     t.put_value( scalar );
+                //     return;
+                // }
+                // std::cerr << "==> b.3: add child: " << scalar << std::endl;
+                // parse( parser, scalar.empty() ? t : t.add_child( scalar, boost::property_tree::ptree() ), true );
+                // expecting_value = false;
                 break;
             case YAML_SEQUENCE_START_EVENT:
-                previous_was_scalar = false;
-                std::cerr << "==> c: seq start" << std::endl; 
-                parse( parser, t, false, true );
-                break;
+                // previous_was_scalar = false;
+                // std::cerr << "==> c: seq start: is_sequence: " << is_sequence << std::endl; 
+                // parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t, false, true );
+                std::cerr << "==> c: seq start" << std::endl;
+                parse( parser, t, on::seq );
+                return;
             case YAML_SEQUENCE_END_EVENT:
-                if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
                 std::cerr << "==> d: seq end" << std::endl;
                 return;
             case YAML_MAPPING_START_EVENT:
-                previous_was_scalar = false;
                 std::cerr << "==> e: map start" << std::endl;
-                parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t ); // todo
+                parse( parser, t, on::map, true );
                 return;
             case YAML_MAPPING_END_EVENT:
+                std::cerr << "==> f: map end" << std::endl;
+                return;
             case YAML_STREAM_END_EVENT:
             case YAML_DOCUMENT_END_EVENT:
             case YAML_NO_EVENT:
-                std::cerr << "==> f: map end" << std::endl;
+                std::cerr << "==> f: stream/document end or no event" << std::endl;
                 return;
             case YAML_DOCUMENT_START_EVENT:
             case YAML_STREAM_START_EVENT:

From ceb6005bccfa0909f92cf2224651a0627a4a4a86 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 24 Apr 2025 13:53:28 +1000
Subject: [PATCH 1024/1056] name_value: property_tree: yaml support: in
 progress...

---
 name_value/impl/yaml.cpp | 53 +---------------------------------------
 1 file changed, 1 insertion(+), 52 deletions(-)

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index 5fb4a0acd..d2b168bf3 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -142,56 +142,6 @@ namespace comma { namespace name_value { namespace impl { namespace yaml {
 //     }
 // }
 
-// static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool expecting_value = false, bool is_sequence = false )
-// {
-//     //COMMA_THROW( comma::exception, "implementing..." );
-//     std::cerr << "==> A" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
-//     std::string scalar, previous_scalar;
-//     bool previous_was_scalar{false};
-//     while( true )
-//     {
-//         yaml_event_t event;
-//         yaml_parser_parse( parser, &event );
-//         auto event_type = event.type;
-//         scalar = event.type == YAML_SCALAR_EVENT ? std::string( reinterpret_cast< const char* >( event.data.scalar.value ) ) : "";
-//         yaml_event_delete( &event );
-//         //std::cerr << "==> a: scalar: " << scalar << std::endl;
-//         switch( event_type )
-//         {
-//             case YAML_SCALAR_EVENT:
-//                 std::cerr << "==> b: scalar: " << scalar << std::endl;
-//                 break;
-//             case YAML_SEQUENCE_START_EVENT:
-//                 std::cerr << "==> c: seq start" << std::endl;
-//                 break;
-//             case YAML_SEQUENCE_END_EVENT:
-//                 std::cerr << "==> d: seq end" << std::endl;
-//                 break;
-//             case YAML_MAPPING_START_EVENT:
-//                 std::cerr << "==> e: map start" << std::endl;
-//                 break;
-//             case YAML_MAPPING_END_EVENT:
-//                 std::cerr << "==> f: map end" << std::endl;
-//                 break;
-//             case YAML_STREAM_END_EVENT:
-//             case YAML_DOCUMENT_END_EVENT:
-//             case YAML_NO_EVENT:
-//                 std::cerr << "==> f: stream/document end or no event" << std::endl;
-//                 return;
-//             case YAML_DOCUMENT_START_EVENT:
-//             case YAML_STREAM_START_EVENT:
-//             case YAML_ALIAS_EVENT:
-//                 break; // todo? handle?
-//             // default:
-//             // {
-//             //     auto e = event.type;
-//             //     yaml_event_delete( &event );       
-//             //     COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
-//             // }
-//         }
-//     }
-// }
-
 enum class on { none, scalar, seq, map };
 
 static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on what = on::none, bool is_name = false )
@@ -221,7 +171,6 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
                         t.put_value( scalar );
                         return;
                     case on::seq:
-                        if( is_name ) {}
                         t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( scalar );
                         break;
                 }
@@ -256,7 +205,7 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
                 return;
             case YAML_MAPPING_START_EVENT:
                 std::cerr << "==> e: map start" << std::endl;
-                parse( parser, t, on::map, true );
+                parse( parser, what == on::seq ? t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second : t, on::map, true );
                 return;
             case YAML_MAPPING_END_EVENT:
                 std::cerr << "==> f: map end" << std::endl;

From dcafd7083c4345dbc4da87e044cc0005f26e29b0 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 24 Apr 2025 14:18:27 +1000
Subject: [PATCH 1025/1056] name_value: property_tree: yaml support: first cut
 done

---
 name_value/impl/yaml.cpp | 147 ++++-----------------------------------
 name_value/ptree.cpp     |   5 +-
 2 files changed, 16 insertions(+), 136 deletions(-)

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index d2b168bf3..e25a38cf0 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -37,111 +37,6 @@
 
 namespace comma { namespace name_value { namespace impl { namespace yaml {
 
-// static boost::property_tree::ptree xml_to_ptree_( boost::property_tree::ptree& ptree)
-// {
-//     boost::property_tree::ptree out= boost::property_tree::ptree();
-//     boost::property_tree::ptree unnamed_array= boost::property_tree::ptree();
-//     for ( boost::property_tree::ptree::iterator i=ptree.begin(); i!=ptree.end(); i++ )
-//     {
-//         //look ahead for duplicate name
-//         boost::property_tree::ptree::iterator lah = i;
-//         if ( ++lah != ptree.end() && i->first == lah->first )
-//         {
-//             //add to unnamed array
-//             unnamed_array.push_back( std::make_pair( "", xml_to_ptree_( i->second ) ) );
-//         }
-//         else
-//         {
-//             if(unnamed_array.size()!=0)
-//             {
-//                 //assert((i-1)->first==i->first);
-//                 //the previous_scalar of duplicated name
-//                 unnamed_array.push_back( std::make_pair( "", xml_to_ptree_( i->second ) ) );
-//                 out.add_child(i->first,unnamed_array);
-//                 unnamed_array= boost::property_tree::ptree();
-//             }
-//             else
-//             {
-//                 out.add_child(i->first, xml_to_ptree_(i->second) );
-//             }
-//         }
-//     }
-//     out.put_value( comma::strip( ptree.get_value<std::string>(), " \n\t" ));
-//     return out;
-// }
-
-// static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, bool expecting_value = false, bool is_sequence = false )
-// {
-//     //COMMA_THROW( comma::exception, "implementing..." );
-//     std::cerr << "==> A" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
-//     std::string scalar, previous_scalar;
-//     bool previous_was_scalar{false};
-//     while( true )
-//     {
-//         yaml_event_t event;
-//         yaml_parser_parse( parser, &event );
-//         auto event_type = event.type;
-//         scalar = event.type == YAML_SCALAR_EVENT ? std::string( reinterpret_cast< const char* >( event.data.scalar.value ) ) : "";
-//         yaml_event_delete( &event );
-//         //std::cerr << "==> a: scalar: " << scalar << std::endl;
-//         switch( event_type )
-//         {
-//             case YAML_SCALAR_EVENT:
-//                 std::cerr << "==> b: scalar: " << scalar << std::endl;
-//                 if( is_sequence )
-//                 {
-//                     std::cerr << "==> b.0: scalar: " << scalar << " previous_was_scalar: " << previous_was_scalar << std::endl;
-//                     if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
-//                     previous_was_scalar = true;
-//                     previous_scalar = scalar;
-//                     break;
-//                 }
-//                 if( expecting_value )
-//                 {
-//                     std::cerr << "==> b.2: put value: " << scalar << std::endl;
-//                     t.put_value( scalar );
-//                     return;
-//                 }
-//                 std::cerr << "==> b.3: add child: " << scalar << std::endl;
-//                 parse( parser, scalar.empty() ? t : t.add_child( scalar, boost::property_tree::ptree() ), true );
-//                 expecting_value = false;
-//                 break;
-//             case YAML_SEQUENCE_START_EVENT:
-//                 previous_was_scalar = false;
-//                 std::cerr << "==> c: seq start: is_sequence: " << is_sequence << std::endl; 
-//                 parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t, false, true );
-//                 break;
-//             case YAML_SEQUENCE_END_EVENT:
-//                 if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
-//                 std::cerr << "==> d: seq end" << std::endl;
-//                 return;
-//             case YAML_MAPPING_START_EVENT:
-//                 previous_was_scalar = false;
-//                 std::cerr << "==> e: map start" << std::endl;
-//                 parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t ); // todo
-//                 return;
-//             case YAML_MAPPING_END_EVENT:
-//                 std::cerr << "==> f: map end" << std::endl;
-//                 return;
-//             case YAML_STREAM_END_EVENT:
-//             case YAML_DOCUMENT_END_EVENT:
-//             case YAML_NO_EVENT:
-//                 std::cerr << "==> f: stream/document end or no event" << std::endl;
-//                 return;
-//             case YAML_DOCUMENT_START_EVENT:
-//             case YAML_STREAM_START_EVENT:
-//             case YAML_ALIAS_EVENT:
-//                 break; // todo? handle?
-//             // default:
-//             // {
-//             //     auto e = event.type;
-//             //     yaml_event_delete( &event );       
-//             //     COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
-//             // }
-//         }
-//     }
-// }
-
 enum class on { none, scalar, seq, map };
 
 static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on what = on::none, bool is_name = false )
@@ -162,10 +57,8 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
                 switch( what )
                 {
                     case on::none:
-                        COMMA_THROW( comma::exception, "expected map or sequence, got scalar" );
                     case on::scalar:
-                        // todo
-                        break;
+                        COMMA_THROW( comma::exception, "expected map or sequence, got scalar" );
                     case on::map:
                         if( is_name ) { parse( parser, t.add_child( scalar, boost::property_tree::ptree() ), on::map, false ); break; }
                         t.put_value( scalar );
@@ -174,46 +67,30 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
                         t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( scalar );
                         break;
                 }
-                // std::cerr << "==> b: scalar: " << scalar << std::endl;
-                // if( is_sequence )
-                // {
-                //     std::cerr << "==> b.0: scalar: " << scalar << " previous_was_scalar: " << previous_was_scalar << std::endl;
-                //     if( previous_was_scalar ) { t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( previous_scalar ); }
-                //     previous_was_scalar = true;
-                //     previous_scalar = scalar;
-                //     break;
-                // }
-                // if( expecting_value )
-                // {
-                //     std::cerr << "==> b.2: put value: " << scalar << std::endl;
-                //     t.put_value( scalar );
-                //     return;
-                // }
-                // std::cerr << "==> b.3: add child: " << scalar << std::endl;
-                // parse( parser, scalar.empty() ? t : t.add_child( scalar, boost::property_tree::ptree() ), true );
-                // expecting_value = false;
                 break;
             case YAML_SEQUENCE_START_EVENT:
-                // previous_was_scalar = false;
-                // std::cerr << "==> c: seq start: is_sequence: " << is_sequence << std::endl; 
-                // parse( parser, is_sequence ? t.add_child( previous_scalar, boost::property_tree::ptree() ) : t, false, true );
-                std::cerr << "==> c: seq start" << std::endl;
+                //std::cerr << "==> c: seq start" << std::endl;
                 parse( parser, t, on::seq );
                 return;
             case YAML_SEQUENCE_END_EVENT:
-                std::cerr << "==> d: seq end" << std::endl;
+                //std::cerr << "==> d: seq end" << std::endl;
                 return;
             case YAML_MAPPING_START_EVENT:
-                std::cerr << "==> e: map start" << std::endl;
-                parse( parser, what == on::seq ? t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second : t, on::map, true );
+                //std::cerr << "==> e: map start" << std::endl;
+                if( what == on::seq )
+                {
+                    parse( parser, t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second, on::map, true );
+                    break;
+                }
+                parse( parser, t, on::map, true );
                 return;
             case YAML_MAPPING_END_EVENT:
-                std::cerr << "==> f: map end" << std::endl;
+                //std::cerr << "==> f: map end" << std::endl;
                 return;
             case YAML_STREAM_END_EVENT:
             case YAML_DOCUMENT_END_EVENT:
             case YAML_NO_EVENT:
-                std::cerr << "==> f: stream/document end or no event" << std::endl;
+                //std::cerr << "==> f: stream/document end or no event" << std::endl;
                 return;
             case YAML_DOCUMENT_START_EVENT:
             case YAML_STREAM_START_EVENT:
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index 986e116bd..4d76eefcd 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -487,7 +487,10 @@ boost::property_tree::ptree& property_tree::from_yaml( const std::string& s, boo
 
 std::string property_tree::to_yaml( const boost::property_tree::ptree& t )
 {
-    COMMA_THROW( comma::exception, "todo" );
+    COMMA_THROW( comma::exception, R"(conversion to yaml: todo; in the meantime, do it in python:
+
+cat your.json | python3 -c 'import json, yaml, sys; yaml.dump( json.load( sys.stdin ), sys.stdout )
+)" );
 }
 
 #else // #if defined comma_BUILD_NAME_VALUE_YAML

From 33d1f236e8209b4d135fee5a4e7a05c9d8f0d95a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 24 Apr 2025 14:32:06 +1000
Subject: [PATCH 1026/1056] name_value: serialize: read_yaml() implemented;
 write_yaml() added, but will throw not-implemented exception

---
 name_value/serialize.h | 74 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 74 insertions(+)

diff --git a/name_value/serialize.h b/name_value/serialize.h
index 9c48b100f..c158afa51 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -135,6 +135,35 @@ template < typename T > void read_xml( T& t, std::istream& stream, const char* r
 template < typename T > void read_xml( T& t, std::istream& stream, bool permissive );
 template < typename T > void read_xml( T& t, std::istream& stream );
 
+/// read object from xml file or stream
+/// convenience wrappers for comma::property_tree boiler-plate code
+template < typename T > T read_yaml( const std::string& filename, const xpath& root, bool permissive );
+template < typename T > T read_yaml( const std::string& filename, const char* root, bool permissive );
+template < typename T > T read_yaml( const std::string& filename, const xpath& root );
+template < typename T > T read_yaml( const std::string& filename, const char* root );
+template < typename T > T read_yaml( const std::string& filename, bool permissive, bool split_filename );
+template < typename T > T read_yaml( const std::string& filename, bool permissive );
+template < typename T > T read_yaml( const std::string& filename );
+template < typename T > void read_yaml( T& t, const std::string& filename, const xpath& root, bool permissive );
+template < typename T > void read_yaml( T& t, const std::string& filename, const char* root, bool permissive );
+template < typename T > void read_yaml( T& t, const std::string& filename, const xpath& root );
+template < typename T > void read_yaml( T& t, const std::string& filename, const char* root );
+template < typename T > void read_yaml( T& t, const std::string& filename, bool permissive, bool split_filename );
+template < typename T > void read_yaml( T& t, const std::string& filename, bool permissive );
+template < typename T > void read_yaml( T& t, const std::string& filename );
+template < typename T > T read_yaml( std::istream& stream, const xpath& root, bool permissive );
+template < typename T > T read_yaml( std::istream& stream, const char* root, bool permissive );
+template < typename T > T read_yaml( std::istream& stream, const xpath& root );
+template < typename T > T read_yaml( std::istream& stream, const char* root );
+template < typename T > T read_yaml( std::istream& stream, bool permissive );
+template < typename T > T read_yaml( std::istream& stream );
+template < typename T > void read_yaml( T& t, std::istream& stream, const xpath& root, bool permissive );
+template < typename T > void read_yaml( T& t, std::istream& stream, const char* root, bool permissive );
+template < typename T > void read_yaml( T& t, std::istream& stream, const xpath& root );
+template < typename T > void read_yaml( T& t, std::istream& stream, const char* root );
+template < typename T > void read_yaml( T& t, std::istream& stream, bool permissive );
+template < typename T > void read_yaml( T& t, std::istream& stream );
+
 /// read object from path-value file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 template < typename T > T read_path_value( const std::string& filename, const xpath& root, bool permissive );
@@ -333,6 +362,51 @@ template < typename T > inline void read_xml( T& t, std::istream& stream, const
 template < typename T > inline void read_xml( T& t, std::istream& stream, bool permissive ) { read_xml< T >( t, stream, xpath(), permissive ); }
 template < typename T > inline void read_xml( T& t, std::istream& stream ) { read_xml< T >( t, stream, xpath(), true ); }
 
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const xpath& root, bool permissive )
+{
+    std::ifstream ifs( &filename[0] );
+    if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
+    read_yaml< T >( t, ifs, root, permissive );
+    ifs.close();
+}
+
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const xpath& root, bool permissive )
+{
+    boost::property_tree::ptree p;
+    comma::property_tree::read_yaml( stream, p );
+    comma::from_ptree from_ptree( p, root, permissive );
+    comma::visiting::apply( from_ptree ).to( t );
+}
+
+template < typename T > inline T read_yaml( const std::string& filename, const xpath& root, bool permissive ) { T t; read_yaml< T >( t, filename, root, permissive ); return t; }
+template < typename T > inline T read_yaml( const std::string& filename, const char* root, bool permissive ) { return root ? read_yaml< T >( filename, xpath( root ), permissive ) : read_yaml< T >( filename, permissive ); }
+template < typename T > inline T read_yaml( const std::string& filename, const xpath& root ) { return read_yaml< T >( filename, root, true ); }
+template < typename T > inline T read_yaml( const std::string& filename, const char* root ) { return root ? read_yaml< T >( filename, xpath( root ), true ) : read_yaml< T >( filename, true ); }
+template < typename T > inline T read_yaml( const std::string& filename, bool permissive, bool split_filename ) { T t; read_yaml< T >( t, filename, permissive, split_filename ); return t; }
+template < typename T > inline T read_yaml( const std::string& filename, bool permissive ) { return read_yaml< T >( filename, xpath(), permissive ); }
+template < typename T > inline T read_yaml( const std::string& filename ) { return read_yaml< T >( filename, xpath(), true ); }
+template < typename T > inline T read_yaml( std::istream& stream, const xpath& root, bool permissive ) { T t; read_yaml< T >( t, stream, root, permissive ); return t; }
+template < typename T > inline T read_yaml( std::istream& stream, const char* root, bool permissive ) { return root ? read_yaml< T >( stream, xpath( root ), permissive ) : read_yaml< T >( stream, permissive ); }
+template < typename T > inline T read_yaml( std::istream& stream, const xpath& root ) { return read_yaml< T >( stream, root, true ); }
+template < typename T > inline T read_yaml( std::istream& stream, const char* root ) { return root ? read_yaml< T >( stream, xpath( root ), true ) : read_yaml< T >( stream, true ); }
+template < typename T > inline T read_yaml( std::istream& stream, bool permissive ) { return read_yaml< T >( stream, xpath(), permissive ); }
+template < typename T > inline T read_yaml( std::istream& stream ) { return read_yaml< T >( stream, xpath(), true ); }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_yaml< T >( t, filename, xpath( root ), permissive ); } else { read_yaml< T >( t, filename, permissive ); } }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const xpath& root ) { read_yaml< T >( t, filename, root, true ); }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const char* root ) { if( root ) { read_yaml< T >( t, filename, xpath( root ), true ); } else { read_yaml< T >( t, filename, true ); } }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_yaml< T >( t, p.first, p.second, permissive );
+}
+template < typename T > inline void read_yaml( T& t, const std::string& filename, bool permissive ) { read_yaml< T >( t, filename, xpath(), permissive ); }
+template < typename T > inline void read_yaml( T& t, const std::string& filename ) { read_yaml< T >( t, filename, xpath(), true ); }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_yaml< T >( t, stream, xpath( root ), permissive ); } else { read_yaml< T >( t, stream, permissive ); } }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const xpath& root ) { read_yaml< T >( t, stream, root, true ); }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const char* root ) { if( root ) { read_yaml< T >( t, stream, xpath( root ), true ); } else { read_yaml< T >( t, stream, true ); } }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, bool permissive ) { read_yaml< T >( t, stream, xpath(), permissive ); }
+template < typename T > inline void read_yaml( T& t, std::istream& stream ) { read_yaml< T >( t, stream, xpath(), true ); }
+
 template < typename T > inline void read_path_value( T& t, std::istream& stream, const xpath& root, bool permissive )
 {
     boost::property_tree::ptree p;

From 84a5bf0f771dee75bd434bdec9c3b11af7e532d3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 24 Apr 2025 14:33:10 +1000
Subject: [PATCH 1027/1056] name_value: serialize: read_yaml() implemented;
 write_yaml() added, but will throw not-implemented exception

---
 name_value/serialize.h | 32 ++++++++++++++++++++++++++++++++
 1 file changed, 32 insertions(+)

diff --git a/name_value/serialize.h b/name_value/serialize.h
index c158afa51..bc74e1a80 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -243,6 +243,15 @@ template < typename T > std::ostream& write_xml( const T& t, std::ostream& strea
 template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream, const char* root );
 template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream );
 
+/// write yaml object to file or stream
+/// convenience wrappers for comma::property_tree boiler-plate code
+template < typename T > void write_yaml( const T& t, const std::string& filename, const xpath& root );
+template < typename T > void write_yaml( const T& t, const std::string& filename, const char* root );
+template < typename T > void write_yaml( const T& t, const std::string& filename );
+template < typename T > std::ostream& write_yaml( const T& t, std::ostream& stream, const xpath& root );
+template < typename T > std::ostream& write_yaml( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_yaml( const T& t, std::ostream& stream );
+
 /// write path-value object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 /// @todo parametrize on equality sign and delimiter?
@@ -553,6 +562,29 @@ template < typename T > inline void write_xml( const T& t, const std::string& fi
 template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream, const char* root ) { return write_xml( t, stream, xpath( root ) ); }
 template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream ) { return write_xml( t, stream, xpath() ); }
 
+template < typename T > inline void write_xml( const T& t, const std::string& filename, const xpath& root )
+{
+    std::ofstream ofs( &filename[0] );
+    if( !ofs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
+    write_xml< T >( t, ofs, root );
+    ofs.close();
+}
+
+template < typename T > inline std::ostream& write_yaml( const T& t, std::ostream& stream, const xpath& root )
+{
+    boost::property_tree::ptree p;
+    comma::to_ptree to_ptree( p, root );
+    comma::visiting::apply( to_ptree ).to( t );
+    stream.precision( 16 ); // quick and dirty
+    boost::property_tree::write_yaml( stream, p );
+    return stream;
+}
+
+template < typename T > inline void write_yaml( const T& t, const std::string& filename, const char* root ) { write_yaml( t, filename, xpath( root ) ); }
+template < typename T > inline void write_yaml( const T& t, const std::string& filename ) { write_yaml( t, filename, xpath() ); }
+template < typename T > inline std::ostream& write_yaml( const T& t, std::ostream& stream, const char* root ) { return write_yaml( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_yaml( const T& t, std::ostream& stream ) { return write_yaml( t, stream, xpath() ); }
+
 template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool unquote_numbers, const std::string& prefix )
 {
     boost::property_tree::ptree p;

From 3a1634345dcb0427d28475b432f92074fbc28d85 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 28 Apr 2025 11:06:57 +1000
Subject: [PATCH 1028/1056] name_value: yaml support: compilation errors fixed

---
 name_value/ptree.cpp   | 45 +++++++++++-------------------------------
 name_value/serialize.h |  6 +++---
 2 files changed, 15 insertions(+), 36 deletions(-)

diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index 4d76eefcd..e234b25b9 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -456,7 +456,15 @@ void property_tree::from_unknown_seekable( std::istream& stream, boost::property
     COMMA_THROW( comma::exception, "failed to guess format" );
 }
 
-#if defined comma_BUILD_NAME_VALUE_YAML
+void property_tree::write_yaml( std::ostream& os, const boost::property_tree::ptree& t ) { os << to_yaml( t ) << std::endl; }
+
+std::string property_tree::to_yaml( const boost::property_tree::ptree& t )
+{
+    COMMA_THROW( comma::exception, R"(conversion to yaml: todo; in the meantime, do it in python:
+
+cat your.json | python3 -c 'import json, yaml, sys; yaml.dump( json.load( sys.stdin ), sys.stdout )
+)" );
+}
 
 boost::property_tree::ptree property_tree::from_yaml( const std::string& s )
 {
@@ -478,42 +486,13 @@ void property_tree::read_yaml( std::istream& is, boost::property_tree::ptree& t
     from_yaml( oss.str(), t );
 }
 
-void property_tree::write_yaml( std::ostream& os, const boost::property_tree::ptree& t ) { os << to_yaml( t ) << std::endl; }
-
-boost::property_tree::ptree& property_tree::from_yaml( const std::string& s, boost::property_tree::ptree& t )
-{
-    return comma::name_value::impl::yaml::to_ptree( s, t );
-}
-
-std::string property_tree::to_yaml( const boost::property_tree::ptree& t )
-{
-    COMMA_THROW( comma::exception, R"(conversion to yaml: todo; in the meantime, do it in python:
+#if defined comma_BUILD_NAME_VALUE_YAML
 
-cat your.json | python3 -c 'import json, yaml, sys; yaml.dump( json.load( sys.stdin ), sys.stdout )
-)" );
-}
+boost::property_tree::ptree& property_tree::from_yaml( const std::string& s, boost::property_tree::ptree& t ) { return comma::name_value::impl::yaml::to_ptree( s, t ); }
 
 #else // #if defined comma_BUILD_NAME_VALUE_YAML
 
-boost::property_tree::ptree property_tree::from_yaml( const std::string& s )
-{
-    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
-}
-
-boost::property_tree::ptree& property_tree::from_yaml( const std::string& s, boost::property_tree::ptree& t )
-{
-    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
-}
-
-boost::property_tree::ptree& property_tree::from_yaml( std::istream& is, boost::property_tree::ptree& t )
-{
-    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
-}
-
-std::string property_tree::to_yaml( const boost::property_tree::ptree& t )
-{
-    COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" );
-}
+boost::property_tree::ptree& property_tree::from_yaml( const std::string&, boost::property_tree::ptree& ) { COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" ); }
 
 #endif // #if defined comma_BUILD_NAME_VALUE_YAML
 
diff --git a/name_value/serialize.h b/name_value/serialize.h
index bc74e1a80..4a88dd46c 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -562,11 +562,11 @@ template < typename T > inline void write_xml( const T& t, const std::string& fi
 template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream, const char* root ) { return write_xml( t, stream, xpath( root ) ); }
 template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream ) { return write_xml( t, stream, xpath() ); }
 
-template < typename T > inline void write_xml( const T& t, const std::string& filename, const xpath& root )
+template < typename T > inline void write_yaml( const T& t, const std::string& filename, const xpath& root )
 {
     std::ofstream ofs( &filename[0] );
     if( !ofs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
-    write_xml< T >( t, ofs, root );
+    write_yaml< T >( t, ofs, root );
     ofs.close();
 }
 
@@ -576,7 +576,7 @@ template < typename T > inline std::ostream& write_yaml( const T& t, std::ostrea
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
-    boost::property_tree::write_yaml( stream, p );
+    comma::property_tree::write_yaml( stream, p );
     return stream;
 }
 

From c62953b7506ad3ec5dae922fc0d6751b8d75d9bd Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 29 Apr 2025 18:41:14 +1000
Subject: [PATCH 1029/1056] name_value: yaml: typo bug fixed: std::cin replaced
 with input stream parameter; unit test: negative test made more outrageous,
 otherwise yaml swallows anything

---
 name_value/impl/yaml.cpp                 | 39 +++++++++++++++++++-----
 name_value/ptree.cpp                     |  2 +-
 name_value/test/serialise_guess_test.cpp |  2 +-
 3 files changed, 33 insertions(+), 10 deletions(-)

diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
index e25a38cf0..87a0cb688 100644
--- a/name_value/impl/yaml.cpp
+++ b/name_value/impl/yaml.cpp
@@ -39,7 +39,26 @@ namespace comma { namespace name_value { namespace impl { namespace yaml {
 
 enum class on { none, scalar, seq, map };
 
-static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on what = on::none, bool is_name = false )
+const char* event_to_string( yaml_event_type_e e )
+{
+    switch( e )
+    {
+        case YAML_NO_EVENT: return "no";
+        case YAML_STREAM_START_EVENT: return "stream start";
+        case YAML_STREAM_END_EVENT: return "stream end";
+        case YAML_DOCUMENT_START_EVENT: return "document start";
+        case YAML_DOCUMENT_END_EVENT: return "document end";
+        case YAML_ALIAS_EVENT: return "alias";
+        case YAML_SCALAR_EVENT: return "scalar";
+        case YAML_SEQUENCE_START_EVENT: return "sequence start";
+        case YAML_SEQUENCE_END_EVENT: return "sequence end";
+        case YAML_MAPPING_START_EVENT: return "mapping start";
+        case YAML_MAPPING_END_EVENT: return "mapping end";
+    }
+    return "unknown"; // never here
+}
+
+static yaml_event_type_e parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on what = on::none, bool is_name = false )
 {
     //COMMA_THROW( comma::exception, "implementing..." );
     //std::cerr << "==> A" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
@@ -47,7 +66,7 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
     while( true )
     {
         yaml_event_t event;
-        yaml_parser_parse( parser, &event );
+        COMMA_ASSERT( yaml_parser_parse( parser, &event ) == 1, "yaml_parser_parse() failed" );
         auto event_type = event.type;
         scalar = event.type == YAML_SCALAR_EVENT ? std::string( reinterpret_cast< const char* >( event.data.scalar.value ) ) : "";
         yaml_event_delete( &event );
@@ -62,7 +81,7 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
                     case on::map:
                         if( is_name ) { parse( parser, t.add_child( scalar, boost::property_tree::ptree() ), on::map, false ); break; }
                         t.put_value( scalar );
-                        return;
+                        return YAML_SCALAR_EVENT;
                     case on::seq:
                         t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( scalar );
                         break;
@@ -71,10 +90,10 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
             case YAML_SEQUENCE_START_EVENT:
                 //std::cerr << "==> c: seq start" << std::endl;
                 parse( parser, t, on::seq );
-                return;
+                return YAML_SEQUENCE_START_EVENT;
             case YAML_SEQUENCE_END_EVENT:
                 //std::cerr << "==> d: seq end" << std::endl;
-                return;
+                return YAML_SEQUENCE_END_EVENT;
             case YAML_MAPPING_START_EVENT:
                 //std::cerr << "==> e: map start" << std::endl;
                 if( what == on::seq )
@@ -83,15 +102,17 @@ static void parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on wha
                     break;
                 }
                 parse( parser, t, on::map, true );
-                return;
+                return YAML_MAPPING_START_EVENT;
             case YAML_MAPPING_END_EVENT:
                 //std::cerr << "==> f: map end" << std::endl;
-                return;
+                return YAML_MAPPING_END_EVENT;
             case YAML_STREAM_END_EVENT:
+                return YAML_STREAM_END_EVENT;
             case YAML_DOCUMENT_END_EVENT:
+                return YAML_DOCUMENT_END_EVENT;
             case YAML_NO_EVENT:
                 //std::cerr << "==> f: stream/document end or no event" << std::endl;
-                return;
+                return YAML_NO_EVENT;
             case YAML_DOCUMENT_START_EVENT:
             case YAML_STREAM_START_EVENT:
             case YAML_ALIAS_EVENT:
@@ -112,6 +133,8 @@ boost::property_tree::ptree& to_ptree( const std::string& s, boost::property_tre
     yaml_parser_initialize( &parser );
     yaml_parser_set_input_string( &parser, reinterpret_cast< const unsigned char* >( &s[0] ), s.size() );
     parse( &parser, t );
+    // auto r = parse( &parser, t );
+    // COMMA_ASSERT( r == YAML_STREAM_END_EVENT, "expected YAML_STREAM_END_EVENT; got: " << event_to_string( r ) << " event" );
     yaml_parser_delete( &parser );
     return t;
 }
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index e234b25b9..fb678791f 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -479,7 +479,7 @@ void property_tree::read_yaml( std::istream& is, boost::property_tree::ptree& t
     while( is.good() && !is.eof() ) // quick and dirty, watch performance
     {
         std::string line;
-        std::getline( std::cin, line );
+        std::getline( is, line );
         if( line.empty() ) { continue; }
         oss << line << std::endl;
     }
diff --git a/name_value/test/serialise_guess_test.cpp b/name_value/test/serialise_guess_test.cpp
index c8a40bf60..f6f8f67a5 100644
--- a/name_value/test/serialise_guess_test.cpp
+++ b/name_value/test/serialise_guess_test.cpp
@@ -233,7 +233,7 @@ TEST( serialise, guess_path_value_root ) { std::istringstream iss( path_value_ro
 
 TEST( serialise, guess_corrupted_json )
 {
-    std::istringstream iss( "{ \"name\": \"dummy\", }" );
+    std::istringstream iss( "{ \"name\": \"dummy\"," );
     config c; 
     ASSERT_THROW( comma::read< config >( c, iss ), comma::exception );
 }

From 2d4703fc5a0764b7137cc5c0fbc62d5b492ed703 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 1 May 2025 03:51:01 +0000
Subject: [PATCH 1030/1056] cmake: -std=c++20 added as an option

---
 CMakeFiles/check.c++.standard.cmake | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeFiles/check.c++.standard.cmake b/CMakeFiles/check.c++.standard.cmake
index c8ae95f44..f17089638 100644
--- a/CMakeFiles/check.c++.standard.cmake
+++ b/CMakeFiles/check.c++.standard.cmake
@@ -1,4 +1,4 @@
-    SET( CXX_STANDARDS "0x;11;14;17" CACHE STRING "list of known c++ standards" )
+    SET( CXX_STANDARDS "0x;11;14;17;20" CACHE STRING "list of known c++ standards" )
     MARK_AS_ADVANCED( FORCE CXX_STANDARDS )
     STRING( REGEX REPLACE ";" "," CXX_STANDARDS_READABLE "${CXX_STANDARDS}" )
     SET( CXX_STANDARD_DEFAULT "17" CACHE STRING "default c++ standard to use" )

From 521337e293a87ebcd1e8d405b095ebddbe77ad18 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 1 May 2025 04:07:44 +0000
Subject: [PATCH 1031/1056] csv::options: compile warning silenced, bug fixed:
 quote sign size switch statement: case 2: replaced with default:

---
 csv/options.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/csv/options.cpp b/csv/options.cpp
index 21718bd83..8fd16e0db 100644
--- a/csv/options.cpp
+++ b/csv/options.cpp
@@ -31,6 +31,7 @@
 
 #include <boost/regex.hpp>
 #include "../base/exception.h"
+#include "../base/none.h"
 #include "../csv/options.h"
 #include "../string/split.h"
 #include "../string/string.h"
@@ -69,9 +70,9 @@ static void init( comma::csv::options& csv_options
     {
         switch( quote_character->size() )
         {
-            case 0: csv_options.quote.reset(); break;
+            case 0: csv_options.quote = silent_none< char >(); break;
             case 1: csv_options.quote = ( *quote_character )[0]; break;
-            case 2: COMMA_THROW( comma::exception, "expected a quote character, got \"" << *quote_character << "\"" );
+            default: COMMA_THROW( comma::exception, "expected a quote character, got \"" << *quote_character << "\"" );
         }
     }
     csv_options.flush = options.exists( "--flush" );

From bab98277c3bf242df1fc924c279251f26f2383be Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 May 2025 00:27:25 +0000
Subject: [PATCH 1032/1056] containers::multidimentional::map::find(point)
 renamed to ...::at(point); otherwise, it does not compile if point and index
 types are the same

---
 containers/multidimensional/map.h | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/containers/multidimensional/map.h b/containers/multidimensional/map.h
index 6742c5305..493cdcab2 100644
--- a/containers/multidimensional/map.h
+++ b/containers/multidimensional/map.h
@@ -72,15 +72,15 @@ class map : public std::unordered_map< std::array< comma::int32, Size >, V, arra
         static key_type index_of( const point_type& point, const point_type& resolution );
         
         /// find value by point
-        iterator find( const point_type& point );
+        iterator at( const point_type& point );
         
         /// find value by point
-        const_iterator find( const point_type& point ) const;
+        const_iterator at( const point_type& point ) const;
         
         /// find value by key
         iterator find( const key_type& index );
         
-        /// find voxel by key
+        /// find value by key
         const_iterator find( const key_type& index ) const;
         
         /// return origin
@@ -142,14 +142,14 @@ inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Trait
 }
 
 template < typename K, typename V, std::size_t Size, typename P, typename Traits >
-inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::point_type& point )
+inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::at( const typename map< K, V, Size, P, Traits >::point_type& point )
 {
     index_type i = index_of( point );
     return this->base_type::find( i );
 }
 
 template < typename K, typename V, std::size_t Size, typename P, typename Traits >
-inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::point_type& point ) const
+inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::at( const typename map< K, V, Size, P, Traits >::point_type& point ) const
 {
     index_type i = index_of( point );
     return this->base_type::find( i );

From c06585454103658b3bd80a5dd68323d35644a90d Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Fri, 2 May 2025 00:28:43 +0000
Subject: [PATCH 1033/1056] multidimensional_map_test: find(point) renamed to
 at(point)

---
 containers/test/multidimensional_map_test.cpp | 24 +++++++++----------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/containers/test/multidimensional_map_test.cpp b/containers/test/multidimensional_map_test.cpp
index 7f30a4ced..e0516f19d 100644
--- a/containers/test/multidimensional_map_test.cpp
+++ b/containers/test/multidimensional_map_test.cpp
@@ -62,33 +62,33 @@ TEST( multikey_map, operations )
     typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
     map_type m( {1, 1, 1} );
     {
-        EXPECT_TRUE( ( m.find( map_type::point_type{1., 1., 1.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{1., 1., 1.} ) == m.end() ) );
         EXPECT_TRUE( ( m.touch_at( map_type::point_type{1., 1., 1.} ) != m.end() ) );
         EXPECT_EQ( 1, m.size() );
-        EXPECT_TRUE( ( m.find( map_type::point_type{1., 1., 1.} ) != m.end() ) );
-        EXPECT_TRUE( ( m.find( map_type::point_type{1., 1., 1.} ) == m.find( map_type::point_type{1.1, 1.1, 1.1} ) ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{1., 1., 1.} ) != m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{1., 1., 1.} ) == m.at( map_type::point_type{1.1, 1.1, 1.1} ) ) );
         EXPECT_TRUE( ( m.touch_at( {1, 1, 1} ) != m.end() ) );
         EXPECT_EQ( 1, m.size() );
         EXPECT_TRUE( ( m.touch_at( {1.1, 1.1, 1.1} ) != m.end() ) );
         EXPECT_EQ( 1, m.size() );
     }
     {
-        EXPECT_TRUE( ( m.find( map_type::point_type{-1., -1., -1.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{-1., -1., -1.} ) == m.end() ) );
         EXPECT_TRUE( ( m.touch_at( {-1., -1., -1.} ) != m.end() ) );
         EXPECT_EQ( 2, m.size() );
-        EXPECT_TRUE( ( m.find( map_type::point_type{-1., -1., -1.} ) != m.end() ) );
-        EXPECT_TRUE( ( m.find( map_type::point_type{-1., -1., -1.} ) == m.find( map_type::point_type{-0.1, -0.1, -0.1} ) ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{-1., -1., -1.} ) != m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{-1., -1., -1.} ) == m.at( map_type::point_type{-0.1, -0.1, -0.1} ) ) );
         EXPECT_TRUE( ( m.touch_at( {-1., -1., -1.} ) != m.end() ) );
         EXPECT_EQ( 2, m.size() );
         EXPECT_TRUE( ( m.touch_at( {-0.1, -0.1, -0.1} ) != m.end() ) );
         EXPECT_EQ( 2, m.size() );
     }
     {
-        EXPECT_TRUE( ( m.find( map_type::point_type{0., 0., 0.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{0., 0., 0.} ) == m.end() ) );
         EXPECT_TRUE( ( m.touch_at( {0., 0., 0.} ) != m.end() ) );
         EXPECT_EQ( 3, m.size() );
-        EXPECT_TRUE( ( m.find( map_type::point_type{0., 0, 0} ) != m.end() ) );
-        EXPECT_TRUE( ( m.find( map_type::point_type{0., 0, 0} ) == m.find( map_type::point_type{0.1, 0.1, 0.1} ) ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{0., 0, 0} ) != m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{0., 0, 0} ) == m.at( map_type::point_type{0.1, 0.1, 0.1} ) ) );
         EXPECT_TRUE( ( m.touch_at( {0., 0, 0} ) != m.end() ) );
         EXPECT_EQ( 3, m.size() );
         EXPECT_TRUE( ( m.touch_at( {0.1, 0.1, 0.1} ) != m.end() ) );
@@ -108,12 +108,12 @@ TEST( multikey_map, neighbourhood )
     typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
     map_type m( {1, 1, 1} );
     {
-        EXPECT_TRUE( ( m.find( map_type::point_type{1, 1, 1} ) == m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{1, 1, 1} ) == m.end() ) );
         {
             EXPECT_TRUE( ( m.touch_at( {1, 1, 1} ) != m.end() ) );
             EXPECT_EQ( 1, m.size() );
             m.touch_at( {1, 1, 1} )->second = 111;
-            EXPECT_EQ( 111, m.find( map_type::point_type{1, 1, 1} )->second );
+            EXPECT_EQ( 111, m.at( map_type::point_type{1, 1, 1} )->second );
             map_type::index_type index = {{ 1, 1, 1 }};
             EXPECT_EQ( 111, m.base_type::find( index )->second );
         }
@@ -121,7 +121,7 @@ TEST( multikey_map, neighbourhood )
             EXPECT_TRUE( ( m.touch_at( {2, 2, 2} ) != m.end() ) );
             EXPECT_EQ( 2, m.size() );
             m.touch_at( {2, 2, 2} )->second = 222;
-            EXPECT_EQ( 222, m.find( map_type::point_type{2, 2, 2} )->second );
+            EXPECT_EQ( 222, m.at( map_type::point_type{2, 2, 2} )->second );
             map_type::index_type index = {{ 2, 2, 2 }};
             EXPECT_EQ( 222, m.base_type::find( index )->second );
         }

From 5777545f131fe2bd86714506616d270558399301 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 5 May 2025 08:24:33 +1000
Subject: [PATCH 1034/1056] containers::multidimensional::map: deprecation
 warning fixed

---
 containers/multidimensional/map.h | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/containers/multidimensional/map.h b/containers/multidimensional/map.h
index 493cdcab2..b4347d7d8 100644
--- a/containers/multidimensional/map.h
+++ b/containers/multidimensional/map.h
@@ -5,6 +5,7 @@
 #pragma once
 
 #include <array>
+#include <functional>
 #include <unordered_map>
 #include <boost/functional/hash.hpp>
 #include "../../base/types.h"
@@ -14,7 +15,7 @@ namespace comma { namespace containers { namespace multidimensional {
 
 /// quick and dirty hash for array-like containers (its support is awkward in boost)
 template < typename Array, std::size_t Size >
-struct array_hash : public std::unary_function< Array, std::size_t >
+struct array_hash : public std::function< std::size_t( const Array& ) > // struct array_hash : public std::unary_function< Array, std::size_t >
 {
     std::size_t operator()( Array const& array ) const
     {

From d4db4f89b5c31c89b64ed0e8a578bc48b7861b5a Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 5 May 2025 09:21:13 +1000
Subject: [PATCH 1035/1056] python: containers.multidimensional.Map: in
 progress...

---
 python/CMakeLists.txt                         |   3 +-
 python/bindings/CMakeLists.txt                |  21 +++
 .../containers/multidimensional/map.cpp       | 123 ++++++++++++++++++
 .../containers/multidimensional/map.h         |  21 +++
 python/comma/__init__.py                      |   1 +
 python/comma/containers/__init__.py           |   1 +
 .../containers/multidimensional/__init__.py   |   1 +
 .../comma/containers/multidimensional/_map.py |  26 ++++
 python/setup.py                               |   2 +-
 9 files changed, 197 insertions(+), 2 deletions(-)
 create mode 100644 python/bindings/CMakeLists.txt
 create mode 100644 python/bindings/containers/multidimensional/map.cpp
 create mode 100644 python/bindings/containers/multidimensional/map.h
 create mode 100644 python/comma/containers/__init__.py
 create mode 100644 python/comma/containers/multidimensional/__init__.py
 create mode 100644 python/comma/containers/multidimensional/_map.py

diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index 9dc0f284c..4ec896d52 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -75,7 +75,8 @@ SET( comma_PYTHON_SOURCE_ROOT_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 
 set_python_build_lib_directory()
 
-ADD_SUBDIRECTORY( comma )
+add_subdirectory( comma )
+add_subdirectory( bindings )
 
 ADD_CUSTOM_TARGET( python_build ALL
                    ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE}
diff --git a/python/bindings/CMakeLists.txt b/python/bindings/CMakeLists.txt
new file mode 100644
index 000000000..2efe93e47
--- /dev/null
+++ b/python/bindings/CMakeLists.txt
@@ -0,0 +1,21 @@
+SET( PROJECT "python_bindings" )
+SET( TARGET_NAME comma_${PROJECT} )
+SET( dir ${SOURCE_CODE_BASE_DIR}/python/bindings )
+
+FILE( GLOB_RECURSE source ${dir}/*.cpp )
+FILE( GLOB_RECURSE includes ${dir}/*.h )
+
+SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
+
+ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes} )
+SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+target_link_libraries( ${TARGET_NAME} comma_base ${comma_ALL_EXTERNAL_LIBRARIES} )
+
+# INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
+# INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
+INSTALL(
+    TARGETS ${TARGET_NAME}
+    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
+    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
+    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
+)
diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
new file mode 100644
index 000000000..36e6a3b8f
--- /dev/null
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -0,0 +1,123 @@
+#include <cstdint>
+#include <vector>
+#include "../../../../base/exception.h"
+#include "../../../../containers/multidimensional/map.h"
+#include "map.h"
+
+namespace comma { namespace python { namespace bindings { namespace containers { namespace multidimensional { namespace map { namespace impl {
+
+class base
+{
+    public:
+        base( void* m ): _m( m ) {}
+        virtual ~base() = default;
+        virtual void insert( const void* p, int v ) = 0;
+        virtual const int* at( const void* p, unsigned int* size ) const = 0;
+        virtual unsigned int size( const void* p ) const = 0;
+    protected:
+        void* _m{nullptr};
+};
+
+template < typename K, unsigned int Dim >
+struct proxy: public base
+{
+    typedef comma::containers::multidimensional::map< K, std::vector< int >, Dim > map_t;
+
+    typedef typename map_t::point_type key_t;
+
+    proxy( const void* o, const void* r, const void* p, int size )
+        : base( new map_t( *reinterpret_cast< const key_t* >( o ), *reinterpret_cast< const key_t* >( r ) ) )
+    {
+        if( !p || size == 0 ) { return; }
+        const K* q = reinterpret_cast< const K* >( p );
+        for( int i = 0; i < size; ++i, q += sizeof( K ) * Dim * size ) { insert( q, i ); }
+    }
+
+    ~proxy() { if( _m ) { delete reinterpret_cast< map_t* >( _m ); } }
+
+    void insert( const void* k, int v ) { map().touch_at( key( k ) )->second.push_back( v ); }
+
+    const int* at( const void* k, unsigned int* size ) const { const auto& i = map().at( key( k ) ); *size = i == map().end() ? 0 : int( i->second.size() ); return i == map().end() || i->second.empty() ? nullptr : &i->second[0]; }
+    
+    unsigned int size( const void* p ) const { return map().size(); }
+
+    map_t& map() { return *reinterpret_cast< map_t* >( _m ); }
+
+    const map_t& map() const { return *reinterpret_cast< const map_t* >( _m ); }
+
+    const key_t& key( const void* p ) const { return *reinterpret_cast< const key_t* >( p ); }
+};
+
+void* make( int key_type, unsigned int dim, const void* o, const void* r, const void* v, unsigned int s )
+{
+    switch( key_type )
+    {
+        case _comma_int32:
+            switch( dim )
+            {
+                case 2: return new proxy< std::int32_t, 2 >( o, r, v, s );
+                case 3: return new proxy< std::int32_t, 3 >( o, r, v, s );
+                case 4: return new proxy< std::int32_t, 4 >( o, r, v, s );
+                case 5: return new proxy< std::int32_t, 5 >( o, r, v, s );
+                case 6: return new proxy< std::int32_t, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with int32 keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        case _comma_int64:
+            switch( dim )
+            {
+                case 2: return new proxy< std::int64_t, 2 >( o, r, v, s );
+                case 3: return new proxy< std::int64_t, 3 >( o, r, v, s );
+                case 4: return new proxy< std::int64_t, 4 >( o, r, v, s );
+                case 5: return new proxy< std::int64_t, 5 >( o, r, v, s );
+                case 6: return new proxy< std::int64_t, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with int64 keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        case _comma_float32:
+            static_assert( sizeof( float ) == 4 );
+            switch( dim )
+            {
+                case 2: return new proxy< float, 2 >( o, r, v, s );
+                case 3: return new proxy< float, 3 >( o, r, v, s );
+                case 4: return new proxy< float, 4 >( o, r, v, s );
+                case 5: return new proxy< float, 5 >( o, r, v, s );
+                case 6: return new proxy< float, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with float32 keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        case _comma_float64:
+            static_assert( sizeof( double ) == 8 );
+            switch( dim )
+            {
+                case 2: return new proxy< double, 2 >( o, r, v, s );
+                case 3: return new proxy< double, 3 >( o, r, v, s );
+                case 4: return new proxy< double, 4 >( o, r, v, s );
+                case 5: return new proxy< double, 5 >( o, r, v, s );
+                case 6: return new proxy< double, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with double keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        default:
+            COMMA_THROW_BRIEF( comma::exception, "multidimensional map supports types int32 (0), int64 (1), float32 (2), and float64 (3); got: " << key_type );
+    }
+    return nullptr;
+}
+
+} } } } } } } // namespace comma { namespace python { namespace bindings { namespace containers { namespace multidimensional { namespace map { namespace impl {
+
+static auto as_base( void* p ) { return reinterpret_cast< comma::python::bindings::containers::multidimensional::map::impl::base* >( p ); }
+
+static auto as_base( const void* p ) { return reinterpret_cast< const comma::python::bindings::containers::multidimensional::map::impl::base* >( p ); }
+
+DLL_EXPORT void* comma_containers_multidimensional_map_create( int key_type, unsigned int dim, const void* origin, const void* resolution, const void* values, unsigned int size )
+{
+    return comma::python::bindings::containers::multidimensional::map::impl::make( key_type, dim, origin, resolution, values, size );
+}
+
+DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p ) { delete as_base( p ); }
+
+DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, void* size ) { return as_base( p )->at( p, reinterpret_cast< unsigned int* >( size ) ); }
+
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p ) { return as_base( p )->size( p ); }
+
diff --git a/python/bindings/containers/multidimensional/map.h b/python/bindings/containers/multidimensional/map.h
new file mode 100644
index 000000000..cb561a736
--- /dev/null
+++ b/python/bindings/containers/multidimensional/map.h
@@ -0,0 +1,21 @@
+#pragma once
+
+#ifdef _WIN32
+#define DLL_EXPORT __declspec( dllexport )
+#else
+#define DLL_EXPORT
+#endif
+
+extern "C" {
+
+enum types { _comma_int32 = 0, _comma_int64 = 1, _comma_float32 = 2, _comma_float64 = 3 };
+
+DLL_EXPORT void* comma_containers_multidimensional_map_create( int key_type, unsigned int dim, const void* origin, const void* resolution, const void* values, unsigned int size );
+
+DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p );
+
+DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, void* size );
+
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p );
+
+}
\ No newline at end of file
diff --git a/python/comma/__init__.py b/python/comma/__init__.py
index a06fdb611..878ab83d3 100644
--- a/python/comma/__init__.py
+++ b/python/comma/__init__.py
@@ -1,6 +1,7 @@
 # Copyright (c) 2011 The University of Sydney
 # Copyright (c) 2013 Vsevolod Vlaskine
 
+from . import containers
 from . import csv
 from . import dictionary
 from . import filesystem
diff --git a/python/comma/containers/__init__.py b/python/comma/containers/__init__.py
new file mode 100644
index 000000000..602e6d3b6
--- /dev/null
+++ b/python/comma/containers/__init__.py
@@ -0,0 +1 @@
+from . import multidimensional
diff --git a/python/comma/containers/multidimensional/__init__.py b/python/comma/containers/multidimensional/__init__.py
new file mode 100644
index 000000000..ca579ad56
--- /dev/null
+++ b/python/comma/containers/multidimensional/__init__.py
@@ -0,0 +1 @@
+from ._map import Map
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
new file mode 100644
index 000000000..4957373e0
--- /dev/null
+++ b/python/comma/containers/multidimensional/_map.py
@@ -0,0 +1,26 @@
+import ctypes, ctypes.util, numpy
+
+class Map:
+    def __init__( self, key_type, dim, resolution, origin=None, values=None ):
+        self._bindings = ctypes.CDLL( ctypes.util.find_library( 'comma_python_bindings' ) )
+        self._create = self._bindings.comma_containers_multidimensional_map_create
+        self._create.argtypes = [ ctypes.c_in, ctypes.c_uint, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_uint ]
+        self._create.restype = None # todo? make callable?
+        key_types = { numpy.int32: 0, numpy.int64: 1, numpy.float32: 2, numpy.float64: 3 }
+        if origin is None: origin = numpy.zero( dim )
+        assert key_type in key_types, TypeError( f'expected key type in {list(key_types.keys())}; got: {key_type}' )
+        self._map = self._create( key_types[key_type]
+                        , dim
+                        , numpy.array( origin, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
+                        , numpy.array( resolution, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
+                        , values if isinstance( values, numpy.array ) else numpy.array( [] if values is None else values ).ctypes.data_as( ctypes.c_void_p )
+                        , 0 if value is None else len( values ) )
+        
+        def __enter__( self ): return self
+
+        def __exit__( self, type, value, traceback ):
+            self._bindings.comma_containers_multidimensional_map_destroy( self._map )
+
+        # todo: at()
+
+        # todo: size()
\ No newline at end of file
diff --git a/python/setup.py b/python/setup.py
index 950ebe376..647559a2d 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -30,7 +30,7 @@
         maintainer_email    = 'vsevolod.vlaskine@gmail.com',
         python_requires     = '>=3.6',
         #install_requires    = [ 'numpy' ], # todo? does it need to be uncommented for packaging
-        packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.dictionary', 'comma.filesystem', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
+        packages            = [ 'comma', 'comma.containers', 'comma.containers.multidimensional', 'comma.csv', 'comma.csv.applications', 'comma.dictionary', 'comma.filesystem', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
         package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
         package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
         entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] } #scripts             = [ "comma/csv/applications/csv-eval" ]

From 8283399c9ad84ca7260e5caa91d36e5359484dc7 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 6 May 2025 09:40:38 +1000
Subject: [PATCH 1036/1056] python: comma.containers.multidimensional.Map: unit
 test placeholder added; in progress...

---
 .../containers/multidimensional/map.cpp       | 10 ++++--
 .../containers/multidimensional/map.h         |  4 +++
 .../comma/containers/multidimensional/_map.py | 35 +++++++++++++------
 .../containers/multidimensional/test/test     |  6 ++++
 .../test/test_multidimensional_map.py         |  8 +++++
 python/comma/dictionary/test/test             |  1 +
 6 files changed, 51 insertions(+), 13 deletions(-)
 create mode 100755 python/comma/containers/multidimensional/test/test
 create mode 100644 python/comma/containers/multidimensional/test/test_multidimensional_map.py

diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
index 36e6a3b8f..ed795ee39 100644
--- a/python/bindings/containers/multidimensional/map.cpp
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -13,7 +13,8 @@ class base
         virtual ~base() = default;
         virtual void insert( const void* p, int v ) = 0;
         virtual const int* at( const void* p, unsigned int* size ) const = 0;
-        virtual unsigned int size( const void* p ) const = 0;
+        virtual unsigned int count() const = 0;
+        virtual unsigned int size() const = 0;
     protected:
         void* _m{nullptr};
 };
@@ -39,7 +40,9 @@ struct proxy: public base
 
     const int* at( const void* k, unsigned int* size ) const { const auto& i = map().at( key( k ) ); *size = i == map().end() ? 0 : int( i->second.size() ); return i == map().end() || i->second.empty() ? nullptr : &i->second[0]; }
     
-    unsigned int size( const void* p ) const { return map().size(); }
+    unsigned int size() const { return map().size(); }
+
+    unsigned int count() const { unsigned int c{0}; for( auto i: map() ) { c += i.second.size(); } return c; }
 
     map_t& map() { return *reinterpret_cast< map_t* >( _m ); }
 
@@ -119,5 +122,6 @@ DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p ) { delet
 
 DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, void* size ) { return as_base( p )->at( p, reinterpret_cast< unsigned int* >( size ) ); }
 
-DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p ) { return as_base( p )->size( p ); }
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p ) { return as_base( p )->size(); }
 
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void* p ) { return as_base( p )->count(); }
diff --git a/python/bindings/containers/multidimensional/map.h b/python/bindings/containers/multidimensional/map.h
index cb561a736..aace23216 100644
--- a/python/bindings/containers/multidimensional/map.h
+++ b/python/bindings/containers/multidimensional/map.h
@@ -16,6 +16,10 @@ DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p );
 
 DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, void* size );
 
+// todo? DLL_EXPORT const void* comma_containers_multidimensional_map_free( const void* p, void* size );
+
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p );
 
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void* p );
+
 }
\ No newline at end of file
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
index 4957373e0..3a23c200e 100644
--- a/python/comma/containers/multidimensional/_map.py
+++ b/python/comma/containers/multidimensional/_map.py
@@ -2,25 +2,40 @@
 
 class Map:
     def __init__( self, key_type, dim, resolution, origin=None, values=None ):
+        self._key_type = key_type
         self._bindings = ctypes.CDLL( ctypes.util.find_library( 'comma_python_bindings' ) )
         self._create = self._bindings.comma_containers_multidimensional_map_create
-        self._create.argtypes = [ ctypes.c_in, ctypes.c_uint, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_uint ]
-        self._create.restype = None # todo? make callable?
+        self._create.argtypes = [ ctypes.c_int, ctypes.c_uint, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_uint ]
+        self._create.restype = ctypes.c_void_p
+        self._at = self._bindings.comma_containers_multidimensional_map_at
+        self._at.argtypes = [ ctypes.c_void_p, ctypes.c_void_p ]
+        self._at.restype = ctypes.c_void_p
+        self._count = self._bindings.comma_containers_multidimensional_map_count
+        self._count.argtypes = [ ctypes.c_void_p ]
+        self._count.restype = ctypes.c_uint
+        self._size = self._bindings.comma_containers_multidimensional_map_count
+        self._size.argtypes = [ ctypes.c_void_p ]
+        self._size.restype = ctypes.c_uint
         key_types = { numpy.int32: 0, numpy.int64: 1, numpy.float32: 2, numpy.float64: 3 }
-        if origin is None: origin = numpy.zero( dim )
+        if origin is None: origin = numpy.zeros( dim )
         assert key_type in key_types, TypeError( f'expected key type in {list(key_types.keys())}; got: {key_type}' )
         self._map = self._create( key_types[key_type]
                         , dim
                         , numpy.array( origin, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
                         , numpy.array( resolution, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
-                        , values if isinstance( values, numpy.array ) else numpy.array( [] if values is None else values ).ctypes.data_as( ctypes.c_void_p )
-                        , 0 if value is None else len( values ) )
+                        , numpy.array( [] if values is None else values, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
+                        , 0 if values is None else len( values ) )
         
-        def __enter__( self ): return self
+    def __enter__( self ): return self
 
-        def __exit__( self, type, value, traceback ):
-            self._bindings.comma_containers_multidimensional_map_destroy( self._map )
+    def __exit__( self, type, value, traceback ): self._bindings.comma_containers_multidimensional_map_destroy( self._map )
 
-        # todo: at()
+    def at( self, points ):
+        # todo: call method
+        # todo: 'cast' pointer to int
+        # todo: make numpy array
+        ...
 
-        # todo: size()
\ No newline at end of file
+    def count( self ): return self._count( self._map )
+    
+    def size( self ): return self._size( self._map )
diff --git a/python/comma/containers/multidimensional/test/test b/python/comma/containers/multidimensional/test/test
new file mode 100755
index 000000000..805e29f9b
--- /dev/null
+++ b/python/comma/containers/multidimensional/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+# todo! consolidate pytests
+name=$( basename $0 )
+type -p pytest >/dev/null || { echo "$0: pytest not found; to install run: sudo apt install python3-pytest" >&2; exit 1; }
+pytest 1>&2 && echo "$name: succeeded" >&2 || { echo "$name: failed" >&2; exit 1; }
diff --git a/python/comma/containers/multidimensional/test/test_multidimensional_map.py b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
new file mode 100644
index 000000000..5b1e5a465
--- /dev/null
+++ b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
@@ -0,0 +1,8 @@
+import numpy, pytest
+from comma.containers import multidimensional
+
+def test_multidimensional_map_size():
+    assert multidimensional.Map( numpy.float32, 3, resolution=[1, 1, 1] ).size() == 0
+    assert multidimensional.Map( numpy.float32, 3, resolution=[1, 1, 1] ).count() == 0
+    # todo: debug: assert multidimensional.Map( numpy.float32, 3, resolution=[0.5, 0.5, 0.5], values=[[0, 0, 0], [0, 0, 0], [1, 1, 1]] ).size() == 2
+    assert multidimensional.Map( numpy.float32, 3, resolution=[0.5, 0.5, 0.5], values=[[0, 0, 0], [0, 0, 0], [1, 1, 1]] ).count() == 3
diff --git a/python/comma/dictionary/test/test b/python/comma/dictionary/test/test
index e61bd77fb..805e29f9b 100755
--- a/python/comma/dictionary/test/test
+++ b/python/comma/dictionary/test/test
@@ -1,5 +1,6 @@
 #!/bin/bash
 
+# todo! consolidate pytests
 name=$( basename $0 )
 type -p pytest >/dev/null || { echo "$0: pytest not found; to install run: sudo apt install python3-pytest" >&2; exit 1; }
 pytest 1>&2 && echo "$name: succeeded" >&2 || { echo "$name: failed" >&2; exit 1; }

From 8f3023e21b489aa681568c31cfb5edbca27454f5 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 7 May 2025 09:45:10 +1000
Subject: [PATCH 1037/1056] python: comma.containers.multidimensional.Map: a
 few bugs fixed; testing: in progress...

---
 .../containers/multidimensional/map.cpp       |  2 +-
 .../comma/containers/multidimensional/_map.py | 23 ++++++++++---------
 .../test/test_multidimensional_map.py         | 12 ++++++----
 3 files changed, 20 insertions(+), 17 deletions(-)

diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
index ed795ee39..2d484b04b 100644
--- a/python/bindings/containers/multidimensional/map.cpp
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -31,7 +31,7 @@ struct proxy: public base
     {
         if( !p || size == 0 ) { return; }
         const K* q = reinterpret_cast< const K* >( p );
-        for( int i = 0; i < size; ++i, q += sizeof( K ) * Dim * size ) { insert( q, i ); }
+        for( int i = 0; i < size; ++i, q += Dim ) { insert( q, i ); }
     }
 
     ~proxy() { if( _m ) { delete reinterpret_cast< map_t* >( _m ); } }
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
index 3a23c200e..2b46b5451 100644
--- a/python/comma/containers/multidimensional/_map.py
+++ b/python/comma/containers/multidimensional/_map.py
@@ -1,8 +1,9 @@
 import ctypes, ctypes.util, numpy
 
 class Map:
-    def __init__( self, key_type, dim, resolution, origin=None, values=None ):
-        self._key_type = key_type
+    def __init__( self, resolution, origin=None, values=None ):
+        self._dtype = resolution.dtype
+        # todo: if resolution is not numpy array, try origin; if origin is not numpy array, try values
         self._bindings = ctypes.CDLL( ctypes.util.find_library( 'comma_python_bindings' ) )
         self._create = self._bindings.comma_containers_multidimensional_map_create
         self._create.argtypes = [ ctypes.c_int, ctypes.c_uint, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_uint ]
@@ -13,17 +14,17 @@ def __init__( self, key_type, dim, resolution, origin=None, values=None ):
         self._count = self._bindings.comma_containers_multidimensional_map_count
         self._count.argtypes = [ ctypes.c_void_p ]
         self._count.restype = ctypes.c_uint
-        self._size = self._bindings.comma_containers_multidimensional_map_count
+        self._size = self._bindings.comma_containers_multidimensional_map_size
         self._size.argtypes = [ ctypes.c_void_p ]
         self._size.restype = ctypes.c_uint
-        key_types = { numpy.int32: 0, numpy.int64: 1, numpy.float32: 2, numpy.float64: 3 }
-        if origin is None: origin = numpy.zeros( dim )
-        assert key_type in key_types, TypeError( f'expected key type in {list(key_types.keys())}; got: {key_type}' )
-        self._map = self._create( key_types[key_type]
-                        , dim
-                        , numpy.array( origin, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
-                        , numpy.array( resolution, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
-                        , numpy.array( [] if values is None else values, dtype=key_type ).ctypes.data_as( ctypes.c_void_p )
+        key_types = { numpy.dtype( 'int32' ): 0, numpy.dtype( 'int64' ): 1, numpy.dtype( 'float32' ): 2, numpy.dtype( 'float64' ): 3 }
+        if origin is None: origin = numpy.zeros( resolution.shape[0] )
+        assert self._dtype in key_types, TypeError( f'expected key type in {list(key_types.keys())}; got: {self._dtype}' )
+        self._map = self._create( key_types[self._dtype]
+                        , resolution.shape[0]
+                        , numpy.array( origin, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p )
+                        , numpy.array( resolution, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p )
+                        , numpy.array( [] if values is None else values, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p )
                         , 0 if values is None else len( values ) )
         
     def __enter__( self ): return self
diff --git a/python/comma/containers/multidimensional/test/test_multidimensional_map.py b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
index 5b1e5a465..deeeecb10 100644
--- a/python/comma/containers/multidimensional/test/test_multidimensional_map.py
+++ b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
@@ -1,8 +1,10 @@
-import numpy, pytest
+import numpy, pytest, sys
 from comma.containers import multidimensional
 
 def test_multidimensional_map_size():
-    assert multidimensional.Map( numpy.float32, 3, resolution=[1, 1, 1] ).size() == 0
-    assert multidimensional.Map( numpy.float32, 3, resolution=[1, 1, 1] ).count() == 0
-    # todo: debug: assert multidimensional.Map( numpy.float32, 3, resolution=[0.5, 0.5, 0.5], values=[[0, 0, 0], [0, 0, 0], [1, 1, 1]] ).size() == 2
-    assert multidimensional.Map( numpy.float32, 3, resolution=[0.5, 0.5, 0.5], values=[[0, 0, 0], [0, 0, 0], [1, 1, 1]] ).count() == 3
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).size() == 0
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).count() == 0
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]), values=[[0.5, 0.5, 0.5], [0.5, 0.5, 0.5], [0.5, 0.5, 0.5]] ).size() == 1
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]), values=[[0.5, 0.5, 0.5], [0.5, 0.5, 0.5], [0.5, 0.5, 0.5]] ).count() == 3
+    assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).size() == 1
+    assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).count() == 3

From 73b99c0831f74b36024da4abda00679274b75321 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 12 May 2025 10:02:22 +1000
Subject: [PATCH 1038/1056] python: comma.containers.multidimensional.Map.at():
 implemented; debugging: in progress...

---
 python/bindings/containers/multidimensional/map.cpp  |  2 +-
 python/bindings/containers/multidimensional/map.h    |  4 ++--
 python/comma/containers/multidimensional/_map.py     | 12 +++++++-----
 .../test/test_multidimensional_map.py                |  3 +++
 4 files changed, 13 insertions(+), 8 deletions(-)

diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
index 2d484b04b..812deeb38 100644
--- a/python/bindings/containers/multidimensional/map.cpp
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -120,7 +120,7 @@ DLL_EXPORT void* comma_containers_multidimensional_map_create( int key_type, uns
 
 DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p ) { delete as_base( p ); }
 
-DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, void* size ) { return as_base( p )->at( p, reinterpret_cast< unsigned int* >( size ) ); }
+DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, const void* k, void* size ) { return as_base( p )->at( k, reinterpret_cast< unsigned int* >( size ) ); }
 
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p ) { return as_base( p )->size(); }
 
diff --git a/python/bindings/containers/multidimensional/map.h b/python/bindings/containers/multidimensional/map.h
index aace23216..bce97a0a9 100644
--- a/python/bindings/containers/multidimensional/map.h
+++ b/python/bindings/containers/multidimensional/map.h
@@ -14,12 +14,12 @@ DLL_EXPORT void* comma_containers_multidimensional_map_create( int key_type, uns
 
 DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p );
 
-DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, void* size );
-
 // todo? DLL_EXPORT const void* comma_containers_multidimensional_map_free( const void* p, void* size );
 
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p );
 
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void* p );
 
+DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, const void* k, void* size );
+
 }
\ No newline at end of file
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
index 2b46b5451..dbc0b4a4d 100644
--- a/python/comma/containers/multidimensional/_map.py
+++ b/python/comma/containers/multidimensional/_map.py
@@ -17,6 +17,9 @@ def __init__( self, resolution, origin=None, values=None ):
         self._size = self._bindings.comma_containers_multidimensional_map_size
         self._size.argtypes = [ ctypes.c_void_p ]
         self._size.restype = ctypes.c_uint
+        self._at = self._bindings.comma_containers_multidimensional_map_at
+        self._at.argtypes = [ ctypes.c_void_p, ctypes.c_void_p ]
+        self._at.restype = ctypes.c_void_p
         key_types = { numpy.dtype( 'int32' ): 0, numpy.dtype( 'int64' ): 1, numpy.dtype( 'float32' ): 2, numpy.dtype( 'float64' ): 3 }
         if origin is None: origin = numpy.zeros( resolution.shape[0] )
         assert self._dtype in key_types, TypeError( f'expected key type in {list(key_types.keys())}; got: {self._dtype}' )
@@ -31,11 +34,10 @@ def __enter__( self ): return self
 
     def __exit__( self, type, value, traceback ): self._bindings.comma_containers_multidimensional_map_destroy( self._map )
 
-    def at( self, points ):
-        # todo: call method
-        # todo: 'cast' pointer to int
-        # todo: make numpy array
-        ...
+    def at( self, value ):
+        s = ctypes.POINTER( ctypes.c_int )()
+        p = self._at( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), s )
+        return None if p is None else numpy.frombuffer( p, dtype=numpy.int32, count=s.values[0] )
 
     def count( self ): return self._count( self._map )
     
diff --git a/python/comma/containers/multidimensional/test/test_multidimensional_map.py b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
index deeeecb10..f5c46aaba 100644
--- a/python/comma/containers/multidimensional/test/test_multidimensional_map.py
+++ b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
@@ -8,3 +8,6 @@ def test_multidimensional_map_size():
     assert multidimensional.Map( resolution=numpy.array([1, 1, 1]), values=[[0.5, 0.5, 0.5], [0.5, 0.5, 0.5], [0.5, 0.5, 0.5]] ).count() == 3
     assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).size() == 1
     assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).count() == 3
+
+# def test_multidimensional_map_at():
+#     assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).at( [0, 0, 0] ) is None

From 3de93f0b2d2bff0cca26069bbc72a40e68c5980e Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 12 May 2025 10:49:08 +1000
Subject: [PATCH 1039/1056] python: comma.containers.multidimensional.Map.at():
 implemented; debugging: in progress...

---
 .../containers/multidimensional/map.cpp        | 18 ++++++++++++++++--
 .../comma/containers/multidimensional/_map.py  | 14 ++++++++++----
 .../test/test_multidimensional_map.py          | 12 ++++++++++--
 3 files changed, 36 insertions(+), 8 deletions(-)

diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
index 812deeb38..89e3e4b8d 100644
--- a/python/bindings/containers/multidimensional/map.cpp
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -1,3 +1,5 @@
+#include <iostream>
+
 #include <cstdint>
 #include <vector>
 #include "../../../../base/exception.h"
@@ -31,14 +33,26 @@ struct proxy: public base
     {
         if( !p || size == 0 ) { return; }
         const K* q = reinterpret_cast< const K* >( p );
-        for( int i = 0; i < size; ++i, q += Dim ) { insert( q, i ); }
+        for( int i = 0; i < size; ++i, q += Dim ) { insert( q, i ); std::cerr << "==> proxy: a: i: " << i << std::endl; }
     }
 
     ~proxy() { if( _m ) { delete reinterpret_cast< map_t* >( _m ); } }
 
     void insert( const void* k, int v ) { map().touch_at( key( k ) )->second.push_back( v ); }
 
-    const int* at( const void* k, unsigned int* size ) const { const auto& i = map().at( key( k ) ); *size = i == map().end() ? 0 : int( i->second.size() ); return i == map().end() || i->second.empty() ? nullptr : &i->second[0]; }
+    // const int* at( const void* k, unsigned int* size ) const { const auto& i = map().at( key( k ) ); *size = i == map().end() ? 0 : int( i->second.size() ); return i == map().end() || i->second.empty() ? nullptr : &i->second[0]; }
+
+    const int* at( const void* k, unsigned int* size ) const
+    {
+        std::cerr << "==> a" << std::endl;
+        const auto& i = map().at( key( k ) );
+        std::cerr << "==> b" << std::endl;
+        unsigned int s = i == map().end() ? 0 : int( i->second.size() );
+        *size = s;
+        std::cerr << "==> c" << std::endl;
+        if( s > 0 ) { for( auto j: i->second ) { std::cerr << "==> d: j: " << j << std::endl; } }
+        return i == map().end() || i->second.empty() ? nullptr : &i->second[0];
+    }
     
     unsigned int size() const { return map().size(); }
 
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
index dbc0b4a4d..6f7123e42 100644
--- a/python/comma/containers/multidimensional/_map.py
+++ b/python/comma/containers/multidimensional/_map.py
@@ -1,4 +1,4 @@
-import ctypes, ctypes.util, numpy
+import ctypes, ctypes.util, numpy, sys
 
 class Map:
     def __init__( self, resolution, origin=None, values=None ):
@@ -35,9 +35,15 @@ def __enter__( self ): return self
     def __exit__( self, type, value, traceback ): self._bindings.comma_containers_multidimensional_map_destroy( self._map )
 
     def at( self, value ):
-        s = ctypes.POINTER( ctypes.c_int )()
-        p = self._at( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), s )
-        return None if p is None else numpy.frombuffer( p, dtype=numpy.int32, count=s.values[0] )
+        s = numpy.zeros( 1, dtype=numpy.int32 ) # todo: quick and dirty, figure out the right way
+        print( f'==> Map.at(): a: {s[0]=}', file=sys.stderr )
+        p = self._at( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), s.ctypes.data_as( ctypes.c_void_p ) )
+        print( f'==> Map.at(): b: {s[0]=} {p=}', file=sys.stderr )
+        if not p is None:
+            print( f'==> Map.at(): c', file=sys.stderr )
+            a = numpy.frombuffer( bytes( p ), dtype=numpy.int32, count=s[0] )
+            print( f'==> Map.at(): d: {a=}', file=sys.stderr )
+        return None if p is None else numpy.frombuffer( bytes( p ), dtype=numpy.int32, count=s[0] )
 
     def count( self ): return self._count( self._map )
     
diff --git a/python/comma/containers/multidimensional/test/test_multidimensional_map.py b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
index f5c46aaba..fdb8dedea 100644
--- a/python/comma/containers/multidimensional/test/test_multidimensional_map.py
+++ b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
@@ -9,5 +9,13 @@ def test_multidimensional_map_size():
     assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).size() == 1
     assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).count() == 3
 
-# def test_multidimensional_map_at():
-#     assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).at( [0, 0, 0] ) is None
+def test_multidimensional_map_at():
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).at( [0, 0, 0] ) is None
+    m = multidimensional.Map( resolution=numpy.array([2, 2, 2]), values=[[0.5, 0.5, 0.5], [1, 1, 1], [3, 3, 3]] )
+    assert m.size() == 2
+    assert m.count() == 3
+    # assert m.at( [-1, -1, -1] ) is None
+    # assert m.at( [0, 0, 0] ).all( [0, 1] )
+    # assert m.at( [1, 1, 1] ).all( [0, 1] )
+    # assert m.at( [2, 2, 2] ) == [2]
+    # assert m.at( [5, 5, 5] ) is None
\ No newline at end of file

From b5f73bad20d5e5d5eb9d72c6e7ef931afe13dbba Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 12 May 2025 18:58:50 +1000
Subject: [PATCH 1040/1056] python: comma.containers.multidimensional.Map.at():
 a few bugs fixed, basics tested; Map.at(point, radius): in progress...

---
 .../containers/multidimensional/map.cpp       | 13 +++---------
 .../comma/containers/multidimensional/_map.py | 16 ++++++---------
 .../test/test_multidimensional_map.py         | 20 +++++++++++--------
 3 files changed, 21 insertions(+), 28 deletions(-)

diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
index 89e3e4b8d..69e753142 100644
--- a/python/bindings/containers/multidimensional/map.cpp
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -33,25 +33,18 @@ struct proxy: public base
     {
         if( !p || size == 0 ) { return; }
         const K* q = reinterpret_cast< const K* >( p );
-        for( int i = 0; i < size; ++i, q += Dim ) { insert( q, i ); std::cerr << "==> proxy: a: i: " << i << std::endl; }
+        for( int i = 0; i < size; ++i, q += Dim ) { insert( q, i ); }
     }
 
     ~proxy() { if( _m ) { delete reinterpret_cast< map_t* >( _m ); } }
 
     void insert( const void* k, int v ) { map().touch_at( key( k ) )->second.push_back( v ); }
 
-    // const int* at( const void* k, unsigned int* size ) const { const auto& i = map().at( key( k ) ); *size = i == map().end() ? 0 : int( i->second.size() ); return i == map().end() || i->second.empty() ? nullptr : &i->second[0]; }
-
     const int* at( const void* k, unsigned int* size ) const
     {
-        std::cerr << "==> a" << std::endl;
         const auto& i = map().at( key( k ) );
-        std::cerr << "==> b" << std::endl;
-        unsigned int s = i == map().end() ? 0 : int( i->second.size() );
-        *size = s;
-        std::cerr << "==> c" << std::endl;
-        if( s > 0 ) { for( auto j: i->second ) { std::cerr << "==> d: j: " << j << std::endl; } }
-        return i == map().end() || i->second.empty() ? nullptr : &i->second[0];
+        *size = i == map().end() ? 0 : int( i->second.size() );
+        return *size == 0 ? nullptr : &i->second[0];
     }
     
     unsigned int size() const { return map().size(); }
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
index 6f7123e42..503e304c8 100644
--- a/python/comma/containers/multidimensional/_map.py
+++ b/python/comma/containers/multidimensional/_map.py
@@ -34,16 +34,12 @@ def __enter__( self ): return self
 
     def __exit__( self, type, value, traceback ): self._bindings.comma_containers_multidimensional_map_destroy( self._map )
 
-    def at( self, value ):
-        s = numpy.zeros( 1, dtype=numpy.int32 ) # todo: quick and dirty, figure out the right way
-        print( f'==> Map.at(): a: {s[0]=}', file=sys.stderr )
-        p = self._at( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), s.ctypes.data_as( ctypes.c_void_p ) )
-        print( f'==> Map.at(): b: {s[0]=} {p=}', file=sys.stderr )
-        if not p is None:
-            print( f'==> Map.at(): c', file=sys.stderr )
-            a = numpy.frombuffer( bytes( p ), dtype=numpy.int32, count=s[0] )
-            print( f'==> Map.at(): d: {a=}', file=sys.stderr )
-        return None if p is None else numpy.frombuffer( bytes( p ), dtype=numpy.int32, count=s[0] )
+    def at( self, value, radius=None ):
+        if radius is None:
+            s = numpy.zeros( 1, dtype=numpy.int32 ) # todo: quick and dirty, figure out the right way
+            p = self._at( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), s.ctypes.data_as( ctypes.c_void_p ) )
+            return None if p is None else numpy.frombuffer( ctypes.string_at( p, s[0] * 4 ), dtype=numpy.int32, count=s[0] )
+        raise NotImplementedError( 'Map.at(...,radius=...): implementing...' )
 
     def count( self ): return self._count( self._map )
     
diff --git a/python/comma/containers/multidimensional/test/test_multidimensional_map.py b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
index fdb8dedea..936cfa2f1 100644
--- a/python/comma/containers/multidimensional/test/test_multidimensional_map.py
+++ b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
@@ -10,12 +10,16 @@ def test_multidimensional_map_size():
     assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).count() == 3
 
 def test_multidimensional_map_at():
-    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).at( [0, 0, 0] ) is None
-    m = multidimensional.Map( resolution=numpy.array([2, 2, 2]), values=[[0.5, 0.5, 0.5], [1, 1, 1], [3, 3, 3]] )
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).at([0, 0, 0]) is None
+    m = multidimensional.Map( resolution=numpy.array([2, 2, 2], dtype=float), values=[[0, 0, 0], [0.5, 0.5, 0.5], [1, 1, 1], [2, 2, 2], [3, 3, 3]] )
     assert m.size() == 2
-    assert m.count() == 3
-    # assert m.at( [-1, -1, -1] ) is None
-    # assert m.at( [0, 0, 0] ).all( [0, 1] )
-    # assert m.at( [1, 1, 1] ).all( [0, 1] )
-    # assert m.at( [2, 2, 2] ) == [2]
-    # assert m.at( [5, 5, 5] ) is None
\ No newline at end of file
+    assert m.count() == 5
+    assert m.at( [-1, -1, -1] ) is None
+    assert ( m.at( [0, 0, 0] ) == [0, 1, 2] ).all()
+    assert ( m.at( [2, 2, 2] ) == [3, 4] ).all()
+    assert m.at( [5, 5, 5] ) is None
+    # todo
+    # - single point method? or pass multiple points and decide on shape?
+    # - return list of sizes and list of indices
+    # ? profile performance 
+    # print( m.at( [5, 5, 5], radius=3 ), file=sys.stderr )
\ No newline at end of file

From 262153defa26b9a6cc3dae441a282d596cd789b8 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 15 May 2025 10:18:08 +1000
Subject: [PATCH 1041/1056] python: comma.containers.multidimensional.Map.at():
 a few bugs fixed, basics tested; Map.at(point, radius): in progress...

---
 .../containers/multidimensional/map.cpp       | 49 ++++++++++++++++---
 1 file changed, 41 insertions(+), 8 deletions(-)

diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
index 69e753142..c73e98f99 100644
--- a/python/bindings/containers/multidimensional/map.cpp
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -21,12 +21,24 @@ class base
         void* _m{nullptr};
 };
 
+template < unsigned int D > struct _traits
+{ 
+    static unsigned int power( unsigned int b ) { return _traits< D - 1 >::power * b; }
+    static void index( std::array< int, D >& a, unsigned int v, int b, unsigned int i = D )
+    {
+        a[ --i ] = v % b - b / 2;
+        if( i > 0 ) { index( a, v / b, i ); }
+    } 
+};
+
+template <> struct _traits< 0 > { static unsigned int power( unsigned int ) { return 1; } };
+
 template < typename K, unsigned int Dim >
 struct proxy: public base
 {
-    typedef comma::containers::multidimensional::map< K, std::vector< int >, Dim > map_t;
-
-    typedef typename map_t::point_type key_t;
+    typedef std::array< K, Dim > key_t;
+    
+    typedef comma::containers::multidimensional::map< K, std::pair< std::vector< int >, std::vector< key_t > >, Dim > map_t;
 
     proxy( const void* o, const void* r, const void* p, int size )
         : base( new map_t( *reinterpret_cast< const key_t* >( o ), *reinterpret_cast< const key_t* >( r ) ) )
@@ -38,18 +50,39 @@ struct proxy: public base
 
     ~proxy() { if( _m ) { delete reinterpret_cast< map_t* >( _m ); } }
 
-    void insert( const void* k, int v ) { map().touch_at( key( k ) )->second.push_back( v ); }
+    void insert( const void* k, int v )
+    {
+        auto i = map().touch_at( key( k ) );
+        i->second.first.push_back( v );
+        i->second.second.push_back( key( k ) );
+    }
 
     const int* at( const void* k, unsigned int* size ) const
     {
-        const auto& i = map().at( key( k ) );
-        *size = i == map().end() ? 0 : int( i->second.size() );
-        return *size == 0 ? nullptr : &i->second[0];
+        auto i = map().at( key( k ) );
+        *size = i == map().end() ? 0 : int( i->second.first.size() );
+        return *size == 0 ? nullptr : &i->second.first[0];
+    }
+
+    const int* nearest( const void* k, unsigned int neighbourhood, unsigned int count, unsigned int* size ) const
+    {
+        auto i = map().index_of( key( k ) );
+        typename map_t::index_type j;
+        int b = neighbourhood * 2 + 1;
+        for( unsigned int k = 0; k < _traits< Dim >::power( b ); ++k )
+        {
+            _traits< Dim >::index( j, k, b );
+            for( unsigned int m = 0; m < Dim; ++m ) { j[m] += i[m]; }
+            auto n = map().find( j );
+            if( n == map().end() ) { continue; }
+            // todo: for( auto s: n->second )
+        }
+        return nullptr;
     }
     
     unsigned int size() const { return map().size(); }
 
-    unsigned int count() const { unsigned int c{0}; for( auto i: map() ) { c += i.second.size(); } return c; }
+    unsigned int count() const { unsigned int c{0}; for( auto i: map() ) { c += i.second.first.size(); } return c; }
 
     map_t& map() { return *reinterpret_cast< map_t* >( _m ); }
 

From 5da710c8cca265cc1f784ca205a4ea154ebb36cb Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Mon, 19 May 2025 09:26:26 +1000
Subject: [PATCH 1042/1056] python:
 comma.containers.multidimensional.Map.nearest(): first basic cut implemented
 and tested

---
 .../containers/multidimensional/map.cpp       | 38 ++++++++++++++-----
 .../containers/multidimensional/map.h         |  2 +
 .../comma/containers/multidimensional/_map.py |  7 ++++
 .../test/test_multidimensional_map.py         | 11 +++++-
 4 files changed, 47 insertions(+), 11 deletions(-)

diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
index c73e98f99..991043d27 100644
--- a/python/bindings/containers/multidimensional/map.cpp
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -1,6 +1,7 @@
 #include <iostream>
 
 #include <cstdint>
+#include <limits>
 #include <vector>
 #include "../../../../base/exception.h"
 #include "../../../../containers/multidimensional/map.h"
@@ -15,6 +16,7 @@ class base
         virtual ~base() = default;
         virtual void insert( const void* p, int v ) = 0;
         virtual const int* at( const void* p, unsigned int* size ) const = 0;
+        virtual const int* nearest( const void* k, unsigned int neighbourhood ) const = 0;
         virtual unsigned int count() const = 0;
         virtual unsigned int size() const = 0;
     protected:
@@ -23,11 +25,12 @@ class base
 
 template < unsigned int D > struct _traits
 { 
-    static unsigned int power( unsigned int b ) { return _traits< D - 1 >::power * b; }
-    static void index( std::array< int, D >& a, unsigned int v, int b, unsigned int i = D )
+    static unsigned int power( unsigned int b ) { return _traits< D - 1 >::power( b ) * b; }
+    static std::array< int, D > index( unsigned int v, int b, unsigned int i = D )
     {
-        a[ --i ] = v % b - b / 2;
-        if( i > 0 ) { index( a, v / b, i ); }
+        std::array< int, D > a;
+        for( int i = D - 1; i >= 0; a[i--] = v % b - b / 2, v /= b );
+        return a;
     } 
 };
 
@@ -64,20 +67,33 @@ struct proxy: public base
         return *size == 0 ? nullptr : &i->second.first[0];
     }
 
-    const int* nearest( const void* k, unsigned int neighbourhood, unsigned int count, unsigned int* size ) const
+    // todo: up to a given number of nearest points
+    // todo: all points in radius
+    // todo: multple input points
+    const int* nearest( const void* k, unsigned int neighbourhood ) const
     {
         auto i = map().index_of( key( k ) );
-        typename map_t::index_type j;
         int b = neighbourhood * 2 + 1;
-        for( unsigned int k = 0; k < _traits< Dim >::power( b ); ++k )
+        double s = std::numeric_limits< double >::max();
+        const int* si{nullptr};
+        for( unsigned int p = 0; p < _traits< Dim >::power( b ); ++p )
         {
-            _traits< Dim >::index( j, k, b );
+            typename map_t::index_type j = _traits< Dim >::index( p, b );
             for( unsigned int m = 0; m < Dim; ++m ) { j[m] += i[m]; }
             auto n = map().find( j );
             if( n == map().end() ) { continue; }
-            // todo: for( auto s: n->second )
+            for( unsigned int q = 0; q < n->second.first.size(); ++q )
+            {
+                double t = 0;
+                for( unsigned int m = 0; m < Dim; ++m )
+                { 
+                    double d = key( k )[m] - n->second.second[q][m]; 
+                    t += d * d;
+                }
+                if( t < s ) { s = t; si = &n->second.first[q]; }
+            }
         }
-        return nullptr;
+        return si;
     }
     
     unsigned int size() const { return map().size(); }
@@ -165,3 +181,5 @@ DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p,
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p ) { return as_base( p )->size(); }
 
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void* p ) { return as_base( p )->count(); }
+
+DLL_EXPORT const void* comma_containers_multidimensional_map_nearest( const void* p, const void* k, unsigned int n ) { return as_base( p )->nearest( k, n ); }
\ No newline at end of file
diff --git a/python/bindings/containers/multidimensional/map.h b/python/bindings/containers/multidimensional/map.h
index bce97a0a9..31c396f7f 100644
--- a/python/bindings/containers/multidimensional/map.h
+++ b/python/bindings/containers/multidimensional/map.h
@@ -22,4 +22,6 @@ DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void*
 
 DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, const void* k, void* size );
 
+DLL_EXPORT const void* comma_containers_multidimensional_map_nearest( const void* p, const void* k, unsigned int n );
+
 }
\ No newline at end of file
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
index 503e304c8..448551a09 100644
--- a/python/comma/containers/multidimensional/_map.py
+++ b/python/comma/containers/multidimensional/_map.py
@@ -20,6 +20,9 @@ def __init__( self, resolution, origin=None, values=None ):
         self._at = self._bindings.comma_containers_multidimensional_map_at
         self._at.argtypes = [ ctypes.c_void_p, ctypes.c_void_p ]
         self._at.restype = ctypes.c_void_p
+        self._nearest = self._bindings.comma_containers_multidimensional_map_nearest
+        self._nearest.argtypes = [ ctypes.c_void_p, ctypes.c_void_p, ctypes.c_uint ]
+        self._nearest.restype = ctypes.c_void_p
         key_types = { numpy.dtype( 'int32' ): 0, numpy.dtype( 'int64' ): 1, numpy.dtype( 'float32' ): 2, numpy.dtype( 'float64' ): 3 }
         if origin is None: origin = numpy.zeros( resolution.shape[0] )
         assert self._dtype in key_types, TypeError( f'expected key type in {list(key_types.keys())}; got: {self._dtype}' )
@@ -41,6 +44,10 @@ def at( self, value, radius=None ):
             return None if p is None else numpy.frombuffer( ctypes.string_at( p, s[0] * 4 ), dtype=numpy.int32, count=s[0] )
         raise NotImplementedError( 'Map.at(...,radius=...): implementing...' )
 
+    def nearest( self, value ):
+        n = self._nearest( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), 1 ) # todo? radius?
+        return None if n is None else ctypes.cast( n, ctypes.POINTER( ctypes.c_uint ) )[0]
+
     def count( self ): return self._count( self._map )
     
     def size( self ): return self._size( self._map )
diff --git a/python/comma/containers/multidimensional/test/test_multidimensional_map.py b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
index 936cfa2f1..8f3c39306 100644
--- a/python/comma/containers/multidimensional/test/test_multidimensional_map.py
+++ b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
@@ -22,4 +22,13 @@ def test_multidimensional_map_at():
     # - single point method? or pass multiple points and decide on shape?
     # - return list of sizes and list of indices
     # ? profile performance 
-    # print( m.at( [5, 5, 5], radius=3 ), file=sys.stderr )
\ No newline at end of file
+    # print( m.at( [5, 5, 5], radius=3 ), file=sys.stderr )
+
+def test_multidimensional_map_at():
+    values=[[0, 0, 0], [0.5, 0.5, 0.5], [1, 1, 1], [2, 2, 2], [3, 3, 3]]
+    m = multidimensional.Map( resolution=numpy.array([2, 2, 2], dtype=float), values=values )
+    assert values[ m.nearest( [0, 0, 0] ) ] == [0, 0, 0]
+    assert values[ m.nearest( [0.4, 0.4, 0.4] ) ] == [0.5, 0.5, 0.5]
+    assert values[ m.nearest( [1.4, 1.4, 1.4] ) ] == [1, 1, 1]
+    assert values[ m.nearest( [5, 5, 5] ) ] == [3, 3, 3]
+    assert m.nearest( [7, 7, 7] ) is None

From 3fad0ed784183dc2471bca0535feae1db3339660 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Tue, 20 May 2025 09:17:24 +1000
Subject: [PATCH 1043/1056] python: bindings: trivial comma_free() added

---
 python/bindings/CMakeLists.txt                | 19 +++++++++----------
 .../containers/multidimensional/map.h         |  9 ++-------
 python/bindings/definitions.h                 |  7 +++++++
 python/bindings/memory.cpp                    |  6 ++++++
 python/bindings/memory.h                      | 15 +++++++++++++++
 5 files changed, 39 insertions(+), 17 deletions(-)
 create mode 100644 python/bindings/definitions.h
 create mode 100644 python/bindings/memory.cpp
 create mode 100644 python/bindings/memory.h

diff --git a/python/bindings/CMakeLists.txt b/python/bindings/CMakeLists.txt
index 2efe93e47..005b21bc7 100644
--- a/python/bindings/CMakeLists.txt
+++ b/python/bindings/CMakeLists.txt
@@ -1,19 +1,18 @@
-SET( PROJECT "python_bindings" )
-SET( TARGET_NAME comma_${PROJECT} )
-SET( dir ${SOURCE_CODE_BASE_DIR}/python/bindings )
+set( PROJECT "python_bindings" )
+set( TARGET_NAME comma_${PROJECT} )
+set( dir ${SOURCE_CODE_BASE_DIR}/python/bindings )
 
-FILE( GLOB_RECURSE source ${dir}/*.cpp )
-FILE( GLOB_RECURSE includes ${dir}/*.h )
+file( GLOB_RECURSE source ${dir}/*.cpp )
+file( GLOB_RECURSE includes ${dir}/*.h )
 
-SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
+source_group( ${TARGET_NAME} FILES ${source} ${includes} )
 
-ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes} )
-SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+add_library( ${TARGET_NAME} ${source} ${includes} )
+set_target_properties( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 target_link_libraries( ${TARGET_NAME} comma_base ${comma_ALL_EXTERNAL_LIBRARIES} )
 
 # INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
-# INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
-INSTALL(
+install(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
     LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
diff --git a/python/bindings/containers/multidimensional/map.h b/python/bindings/containers/multidimensional/map.h
index 31c396f7f..c11b4b481 100644
--- a/python/bindings/containers/multidimensional/map.h
+++ b/python/bindings/containers/multidimensional/map.h
@@ -1,10 +1,7 @@
 #pragma once
 
-#ifdef _WIN32
-#define DLL_EXPORT __declspec( dllexport )
-#else
-#define DLL_EXPORT
-#endif
+#include "../../definitions.h"
+#include "../../memory.h"
 
 extern "C" {
 
@@ -14,8 +11,6 @@ DLL_EXPORT void* comma_containers_multidimensional_map_create( int key_type, uns
 
 DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p );
 
-// todo? DLL_EXPORT const void* comma_containers_multidimensional_map_free( const void* p, void* size );
-
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p );
 
 DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void* p );
diff --git a/python/bindings/definitions.h b/python/bindings/definitions.h
new file mode 100644
index 000000000..f68b7134b
--- /dev/null
+++ b/python/bindings/definitions.h
@@ -0,0 +1,7 @@
+#pragma once
+
+#ifdef _WIN32
+#define DLL_EXPORT __declspec( dllexport )
+#else
+#define DLL_EXPORT
+#endif
diff --git a/python/bindings/memory.cpp b/python/bindings/memory.cpp
new file mode 100644
index 000000000..66eeda4d6
--- /dev/null
+++ b/python/bindings/memory.cpp
@@ -0,0 +1,6 @@
+#pragma once
+
+#include <stdlib.h>
+#include "memory.h"
+
+DLL_EXPORT void comma_free( void* p ) { ::free( p ); }
diff --git a/python/bindings/memory.h b/python/bindings/memory.h
new file mode 100644
index 000000000..aa43287b4
--- /dev/null
+++ b/python/bindings/memory.h
@@ -0,0 +1,15 @@
+#pragma once
+
+#include "definitions.h"
+
+#ifdef _WIN32
+#define DLL_EXPORT __declspec( dllexport )
+#else
+#define DLL_EXPORT
+#endif
+
+extern "C" {
+
+DLL_EXPORT void comma_free( void* p );
+
+}

From 4907eeab0aec695964c439cdbde4b7761c7b2dbc Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 22 May 2025 02:41:57 +0000
Subject: [PATCH 1044/1056] csv/impl/to_ascii.h: optional-related compile
 warning fixed

---
 csv/impl/to_ascii.h | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/csv/impl/to_ascii.h b/csv/impl/to_ascii.h
index 936a07412..37f44cee3 100644
--- a/csv/impl/to_ascii.h
+++ b/csv/impl/to_ascii.h
@@ -29,8 +29,7 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_IMPL_TOASCII_HEADER_GUARD_
-#define COMMA_CSV_IMPL_TOASCII_HEADER_GUARD_
+#pragma once
 
 #include <vector>
 #include <boost/date_time/posix_time/posix_time.hpp>
@@ -40,6 +39,7 @@
 #include <boost/shared_ptr.hpp>
 #include <boost/type_traits.hpp>
 #include "../../base/exception.h"
+#include "../../base/none.h"
 #include "../../string/string.h"
 #include "../../visiting/visit.h"
 #include "../../visiting/while.h"
@@ -84,8 +84,8 @@ class to_ascii
         const std::vector< boost::optional< std::size_t > >& indices_;
         std::vector< std::string >& row_;
         std::size_t index_;
-        boost::optional< unsigned int > precision_;
-        boost::optional< char > quote_;
+        boost::optional< unsigned int > precision_{ comma::silent_none< unsigned int >() };
+        boost::optional< char > quote_{ comma::silent_none< char >() };
 
         std::string as_string_( const boost::posix_time::ptime& v ) { return to_iso_string( v ); }
         std::string as_string_( const std::string& v ) { return quote_ ? *quote_ + v + *quote_ : v; } // todo: escape/unescape
@@ -157,5 +157,3 @@ inline void to_ascii::apply_final( const K&, const T& value )
 }
 
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // #ifndef COMMA_CSV_IMPL_TOASCII_HEADER_GUARD_

From b11cb959d80f2d3094ce819075d74d53bec13272 Mon Sep 17 00:00:00 2001
From: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 22 May 2025 02:46:34 +0000
Subject: [PATCH 1045/1056] name-value-to-csv: compile warning fixed

---
 name_value/applications/name-value-to-csv.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index 19ebb77db..5133a5120 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -10,6 +10,7 @@
 #include <unordered_set>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
+#include "../../base/none.h"
 #include "../../string/string.h"
 #include "../../xpath/xpath.h"
 
@@ -117,7 +118,7 @@ int main( int ac, char** av )
         std::string prefix = options.value< std::string >( "--prefix,--path,-p", "" );
         values_t values; // quick and dirty; watch performance?
         std::map< unsigned int, values_t > map;
-        boost::optional< unsigned int > index;
+        boost::optional< unsigned int > index{ comma::silent_none< unsigned int >() };
         std::string key;
         bool is_map = options.exists( "--dict,--map" );
         if( is_map && unsorted ) { comma::say() << "combination of --map and --unsorted: todo, just ask" << std::endl; return 1; }

From 247c89fa12a3179f57543f2305eecbae7735d858 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 22 May 2025 19:24:01 +1000
Subject: [PATCH 1046/1056] csv-random: shuffle: std::random_shuffle() replaced
 with std::shuffle() since the former is deprecated and will be removed -
 supposedly from c++17, but gcc seems to still support it

---
 csv/applications/csv-random.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
index 2d6aeb476..745b0c2e8 100644
--- a/csv/applications/csv-random.cpp
+++ b/csv/applications/csv-random.cpp
@@ -370,10 +370,11 @@ template < typename Engine > static int run_impl( const comma::command_line_opti
         {
             if( !records.empty() )
             {
-                std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+                //std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
                 indices.resize( records.size() ); // quick and dirty
                 for( unsigned int i = 0; i < indices.size(); ++i ) { indices[i] = i; }
-                std::random_shuffle( indices.begin(), indices.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
+                // deprecated: std::random_shuffle( indices.begin(), indices.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
+                std::shuffle( indices.begin(), indices.end(), engine );
                 unsigned int s = sample ? ( ratio ? int( records.size() * *ratio ) : size ) : records.size();
                 if( sample ) { std::sort( indices.begin(), indices.begin() + s ); } // quick and dirty
                 for( unsigned int i = 0; i < s; ++i ) { std::cout.write( &records[indices[i]][0], records[indices[i]].size() ); }

From 11b949528c03388e4cd31da1e721231fe13b6a21 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 22 May 2025 19:24:34 +1000
Subject: [PATCH 1047/1056] csv-join, csv-update: compile warnings fixed
 (somewhat)

---
 csv/applications/csv-join.cpp   | 2 +-
 csv/applications/csv-update.cpp | 8 ++++----
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 9bad81d5b..24d82e877 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -372,7 +372,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         if( filter_id_fields_discard ) { filter_id_fields_flags.resize( w.size(), 0 ); }
         bool got_state = false;
         bool got_next_state = false;
-        std::size_t filter_state_index;
+        std::size_t filter_state_index{0};
         for( std::size_t k = 0; k < w.size() && ( !got_state || !got_next_state ); ++k ) 
         {
             if( w[k] == "state" ) { got_state = true; filter_state_index = k; continue; }
diff --git a/csv/applications/csv-update.cpp b/csv/applications/csv-update.cpp
index decefba96..32b09b537 100644
--- a/csv/applications/csv-update.cpp
+++ b/csv/applications/csv-update.cpp
@@ -119,7 +119,7 @@ struct input_t
 {
     comma::csv::impl::unstructured key;
     comma::csv::impl::unstructured value;
-    comma::uint32 block;
+    comma::uint32 block{0};
 
     input_t() : block( 0 ) {}
     input_t( comma::csv::impl::unstructured key, comma::csv::impl::unstructured value, comma::uint32 block ): key( key ), value( value ), block( block ) {}
@@ -131,8 +131,8 @@ struct map_t
 {
     struct value_type
     {
-        unsigned int index;
-        input_t value;
+        unsigned int index{0};
+        input_t value{};
         std::string string;
 
         value_type() {}
@@ -171,7 +171,7 @@ static bool last_block = false;
 static bool last_only = false;
 static bool matched_only = false;
 static bool update_non_empty = false;
-static input_t default_input;
+static input_t default_input{};
 static comma::csv::impl::unstructured empty;
 static boost::optional< comma::csv::impl::unstructured > erase;
 static map_t::type filter_map;

From 936030fb044e8977558a40d25ef7724429613049 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 28 May 2025 19:39:30 +1000
Subject: [PATCH 1048/1056] application: command_line_options: annoying compile
 warnings fixed

---
 application/command_line_options.cpp | 3 +--
 application/command_line_options.h   | 5 +++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 91f1af574..9a3807046 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -15,7 +15,6 @@
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>
-#include "../base/exception.h"
 #include "../io/impl/filesystem.h"
 #include "../string/split.h"
 #include "command_line_options.h"
@@ -166,7 +165,7 @@ void command_line_options::_fill_map( const std::vector< std::string >& v )
     {
         if( v[i].length() < 2 || v[i].at( 0 ) != '-') { continue; }
         std::string name;
-        boost::optional< std::string > value;
+        boost::optional< std::string > value = comma::silent_none< std::string >();
         std::size_t equal = v[i].find_first_of( '=' );
         if( equal == std::string::npos )
         {
diff --git a/application/command_line_options.h b/application/command_line_options.h
index ca3f51270..f257cbd10 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -13,6 +13,7 @@
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include "../base/exception.h"
+#include "../base/none.h"
 #include "../io/terminal.h"
 #include "../string/string.h"
 #include "verbose.h" // todo: deprecate
@@ -155,7 +156,7 @@ class command_line_options
             std::vector< std::string > names;
             bool is_optional;
             bool has_value;
-            boost::optional< std::string > default_value; // todo: make strongly typed
+            boost::optional< std::string > default_value{ comma::silent_none< std::string >() }; // todo: make strongly typed
             std::string help;
 
             /// default constructor
@@ -231,7 +232,7 @@ template < typename T >
 inline boost::optional< T > command_line_options::optional( const std::string& name ) const
 {
     std::vector< T > v = values< T >( name );
-    return v.empty() ? boost::optional< T >() : boost::optional< T >( v[0] );
+    return v.empty() ? comma::silent_none< T >() : boost::optional< T >( v[0] );
 }
 
 template < typename T >

From d2897b2b9abb6ddfb225464881f82917113fe60f Mon Sep 17 00:00:00 2001
From: Dave Jennings <dave.jennings@missionsystems.com.au>
Date: Fri, 30 May 2025 14:46:21 +1000
Subject: [PATCH 1049/1056] command_line_options.h: change brace-initialization
 to equals

to avoid the most vexing parse which confuses gcc 9
https://en.wikipedia.org/wiki/Most_vexing_parse
---
 application/command_line_options.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/application/command_line_options.h b/application/command_line_options.h
index f257cbd10..ea0817879 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -156,7 +156,7 @@ class command_line_options
             std::vector< std::string > names;
             bool is_optional;
             bool has_value;
-            boost::optional< std::string > default_value{ comma::silent_none< std::string >() }; // todo: make strongly typed
+            boost::optional< std::string > default_value = comma::silent_none< std::string >(); // todo: make strongly typed
             std::string help;
 
             /// default constructor

From 31d1ba174f1280c06b44f2409ae79fa0fc16638f Mon Sep 17 00:00:00 2001
From: Rex Crisp <rex.crisp@missionsystems.com.au>
Date: Thu, 11 Sep 2025 08:58:15 +1000
Subject: [PATCH 1050/1056] io/stream: fix istreams EOF behaviour and read
 logic  - eof() returns true only when all files are exhausted  - read() only
 advances to next file when current file reaches EOF  - test cases for
 istreams behaviour with single and multiple files

---
 io/stream.cpp           |  5 ++-
 io/test/stream_test.cpp | 89 +++++++++++++++++++++++++++++++++++++++++
 2 files changed, 92 insertions(+), 2 deletions(-)

diff --git a/io/stream.cpp b/io/stream.cpp
index 8a4d3de2f..fab2b1ab1 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -399,7 +399,7 @@ istreams::istreams( const std::vector< std::string >& names, mode::value mode, m
 {
 }
 
-bool istreams::eof() const { return _index >= _names.size() || _index == _names.size() - 1 || ( *_istream )->eof(); }
+bool istreams::eof() const { return _index >= _names.size(); }
 
 istreams& istreams::operator++()
 {
@@ -412,11 +412,12 @@ istreams& istreams::operator++()
 bool istreams::read( char* buf, std::size_t size )
 {
     std::size_t s = size;
-    for( char* p = buf; s > 0 && !eof(); ++( *this ) )
+    for( char* p = buf; s > 0 && !eof(); )
     {
         auto& is = *( *_istream );
         is.read( p, s );
         if( is.gcount() > 0 ) { s -= is.gcount(); p += is.gcount(); }
+        if ( is.eof() ) { ++( *this ); }
     }
     return s == 0;
 }
diff --git a/io/test/stream_test.cpp b/io/test/stream_test.cpp
index 1b8cc0b98..30adc818e 100644
--- a/io/test/stream_test.cpp
+++ b/io/test/stream_test.cpp
@@ -38,6 +38,95 @@ TEST( io, file_stream )
     EXPECT_EQ( system( "rm ./test.pipe" ), 0 );
 }
 
+TEST(io, istreams) {
+    std::vector<std::string> files = { "./file1.txt" };
+
+    // --- single file ---
+    {
+        std::ofstream os1(files[0]);
+        os1 << "abc";
+        os1.close();
+
+        comma::io::istreams single(files);
+
+        char buf1[4] = {0};
+
+        // partial read
+        bool ok = single.read(buf1, 2);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf1[0], 'a');
+        EXPECT_EQ(buf1[1], 'b');
+        EXPECT_FALSE(single.eof()); // not at EOF yet
+
+        // read the remainder
+        ok = single.read(buf1 + 2, 1);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf1[2], 'c');
+        EXPECT_FALSE(single.eof()); // EOF not flagged until next attempt
+
+        // attempt to read past EOF
+        ok = single.read(buf1, 1);
+        EXPECT_FALSE(ok);
+        EXPECT_TRUE(single.eof());
+
+        // edge case: zero-size read should succeed and not change EOF
+        ok = single.read(buf1, 0);
+        EXPECT_TRUE(ok);
+        EXPECT_TRUE(single.eof());
+    }
+
+    // --- multiple files ---
+    {
+        files.emplace_back("./file2.txt");
+        std::ofstream os2(files[1]);
+        os2 << "def";
+        os2.close();
+
+        files.emplace_back("./file3.txt");
+        std::ofstream os3(files[2]);
+        os3 << "ghi";
+        os3.close();
+
+        comma::io::istreams multi(files);
+
+        char buf2[10] = {0};
+
+        // first file, partial read
+        bool ok = multi.read(buf2, 3);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf2[0], 'a');
+        EXPECT_EQ(buf2[1], 'b');
+        EXPECT_EQ(buf2[2], 'c');
+        EXPECT_FALSE(multi.eof());
+
+        // read across files 1 -> 2 -> 3
+        ok = multi.read(buf2 + 3, 5);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf2[3], 'd');
+        EXPECT_EQ(buf2[4], 'e');
+        EXPECT_EQ(buf2[5], 'f');
+        EXPECT_EQ(buf2[6], 'g');
+        EXPECT_EQ(buf2[7], 'h');
+        EXPECT_FALSE(multi.eof());
+
+        // read remainder, but request too many
+        ok = multi.read(buf2 + 8, 3); // only 'i' available
+        EXPECT_FALSE(ok);             // not enough to fill request
+        EXPECT_EQ(buf2[8], 'i');
+        EXPECT_EQ(buf2[9], '\0');     // untouched
+        EXPECT_TRUE(multi.eof());
+
+        // edge case: further reads must stay at EOF
+        ok = multi.read(buf2, 1);
+        EXPECT_FALSE(ok);
+        EXPECT_TRUE(multi.eof());
+    }
+
+    // cleanup
+    for (const auto& f : files) { comma::filesystem::remove(f); }
+}
+
+
 TEST( io, std_stream )
 {
     comma::io::istream istream( "-" );

From 2f4f55c8e688110c7be5624a242f2deeb599fc7c Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 6 Nov 2025 11:54:16 +1100
Subject: [PATCH 1051/1056] system/ansible: removed pip install numpy; added
 apt install python3-numpy

---
 system/ansible/install.yml | 7 +------
 1 file changed, 1 insertion(+), 6 deletions(-)

diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 3be479b03..c15ebf66a 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -12,7 +12,7 @@
   - name: "install comma dependencies"
     become: true
     apt:
-        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-pip', 'libprocps-dev', 'recode']
+        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-pip', 'python3-numpy', 'libproc2-dev', 'recode']
         state: present
         update_cache: yes
 
@@ -23,11 +23,6 @@
         state: present
         update_cache: yes
 
-  - name: "install python dependencies using pip"
-    become: true
-    pip:
-        name: numpy
-
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
     with_items:

From fb97a238eec3e48522eeaf1f7b15beeb3a3c7030 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 6 Nov 2025 12:07:17 +1100
Subject: [PATCH 1052/1056] a few compilation warnings fixed; a few boost
 dependencies removed

---
 base/variant.h                |  4 ++--
 csv/applications/csv-join.cpp | 15 +++++++--------
 python/bindings/memory.cpp    |  2 --
 3 files changed, 9 insertions(+), 12 deletions(-)

diff --git a/base/variant.h b/base/variant.h
index 5d0989c8b..5d2b822bd 100644
--- a/base/variant.h
+++ b/base/variant.h
@@ -118,8 +118,8 @@ struct named_variant : public variant< Args... >, public Names
 {
     typedef Names names_t;
     typedef variant< Args... > variant_t;
-    template < typename S > static const std::string& name_of() { return Names::names()[ variant_t::template index_of< S >() ]; }
-    const auto& name() const { COMMA_ASSERT( bool( *this ), "asked for name, but value is not set" ); return this->names()[this->index()]; }
+    template < typename S > static auto name_of() { return Names::names()[ variant_t::template index_of< S >() ]; }
+    auto name() const { COMMA_ASSERT( bool( *this ), "asked for name, but value is not set" ); return this->names()[this->index()]; }
 };
 
 template < typename Names >
diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 24d82e877..39fab1839 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -4,18 +4,17 @@
 /// @author vsevolod vlaskine
 
 #include <string.h>
+#include <functional>
 #include <iostream>
 #include <map>
 #include <sstream>
 #include <string>
 #include <type_traits>
+#include <unordered_map>
 #include <vector>
-#include <boost/array.hpp>
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/functional/hash.hpp>
-#include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
-#include <boost/unordered_map.hpp>
 #include "../../application/command_line_options.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
@@ -188,7 +187,7 @@ struct input
         return comma::math::less( keys[0], rhs.keys[0] ); //, *radius );
     }
 
-    struct hash : public std::unary_function< input, std::size_t >
+    struct hash : public std::function< input( std::size_t ) >
     {
         std::size_t operator()( input const& p ) const
         {
@@ -198,7 +197,7 @@ struct input
         }
     };
 
-    typedef boost::unordered_map< input, std::vector< std::string >, hash > unordered_map;
+    typedef std::unordered_map< input, std::vector< std::string >, hash > unordered_map;
     typedef std::map< input, std::vector< std::string > > map;
 };
 
@@ -393,8 +392,8 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
                 if( !w[k].empty() && w[k] != "block" ) { no_filter_key_fields = false; }
                 if( filter_id_fields_discard && w[k] == "block" ) { filter_id_fields_flags[k] = 1; }
                 if( v[i] != w[k] ) { continue; }
-                v[i] = "keys[" + boost::lexical_cast< std::string >( default_input_keys_count ) + "]";
-                w[k] = "keys[" + boost::lexical_cast< std::string >( default_input_keys_count ) + "]";
+                v[i] = "keys[" + std::to_string( default_input_keys_count ) + "]";
+                w[k] = "keys[" + std::to_string( default_input_keys_count ) + "]";
                 if( filter_id_fields_discard ) { filter_id_fields_flags[k] = 1; }
                 ++default_input_keys_count;
             }
@@ -419,7 +418,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         if( is_state_machine )
         {
             state_index = default_input_keys_count;
-            w[filter_state_index] = "keys[" + boost::lexical_cast< std::string >( state_index ) + "]";
+            w[filter_state_index] = "keys[" + std::to_string( state_index ) + "]";
             ++default_input_keys_count;
         }
         default_input.keys.resize( default_input_keys_count );
diff --git a/python/bindings/memory.cpp b/python/bindings/memory.cpp
index 66eeda4d6..5f971db25 100644
--- a/python/bindings/memory.cpp
+++ b/python/bindings/memory.cpp
@@ -1,5 +1,3 @@
-#pragma once
-
 #include <stdlib.h>
 #include "memory.h"
 

From a7a1cd9bbbf2a71f39acce77087c3fe1ba89e344 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 6 Nov 2025 12:07:35 +1100
Subject: [PATCH 1053/1056] system/ansible/install.yml: libyaml-dev added

---
 system/ansible/install.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index c15ebf66a..4ede9cf02 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -12,7 +12,7 @@
   - name: "install comma dependencies"
     become: true
     apt:
-        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-pip', 'python3-numpy', 'libproc2-dev', 'recode']
+        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-pip', 'python3-numpy', 'libproc2-dev', 'libyaml-dev', 'recode']
         state: present
         update_cache: yes
 

From 229ad7f69d3f2183c2c8ca7f2f04452af6720559 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Wed, 26 Nov 2025 16:11:51 +1100
Subject: [PATCH 1054/1056] cmake: minimum required version made dependent on
 the current cmake version for backward compatibility as cmake 4 has
 discontinued support for anything less than 3.5

---
 CMakeLists.txt | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 357da2d9d..9bc598eaf 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -8,7 +8,11 @@ if( USE_ARM_TOOLCHAIN )
     include( ${CMAKE_TOOLCHAIN_FILE} REQUIRED )
 endif( USE_ARM_TOOLCHAIN )
 
-cmake_minimum_required( VERSION 3.1 )
+if( ${CMAKE_MAJOR_VERSION} LESS 4 )
+    cmake_minimum_required( VERSION 3.1 )
+else()
+    cmake_minimum_required( VERSION 3.5 )
+endif()
 cmake_policy( SET CMP0048 NEW )
 project( comma VERSION 1.1.0 LANGUAGES CXX )
 if( NOT DEFINED CMAKE_PROJECT_VERSION )

From fbbe9eb636e681ce1b594f47aca69428042a89e3 Mon Sep 17 00:00:00 2001
From: vsevolod vlaskine <vsevolod.vlaskine@gmail.com>
Date: Thu, 11 Dec 2025 17:28:46 +1100
Subject: [PATCH 1055/1056] io-publish: --exec: SIGPIPE signal handler restored
 to default just before running execlp(); otherwise pipelines like
 yes|csv-thin|csv-time-stamp do not exit if csv-time-stamp crashes (or is
 killed); the reason is that lots of applications (in comma and snark anyway)
 don't enable SIGPIPE handler explicitly and rely on default, which is
 inherited from the process calling exec

---
 io/applications/io-publish.cpp | 17 +++++++++++++++++
 1 file changed, 17 insertions(+)

diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index 70b0ad760..0f46d6d86 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -111,6 +111,23 @@ class command
                 while( ( dup2( fd[1], STDOUT_FILENO ) == -1 ) && ( errno == EINTR ) ) {} // connect pipe input to stdout in child
                 ::close( fd[1] );     // no longer need fd[1], now that it's duped
                 ::close( fd[0] );     // don't need pipe output in the child
+                // quick and dirty as impl/publisher.cpp sets the SIGPIPE handler to ignore
+                // the clean way would be to handle it correctly in impl/publisher.cpp, but
+                // that might be too fiddly for now
+                //
+                // failure example:
+                //     io-publish tcp:1234 --exec "yes | csv-thin --period 0.1 | csv-time-stamp"
+                //     killall csv-time-stamp
+                //     then, if you comment the SIGPIPE-related code below, csv-thin
+                //     will ignore SIGPIPE as exec environment inherits the ignore SIGPIPE
+                //     handler
+                // also, all applications in comma and snark would benefit from setting
+                // the SIGPIPE handling explicitly to avoid similar problems in future
+                struct sigaction new_action, old_action;
+                new_action.sa_handler = SIG_DFL;
+                sigemptyset( &new_action.sa_mask );
+                sigaction( SIGPIPE, NULL, &old_action );
+                sigaction( SIGPIPE, &new_action, NULL );
                 ::execlp( "bash", "bash", "-c", &command_[0], NULL );
                 comma::say() << "failed to exec child: errno " << comma::last_error::value() << " - " << comma::last_error::to_string() << std::endl;
                 exit( 1 );

From 4e37c310d1ee7af96a3ca09f6a85c60bc05dfdb3 Mon Sep 17 00:00:00 2001
From: mimhoff <matthew@mimhoff.com>
Date: Fri, 19 Dec 2025 16:55:34 +1100
Subject: [PATCH 1056/1056] add build to .gitignore

---
 .gitignore | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.gitignore b/.gitignore
index 50b820a33..d1bce2041 100644
--- a/.gitignore
+++ b/.gitignore
@@ -14,3 +14,4 @@ compile_commands.json
 .ycm_extra_conf.py
 python/comma_py.egg-info/
 python/dist/
+build