diff --git a/.gitignore b/.gitignore
index ebaa5be7f..d1bce2041 100644
--- a/.gitignore
+++ b/.gitignore
@@ -12,3 +12,6 @@ doc/generated
 tags
 compile_commands.json
 .ycm_extra_conf.py
+python/comma_py.egg-info/
+python/dist/
+build
diff --git a/AUTHORS b/AUTHORS
index 53aaa505a..b3ae456ea 100644
--- a/AUTHORS
+++ b/AUTHORS
@@ -1,4 +1,4 @@
-  Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
-  Cedric Wohlleber <c.wohlleber@acfr.usyd.edu.au>
-  Matthew Herrmann <matthewinrandwick@gmail.com>
-  James Underwood <j.underwood@acfr.usyd.edu.au>
+Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
+Cedric Wohlleber <c.wohlleber@acfr.usyd.edu.au>
+Matthew Herrmann <matthewinrandwick@gmail.com>
+James Underwood <j.underwood@acfr.usyd.edu.au>
diff --git a/CMakeFiles/FindComma.cmake b/CMakeFiles/FindComma.cmake
index 599c3f7f9..12ec30316 100644
--- a/CMakeFiles/FindComma.cmake
+++ b/CMakeFiles/FindComma.cmake
@@ -3,10 +3,10 @@
 # The following variables are set if comma is found.
 #  comma_FOUND         - Set to true when comma is found.
 #  comma_USE_FILE      - CMake file to use comma.
-#  comma_MAJOR_VERSION - The comma major version number.
-#  comma_MINOR_VERSION - The comma minor version number
+#  comma_version_major - The comma major version number.
+#  comma_version_minor - The comma minor version number
 #                       (odd non-release).
-#  comma_BUILD_VERSION - The comma patch level
+#  comma_version_patch - The comma patch level
 #                       (meaningless for odd minor).
 #  comma_INCLUDE_DIRS  - Include directories for comma
 #  comma_LIBRARY_DIRS  - Link directories for comma libraries
@@ -85,4 +85,3 @@ ENDIF ( comma_FOUND )
 IF( NOT comma_FOUND )
   MESSAGE(FATAL_ERROR ${comma_DIR_MESSAGE})
 ENDIF( NOT comma_FOUND )
-
diff --git a/CMakeFiles/check.c++.standard.cmake b/CMakeFiles/check.c++.standard.cmake
index fd1942322..f17089638 100644
--- a/CMakeFiles/check.c++.standard.cmake
+++ b/CMakeFiles/check.c++.standard.cmake
@@ -1,7 +1,7 @@
-    SET( CXX_STANDARDS "0x;11;14;17" CACHE STRING "list of known c++ standards" )
+    SET( CXX_STANDARDS "0x;11;14;17;20" CACHE STRING "list of known c++ standards" )
     MARK_AS_ADVANCED( FORCE CXX_STANDARDS )
     STRING( REGEX REPLACE ";" "," CXX_STANDARDS_READABLE "${CXX_STANDARDS}" )
-    SET( CXX_STANDARD_DEFAULT "11" CACHE STRING "default c++ standard to use" )
+    SET( CXX_STANDARD_DEFAULT "17" CACHE STRING "default c++ standard to use" )
     MARK_AS_ADVANCED( FORCE CXX_STANDARD_DEFAULT )
     SET( CXX_STANDARD_TO_USE "${CXX_STANDARD_DEFAULT}" CACHE STRING "c++ standard to use (one of ${CXX_STANDARDS_READABLE})" )
     SET_PROPERTY( CACHE CXX_STANDARD_TO_USE PROPERTY STRINGS ${CXX_STANDARDS} )
@@ -17,7 +17,6 @@
 	 MARK_AS_ADVANCED( FORCE CXX_STANDARD_FLAGS )
     ENDIF()
 
-    # A much better way to do this is with CXX_STANDARD but that requires CMake 3.1
     include( CheckCXXCompilerFlag )
     IF( ${CXX_STANDARD_TO_USE} MATCHES "0x" )
         message( WARNING "
@@ -28,27 +27,22 @@
  #########################################################################
 " )
     ENDIF()
-    FOREACH( STANDARD ${CXX_STANDARDS} )
-        # message( "Check if using C++${STANDARD}" )
-        IF( ${CXX_STANDARD_TO_USE} MATCHES "${STANDARD}" )
-            # message( "Yes, using C++${STANDARD}" )
-            IF( NOT ( ${CXX_STANDARD_TO_USE} MATCHES ${CXX_STANDARD_LAST} ) )
-                # message( "Have to check if ${CMAKE_CXX_COMPILER} supports C++${STANDARD}" )
-                message( "Attempt to use C++ standard ${STANDARD}" )
-		UNSET( compiler_supports_standard CACHE )
-		UNSET( compiler_flag_to_check CACHE )
-		SET( compiler_flag_to_check "-std=c++${STANDARD}" )
-		if ( CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND ${STANDARD} MATCHES "11" )
-		    set( compiler_flag_to_check "${compiler_flag_to_check} -Wc++11-narrowing" )
-		endif()
-		CHECK_CXX_COMPILER_FLAG( "${compiler_flag_to_check}" compiler_supports_standard )
-		if( NOT compiler_supports_standard )
-		    message( FATAL_ERROR "attempt to use C++ standard ${STANDARD} but ${CMAKE_CXX_COMPILER} does not support it" )
-		endif()
-                STRING( REPLACE " ${CXX_STANDARD_FLAGS}" "" CXX_FLAGS_NO_STANDARD "${CMAKE_CXX_FLAGS}" )
-		SET( CXX_STANDARD_FLAGS ${compiler_flag_to_check} CACHE STRING "updating compiler flags selecting C++ standard" FORCE )
-		SET( CXX_STANDARD_LAST ${CXX_STANDARD_TO_USE} CACHE STRING "updating C++ standard to use option" FORCE )
-                set( CMAKE_CXX_FLAGS "${CXX_FLAGS_NO_STANDARD} ${compiler_flag_to_check}" CACHE STRING "" FORCE )
-            ENDIF()
-        ENDIF()
-    ENDFOREACH()
+
+    IF( NOT ( ${CXX_STANDARD_TO_USE} MATCHES ${CXX_STANDARD_LAST} ) )
+        # message( "Have to check if ${CMAKE_CXX_COMPILER} supports C++${CXX_STANDARD_TO_USE}" )
+        message( "Attempt to use C++ standard ${CXX_STANDARD_TO_USE}" )
+        UNSET( compiler_supports_standard CACHE )
+        UNSET( compiler_flag_to_check CACHE )
+        SET( compiler_flag_to_check "-std=c++${CXX_STANDARD_TO_USE}" )
+        if ( CMAKE_CXX_COMPILER_ID MATCHES "Clang" AND ${CXX_STANDARD_TO_USE} MATCHES "11" )
+            set( extra_compiler_flags "${compiler_flag_to_check} -Wc++11-narrowing" )
+        endif()
+        CHECK_CXX_COMPILER_FLAG( "${compiler_flag_to_check} ${extra_compiler_flags}" compiler_supports_standard )
+        if( NOT compiler_supports_standard )
+            message( FATAL_ERROR "attempt to use C++ standard ${CXX_STANDARD_TO_USE} but ${CMAKE_CXX_COMPILER} does not support it" )
+        endif()
+        SET( CXX_STANDARD_LAST ${CXX_STANDARD_TO_USE} CACHE STRING "updating C++ standard to use option" FORCE )
+        set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${extra_compiler_flags}" CACHE STRING "" FORCE )
+    ENDIF()
+
+    set( CMAKE_CXX_STANDARD ${CXX_STANDARD_TO_USE} )
diff --git a/CMakeFiles/comma-config.cmake.in b/CMakeFiles/comma-config.cmake.in
index 0b3eda1b6..b9bbcd676 100644
--- a/CMakeFiles/comma-config.cmake.in
+++ b/CMakeFiles/comma-config.cmake.in
@@ -35,9 +35,13 @@ SET(comma_REQUIRED_EXE_LINKER_FLAGS "@comma_REQUIRED_EXE_LINKER_FLAGS@")
 SET(comma_REQUIRED_SHARED_LINKER_FLAGS "@comma_REQUIRED_SHARED_LINKER_FLAGS@")
 SET(comma_REQUIRED_MODULE_LINKER_FLAGS "@comma_REQUIRED_MODULE_LINKER_FLAGS@")
 
-SET(comma_MAJOR_VERSION "@comma_MAJOR_VERSION@")
-SET(comma_MINOR_VERSION "@comma_MINOR_VERSION@")
-SET(comma_BUILD_VERSION "@comma_BUILD_VERSION@")
+SET(comma_version_major "@comma_version_major@")
+SET(comma_version_minor "@comma_version_minor@")
+SET(comma_version_patch "@comma_version_patch@")
+SET(comma_MAJOR_VERSION "@comma_version_major@") # quick and dirty, otherwise comma so library version in dependent packages seem to get messed up
+SET(comma_MINOR_VERSION "@comma_version_minor@") # quick and dirty, otherwise comma so library version in dependent packages seem to get messed up
+SET(comma_BUILD_VERSION "@comma_version_patch@") # quick and dirty, otherwise comma so library version in dependent packages seem to get messed up
+set(comma_version "@comma_version@")
 
 SET(comma_USE_FILE "@comma_USE_FILE@")
 
diff --git a/CMakeFiles/post_install/CMakeLists.txt b/CMakeFiles/post_install/CMakeLists.txt
new file mode 100644
index 000000000..cf00749b3
--- /dev/null
+++ b/CMakeFiles/post_install/CMakeLists.txt
@@ -0,0 +1,6 @@
+if( BUILD_SHARED_LIBS )
+    install( CODE "message( \"ldconfig: running...\" )" )
+    install( CODE "execute_process( COMMAND /sbin/ldconfig )" )
+    install( CODE "message( \"ldconfig: done\" )" )
+endif( BUILD_SHARED_LIBS )
+
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 167b087db..9bc598eaf 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -8,15 +8,30 @@ if( USE_ARM_TOOLCHAIN )
     include( ${CMAKE_TOOLCHAIN_FILE} REQUIRED )
 endif( USE_ARM_TOOLCHAIN )
 
-PROJECT( "comma" )
-
-cmake_minimum_required(VERSION 2.6)
+if( ${CMAKE_MAJOR_VERSION} LESS 4 )
+    cmake_minimum_required( VERSION 3.1 )
+else()
+    cmake_minimum_required( VERSION 3.5 )
+endif()
+cmake_policy( SET CMP0048 NEW )
+project( comma VERSION 1.1.0 LANGUAGES CXX )
+if( NOT DEFINED CMAKE_PROJECT_VERSION )
+    set( CMAKE_PROJECT_VERSION ${PROJECT_VERSION} )
+    set( CMAKE_PROJECT_VERSION_MAJOR ${PROJECT_VERSION_MAJOR} )
+    set( CMAKE_PROJECT_VERSION_MINOR ${PROJECT_VERSION_MINOR} )
+    set( CMAKE_PROJECT_VERSION_PATCH ${PROJECT_VERSION_PATCH} )
+endif( NOT DEFINED CMAKE_PROJECT_VERSION )
+
+set( comma_version_major "${CMAKE_PROJECT_VERSION_MAJOR}" ) # quick and dirty
+set( comma_version_minor "${CMAKE_PROJECT_VERSION_MINOR}" ) # quick and dirty
+set( comma_version_patch "${CMAKE_PROJECT_VERSION_PATCH}" ) # quick and dirty
+set( comma_version "${CMAKE_PROJECT_VERSION}" ) # quick and dirty
 
 # option( USE_ARM_TOOLCHAIN "Cross compile using arm toolchain" OFF )
 # if( USE_ARM_TOOLCHAIN )
 #     set(CMAKE_TOOLCHAIN_FILE ${SOURCE_CODE_BASE_DIR}/CMakeFiles/arm.toolchain.cmake)
 # endif( USE_ARM_TOOLCHAIN )
-# 
+#
 # option(my_test_option "whatever" OFF)
 # if(my_test_option)
 #     set(my_other_option "is set")
@@ -50,20 +65,15 @@ IF (UNIX AND NOT APPLE)
 		SET ( COMMITHASH "abc" )
 	ENDIF()
 ELSE() # Probably windows; gets hardcoded patch version
-	SET ( COMMITDATE 1 ) 
+	SET ( COMMITDATE 1 )
 	SET ( COMMITHASH "abc" )
 ENDIF()
 
-# ---------------------------------------------------------------------------
-# set compiler and linker flags and variables
+if( NOT CMAKE_BUILD_TYPE )
+  set( CMAKE_BUILD_TYPE Release CACHE STRING "options are: None Debug Release RelWithDebInfo MinSizeRel." FORCE )
+endif( NOT CMAKE_BUILD_TYPE )
 
-IF(NOT CMAKE_BUILD_TYPE)
-  SET(CMAKE_BUILD_TYPE RelWithDebInfo CACHE STRING
-      "Choose the type of build, options are: None Debug Release RelWithDebInfo MinSizeRel."
-      FORCE)
-ENDIF(NOT CMAKE_BUILD_TYPE)
-
-IF(WIN32)
+if( WIN32 )
   SET(CMAKE_CXX_WARNING_LEVEL 4)
   IF(CMAKE_CXX_FLAGS MATCHES "/W[0-4]")
     STRING(REGEX REPLACE "/W[0-4]" "/W4" CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS}")
@@ -78,7 +88,16 @@ IF(WIN32)
   SET (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} /D \"NOMINMAX\"")
   ADD_DEFINITIONS(-D_USE_MATH_DEFINES)
   ADD_DEFINITIONS(-DWIN32_LEAN_AND_MEAN) #used to fix winsock redefinition error
-ENDIF(WIN32)
+else( WIN32 )
+    option( ENABLE_FAST_MATH "enable compiler fast-math; experimental, some tests fail on nan and precision" OFF )
+    if( ENABLE_FAST_MATH )
+        set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -ffast-math" )
+    endif( ENABLE_FAST_MATH )
+    option( ENABLE_OPTIMIZATION "enable compiler optimisation" ON )
+    if( ENABLE_OPTIMIZATION )
+        set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -O3" ) # quick and dirty; make optimisation level configurable
+    endif( ENABLE_OPTIMIZATION )
+endif( WIN32 )
 
 IF( CMAKE_SIZEOF_VOID_P EQUAL 8 )
   SET( IS_64_BIT TRUE )
@@ -106,33 +125,18 @@ IF(CMAKE_BUILD_TOOL MATCHES "make")
 ENDIF(CMAKE_BUILD_TOOL MATCHES "make")
 
 if( UNIX )
-INCLUDE( CMakeFiles/check.c++.standard.cmake REQUIRED )
-endif()
+    include( CMakeFiles/check.c++.standard.cmake REQUIRED )
+endif( UNIX )
 
 SET( SOURCE_CODE_BASE_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 SET( LIBRARY_OUTPUT_PATH ${CMAKE_BINARY_DIR}/lib )
 
-SET( EXECUTABLE_OUTPUT_PATH
-     ${PROJECT_BINARY_DIR}/bin CACHE PATH
-     "Single output directory for building all executables." )
-
-SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" )
-
-IF( NOT comma_INSTALL_BIN_DIR )
-  SET( comma_INSTALL_BIN_DIR bin )
-ENDIF( NOT comma_INSTALL_BIN_DIR )
-
-IF( NOT comma_INSTALL_INCLUDE_DIR )
-    SET( comma_INSTALL_INCLUDE_DIR include/${PROJECT_NAME} )
-ENDIF( NOT comma_INSTALL_INCLUDE_DIR )
+set( comma_INSTALL_BIN_DIR bin CACHE PATH "installation directory for binaries" )
+set( comma_INSTALL_INCLUDE_DIR include/comma CACHE PATH "installation directory for include directories" )
+set( comma_INSTALL_LIB_DIR lib CACHE PATH "installation directory for libraries" )
+set( comma_INSTALL_PACKAGE_DIR CMakeFiles CACHE PATH "installation directory for cmake files" )
 
-IF( NOT comma_INSTALL_LIB_DIR)
-  SET( comma_INSTALL_LIB_DIR lib )
-ENDIF( NOT comma_INSTALL_LIB_DIR )
-
-IF( NOT comma_INSTALL_PACKAGE_DIR )
-  SET( comma_INSTALL_PACKAGE_DIR CMakeFiles )
-ENDIF( NOT comma_INSTALL_PACKAGE_DIR )
+SET( comma_LIBRARY_PROPERTIES ${comma_LIBRARY_PROPERTIES} DEBUG_POSTFIX "-d" SOVERSION ${CMAKE_PROJECT_VERSION} LINK_FLAGS_RELEASE -s )
 
 #INCLUDE_DIRECTORIES( ${comma_INSTALL_INCLUDE_DIR}/../ )
 
@@ -143,7 +147,7 @@ ENDIF( APPLE )
 OPTION( BUILD_TESTS "build unit tests" OFF )
 SET( comma_BUILD_TESTS ${BUILD_TESTS} )
 
-OPTION( BUILD_PYTHON_PACKAGES "install comma python packages" ON )
+option( BUILD_PYTHON_PACKAGES "install comma python packages" ON )
 
 INCLUDE( CMakeDependentOption )
 CMAKE_DEPENDENT_OPTION( ADD_PYTHON_PACKAGES_TO_RPM "add comma python packages to rpm" OFF "BUILD_PYTHON_PACKAGES" ON )
@@ -152,11 +156,21 @@ CMAKE_DEPENDENT_OPTION( BUILD_CPP_PYTHON_BINDINGS "build C++/Python bindings" OF
 OPTION( BUILD_APPLICATIONS "build applications" ON )
 SET( comma_BUILD_APPLICATIONS ${BUILD_APPLICATIONS} )
 
-OPTION( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
-
-OPTION(BUILD_SHARED_LIBS "build with shared libraries" OFF)
-
-OPTION( comma_BUILD_XML "build xml" OFF )
+option( BUILD_SHARED_LIBS "build with shared libraries" ON )
+option( comma_BUILD_NAME_VALUE_YAML "build name_value with yaml support; requires libyaml; e.g. apt install libyaml-dev" OFF )
+option( comma_BUILD_PYTHON "build python" ON )
+option( comma_BUILD_XML "build xml" OFF )
+option( comma_BUILD_ZEROMQ "build io with zeromq support" OFF )
+option( comma_USE_BOOST_FILESYSTEM "use boost::filesystem rather than std::filesystem" OFF )
+
+if( comma_USE_BOOST_FILESYSTEM )
+    set( CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DCOMMA_USE_BOOST_FILESYSTEM -DBOOST_FILESYSTEM_NO_DEPRECATED" )
+else()
+    # see https://gcc.gnu.org/onlinedocs/libstdc++/manual/status.html#status.iso.2017
+    if( CMAKE_CXX_COMPILER_ID STREQUAL "GNU" AND CMAKE_CXX_COMPILER_VERSION VERSION_LESS 9 )
+        link_libraries( "-lstdc++fs" )
+    endif()
+endif()
 
 SET(comma_BUILD_SHARED_LIBS ${BUILD_SHARED_LIBS})
 
@@ -164,6 +178,11 @@ IF( NOT BUILD_SHARED_LIBS )
     SET( Boost_USE_STATIC_LIBS ON )
 ENDIF( NOT BUILD_SHARED_LIBS )
 
+set( comma_boost_components thread system date_time iostreams program_options regex )
+if( comma_USE_BOOST_FILESYSTEM )
+    set( comma_boost_components ${comma_boost_components} filesystem )
+endif()
+
 IF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
     IF( NOT BUILD_SHARED_LIBS )
         MESSAGE( WARNING "Linking C++/Python bindings with static libraries is requested. If linking fails, recompile required libraries with -fPIC or use shared libraries. Note that this feature has only been tested with shared libraries." )
@@ -171,41 +190,44 @@ IF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
     SET( Python_ADDITIONAL_VERSIONS 2.7 )
     FIND_PACKAGE( PythonLibs REQUIRED )
     INCLUDE_DIRECTORIES( ${PYTHON_INCLUDE_DIRS} )
-    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time program_options regex python )
-ELSE( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
-    FIND_PACKAGE( Boost COMPONENTS thread filesystem system date_time program_options regex )
+    set( comma_boost_components ${comma_boost_components} python )
 ENDIF( BUILD_PYTHON_PACKAGES AND BUILD_CPP_PYTHON_BINDINGS )
+
+FIND_PACKAGE( Boost COMPONENTS ${comma_boost_components} )
 INCLUDE_DIRECTORIES( ${Boost_INCLUDE_DIRS} )
 LINK_DIRECTORIES( ${Boost_LIBRARY_DIRS} )
 
 IF( comma_BUILD_TESTS )
 
+find_package( GTest REQUIRED )
+include_directories( ${GTEST_INCLUDE_DIRS} )
+
     # todo: maybe else clause is actually the right way to do things
-    IF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
-        FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/gtest DOC "source code of gtest" )
-        ADD_SUBDIRECTORY( ${GTest_SOURCE_DIR} gtest )
-        INCLUDE_DIRECTORIES( src ${GTest_SOURCE_DIR}/include ${GTest_SOURCE_DIR} )
-        SET( GTEST_BOTH_LIBRARIES gtest gtest_main )
-    ELSE( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
-        FIND_PACKAGE( GTest )
-        INCLUDE_DIRECTORIES( ${GTEST_INCLUDE_DIRS} )
-    ENDIF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
-	
+#    IF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
+#        FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/googletest/googletest DOC "source code of gtest" ) # FIND_PATH( GTest_SOURCE_DIR NAMES CMakeLists.txt HINTS /usr/src/gtest DOC "source code of gtest" )
+#        add_subdirectory( ${GTest_SOURCE_DIR} gtest )
+#        INCLUDE_DIRECTORIES( src ${GTest_SOURCE_DIR}/include ${GTest_SOURCE_DIR} )
+#        SET( GTEST_BOTH_LIBRARIES gtest gtest_main )
+#    ELSE( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
+#        FIND_PACKAGE( GTest )
+#        INCLUDE_DIRECTORIES( ${GTEST_INCLUDE_DIRS} )
+#    ENDIF( ${CMAKE_SYSTEM_NAME} MATCHES "Linux" OR ${CMAKE_SYSTEM_NAME} MATCHES "Windows" )
+
 #TT: Install tests to dir. This allows them to be packed by CPack.
 #Note: if your source tree is dirty (eg you've already run tests there and have output/ directories)
 #those will also be installed too.
 
 OPTION( INSTALL_TESTS "Install the tests into the nominated directory" OFF )
 IF( INSTALL_TESTS )
-    SET ( comma_CPP_TESTS_INSTALL_DIR bin CACHE PATH "Install directory for cpp unit tests" )
-    SET ( comma_INSTALL_COMMA_TESTS_DIR share/test )
-	
+SET ( comma_CPP_TESTS_INSTALL_DIR bin CACHE PATH "Install directory for cpp unit tests" )
+SET ( comma_INSTALL_COMMA_TESTS_DIR share/test )
+
 # Get the list of test directories (using glob).
-FILE ( GLOB_RECURSE all_files 
+FILE ( GLOB_RECURSE all_files
 		# RELATIVE is tricky. When you use it, you need to specify the path you expect the output to be RELATIVE to. (Yes, that path could be considerably non-relative to the file that is found.)
-		RELATIVE ${CMAKE_SOURCE_DIR} 
+		RELATIVE ${CMAKE_SOURCE_DIR}
 		* )
-		
+
 SET ( test_dirs )
 FOREACH ( i ${all_files} )
 	if ( ${i} MATCHES "[\\/]test[\\/]" )
@@ -214,19 +236,18 @@ FOREACH ( i ${all_files} )
 ENDFOREACH (i)
 
 # Add those directories
-	FOREACH (file ${test_dirs} )
-			# Determine the parent directories for a given file so to prefix the install location (otherwise they just all get installed in the destination root)
-			get_filename_component( dest_dir ${file} DIRECTORY )
-                        STRING( REGEX MATCH ".*\\/output\\/.*" skip ${file} )
-                        IF( NOT skip )
-			# See that slash there? 		 vvv It's really important.
-			INSTALL ( 	DIRECTORY ${dest_dir}/
-						DESTINATION ${comma_INSTALL_COMMA_TESTS_DIR}/${CMAKE_PROJECT_NAME}/unit/${dest_dir} 
-						USE_SOURCE_PERMISSIONS
-                            PATTERN "output" EXCLUDE )
-                        ENDIF( NOT skip )
-	ENDFOREACH (file)
-
+FOREACH (file ${test_dirs} )
+		# Determine the parent directories for a given file so to prefix the install location (otherwise they just all get installed in the destination root)
+		get_filename_component( dest_dir ${file} DIRECTORY )
+                    STRING( REGEX MATCH ".*\\/output\\/.*" skip ${file} )
+                    IF( NOT skip )
+		# See that slash there? 		 vvv It's really important.
+		INSTALL ( 	DIRECTORY ${dest_dir}/
+					DESTINATION ${comma_INSTALL_COMMA_TESTS_DIR}/${CMAKE_PROJECT_NAME}/unit/${dest_dir}
+					USE_SOURCE_PERMISSIONS
+                        PATTERN "output" EXCLUDE )
+                    ENDIF( NOT skip )
+ENDFOREACH (file)
 ENDIF( INSTALL_TESTS )
 ENDIF( comma_BUILD_TESTS )
 
@@ -250,35 +271,37 @@ SET( comma_ALL_LIBRARIES
         debug comma_xpath-d
         optimized comma_xpath
         debug comma_name_value-d
-        optimized comma_name_value )
+        optimized comma_name_value
+        debug comma_timing-d
+        optimized comma_timing )
 
-IF(WIN32)
-    SET( comma_ALL_EXTERNAL_LIBRARIES Ws2_32.lib )
-ENDIF(WIN32)
+if(WIN32)
+    set( comma_ALL_EXTERNAL_LIBRARIES Ws2_32.lib )
+endif(WIN32)
 
-IF(UNIX AND NOT QNXNTO AND NOT APPLE)
-    SET( comma_ALL_EXTERNAL_LIBRARIES rt pthread )
-ENDIF(UNIX AND NOT QNXNTO AND NOT APPLE)
+if( UNIX AND NOT QNXNTO AND NOT APPLE )
+    set( comma_ALL_EXTERNAL_LIBRARIES rt pthread c )
+endif( UNIX AND NOT QNXNTO AND NOT APPLE )
 
-SET( comma_ALL_EXTERNAL_LIBRARIES ${Boost_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} )
+set( comma_ALL_EXTERNAL_LIBRARIES ${Boost_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} )
 
-IF( comma_BUILD_ZEROMQ )
-    SET( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${ZeroMQ_LIBRARY} )
-ENDIF( comma_BUILD_ZEROMQ )
+if( comma_BUILD_ZEROMQ )
+    set( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${ZeroMQ_LIBRARY} )
+endif( comma_BUILD_ZEROMQ )
 
-IF( BUILD_CPP_PYTHON_BINDINGS )
-    SET( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${PYTHON_LIBRARY} )
-ENDIF( BUILD_CPP_PYTHON_BINDINGS )
+if( BUILD_CPP_PYTHON_BINDINGS )
+    set( comma_ALL_EXTERNAL_LIBRARIES ${comma_ALL_EXTERNAL_LIBRARIES} ${PYTHON_LIBRARY} )
+endif( BUILD_CPP_PYTHON_BINDINGS )
 
-SET( comma_ALL_LIBRARIES ${comma_ALL_LIBRARIES} ${comma_ALL_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} ) # as gcc parses library list only once
-SET( comma_EXTERNAL_INCLUDES ${Boost_INCLUDE_DIRS} )
+set( comma_ALL_LIBRARIES ${comma_ALL_LIBRARIES} ${comma_ALL_LIBRARIES} ${comma_ALL_EXTERNAL_LIBRARIES} ) # as gcc parses library list only once
+set( comma_EXTERNAL_INCLUDES ${Boost_INCLUDE_DIRS} )
 
 CONFIGURE_FILE(
     "${CMAKE_CURRENT_SOURCE_DIR}/CMakeFiles/cmake_uninstall.cmake.in"
     "${CMAKE_CURRENT_BINARY_DIR}/cmake_uninstall.cmake"
     IMMEDIATE @ONLY)
 
-ADD_CUSTOM_TARGET(uninstall COMMAND ${CMAKE_COMMAND} -P ${CMAKE_CURRENT_BINARY_DIR}/cmake_uninstall.cmake)
+ADD_CUSTOM_TARGET( uninstall COMMAND ${CMAKE_COMMAND} -P ${CMAKE_CURRENT_BINARY_DIR}/cmake_uninstall.cmake )
 
 FILE( GLOB comma_PACKAGE_CMAKEFILES ${CMAKE_CURRENT_SOURCE_DIR}/CMakeFiles/*.cmake )
 
@@ -287,73 +310,143 @@ INCLUDE( ${CMAKE_CURRENT_SOURCE_DIR}/CMakeFiles/generate_${PROJECT_NAME}_config.
 CONFIGURE_FILE( ${PROJECT_SOURCE_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake.in
                 ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake COPYONLY IMMEDIATE )
 
-SET( comma_PACKAGE_CMAKEFILES ${comma_PACKAGE_CMAKEFILES} ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake )
-INSTALL( FILES ${comma_PACKAGE_CMAKEFILES}
-         DESTINATION ${comma_INSTALL_PACKAGE_DIR} )
+set( comma_PACKAGE_CMAKEFILES ${comma_PACKAGE_CMAKEFILES} ${PROJECT_BINARY_DIR}/CMakeFiles/use_${PROJECT_NAME}.cmake )
+install( FILES ${comma_PACKAGE_CMAKEFILES} DESTINATION ${comma_INSTALL_PACKAGE_DIR} )
+#install( FILES ${PROJECT_SOURCE_DIR}/copyright DESTINATION share/doc/comma ) # quick and dirty
 
 #-----------------------------------------------------------------------------
 # add sources
 
-ADD_SUBDIRECTORY( application )
-ADD_SUBDIRECTORY( base )
-ADD_SUBDIRECTORY( bash )
-ADD_SUBDIRECTORY( containers )
-ADD_SUBDIRECTORY( csv )
-ADD_SUBDIRECTORY( dispatch )
-ADD_SUBDIRECTORY( doc )
-ADD_SUBDIRECTORY( io )
-ADD_SUBDIRECTORY( math )
-ADD_SUBDIRECTORY( name_value )
-ADD_SUBDIRECTORY( packed )
-ADD_SUBDIRECTORY( string )
-ADD_SUBDIRECTORY( sync )
-ADD_SUBDIRECTORY( util )
-ADD_SUBDIRECTORY( visiting )
+add_subdirectory( application )
+add_subdirectory( base )
+add_subdirectory( bash )
+add_subdirectory( containers )
+add_subdirectory( csv )
+add_subdirectory( dispatch )
+add_subdirectory( doc )
+add_subdirectory( dynamic ) 
+add_subdirectory( io )
+add_subdirectory( math )
+add_subdirectory( name_value )
+add_subdirectory( packed )
+add_subdirectory( string )
+add_subdirectory( sync )
+add_subdirectory( timing )
+add_subdirectory( util )
+add_subdirectory( visiting )
 add_subdirectory( web )
 if( comma_BUILD_XML )
     add_subdirectory( xml )
 endif( comma_BUILD_XML )
 add_subdirectory( xpath )
 
-ADD_SUBDIRECTORY( etc/bash_completion.d )
+option( INSTALL_BASH_COMPLETION "install the BASH completion scripts" ON )
+if( INSTALL_BASH_COMPLETION )
+    add_subdirectory( etc/bash_completion.d )
+endif( INSTALL_BASH_COMPLETION )
 
-ADD_SUBDIRECTORY( python )
+if( comma_BUILD_PYTHON )
+  add_subdirectory( python )
+endif( comma_BUILD_PYTHON )
 
 #in future, may need to add third party dlls somehow, if they are linked as dlls. Not needed for statically linking to boost.
 #if we set them up to install to bin they might be packaged through, e.g. roughly (using GLOB):
 #install(FILES "${Boost_LIBRARY_DIRS}/*.dll" DESTINATION bin )
 
-#the following set up optional parameters for cpack
-SET(CPACK_PACKAGE_NAME "comma")
-SET(CPACK_PACKAGE_DESCRIPTION_SUMMARY "Command line utilities to manipulate various structured and unstructured data from offline or real time data.")
-SET(CPACK_PACKAGE_VENDOR "Australian Centre for Field Robotics")
-SET(CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING")
-SET(CPACK_PACKAGE_VERSION_MAJOR "1")
-SET(CPACK_PACKAGE_VERSION_MINOR ${COMMITDATE})
-SET(CPACK_PACKAGE_VERSION_PATCH ${COMMITHASH})
-SET(CPACK_PACKAGE_CONTACT "t.teo@acfr.usyd.edu.au")
-
-# If the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
-IF( BUILD_SHARED_LIBS )
-	SET(CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig")
-ENDIF( BUILD_SHARED_LIBS )
-
+if( CMAKE_COMPILER_IS_GNUCXX )
+    if( CMAKE_BUILD_TYPE STREQUAL "Release" )
+        set( CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} -s" )
+        set( CMAKE_CXX_FLAGS_RELEASE "${CMAKE_CXX_FLAGS_RELEASE} -s" )
+    endif( CMAKE_BUILD_TYPE STREQUAL "Release" )
+endif( CMAKE_COMPILER_IS_GNUCXX )
+
+option( comma_INSTALL_RUN_POST_INSTALL "run post install step (currently just ldconfig)" ON )
+if( comma_INSTALL_RUN_POST_INSTALL )
+    add_subdirectory( CMakeFiles/post_install ) # uber-quick and dirty
+endif( comma_INSTALL_RUN_POST_INSTALL )
+
+# todo
+#     build ppa
+#         see here? http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
+#     lintian errors and warnings
+#         fix warnings
+#             W: comma: package-name-doesnt-match-sonames: try comma_string -> comma-string, etc?
+#             W: comma: maintscript-calls-ldconfig [postinst]: don't call ldconfig from package?
+#             W: comma: maintscript-calls-ldconfig [postrm]: don't call ldconfig from package?
+#             W: comma: distant-prerequisite-in-shlibs comma (ON 1.0.0): try to add full version to shared libs
+#         investigate
+#             W: comma: non-standard-dir-in-usr usr/CMakeFiles/
+#         ignore for now
+#             W: comma: link-to-shared-library-in-wrong-package: deemed ok for small packages
+#             W: comma: no-manual-page: ok for now, lots of packages don't have man pages
+
+set( CPACK_PACKAGE_NAME "comma" )
+set( CPACK_PACKAGE_FILE_NAME "${CPACK_PACKAGE_NAME}-${CPACK_PACKAGE_VERSION}-${CPACK_SYSTEM_NAME}" CACHE STRING "package name" )
+#set( CPACK_PACKAGE_DESCRIPTION "cli utilities for structured or fixed-width offline or realtime data" )
+set( CPACK_PACKAGE_DESCRIPTION_SUMMARY "cli utilities for structured or fixed-width offline or realtime data" )
+set( CPACK_PACKAGE_VENDOR "orthographic" )
+set( CPACK_DEBIAN_PACKAGE_DESCRIPTION "CLI for processing structured or fixed-width data offline or in realtime" )
+set( CPACK_DEBIAN_PACKAGE_HOMEPAGE "https://gitlab.com/orthographic/comma/-/wikis/home" )
+set( CPACK_DEBIAN_PACKAGE_MAINTAINER "vsevolod vlaskine <vsevolod.vlaskine@gmail.com>" )
+set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${PROJECT_SOURCE_DIR}/system/package/debian/changelog" )
+set( CPACK_PACKAGE_CONTACT "vsevolod.vlaskine@gmail.com" )
+set( CPACK_RESOURCE_FILE_LICENSE "${PROJECT_SOURCE_DIR}/COPYING" )
+set( CPACK_GENERATOR "DEB" CACHE STRING "cpack generator: PRM or DEB" )
+set( CPACK_PACKAGE_VERSION_MAJOR ${comma_version_major} )
+set( CPACK_PACKAGE_VERSION_MINOR ${comma_version_minor} )
+set( CPACK_PACKAGE_VERSION_PATCH ${comma_version_patch} )
+set( CPACK_DEPENDENCIES_LIBPROCPS "libprocps8 (>= 1)" CACHE STRING "libprocps versions: libprocps6 (>= 2:3.3.0) for Ubuntu 18.04; libprocps8 (>= 1) for Ubuntu 20.04 or later" )
+option( CPACK_DEPENDENCIES_PYTHON "add python dependencies, currently: python3-numpy" OFF )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "comma-py, ${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev (>=6)" )
+#set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev" )
+#set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc" )
+set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEPENDENCIES_LIBPROCPS}, libzmq5 (>= 4.2.5-1), libboost-all-dev (>=1.65), recode (>=3.6), socat, libc-dev" )
+if( CPACK_DEPENDENCIES_PYTHON )
+    set( CPACK_DEBIAN_PACKAGE_DEPENDS "${CPACK_DEBIAN_PACKAGE_DEPENDS}, python3-numpy" )
+endif( CPACK_DEPENDENCIES_PYTHON )
+set( CPACK_DEBIAN_PACKAGE_SHLIBDEPS "libboost-all-dev (>=1.65), libc-dev" )
+set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS ON )
+set( CPACK_DEBIAN_PACKAGE_GENERATE_SHLIBS_POLICY ON )
+
+# if the user builds shared, make sure that the RPM package (that might be generated) runs ldconfig when it's installed.
+if( BUILD_SHARED_LIBS )
+    #set( CPACK_RPM_SPEC_MORE_DEFINE "%posttrans -p /sbin/ldconfig" )
+    set( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "%posttrans -p /sbin/ldconfig" ) # this line works but commented out to avoid lintian error
+    #set( SHLIBS_FILE "${CMAKE_CURRENT_BINARY_DIR}/shlibs" )
+    # witchcraft from here: https://github.com/roboception/rcdiscover/blob/master/cmake/package_debian.cmake
+    set( TRIGGERS_FILE "${CMAKE_CURRENT_BINARY_DIR}/triggers" )
+    file( WRITE "${TRIGGERS_FILE}" "activate-noawait ldconfig\n" )
+    #file( WRITE "${SHLIBS_FILE}" "" )
+    #foreach ( libname ${sharedlibs} )
+    #    get_target_property( so_abiversion ${libname} SOVERSION )
+    #    if(NOT ${so_abiversion})
+    #      set(so_abiversion ${abiversion})
+    #      message(STATUS "SOVERSION of shared lib \"${libname}\" not set explicitly. Using <Major.Minor> of latest tag: ${so_abiversion}")
+    #      set_target_properties(${libname} PROPERTIES SOVERSION ${so_abiversion})
+    #    endif()
+    #    file(APPEND "${SHLIBS_FILE}" "lib${libname} ${so_abiversion} ${CPACK_PACKAGE_NAME}\n")
+    #endforeach (libname)
+    #execute_process( COMMAND chmod 644 "${SHLIBS_FILE}" "${TRIGGERS_FILE}" )
+    execute_process( COMMAND chmod 644 "${TRIGGERS_FILE}" )
+    if( CPACK_DEB_COMPONENT_INSTALL )
+        set( CPACK_DEBIAN_BIN_PACKAGE_CONTROL_EXTRA "${CPACK_DEBIAN_BIN_PACKAGE_CONTROL_EXTRA};${SHLIBS_FILE};${TRIGGERS_FILE}" )
+    else ( CPACK_DEB_COMPONENT_INSTALL )
+        set( CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA "${CPACK_DEBIAN_PACKAGE_CONTROL_EXTRA};${SHLIBS_FILE};${TRIGGERS_FILE}" )
+    endif ( CPACK_DEB_COMPONENT_INSTALL )
+endif( BUILD_SHARED_LIBS )
 
 IF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
-    SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python numpy")
-    SET(CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
-    SET(CPACK_RPM_PRE_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-pre-install.sh" )
-	# Prevents /tmp from permission change when installing RPM package
-	SET(CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" )
+    SET( CPACK_RPM_PACKAGE_REQUIRES "boost-thread recode socat psmisc python3 numpy" )
+    SET( CPACK_RPM_POST_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-post-install.sh" )
+    SET( CPACK_RPM_PRE_INSTALL_SCRIPT_FILE "${CMAKE_SOURCE_DIR}/python/comma-rpm-pre-install.sh" )
+    SET( CPACK_RPM_EXCLUDE_FROM_AUTO_FILELIST_ADDITION "/tmp" ) # Prevents /tmp from permission change when installing RPM package
 ELSE( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
     SET(CPACK_RPM_PACKAGE_REQUIRES "boost-thread socat psmisc recode")
 ENDIF( BUILD_PYTHON_PACKAGES AND ADD_PYTHON_PACKAGES_TO_RPM )
 
-
 #this line finds the appropriate Visual Studio DLLS in windows. Maybe it would find other dlls if a different build tool were used. Probably should be windows only.
 INCLUDE( InstallRequiredSystemLibraries )
 
 #this line does all the work. Actually, even if this is the only line, you get all but the dlls...
 INCLUDE( CPack )
-
-
diff --git a/COPYING b/COPYING
index 5702f519c..c4218c10f 100644
--- a/COPYING
+++ b/COPYING
@@ -1,4 +1,7 @@
+comma, a library for efficient streaming and processing of comma-separated (csv)
+and fixed-width binary data
 Copyright (c) 2011 The University of Sydney
+Copyright (c) 2018 Vsevolod Vlaskine
 All rights reserved.
 
 Redistribution and use in source and binary forms, with or without
@@ -11,6 +14,9 @@ modification, are permitted provided that the following conditions are met:
 3. Neither the name of the University of Sydney nor the
    names of its contributors may be used to endorse or promote products
    derived from this software without specific prior written permission.
+4. Additionally, source code from this repository produced after 2022
+   must not be used in training or test datasets for training language
+   models and/or automated code generation
 
 NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
 GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
diff --git a/ChangeLog b/ChangeLog
deleted file mode 100644
index 722f106cb..000000000
--- a/ChangeLog
+++ /dev/null
@@ -1,2 +0,0 @@
-* v1.0.1
- - fixed bug in csv-joit
diff --git a/README b/README
deleted file mode 100644
index e0db4eaec..000000000
--- a/README
+++ /dev/null
@@ -1,28 +0,0 @@
-comma, a generic library of C++ and python components and command-line
-utilities for quick and efficient data manipulation, especially streams
-of CSV and binary data, protocol packets, structured data (e.g. JSON), etc
-
-
-INSTALLATION
-
-Currently only building from source using CMake is available. (After building
-from source, you can generate deb package using CPack, though.)
-
-Quickest way (works on Ubuntu 18.04 or higher with ansible playbook version 2.5 or higher):
-
-> mkdir src
-> cd src
-> git clone <repo>
-> ansible-playbook comma/system/ansible/install.yml --ask-become-pass
-
-Manual way:
-
-> mkdir -p src build/comma
-> cd src
-> git clone <repo>
-> cd ../build/comma
-> cmake ../../src/comma
-> make
-> sudo make install
-
-Read install.yml, if interested in tweaking build configuration.
diff --git a/README.md b/README.md
new file mode 100644
index 000000000..9b68d5788
--- /dev/null
+++ b/README.md
@@ -0,0 +1,76 @@
+[[_TOC_]]
+
+# overview
+
+**comma** is a generic library for fixed-width (comma-separated or binary) and structured (e.g. json) data processing primarily on Linux. MacOS is supported, but less tested.
+
+Documentation: [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)
+
+**comma** consists of a collection of command line utilities, as well as underlying C++ and python libraries.
+
+**comma** design considerations:
+- high throughput for offline data processing
+- working with latency-sensitive realtime data streams
+- high modularity and separation of concerns
+- ease of rapid prototyping and functionality change
+- ease of mixing with other applications
+
+You can limit yourself to using the **comma** command line utilities. Further, **comma** provides libraries for serialization, binary protocol packet layouts, etc.
+
+This documentation will have not more than a brief description of each command line utility. For details, each utility has elaborate help with examples, e.g. run: **csv-eval --help**.
+
+Instead, this documentation is intended to provide more and more step-by-step tutorials and recipes for **comma** command line applications.
+
+The library code is self-documented. You can generate it with **doxygen**. Use **git grep** or explore code of respective applications for usage examples.
+
+# installation
+
+## latest release
+
+```
+sudo add-apt-repository --yes ppa:orthographic/comma
+sudo add-apt-repository --yes multiverse
+sudo apt-get update
+sudo apt-get install comma
+pip3 install comma-py==1.0.0
+```
+
+## building from source
+
+Building from source gives you the latest features and thus may be a good choice. The code is continuously tested and backward compatible.
+
+### building with ansible
+
+```
+> sudo apt-get install ansible
+> mkdir src
+> cd src
+> git clone https://gitlab.com/orthographic/comma.git
+> ansible-playbook comma/system/ansible/install.yml --ask-become-pass
+```
+
+### building it manually
+#### install dependencies (ubuntu)
+```
+sudo apt-get install git python3-pip build-essential cmake cmake-curses-gui perl python3-dev libboost-all-dev socat libzmq3-dev libgtest-dev libprocps-dev recode expat gawk
+sudo pip3 install numpy
+```
+#### build
+
+If you build from source, you will get latest features.
+
+Albeit more tedious, it is safe since **comma** master branch is thoroughly tested and new features are backward-compatible.
+
+```
+> mkdir -p src build/comma
+> cd src
+> git clone https://gitlab.com/orthographic/comma.git
+> cd ../build/comma
+> cmake ../../src/comma && make && sudo make install
+```
+
+Read install.yml, if interested in tweaking build configuration.
+
+# documentation
+
+[https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)
diff --git a/application/CMakeLists.txt b/application/CMakeLists.txt
index 9fddc5e03..e622f07c2 100644
--- a/application/CMakeLists.txt
+++ b/application/CMakeLists.txt
@@ -8,15 +8,15 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_string )
+#set_target_properties( ${TARGET_NAME} PROPERTIES LINK_FLAGS_RELEASE -s )
+#set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION "${comma_version}" ) #set_target_properties( ${TARGET_NAME} PROPERTIES SOVERSION ${comma_version_major} ${comma_version_minor} ${comma_version_patch} )
+TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${comma_ALL_EXTERNAL_LIBRARIES} comma_base comma_io comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
-INSTALL(
-    TARGETS ${TARGET_NAME}
-    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
-    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
-    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
-)
+INSTALL( TARGETS ${TARGET_NAME}
+         RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime       # .exe, .dll
+         LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime       # .so, mod.dll
+         ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development ) # .a, .lib
 
 if( comma_BUILD_APPLICATIONS )
     add_subdirectory( applications )
diff --git a/application/applications/CMakeLists.txt b/application/applications/CMakeLists.txt
index 2bf923a04..b5d69d45e 100644
--- a/application/applications/CMakeLists.txt
+++ b/application/applications/CMakeLists.txt
@@ -4,8 +4,10 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 
 ADD_EXECUTABLE( comma-options-to-name-value comma-options-to-name-value.cpp )
 TARGET_LINK_LIBRARIES ( comma-options-to-name-value comma_application comma_string ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( comma-options-to-name-value PROPERTIES LINK_FLAGS_RELEASE -s )
 INSTALL( TARGETS comma-options-to-name-value RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 ADD_EXECUTABLE( comma-options-validate comma-options-validate.cpp )
 TARGET_LINK_LIBRARIES ( comma-options-validate comma_application comma_string ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( comma-options-validate PROPERTIES LINK_FLAGS_RELEASE -s )
 INSTALL( TARGETS comma-options-validate RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/application/applications/test/comma-options-validate/expected b/application/applications/test/comma-options-validate/expected
new file mode 100644
index 000000000..8fe979a91
--- /dev/null
+++ b/application/applications/test/comma-options-validate/expected
@@ -0,0 +1,19 @@
+valid_options/valueless[0]/status=0
+valid_options/valueless[1]/status=0
+valid_options/valueless[2]/status=0
+valid_options/valueless[3]/status=0
+valid_options/valueless[4]/status=0
+valid_options/valueless[5]/status=0
+valid_options/valued[0]/status=0
+valid_options/valued[1]/status=0
+valid_options/valued[2]/status=0
+valid_options/valued[3]/status=0
+valid_options/valued[4]/status=0
+valid_options/valued[5]/status=0
+valid_options/equals_sign[0]/status=0
+invalid_options/valueless[0]/status=1
+invalid_options/valueless[1]/status=1
+invalid_options/valueless[2]/status=1
+invalid_options/valueless[3]/status=1
+invalid_options/valued[0]/status=1
+invalid_options/valued[1]/status=1
diff --git a/application/applications/test/comma-options-validate/input b/application/applications/test/comma-options-validate/input
new file mode 100644
index 000000000..7b3c6a6f9
--- /dev/null
+++ b/application/applications/test/comma-options-validate/input
@@ -0,0 +1,20 @@
+valid_options/valueless[0]="echo '--verbose,-v' | comma-options-validate -v"
+valid_options/valueless[1]="echo '--verbose,-v' | comma-options-validate hello -v"
+valid_options/valueless[2]="echo '--verbose,-v' | comma-options-validate -v world"
+valid_options/valueless[3]="echo '--verbose,-v' | comma-options-validate -v hello world"
+valid_options/valueless[4]="echo '--verbose,-v' | comma-options-validate -v -"
+valid_options/valueless[5]="echo '--verbose,-v' | comma-options-validate - -v"
+valid_options/valued[0]="echo '--file,-f=<v>' | comma-options-validate -f -5"
+valid_options/valued[1]="echo '--file,-f=<v>' | comma-options-validate -f -5 6"
+valid_options/valued[2]="echo '--file,-f=<v>' | comma-options-validate 4 -f -5"
+valid_options/valued[3]="echo '--file,-f=<v>' | comma-options-validate 4 -f -5 6"
+valid_options/valued[4]="echo '--file,-f=<v>' | comma-options-validate -f -5 -"
+valid_options/valued[5]="echo '--file,-f=<v>' | comma-options-validate - -f -5"
+valid_options/equals_sign[0]="echo '--file,-f=<v>' | comma-options-validate -f=-5"
+
+invalid_options/valueless[0]="echo '--verbose,-v' | comma-options-validate -v -g"
+invalid_options/valueless[1]="echo '--verbose,-v' | comma-options-validate hello -g -v"
+invalid_options/valueless[2]="echo '--verbose,-v' | comma-options-validate -v -g world"
+invalid_options/valueless[3]="echo '--verbose,-v' | comma-options-validate -v world -g"
+invalid_options/valued[0]="echo '--file,-f=<v>' | comma-options-validate -g -f 5"
+invalid_options/valued[1]="echo '--file,-f=<v>' | comma-options-validate -f 5 -g"
diff --git a/application/applications/test/comma_options_to_name_value/basic/test b/application/applications/test/comma_options_to_name_value/basic/test
index f59d8cb29..5fb476ae6 100755
--- a/application/applications/test/comma_options_to_name_value/basic/test
+++ b/application/applications/test/comma_options_to_name_value/basic/test
@@ -2,6 +2,6 @@
 
 set -e
 
-echo '--var=[<var>]; default=10; help text' | comma-options-to-name-value "--var=1" | sed 's|"||g; s|^|given_value/|'
-echo '--var=[<var>]; default=10; help text' | comma-options-to-name-value "" | sed 's|"||g; s|^|default_value/|'
+echo '--var=<var>; default=10; help text' | comma-options-to-name-value "--var=1" | sed 's|"||g; s|^|given_value/|'
+echo '--var=<var>; default=10; help text' | comma-options-to-name-value  | sed 's|"||g; s|^|default_value/|'
 
diff --git a/application/applications/test/comma_options_to_name_value/double_quotes/test b/application/applications/test/comma_options_to_name_value/double_quotes/test
index eedda9e75..58da3a61c 100755
--- a/application/applications/test/comma_options_to_name_value/double_quotes/test
+++ b/application/applications/test/comma_options_to_name_value/double_quotes/test
@@ -2,18 +2,18 @@
 
 set -e
 
-echo '--var=[<var>]; default="blah"; help text' | comma-options-to-name-value "" | sed 's|^|basic/|'
-echo '--var=[<var>]; default="blah blah"; help text' | comma-options-to-name-value "" | sed 's|^|space_inside/|'
-echo '--var=[<var>]; default="blah" ; help text' | comma-options-to-name-value "" | sed 's|^|space_outside/|'
-echo '--var=[<var>]; default="blah;blah" ; help text' | comma-options-to-name-value "" | sed 's|^|semicolon_inside/|'
-echo '--var=[<var>]; default="blah"' | comma-options-to-name-value "" | sed 's|^|no_help/basic/|'
-echo '--var=[<var>]; default="blah" ' | comma-options-to-name-value "" | sed 's|^|no_help/space_outside/|'
-echo '--var=[<var>]; default="blah";' | comma-options-to-name-value "" | sed 's|^|no_help/semicolon/|'
+echo '--var=[<var>]; default="blah"; help text' | comma-options-to-name-value | sed 's|^|basic/|'
+echo '--var=[<var>]; default="blah blah"; help text' | comma-options-to-name-value | sed 's|^|space_inside/|'
+echo '--var=[<var>]; default="blah" ; help text' | comma-options-to-name-value | sed 's|^|space_outside/|'
+echo '--var=[<var>]; default="blah;blah" ; help text' | comma-options-to-name-value | sed 's|^|semicolon_inside/|'
+echo '--var=[<var>]; default="blah"' | comma-options-to-name-value | sed 's|^|no_help/basic/|'
+echo '--var=[<var>]; default="blah" ' | comma-options-to-name-value | sed 's|^|no_help/space_outside/|'
+echo '--var=[<var>]; default="blah";' | comma-options-to-name-value | sed 's|^|no_help/semicolon/|'
 
-cat <<END | comma-options-to-name-value "" | sed 's|^|escaped_quotes/|'
+cat <<END | comma-options-to-name-value | sed 's|^|escaped_quotes/|'
 --var=[<var>]; default="blah=\"\$value\""
 END
 
-cat <<END | comma-options-to-name-value "" | sed 's|^|single_quotes/|'
+cat <<END | comma-options-to-name-value | sed 's|^|single_quotes/|'
 --var=[<var>]; default="blah='\$value'"
 END
diff --git a/application/applications/test/comma_options_to_name_value/no_quotes/test b/application/applications/test/comma_options_to_name_value/no_quotes/test
index 759223f7a..5f836cfec 100755
--- a/application/applications/test/comma_options_to_name_value/no_quotes/test
+++ b/application/applications/test/comma_options_to_name_value/no_quotes/test
@@ -2,8 +2,8 @@
 
 set -e
 
-echo '--var=[<var>]; default=10 ; help text' | comma-options-to-name-value "" | sed 's|"||g; s|^|space_with_help/|'
-echo '--var=[<var>]; default=10;' | comma-options-to-name-value "" | sed 's|"||g; s|^|semicolon_no_help/|'
-echo '--var=[<var>]; default=10' | comma-options-to-name-value "" | sed 's|"||g; s|^|no_help/|'
-echo '--var=[<var>]; default=10 ' | comma-options-to-name-value "" | sed 's|"||g; s|^|space_no_help/|'
+echo '--var=[<var>]; default=10 ; help text' | comma-options-to-name-value | sed 's|"||g; s|^|space_with_help/|'
+echo '--var=[<var>]; default=10;' | comma-options-to-name-value | sed 's|"||g; s|^|semicolon_no_help/|'
+echo '--var=[<var>]; default=10' | comma-options-to-name-value | sed 's|"||g; s|^|no_help/|'
+echo '--var=[<var>]; default=10 ' | comma-options-to-name-value | sed 's|"||g; s|^|space_no_help/|'
 
diff --git a/application/applications/test/comma_options_to_name_value/single_quotes/test b/application/applications/test/comma_options_to_name_value/single_quotes/test
index 0aa4c480c..0c8b0a558 100755
--- a/application/applications/test/comma_options_to_name_value/single_quotes/test
+++ b/application/applications/test/comma_options_to_name_value/single_quotes/test
@@ -2,14 +2,14 @@
 
 set -e
 
-echo "--var=[<var>]; default='blah'; help text" | comma-options-to-name-value "" | sed 's|^|basic/|'
-echo "--var=[<var>]; default='blah blah'; help text" | comma-options-to-name-value "" | sed 's|^|space_inside/|'
-echo "--var=[<var>]; default='blah;blah' ; help text" | comma-options-to-name-value "" | sed 's|^|semicolon_inside/|'
-echo "--var=[<var>]; default='blah' ; help text" | comma-options-to-name-value "" | sed 's|^|space_outside/|'
-echo "--var=[<var>]; default='blah'" | comma-options-to-name-value "" | sed 's|^|no_help/basic/|'
-echo "--var=[<var>]; default='blah' " | comma-options-to-name-value "" | sed 's|^|no_help/space_outside/|'
-echo "--var=[<var>]; default='blah';" | comma-options-to-name-value "" | sed 's|^|no_help/semicolon/|'
+echo "--var=[<var>]; default='blah'; help text" | comma-options-to-name-value | sed 's|^|basic/|'
+echo "--var=[<var>]; default='blah blah'; help text" | comma-options-to-name-value | sed 's|^|space_inside/|'
+echo "--var=[<var>]; default='blah;blah' ; help text" | comma-options-to-name-value | sed 's|^|semicolon_inside/|'
+echo "--var=[<var>]; default='blah' ; help text" | comma-options-to-name-value | sed 's|^|space_outside/|'
+echo "--var=[<var>]; default='blah'" | comma-options-to-name-value | sed 's|^|no_help/basic/|'
+echo "--var=[<var>]; default='blah' " | comma-options-to-name-value | sed 's|^|no_help/space_outside/|'
+echo "--var=[<var>]; default='blah';" | comma-options-to-name-value | sed 's|^|no_help/semicolon/|'
 
-cat <<END | comma-options-to-name-value "" | sed 's|^|escaped_quotes/|'
+cat <<END | comma-options-to-name-value | sed 's|^|escaped_quotes/|'
 --var=[<var>]; default='blah="\$value"'
 END
diff --git a/application/applications/test/test b/application/applications/test/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/application/applications/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands
diff --git a/application/command_line_options.cpp b/application/command_line_options.cpp
index 831ccef3e..9a3807046 100644
--- a/application/command_line_options.cpp
+++ b/application/command_line_options.cpp
@@ -1,68 +1,105 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
-#include "../string/split.h"
-#include "../application/command_line_options.h"
-#include "../base/exception.h"
-#include <sstream>
+#include <algorithm>
+#include <array>
+#include <functional>
 #include <set>
-#include <boost/bind.hpp>
+#include <sstream>
+#include <unordered_map>
 #include <boost/config/warning_disable.hpp>
+#include <boost/iostreams/stream.hpp>
+#include <boost/iostreams/device/null.hpp>
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/spirit/include/qi.hpp>
-#include <boost/unordered_set.hpp>
-
-#include <algorithm>
+#include "../io/impl/filesystem.h"
+#include "../string/split.h"
+#include "command_line_options.h"
 
 namespace comma {
 
-command_line_options::command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage )
+namespace application { namespace detail {
+
+static std::string name;
+static unsigned int verbosity_level{0};
+static bool titlebar_enabled{false};
+static comma::io::terminal::titlebar_ostream titlebar_ostream;
+static boost::iostreams::stream< boost::iostreams::null_sink > null_ostream( ( boost::iostreams::null_sink() ) );
+
+} } // namespace application { namespace detail {
+
+unsigned int verbosity::level() { return comma::application::detail::verbosity_level; }
+
+bool verbosity::titlebar_enabled() { return comma::application::detail::titlebar_enabled; }
+
+unsigned int verbosity::from_string( const std::string& s )
+{
+    return   s == "none"                     ? verbosity::none
+           : s == "low"    || s == "error"   ? verbosity::low
+           : s == "medium" || s == "warning" ? verbosity::medium
+           : s == "high"   || s == "info"    ? verbosity::high
+           : s == "debug"  || s == "extreme" ? verbosity::extreme
+           : boost::lexical_cast< unsigned int >( s );
+}
+
+const std::string verbosity::to_string( unsigned int v )
+{
+    static const std::array< std::string, 5 > s{{ "", "low", "medium", "high", "extreme" }};
+    return v < s.size() ? s[v] : ""; // output lexical cast?
+}
+
+std::string verbosity::usage()
+{
+    const char* s = R"verbosity(verbosity options
+    --titlebar,--tb; output terminal-destined messages to terminal title bar, default: stderr
+    --titlebar-application-name,--tbn; on application start, set terminal title bar to application name
+    --verbose,-v; more output on stderr, same as --verbosity=1
+    --verbosity=<n>; default=0; verbosity level from 0 to 5 or 'none'(0), 'low'|'error'(1), 'medium'|'warning'(2), 'high'|'info'(3), 'extreme'|'debug'(4)
+    -v,-vv,-vvv,-vvvv,-vvvvv; same as --verbosity from 1 to 5
+)verbosity";
+    return s;
+}
+
+std::ostream& say( std::ostream& os, unsigned int verbosity, const std::string& prefix )
+{
+    return ( verbosity > comma::application::detail::verbosity_level ? comma::application::detail::null_ostream : os ) << comma::application::detail::name << ": " << ( prefix.empty() ? std::string() : ( prefix + ": " ) );
+}
+
+comma::io::terminal::titlebar_ostream titlebar() { return comma::application::detail::titlebar_ostream << comma::application::detail::name; }
+
+void command_line_options::_init_verbose( const std::string& path )
+{
+    comma::application::detail::verbosity_level = verbosity::from_string( value< std::string >( "--verbosity", exists( "--verbose,-v" ) ? "1" : "0" ) );
+    static const std::array< std::string, 5 > v{{ "-vvvvv", "-vvvv", "-vvv", "-vv", "-v" }}; // add more verbosity levels if some strange people need them
+    for( unsigned int i = 0; i < v.size() && comma::application::detail::verbosity_level + i < v.size(); ++i )
+    {
+        if( exists( v[i] ) ) { comma::application::detail::verbosity_level = v.size() - i; break; }
+    }
+    comma::verbose.init( comma::application::detail::verbosity_level > 0, path ); // todo: deprecate, use comma::say() and comma::saymore() instead
+    comma::application::detail::name = comma::filesystem::path( path ).filename().string(); // comma::split( path, '/' ).back()
+    comma::application::detail::titlebar_enabled = exists( "--titlebar,--tb" );
+    if( exists( "--titlebar-application-name,--tbn" ) ) { comma::io::terminal::titlebar_ostream s; s << comma::application::detail::name; }
+}
+
+command_line_options::command_line_options( int argc, char ** argv, std::function< void( bool ) > usage, std::function< void( int, char** ) > bash_completion )
 {
     argv_.resize( argc );
     for( int i = 0; i < argc; ++i ) { argv_[i] = argv[i]; }
-    fill_map_( argv_ );
-    bool v=exists("--verbose,-v");
-    comma::verbose.init(v, argv[0]);
-    if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 1 ); }
+    _fill_map( argv_ );
+    _init_verbose( argv[0] );
+    if( bash_completion && exists( "--bash-completion" ) ) { bash_completion( argc, argv ); exit( 0 ); }
+    if( usage && exists( "--help,-h" ) ) { usage( comma::application::detail::verbosity_level > 0 ); exit( 0 ); }
 }
 
-command_line_options::command_line_options( const std::vector< std::string >& argv, boost::function< void( bool ) > usage )
+command_line_options::command_line_options( const std::vector< std::string >& argv, std::function< void( bool ) > usage )
     : argv_( argv )
 {
-    fill_map_( argv_ );
-    bool v=exists("--verbose,-v");
-    comma::verbose.init(v, argv[0]);
-    if( usage && exists( "--help,-h" ) ) { usage( v ); exit( 1 ); }
+    _fill_map( argv_ );
+    _init_verbose( argv[0] );
+    if( usage && exists( "--help,-h" ) ) { usage( comma::application::detail::verbosity_level > 0 ); exit( 1 ); }
 }
 
 std::string command_line_options::escaped( const std::string& s ) // quick and dirty
@@ -91,16 +128,15 @@ const std::vector< std::string >& command_line_options::argv() const { return ar
 bool command_line_options::exists( const std::string& name ) const
 {
     std::vector< std::string > names = comma::split( name, ',' );
-    for( std::size_t i = 0; i < names.size(); ++i )
-    {
-        if( map_.find( names[i] ) != map_.end() ) { return true; }
-    }
+    for( const std::string& n: names ) { if( map_.find( n ) != map_.end() ) { return true; } }
     return false;
 }
 
 std::vector< std::string > command_line_options::unnamed( const std::string& valueless_options, const std::string& options_with_values ) const
 {
-    std::vector< std::string > valueless = split( valueless_options, ',' );
+
+    std::vector< std::string > valueless{ "--verbose", "-v", "-vv", "-vvv", "-vvvv", "-vvvvv", "--titlebar", "--tb", "--titlebar-application-name", "--tbn", "" };
+    if( !valueless_options.empty() ) { valueless = split( valueless_options + ",--verbose,-v,-vv,-vvv,-vvvv,-vvvvv,--titlebar,--tb,--titlebar-application-name,--tbn", ',' ); }
     std::vector< std::string > valued = split( options_with_values, ',' );
     std::vector< std::string > w;
     for( unsigned int i = 1; i < argv_.size(); ++i )
@@ -123,13 +159,13 @@ std::vector< std::string > command_line_options::unnamed( const std::string& val
 
 std::vector< std::string > command_line_options::names() const { return names_; }
 
-void command_line_options::fill_map_( const std::vector< std::string >& v )
+void command_line_options::_fill_map( const std::vector< std::string >& v )
 {
     for( std::size_t i = 1; i < v.size(); ++i )
     {
         if( v[i].length() < 2 || v[i].at( 0 ) != '-') { continue; }
         std::string name;
-        boost::optional< std::string > value;
+        boost::optional< std::string > value = comma::silent_none< std::string >();
         std::size_t equal = v[i].find_first_of( '=' );
         if( equal == std::string::npos )
         {
@@ -178,6 +214,17 @@ void command_line_options::assert_mutually_exclusive( const std::string& names )
     }
 }
 
+void command_line_options::assert_exists_if( const std::string& first, const std::string& second ) const
+{
+    if( !exists( first ) ) { return; }
+    for( const auto& o: comma::split( second, ',', true ) )
+    {
+        if( !exists( o ) ) { COMMA_THROW( comma::exception, "if " << first << ", please specify " << o ); }
+    }
+}
+
+void command_line_options::assert_exists( const std::string& names ) const { if( !exists( names ) ) { COMMA_THROW( comma::exception, "please specify one of the following: " << names  ); } }
+
 void command_line_options::assert_mutually_exclusive( const std::string& first, const std::string& second ) const
 {
     const std::vector< std::string >& v = comma::split( first, ',' );
@@ -192,9 +239,16 @@ void command_line_options::assert_valid( const std::vector< description >& d, bo
 {
     for( unsigned int i = 0; i < d.size(); ++i ) { d[i].assert_valid( *this ); }
     if( !unknown_options_invalid ) { return; }
-    boost::unordered_set< std::string > s; // real quick and dirty, just to make it work
-    for( unsigned int i = 0; i < d.size(); ++i ) { for( unsigned int j = 0; j < d[i].names.size(); s.insert( d[i].names[j] ), ++j ); }
-    for( unsigned int i = 0; i < names_.size(); ++i ) { if( s.find( names_[i] ) == s.end() ) { COMMA_THROW( comma::exception, "unknown option " << names_[i] ); } }
+    std::unordered_map< std::string, bool > m; // real quick and dirty, just to make it work
+    for( unsigned int i = 0; i < d.size(); ++i ) { for( unsigned int j = 0; j < d[i].names.size(); ++j ) { m[ d[i].names[j] ] = d[i].has_value; } }
+    for( unsigned int i = 1; i < argv_.size(); ++i )
+    {
+        std::string option_name = comma::split( argv_[i], '=' )[0];
+        if( !boost::regex_match( option_name, boost::regex( "-.+" ) ) ) { continue; }
+        auto it = m.find( option_name );
+        if( it == m.end() ) { COMMA_THROW( comma::exception, "unknown option " << option_name ); }
+        if( it->second ) { ++i; }
+    }
 }
 
 namespace impl {
@@ -226,12 +280,12 @@ namespace impl {
         description_t d;
         bool r = boost::spirit::qi::phrase_parse( s.begin()
                                                 , s.end()
-                                                ,      name[ boost::bind( push_back_, boost::ref( d.names ), _1 ) ]
-                                                    >> *( ',' >> name[ boost::bind( push_back_, boost::ref( d.names ), _1 ) ] )
-                                                    >> -( '=' >> ( value[ boost::bind( got_value, boost::ref( d ), _1 ) ]
-                                                                | optional_value[ boost::bind( got_optional_value, boost::ref( d ), _1 ) ] ) )
-                                                    >> -( ';' >> default_value[ boost::bind( got_default_value, boost::ref( d ), _1 ) ] )
-                                                    >> -( ';' >> *( ascii::space ) >> help[ boost::bind( set_, boost::ref( d.help ), _1 ) ] )
+                                                ,      name[ std::bind( push_back_, boost::ref( d.names ), std::placeholders::_1 ) ]
+                                                    >> *( ',' >> name[ std::bind( push_back_, boost::ref( d.names ), std::placeholders::_1 ) ] )
+                                                    >> -( '=' >> ( value[ std::bind( got_value, boost::ref( d ), std::placeholders::_1 ) ]
+                                                                | optional_value[ std::bind( got_optional_value, boost::ref( d ), std::placeholders::_1 ) ] ) )
+                                                    >> -( ';' >> default_value[ std::bind( got_default_value, boost::ref( d ), std::placeholders::_1 ) ] )
+                                                    >> -( ';' >> *( ascii::space ) >> help[ std::bind( set_, boost::ref( d.help ), std::placeholders::_1 ) ] )
                                                     >> qi::eoi
                                                 , ascii::space );
         if( !r ) { COMMA_THROW( comma::exception, "invalid option description: \"" << s << "\"" ); }
diff --git a/application/command_line_options.h b/application/command_line_options.h
index 8fbdf1dff..ea0817879 100644
--- a/application/command_line_options.h
+++ b/application/command_line_options.h
@@ -1,51 +1,70 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_APPLICATION_COMMAND_LINE_OPTIONS_H_
-#define COMMA_APPLICATION_COMMAND_LINE_OPTIONS_H_
+#pragma once
 
+#include <functional>
+#include <iostream>
 #include <map>
 #include <string>
 #include <vector>
-#include <iostream>
-#include <boost/function.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include "../base/exception.h"
+#include "../base/none.h"
+#include "../io/terminal.h"
 #include "../string/string.h"
-#include "verbose.h"
+#include "verbose.h" // todo: deprecate
 
 namespace comma {
 
+struct verbosity
+{
+    enum levels { none=0, low=1, medium=2, high=3, extreme=4 }; // todo: more levels and or aliases like warning, info, debug - but when choosing names, remember: verbosity is not the same as logging!
+    enum target { stderr=0, terminal=1 };
+    static unsigned int level();
+    static bool titlebar_enabled();
+    static unsigned int from_string( const std::string& s );
+    static const std::string to_string( unsigned int v );
+    static std::string usage();
+};
+
+/// @example
+///      in my-application:
+///          say() << "some message";
+///      will print on stderr:
+///          my-application: some message
+std::ostream& say( std::ostream& os, unsigned int verbosity=0, const std::string& prefix="" );
+inline std::ostream& say( unsigned int verbosity=0, const std::string& prefix="" ) { return say( std::cerr, verbosity, prefix ); }
+/// set terminal title bar if --tb option present or force set to true
+/// @example
+///     todo
+comma::io::terminal::titlebar_ostream titlebar();
+
+/// convenience macros
+#define _COMMA_SAY( _level, _message ) { if( _level <= ::comma::verbosity::level() ) { ::comma::say( _level ) << _message; } }
+#define COMMA_SAY( message )         _COMMA_SAY( 0,                message << std::endl )
+#define COMMA_SAY_ERROR( message )   _COMMA_SAY( 0, "error:   "   << message << std::endl )
+#define COMMA_SAY_WARN( message )    _COMMA_SAY( 1, "warning: " << message << std::endl )
+#define COMMA_SAY_INFO( message )    _COMMA_SAY( 2, "info:    "    << message << std::endl )
+#define COMMA_SAY_DEBUG( message )   _COMMA_SAY( 3, "debug:   "   << message << std::endl )
+#define COMMA_SAY_TRACE( message )   _COMMA_SAY( 4, "trace:   "   << __FILE__ << ": " << __FUNCTION__ << ": line " << __LINE__ << ": " << message << std::endl; )
+#define COMMA_TITLE( message )       { if( ::comma::verbosity::titlebar_enabled() ) { auto t = ::comma::tilebar(); t << message; } else { COMMA_SAY( message ); } }
+#define COMMA_TITLE_BARE( message )  { if( ::comma::verbosity::titlebar_enabled() ) { ::comma::io::terminal::titlebar_ostream t; t << message; } else { std::cerr << message << std::endl; } }
+
+/// convenience alias of say( verbosity )
+/// @example
+///      in my-application
+///          saymore() << "some debug message";
+///          saymore( 2 ) << "some debug message at medium verbosity";
+///          saymore( comma::verbosity::medium ) << "some debug message at medium verbosity";
+///      if run as: my-application --verbose, will print on stderr:
+///          my-application: some debug message
+///      define verbosity level on command line as --verbosity-level=3 or equivalently --vvv
+inline std::ostream& saymore( unsigned int verbosity=comma::verbosity::low ) { return say( verbosity ); }
+    
 /// a simple command line options class
 class command_line_options
 {
@@ -53,18 +72,18 @@ class command_line_options
         /// constructor
         /// if --help,-h present, call usage()
         /// if --verbose,-v present, call usage( verbose )
-        command_line_options( int argc, char ** argv, boost::function< void( bool ) > usage = NULL );
+        command_line_options( int argc, char ** argv, std::function< void( bool ) > usage = NULL, std::function< void( int, char** ) > bash_completion = NULL );
 
         /// constructor
         /// if --help,-h present, call usage()
         /// if --verbose,-v present, call usage( verbose )
-        command_line_options( const std::vector< std::string >& argv, boost::function< void( bool ) > usage = NULL );
+        command_line_options( const std::vector< std::string >& argv, std::function< void( bool ) > usage = NULL );
         
         /// constructor
         /// if --help,-h present, call usage()
         /// if --verbose,-v present, call usage( verbose )
         template< typename Iterator >
-        command_line_options( Iterator begin, Iterator end, boost::function< void( bool ) > usage = NULL );
+        command_line_options( Iterator begin, Iterator end, std::function< void( bool ) > usage = NULL );
 
         /// constructor
         command_line_options( const command_line_options& rhs );
@@ -124,6 +143,12 @@ class command_line_options
         
         /// throw, if at least one option from each set is present
         void assert_mutually_exclusive( const std::string& first, const std::string& second ) const;
+        
+        /// throw, if not at least one of options in the list exists, trivial convenience method
+        void assert_exists( const std::string& comma_separated_names ) const;
+
+        /// throw, if first option is present, but any of options in the csv list in second is not
+        void assert_exists_if( const std::string& first, const std::string& second ) const;
 
         /// description
         struct description
@@ -131,7 +156,7 @@ class command_line_options
             std::vector< std::string > names;
             bool is_optional;
             bool has_value;
-            boost::optional< std::string > default_value; // todo: make strongly typed
+            boost::optional< std::string > default_value = comma::silent_none< std::string >(); // todo: make strongly typed
             std::string help;
 
             /// default constructor
@@ -158,25 +183,25 @@ class command_line_options
 
     private:
         typedef std::map< std::string, std::vector< std::string > > map_type_;
-
-        void fill_map_( const std::vector< std::string >& v );
-        template < typename T > static T lexical_cast_( const std::string& s );
-
         std::vector< std::string > argv_;
         map_type_ map_;
         std::vector< std::string > names_;
+        void _fill_map( const std::vector< std::string >& v );
+        void _init_verbose( const std::string& path );
+        template < typename T > static T lexical_cast_( const std::string& s );
+        
 };
 
-template< typename Iterator > inline command_line_options::command_line_options( Iterator begin, Iterator end, boost::function< void( bool ) > usage )
+template< typename Iterator > inline command_line_options::command_line_options( Iterator begin, Iterator end, std::function< void( bool ) > usage )
 {
     argv_.resize( std::distance( begin, end ) );
     for ( Iterator i = begin; i < end; ++i ) { argv_[i] = *i; }
-    fill_map_( argv_ );
-    if ( usage && exists( "--help,-h" ) )
+    _fill_map( argv_ );
+    if( usage && exists( "--help,-h" ) )
     {
-        bool v = exists( "--verbose,-v" );
-        comma::verbose.init( v, *begin );
-        usage( v ); exit( 1 );
+        _init_verbose( *begin );
+        usage( verbosity::level() > 0 );
+        exit( 0 );
     }
 }
 
@@ -207,7 +232,7 @@ template < typename T >
 inline boost::optional< T > command_line_options::optional( const std::string& name ) const
 {
     std::vector< T > v = values< T >( name );
-    return v.empty() ? boost::optional< T >() : boost::optional< T >( v[0] );
+    return v.empty() ? comma::silent_none< T >() : boost::optional< T >( v[0] );
 }
 
 template < typename T >
@@ -234,5 +259,3 @@ inline std::vector< T > command_line_options::values( const std::string& name, T
 }
 
 } // namespace comma {
-
-#endif // COMMA_APPLICATION_COMMAND_LINE_OPTIONS_H_
diff --git a/application/signal_flag.h b/application/signal_flag.h
index 62266f636..f9aad6886 100644
--- a/application/signal_flag.h
+++ b/application/signal_flag.h
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -66,8 +38,8 @@ struct signal_flag : public boost::noncopyable
         /// for those who does not like to type
         operator bool() const { return is_set_; }
 
-        /// reset to false
-        void reset() { is_set_ = false; }
+        /// reset to a given value
+        void reset( bool value = false ) { is_set_ = value; }
 
     private:
         static bool is_set_;
diff --git a/application/test/CMakeLists.txt b/application/test/CMakeLists.txt
index 004a6d1e9..4f56b8487 100644
--- a/application/test/CMakeLists.txt
+++ b/application/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT application )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT application )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/application/test/application_test.cpp b/application/test/application_test.cpp
index 037ae84e0..c8d91faea 100644
--- a/application/test/application_test.cpp
+++ b/application/test/application_test.cpp
@@ -1,32 +1,6 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+#include <cmath>
 #include <limits>
 #include <gtest/gtest.h>
 #include "../command_line_options.h"
@@ -63,8 +37,8 @@ TEST( application, command_line_options )
     EXPECT_TRUE( !options.exists( "--d" ) );
     EXPECT_TRUE( options.values< int >( "-x" ).empty() );
     EXPECT_TRUE( options.values< int >( "-x,-y,-z" ).empty() );
-    EXPECT_EQ( options.optional< int >( "-x" ), boost::optional< int >() );
-    EXPECT_EQ( options.optional< int >( "-x,-y,-z" ), boost::optional< int >() );
+    EXPECT_FALSE( bool( options.optional< int >( "-x" ) ) );
+    EXPECT_FALSE( bool( options.optional< int >( "-x,-y,-z" ) ) );
     EXPECT_EQ( options.value< std::string >( "-a" ), "b" );
     EXPECT_EQ( options.value< bool >( "--a" ), true );
     EXPECT_EQ( options.value< int >( "--b" ), 15 );
@@ -118,6 +92,32 @@ TEST( application, unnamed )
             EXPECT_EQ( free[5], "free5" );
         }
     }
+    {
+        std::vector< std::string > argv;
+        argv.push_back( "application" );
+        argv.push_back( "--no-value" );
+        argv.push_back( "--value" );
+        argv.push_back( "some-value" );
+        comma::command_line_options options( argv );
+        {
+            std::vector< std::string > unnamed = options.unnamed( "--no-value", "-.*" );
+            EXPECT_EQ( 0u, unnamed.size() );
+        }
+    }
+    {
+        std::vector< std::string > argv;
+        argv.push_back( "application" );
+        argv.push_back( "unnamed" );
+        argv.push_back( "--no-value" );
+        argv.push_back( "--value" );
+        argv.push_back( "x,y,z" );
+        comma::command_line_options options( argv );
+        {
+            std::vector< std::string > unnamed = options.unnamed( "--no-value", "-.*" );
+            EXPECT_EQ( 1u, unnamed.size() );
+            EXPECT_EQ( "unnamed", unnamed[0] );
+        }
+    }
     // TODO: definitely more tests!
 }
 
@@ -172,7 +172,7 @@ TEST( command_line_options, optional )
         EXPECT_FALSE( bool( d ) );
         boost::optional< double > e = options.value< double >( "--d", std::numeric_limits< double >::quiet_NaN() );
         EXPECT_TRUE( bool( e ) );
-        EXPECT_FALSE( *e == *e );
+        EXPECT_TRUE( !std::numeric_limits< double >::has_quiet_NaN || std::isnan( *e ) ); // EXPECT_FALSE( *e == *e );
     }
 }
 
@@ -180,7 +180,7 @@ TEST( application, command_line_options_description_parsing )
 {
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--verbose" );
-        EXPECT_EQ( 1, d.names.size() );
+        EXPECT_EQ( 1u, d.names.size() );
         EXPECT_EQ( "--verbose", d.names[0] );
         EXPECT_FALSE( d.has_value );
         EXPECT_TRUE( d.is_optional );
@@ -188,7 +188,7 @@ TEST( application, command_line_options_description_parsing )
     }
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--verbose,-v" );
-        EXPECT_EQ( 2, d.names.size() );
+        EXPECT_EQ( 2u, d.names.size() );
         EXPECT_EQ( "--verbose", d.names[0] );
         EXPECT_EQ( "-v", d.names[1] );
         EXPECT_FALSE( d.has_value );
@@ -197,7 +197,7 @@ TEST( application, command_line_options_description_parsing )
     }
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--filename,-f=<filename>; some filename" );
-        EXPECT_EQ( 2, d.names.size() );
+        EXPECT_EQ( 2u, d.names.size() );
         EXPECT_EQ( "--filename", d.names[0] );
         EXPECT_EQ( "-f", d.names[1] );
         EXPECT_TRUE( d.has_value );
@@ -207,7 +207,7 @@ TEST( application, command_line_options_description_parsing )
     }
     {
         comma::command_line_options::description d = comma::command_line_options::description::from_string( "--filename,-f=[<filename>]; some filename" );
-        EXPECT_EQ( 2, d.names.size() );
+        EXPECT_EQ( 2u, d.names.size() );
         EXPECT_EQ( "--filename", d.names[0] );
         EXPECT_EQ( "-f", d.names[1] );
         EXPECT_TRUE( d.has_value );
@@ -226,7 +226,7 @@ void check_default_value( const std::string& line, const std::string& default_va
 {
     typedef comma::command_line_options::description description;
     description d = description::from_string( line );
-    EXPECT_EQ( 2, d.names.size() );
+    EXPECT_EQ( 2u, d.names.size() );
     EXPECT_EQ( "--filename", d.names[0] );
     EXPECT_EQ( "-f", d.names[1] );
     EXPECT_TRUE( d.has_value );
@@ -264,7 +264,7 @@ TEST( application, command_line_options_description_default_values_double_quotes
     check_default_value( "--filename,-f=[<filename>]; default=\"blah=\\\"$var\\\"\" ; some filename", "blah=\"$var\"" );
     check_default_value( "--filename,-f=[<filename>]; default=\"blah with space \"; some filename", "blah with space " );
 }
-    
+
 int main( int argc, char* argv[] )
 {
     ::testing::InitGoogleTest( &argc, argv );
diff --git a/application/verbose.cpp b/application/verbose.cpp
index b1fb2e394..0e6c12257 100644
--- a/application/verbose.cpp
+++ b/application/verbose.cpp
@@ -1,33 +1,7 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2015 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-#include <boost/filesystem.hpp>
+#include "../io/impl/filesystem.h"
+#include "../string/string.h"
 #include "verbose.h"
 
 namespace comma {
@@ -39,10 +13,7 @@ verbose_t::operator bool () const {return enabled_;}
 const std::string& verbose_t::app_name() const {return app_name_;}
 void verbose_t::init(bool enabled, const std::string& argv0)
 {
-    if(!argv0.empty())
-    {
-        app_name_=boost::filesystem::basename(argv0);
-    }
+    if(!argv0.empty()) { app_name_ = comma::filesystem::path(argv0).filename().string(); } // comma::split( argv0, '/' ).back();
     enabled_=enabled;
     start_of_line=true;
 }
@@ -58,4 +29,3 @@ verbose_t& verbose_t::operator<<(std::basic_ostream<char>& (*pf)(std::basic_ostr
 }
 
 }//namespace comma {
-
diff --git a/application/verbose.h b/application/verbose.h
index 296cd1709..b220f0730 100644
--- a/application/verbose.h
+++ b/application/verbose.h
@@ -31,7 +31,6 @@
 
 #include <iostream>
 
-//prototype for comma::verbose
 namespace comma {
 
 //a pseudo ostream for outputing information to stderr
@@ -39,6 +38,7 @@ namespace comma {
 //examples: 
 //  comma::verbose << "hello!" << std::endl;
 //  if (comma::verbose) { std::cerr << comma::verbose.app_name() << "info" << std::endl; }
+/// @deprecated
 class verbose_t
 {
     bool enabled_;
diff --git a/base/CMakeLists.txt b/base/CMakeLists.txt
index edc0331da..9e2cbd69b 100644
--- a/base/CMakeLists.txt
+++ b/base/CMakeLists.txt
@@ -7,11 +7,12 @@ SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 
-INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
-INSTALL(
-    TARGETS ${TARGET_NAME}
-    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
-    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
-    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
-)
-     
\ No newline at end of file
+install( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+install( TARGETS ${TARGET_NAME}
+         RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime       # .exe, .dll
+         LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime       # .so, mod.dll
+         ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development ) # .a, .lib
+
+IF( comma_BUILD_TESTS )
+    ADD_SUBDIRECTORY( test )
+ENDIF( comma_BUILD_TESTS )
\ No newline at end of file
diff --git a/base/exception.cpp b/base/exception.cpp
new file mode 100644
index 000000000..2cf93c5b9
--- /dev/null
+++ b/base/exception.cpp
@@ -0,0 +1,49 @@
+// Copyright (c) 2011 The University of Sydney
+
+#include "exception.h"
+
+namespace comma {
+
+exception::exception( const char *message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : std::runtime_error( message )
+    , _message( message )
+    , _filename( filename )
+    , _line( line_number )
+    , _function( function_name )
+{
+    _formatted_string( brief );
+}
+
+exception::exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : std::runtime_error( message.c_str() )
+    , _message( message )
+    , _filename( filename )
+    , _line( line_number )
+    , _function( function_name )
+{
+    _formatted_string( brief );
+}
+
+const char* exception::what() const throw()
+{
+    const char* string = "exception::what() _formatted_message.c_str() threw exception";
+    try { string = _formatted_message.c_str(); } catch( ... ) {}
+    return string;
+}
+
+void exception::_formatted_string( bool brief )
+{
+    std::ostringstream oss;
+    oss << error() << std::endl;
+    if( !brief )
+    {
+        oss << "============================================" << std::endl
+            << "file: "     << _filename << std::endl
+            << "line: "     << _line << std::endl
+            << "function: " << _function << std::endl
+            << "============================================" << std::endl;
+    }
+    _formatted_message = oss.str();
+}
+
+}  // namespace comma
diff --git a/base/exception.h b/base/exception.h
index d6d388ce7..5b92b0e92 100644
--- a/base/exception.h
+++ b/base/exception.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_BASE_EXCEPTION_H
-#define COMMA_BASE_EXCEPTION_H
+#pragma once
 
 #include <stdexcept>
 #include <sstream>
@@ -50,20 +21,24 @@ namespace comma {
 #ifndef COMMA_THROW
 
 #if defined( WIN32 )
-    #define COMMA_THROW_IMPL_( exception, message )      \
-    throw exception( message, __FILE__, __LINE__, __FUNCSIG__ );
+    #define COMMA_THROW_IMPL_( exception, message, brief )      \
+    throw exception( message, __FILE__, __LINE__, __FUNCSIG__, brief );
 #elif defined( __GNUC__ )
-    #define COMMA_THROW_IMPL_( exception, message )      \
-    throw exception( message, __FILE__, __LINE__, __PRETTY_FUNCTION__ );
+    #define COMMA_THROW_IMPL_( exception, message, brief )      \
+    throw exception( message, __FILE__, __LINE__, __PRETTY_FUNCTION__, brief );
 #else
-    #define COMMA_THROW_IMPL_( exception, message )      \
-    throw exception( message, __FILE__, __LINE__, __FUNCTION__ );
+    #define COMMA_THROW_IMPL_( exception, message, brief )      \
+    throw exception( message, __FILE__, __LINE__, __FUNCTION__, brief );
 #endif
 
-#define COMMA_THROW( exception, strmessage ) { std::ostringstream CommaThrowStr##__LINE__; CommaThrowStr##__LINE__ << strmessage;  COMMA_THROW_IMPL_( exception, CommaThrowStr##__LINE__.str() ); }
+#define COMMA_THROW( exception, strmessage ) { std::ostringstream CommaThrowStr##__LINE__; CommaThrowStr##__LINE__ << strmessage;  COMMA_THROW_IMPL_( exception, CommaThrowStr##__LINE__.str(), false ); }
+
+#define COMMA_THROW_BRIEF( exception, strmessage ) { std::ostringstream CommaThrowStr##__LINE__; CommaThrowStr##__LINE__ << strmessage;  COMMA_THROW_IMPL_( exception, CommaThrowStr##__LINE__.str(), true ); }
 
 #define COMMA_THROW_STREAM( exception, strmessage ) COMMA_THROW( exception, strmessage )
 
+#define COMMA_THROW_STREAM_BRIEF( exception, strmessage ) COMMA_THROW_BRIEF( exception, strmessage )
+
 #endif // COMMA_THROW
 
 #ifndef COMMA_RETHROW
@@ -72,111 +47,51 @@ namespace comma {
 
 #endif // COMMA_RETHROW
 
+#define COMMA_ASSERT( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW( comma::exception, "condition: '" << #condition << "' is false; " << strmessage ); } }
+
+#define COMMA_ASSERT_BRIEF( condition, strmessage ) { if( !( condition ) ) { COMMA_THROW_BRIEF( comma::exception, strmessage ); } }
+
+#define COMMA_THROW_IF( condition, strmessage ) { if( condition ) { COMMA_THROW( comma::exception, "throw because condition: '" << #condition << "' is true; " << strmessage ); } }
+
+#define COMMA_THROW_BRIEF_IF( condition, strmessage ) { if( condition ) { COMMA_THROW_BRIEF( comma::exception, strmessage ); } }
+
 class exception : public std::runtime_error
 {
     public:
 
         /// constructor
-        exception( const char *message, const char *filename, unsigned long line_number, const char *function_name );
+        exception( const char *message, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 
         /// constructor
-        exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name );
+        exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 
         /// destructor
         virtual ~exception() throw() {}
 
         /// e.what is the complete formatted info
-        const char*     what(void) const throw();
+        const char*     what() const throw();
 
         /// just the error message
-        const char*     error() const;
+        const char*     error() const { return &_message[0]; }
 
         /// filename
-        const char*     file() const;
+        const char*     file() const { return &_filename[0]; }
 
         /// line number
-        unsigned long   line() const;
+        unsigned long   line() const { return _line; }
 
         /// function name
-        const char*     function() const;
+        const char*     function() const { return &_function[0]; }
 
     protected:
 
-        virtual void    formatted_string_();
+        virtual void    _formatted_string( bool brief );
 
-        std::string     m_message;
-        std::string     m_filename;
-        unsigned long   m_line_number;
-        std::string     m_function_name;
-        std::string     m_formatted_message;
+        std::string     _message;
+        std::string     _filename;
+        unsigned long   _line{0};
+        std::string     _function;
+        std::string     _formatted_message;
 };
 
-inline exception::exception( const char *message, const char *filename, unsigned long line_number, const char *function_name ) :
-    std::runtime_error( message ),
-    m_message( message ),
-    m_filename( filename ),
-    m_line_number( line_number ),
-    m_function_name( function_name )
-{
-    formatted_string_();
-}
-
-inline exception::exception( const std::string& message, const char *filename, unsigned long line_number, const char *function_name ) :
-    std::runtime_error( message.c_str() ),
-    m_message( message ),
-    m_filename( filename ),
-    m_line_number( line_number ),
-    m_function_name( function_name )
-{
-    formatted_string_();
-}
-
-inline const char* exception::what(void) const throw()
-{
-    const char * string = "exception::what() m_formatted_message.c_str() threw exception";
-    try
-    {
-      string = m_formatted_message.c_str();
-    }
-    catch( ... )
-    {}
-    return string;
-}
-
-inline const char* exception::error() const
-{
-    return m_message.c_str();
-}
-
-
-inline const char* exception::file() const
-{
-    return m_filename.c_str();
-}
-
-inline unsigned long exception::line() const
-{
-    return m_line_number;
-}
-
-inline const char* exception::function() const
-{
-    return m_function_name.c_str();
-}
-
-inline void exception::formatted_string_()
-{
-    std::ostringstream oss;
-    oss << error() << std::endl
-        << "============================================" << std::endl
-        << "file: "     << m_filename << std::endl
-        << "line: "     << m_line_number << std::endl
-        << "function: " << m_function_name << std::endl
-        << "============================================" << std::endl;
-    m_formatted_message = oss.str();
-}
-
 }  // namespace comma
-
-#endif //COMMA_BASE_EXCEPTION_H
-
diff --git a/base/last_error.cpp b/base/last_error.cpp
index d62ee22fe..f045465c0 100644
--- a/base/last_error.cpp
+++ b/base/last_error.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -67,43 +39,43 @@ std::string last_error::to_string()
 void last_error::to_exception( const std::string& msg )
 {
     #ifdef WIN32
-    switch( value() )
-    {
-        // TODO: add more exceptions
-        case 0: break;
-        case WSAEINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
-        default: COMMA_THROW( last_error::exception, msg );
-    }
+        switch( value() )
+        {
+            // TODO: add more exceptions
+            case 0: break;
+            case WSAEINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
+            default: COMMA_THROW( last_error::exception, msg );
+        }
     #else
-    switch( value() )
-    {
-        // TODO: add more exceptions
-        case 0: break;
-        case EINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
-        default: COMMA_THROW( last_error::exception, msg );
-    };
+        switch( value() )
+        {
+            // TODO: add more exceptions
+            case 0: break;
+            case EINTR: COMMA_THROW( last_error::interrupted_system_call_exception, msg );
+            default: COMMA_THROW( last_error::exception, msg );
+        };
     #endif
 }
 
-last_error::exception::exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name )
-    : comma::exception( std::string( msg ) + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name )
+last_error::exception::exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : comma::exception( std::string( msg ) + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name, brief )
 {
     value = last_error::value();
 }
 
-last_error::exception::exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name )
-    : comma::exception( msg + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name )
+last_error::exception::exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : comma::exception( msg + ": errno " + boost::lexical_cast< std::string >( last_error::value() ) + " - " + last_error::to_string(), filename, line_number, function_name, brief )
 {
     value = last_error::value();
 }
 
-last_error::interrupted_system_call_exception::interrupted_system_call_exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name )
-    : last_error::exception( msg, filename, line_number, function_name )
+last_error::interrupted_system_call_exception::interrupted_system_call_exception( const char* msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : last_error::exception( msg, filename, line_number, function_name, brief )
 {
 }
 
-last_error::interrupted_system_call_exception::interrupted_system_call_exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name )
-    : last_error::exception( msg, filename, line_number, function_name )
+last_error::interrupted_system_call_exception::interrupted_system_call_exception( const std::string& msg, const char *filename, unsigned long line_number, const char *function_name, bool brief )
+    : last_error::exception( msg, filename, line_number, function_name, brief )
 {
 }
 
diff --git a/base/last_error.h b/base/last_error.h
index ddc54c228..da47c2808 100644
--- a/base/last_error.h
+++ b/base/last_error.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_BASE_LAST_ERROR_HEADER
-#define COMMA_BASE_LAST_ERROR_HEADER
+#pragma once
 
 #include <string>
 #include "exception.h"
@@ -65,18 +36,16 @@ struct last_error
 
 struct last_error::exception : public comma::exception
 {
-    exception( const char*, const char *filename, unsigned long line_number, const char *function_name );
-    exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name );
+    exception( const char*, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
+    exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 
     int value;
 };
 
 struct last_error::interrupted_system_call_exception : public last_error::exception
 {
-    interrupted_system_call_exception( const char*, const char *filename, unsigned long line_number, const char *function_name );
-    interrupted_system_call_exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name );
+    interrupted_system_call_exception( const char*, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
+    interrupted_system_call_exception( const std::string&, const char *filename, unsigned long line_number, const char *function_name, bool brief = false );
 };
 
 } // namespace comma {
-
-#endif // #ifndef COMMA_BASE_LAST_ERROR_HEADER
diff --git a/base/none.h b/base/none.h
new file mode 100644
index 000000000..77ef009fe
--- /dev/null
+++ b/base/none.h
@@ -0,0 +1,25 @@
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <boost/optional.hpp>
+
+namespace comma {
+
+/// convenience type to use e.g. as a "tag" type in template definitions
+/// since boost::none_t is not default-constructible as it is designed
+/// to be a singleton type (see boost/none_t.hpp for details) meaning
+/// that it won't compile for some use cases
+struct none {};
+
+/// a quick fix for annoying boost::optional compilation warning
+/// boost::optional< int > i; // gets compile warning when i first dereferenced
+///                           // even if i is initialized for sure somewhere in the code
+/// boost::optional< int > i{boost::none}; // still same compile warning
+/// boost::optional< int > i = comma::silent_none< int >(); // fine, no warning
+template < typename T >
+inline boost::optional< T > silent_none() { return boost::optional< T >( boost::none ); }
+    
+} // namespace comma {
diff --git a/base/optional.h b/base/optional.h
new file mode 100644
index 000000000..475dc3619
--- /dev/null
+++ b/base/optional.h
@@ -0,0 +1,32 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+namespace comma {
+
+/// convenience class when std::optional or boost::optional is not enough
+/// e.g. if in visiting we would like to have an explicit is-set flag field 
+/// in csv, json, or alike, where it may be essential in fixed-width data
+/// (e.g. csv) where the optional value may or may not be present
+template < typename T >
+struct optional
+{
+    T value;
+    bool is_set{false};
+
+    optional() = default;
+    optional( const T& t ): value( t ), is_set( true ) {}
+    template < class... Args > optional( Args... args ): value( args... ), is_set( true ) {}
+    template < class... Args > void emplace( Args... args ); // todo
+    optional& operator=( const T& rhs ) { value = rhs; is_set = true; return *this; }
+    void reset() { is_set = false; }
+    operator bool() const { return is_set; }
+    T* operator->() { return &value; }
+    const T* operator->() const { return &value; }
+    T& operator*() { return value; }
+    const T& operator*() const { return value; }
+};
+
+} // namespace comma {
diff --git a/base/test/CMakeLists.txt b/base/test/CMakeLists.txt
new file mode 100644
index 000000000..9fb546dd8
--- /dev/null
+++ b/base/test/CMakeLists.txt
@@ -0,0 +1,13 @@
+set( KIT base )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${test_name} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/base/test/base_test.cpp b/base/test/base_test.cpp
new file mode 100644
index 000000000..2a2bb343a
--- /dev/null
+++ b/base/test/base_test.cpp
@@ -0,0 +1,175 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include "../exception.h"
+#include "../variant.h"
+#include <gtest/gtest.h>
+
+namespace comma {
+
+TEST( base, exception )
+{
+    COMMA_ASSERT( true, "all good" );
+    COMMA_ASSERT( 2 * 2 == 4, "all good" );
+    EXPECT_THROW( COMMA_ASSERT( false, "all bad" ), comma::exception );
+    EXPECT_THROW( COMMA_ASSERT( 2 * 2 == 5, "all bad" ), comma::exception );
+    COMMA_THROW_IF( false, "all good" );
+    COMMA_THROW_IF( 2 * 2 == 5, "all good" );
+    EXPECT_THROW( COMMA_THROW_IF( true, "all bad" ), comma::exception );
+    EXPECT_THROW( COMMA_THROW_IF( 2 * 2 == 4, "all bad" ), comma::exception );
+}
+
+TEST( base, variant )
+{
+    {
+        comma::impl::variant< int, float, double > v;
+        v.t = 1;
+        v.values.t = 2;
+        v.values.values.t = 3;
+    }
+    {
+        comma::impl::variant< int, float, double > v;
+        EXPECT_FALSE( v );
+        v.set< int >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< float >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< double >( 5 );
+        EXPECT_TRUE( v );
+        v.reset();
+        EXPECT_FALSE( v );
+    }
+    {
+        comma::impl::variant< int, float, double > v;
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( *v.t, 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< float >( 5 );
+        EXPECT_EQ( *v.values.t, 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_TRUE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< double >( 5 );
+        EXPECT_EQ( *v.values.values.t, 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_TRUE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( *v.t, 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+    }
+    {
+        comma::variant< int, float, double > v;
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( v.get< int >(), 5 );
+        EXPECT_TRUE( v.optional< int >() );
+        EXPECT_FALSE( v.optional< float >() );
+        EXPECT_FALSE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< int >(), 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< float >( 5 );
+        EXPECT_EQ( v.get< float >(), 5 );
+        EXPECT_FALSE( v.optional< int >() );
+        EXPECT_TRUE( v.optional< float >() );
+        EXPECT_FALSE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< float >(), 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_TRUE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+        v.set< double >( 5 );
+        EXPECT_EQ( v.get< double >(), 5 );
+        EXPECT_FALSE( v.optional< int >() );
+        EXPECT_FALSE( v.optional< float >() );
+        EXPECT_TRUE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< double >(), 5 );
+        EXPECT_FALSE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_TRUE( v.is< double >() );
+        v.set< int >( 5 );
+        EXPECT_EQ( v.get< int >(), 5 );
+        EXPECT_TRUE( v.optional< int >() );
+        EXPECT_FALSE( v.optional< float >() );
+        EXPECT_FALSE( v.optional< double >() );
+        EXPECT_EQ( *v.optional< float >(), 5 );
+        EXPECT_EQ( *v.optional< int >(), 5 );
+        EXPECT_TRUE( v.is< int >() );
+        EXPECT_FALSE( v.is< float >() );
+        EXPECT_FALSE( v.is< double >() );
+    }
+    {
+        { auto size = comma::variant< int >::size; EXPECT_EQ( size, 1 ); }
+        { auto size = comma::variant< int, float >::size; EXPECT_EQ( size, 2 ); }
+        { auto size = comma::variant< int, float, double >::size; EXPECT_EQ( size, 3 ); }
+    }
+    {
+        typedef comma::variant< int, float, double > variant_t;
+        EXPECT_EQ( variant_t::index_of< int >(), 0 );
+        EXPECT_EQ( variant_t::index_of< float >(), 1 );
+        EXPECT_EQ( variant_t::index_of< double >(), 2 );
+        variant_t v;
+        EXPECT_EQ( v.index(), 3 );
+        v.set< int >( 5 );
+        EXPECT_EQ( v.index(), 0 );
+        v.set< float >( 5 );
+        EXPECT_EQ( v.index(), 1 );
+        v.set< double >( 5 );
+        EXPECT_EQ( v.index(), 2 );
+        v.reset();
+        EXPECT_EQ( v.index(), 3 );
+    }
+}
+
+TEST( base, named_variant )
+{
+    {
+        struct naming { static std::array< std::string, 3 > names() { return { "a", "b", "c" }; } };
+        typedef comma::named_variant< naming, int, float, double > variant_t;
+        EXPECT_EQ( variant_t::name_of< int >(), "a" );
+        EXPECT_EQ( variant_t::name_of< float >(), "b" );
+        EXPECT_EQ( variant_t::name_of< double >(), "c" );
+    }
+    {
+        struct naming { static std::array< std::string, 3 > names() { return { "a", "b", "c" }; } };
+        comma::named_variant< naming, int, float, double > v;
+        EXPECT_FALSE( v );
+        v.set< int >( 5 );
+        EXPECT_TRUE( v );
+        EXPECT_EQ( v.name(), "a" );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< float >( 5 );
+        EXPECT_TRUE( v );
+        EXPECT_EQ( v.name(), "b" );
+        v.reset();
+        EXPECT_FALSE( v );
+        v.set< double >( 5 );
+        EXPECT_TRUE( v );
+        EXPECT_EQ( v.name(), "c" );
+        v.reset();
+        EXPECT_FALSE( v );
+        EXPECT_THROW( v.name(), comma::exception );
+    }
+}
+
+} // namespace comma {
+
+int main( int argc, char* argv[] )
+{    
+    ::testing::InitGoogleTest( &argc, argv );
+    return RUN_ALL_TESTS();
+}
diff --git a/base/types.h b/base/types.h
index 065547899..22f4f1944 100644
--- a/base/types.h
+++ b/base/types.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_BASE_TYPES_H_
-#define COMMA_BASE_TYPES_H_
+#pragma once
 
 #if defined(__linux__) || defined(__APPLE__) || defined(__QNXNTO__)
 #include <arpa/inet.h>
@@ -45,7 +16,7 @@
 
 #include <cmath>
 #include <limits>
-#include <boost/static_assert.hpp>
+#include <type_traits>
 
 namespace comma {
 
@@ -70,12 +41,12 @@ typedef __int32 int32;
 typedef __int64 int64;
 
 // Windows, you know...
-BOOST_STATIC_ASSERT( sizeof( uint16 ) == 2 );
-BOOST_STATIC_ASSERT( sizeof( uint32 ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( uint64 ) == 8 );
-BOOST_STATIC_ASSERT( sizeof( int16 ) == 2 );
-BOOST_STATIC_ASSERT( sizeof( int32 ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( int64 ) == 8 );
+static_assert( sizeof( uint16 ) == 2, "expected uint16 of size 2" );
+static_assert( sizeof( uint32 ) == 4, "expected uint32 of size 4" );
+static_assert( sizeof( uint64 ) == 8, "expected uint64 of size 8" );
+static_assert( sizeof( int16 ) == 2, "expected int16 of size 2" );
+static_assert( sizeof( int32 ) == 4, "expected int32 of size 4" );
+static_assert( sizeof( int64 ) == 8, "expected int64 of size 8" );
 
 #endif
 
@@ -90,5 +61,3 @@ template <> struct integer< 8, true > { typedef comma::int64 type; };
 template <> struct integer< 8, false > { typedef comma::uint64 type; };
 
 } // namespace comma {
-
-#endif /*COMMA_BASE_TYPES_H_*/
diff --git a/base/variant.h b/base/variant.h
new file mode 100644
index 000000000..5d2b822bd
--- /dev/null
+++ b/base/variant.h
@@ -0,0 +1,131 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+// todo
+// #if __cplusplus >= 201703L
+// #include <optional>
+// #else
+// #include <boost/optional.hpp>
+// #endif
+#include <type_traits>
+#include <boost/optional.hpp>
+#include "exception.h"
+
+namespace comma {
+
+// todo
+//   ? use tuple instead?
+//   - check that types don't repeat
+
+namespace impl {
+
+struct type_is_not_on_type_list{}; // quick and dirty, a tag struct
+
+template < typename T, bool B > struct variant_traits;
+
+template < typename T > struct variant_traits< T, false >
+{
+    template < typename S > static void set( boost::optional< T >& t, const S& ) { t.reset(); }
+    template < typename S > static void set( boost::optional< T >& t, const boost::optional< S >& ) { t.reset(); }
+    template < typename S, typename V > static const S& get( const boost::optional< T >&, const V& v ) { return v.template get< S >(); }
+    template < typename S, typename V > static const boost::optional< S >& optional( const boost::optional< T >&, const V& v ) { return v.template optional< S >(); }
+};
+
+template < typename T > struct variant_traits< T, true >
+{
+    template < typename S > static void set( boost::optional< T >& t, const S& s ) { t = s; }
+    template < typename S > static void set( boost::optional< T >& t, const boost::optional< S >& s ) { t = s; }
+    template < typename S, typename V > static const S& get( const boost::optional< T >& t, const V& ) { return *t; }
+    template < typename S, typename V > static const boost::optional< S >& optional( const boost::optional< T >& t, const V& ) { return t; }
+};
+
+template < typename T, typename... Args > struct variant  // todo? use tuple instead?
+{
+    enum { size = variant< Args... >::size + 1 };
+    boost::optional< T > t;
+    variant< Args... > values;
+
+    template < typename S > bool is() const { return ( std::is_same< T, S >::value && bool( t ) ) || values.template is< S >(); }
+    operator bool() const { return bool( t ) || bool( values ); }
+    template < typename S > void set( const S& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); values.set( s ); }
+    template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); values.set( s ); }
+    template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, values ); }
+    template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, values ); }
+    void reset() { t.reset(); values.reset(); }
+    template < typename S > static unsigned int rindex() { return std::is_same< T, S >::value ? size - 1 : variant< Args... >::template rindex< S >(); }
+    unsigned int index( unsigned int i = 0 ) const { return t ? i : values.index( i + 1 ); }
+};
+
+template < typename T > struct variant< T >  // todo? use tuple instead?
+{
+    enum { size = 1 };
+    boost::optional< T > t;
+
+    template < typename S > bool is() const { return std::is_same< T, S >::value && bool( t ); }
+    operator bool() const { return bool( t ); }
+    template < typename S > void set( const S& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); }
+    template < typename S > void set( const boost::optional< S >& s ) { variant_traits< T, std::is_same< T, S >::value >::set( t, s ); }
+    template < typename S > const S& get() const { return variant_traits< T, std::is_same< T, S >::value >::template get< S >( t, type_is_not_on_type_list() ); }
+    template < typename S > const boost::optional< S >& optional() const { return variant_traits< T, std::is_same< T, S >::value >::template optional< S >( t, type_is_not_on_type_list() ); }
+    void reset() { t.reset(); }
+    template < typename S > static unsigned int rindex() { bool same_type = std::is_same< T, S >::value; COMMA_ASSERT( same_type, "type not found in type list" ); return 0; }
+    unsigned int index( unsigned int i = 0 ) const { return t ? i : ( i + 1 ); }
+};
+
+} // namespace impl {
+
+/// @example
+///     struct chirp { int a{1}; int b{2}; };
+///     struct whistle { int a{3}; int b{4}; };
+///     struct warble { int x{5}; int y{6}; };
+///     comma::named_variant< naming, chirp, whistle, warble > sound;
+template < typename... Args >
+class variant
+{
+    public:
+        enum { size = impl::variant< Args... >::size };
+        variant() = default;
+        template < typename S > variant( const S& s ) { set( s ); }
+        template < typename S > bool is() const { return _values.template is< S >(); }
+        operator bool() const { return bool( _values ); }
+        template < typename S > void set( const S& s ) { _values.set( s ); }
+        template < typename S > void set( const boost::optional< S >& s ) { _values.set( s ); }
+        template < typename S > const S& get() const { return _values.template get< S >(); }
+        template < typename S > const boost::optional< S >& optional() const { return _values.template optional< S >(); }
+        void reset() { _values.reset(); }
+        template < typename S > static unsigned int index_of() { return impl::variant< Args... >::size - impl::variant< Args... >::template rindex< S >() - 1; }
+        unsigned int index() const { return _values.index(); }
+    protected:
+        impl::variant< Args... > _values;
+};
+
+/// @example
+///     struct forest
+///     {
+///         struct chirp { int a{1}; int b{2}; };
+///         struct whistle { int a{3}; int b{4}; };
+///         struct warble { int x{5}; int y{6}; };
+///
+///         struct naming { static std::array< std::string, 3 > names() { return { "chirp", "whistle", "warble" }; } };
+///
+///         comma::named_variant< naming, chirp, whistle, warble > sound;
+/// };
+template < typename Names, typename... Args >
+struct named_variant : public variant< Args... >, public Names
+{
+    typedef Names names_t;
+    typedef variant< Args... > variant_t;
+    template < typename S > static auto name_of() { return Names::names()[ variant_t::template index_of< S >() ]; }
+    auto name() const { COMMA_ASSERT( bool( *this ), "asked for name, but value is not set" ); return this->names()[this->index()]; }
+};
+
+template < typename Names >
+struct make_named_variant
+{
+    template < typename... Args > struct variant { typedef named_variant< Names, Args... > type; };
+};
+
+} // namespace comma {
diff --git a/bash/CMakeLists.txt b/bash/CMakeLists.txt
index 49d6ee611..4f3460a12 100644
--- a/bash/CMakeLists.txt
+++ b/bash/CMakeLists.txt
@@ -1,13 +1,13 @@
-INSTALL( PROGRAMS comma-application-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-log-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-name-value-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-progress-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-resources-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-sync-util DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-units-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-application-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-log-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-name-value-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-progress-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-resources-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-sync-util DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-units-util DESTINATION ${comma_INSTALL_BIN_DIR} )
 
 if( comma_BUILD_APPLICATIONS )
     add_subdirectory( applications )
 endif( comma_BUILD_APPLICATIONS )
-ADD_SUBDIRECTORY( process )
-ADD_SUBDIRECTORY( misc )
+add_subdirectory( process )
+add_subdirectory( misc )
diff --git a/bash/applications/comma-call-graph b/bash/applications/comma-call-graph
index 3ebef826a..d9e916ace 100755
--- a/bash/applications/comma-call-graph
+++ b/bash/applications/comma-call-graph
@@ -108,10 +108,10 @@ load_options $@
 
 if [[ $dot_output && $dot_output != "dot" ]]; then
     type -p dot > /dev/null || {
-        echo "$basename requires graphviz"
-        echo "Install on Ubuntu with:"
-        echo "$ sudo apt-get install graphviz"
-        exit
+        echo "$basename: requires graphviz" >&2
+        echo "$basename: install on ubuntu with:" >&2
+        echo "$basename: sudo apt-get install graphviz" >&2
+        exit 1
     }
     output_fn="dot -T$dot_output"
 else
diff --git a/bash/comma-application-util b/bash/comma-application-util
index ab656d7b8..4f6ff584b 100644
--- a/bash/comma-application-util
+++ b/bash/comma-application-util
@@ -1,33 +1,7 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+# Copyright (c) 2020 Vsevolod Vlaskine
 
 ## @page comma-application-util comma-application-util
 # this script is designed to be included in another script directly, for example:
@@ -43,8 +17,25 @@
 [[ -n "$comma_application_util_include_guard_" ]] && return 0
 readonly comma_application_util_include_guard_=1
 
-source $( type -p comma-name-value-util ) \
-    || { echo "$name: cannot source 'comma-name-value-util' from '$BASH_SOURCE'" >&2; exit 1; }
+source $( type -p comma-name-value-util ) || { echo "$comma_application_name: cannot source 'comma-name-value-util' from '$BASH_SOURCE'" >&2; exit 1; }
+
+## @page comma-source-relative comma-source-relative
+# @section comma-source-relative
+# @description source relative to the location of the calling
+#              script/subshell (a trivial convenience wrapper)
+# @param whitespace-separated relative paths to source
+#        regular expressions permitted, e.g. my/sources/*
+#        as well as directory names, e.g. my/sources, which is the
+#        same as my/sources/*
+function comma-source-relative()
+{
+    local dir="$( realpath $( dirname $0 ) )"
+    for s in "$@"; do
+        if [[ -d "$s" ]]; then for t in "$s"/*; do comma-source-relative "$t" || return 1; done
+        else source "$dir/$s" || return 1; fi
+    done
+}
+export -f comma-source-relative
 
 ## @page comma_options_from_name_value comma_options_from_name_value
 # @section comma_options_from_name_value
@@ -120,7 +111,7 @@ export -f comma_pretty_description
 
 ## @page comma_options_names comma_options_names
 # @description converts a standard comma description to a list of names
-# 
+#
 # example
 #   description | comma_options_names
 function comma_options_names()
@@ -132,7 +123,7 @@ export -f comma_options_names
 ## @page comma_options_to_bash_completion comma_options_to_bash_completion
 # @description converts a standard comma description to input
 # for the comma bash completion function
-# 
+#
 # example
 #   description | comma_options_to_bash_completion
 function comma_options_to_bash_completion()
@@ -144,7 +135,7 @@ export -f comma_options_to_bash_completion
 ## @page comma_options_select comma_options_select
 # @description after a set of options have been retrieved as paths convert to
 # options format for a child script
-# 
+#
 # example
 #   comma-test-run $( comma-test-run --description | comma-options-to-name-value $@ | comma_name_value_to_options )
 function comma_name_value_to_options()
@@ -229,3 +220,124 @@ function comma_tee_function()
     io-tee "${file_and_options[@]}" "$functions ${functions:+;} $command" "${command_args[@]}"
 }
 export -f comma_tee_function
+
+function comma-application-common-options()
+{
+    cat <<eof
+--verbose,-v; output more messages to stderr
+eof
+}
+
+export -f comma-application-common-options
+
+function comma-application-init()
+{
+    comma_application_name=$( basename "$0" )
+    local prologue="$1"
+    local epilogue="$2"
+    local common_options=$( cat )
+    if comma_options_help $@; then
+        [[ "$( type -t prologue )" != "function" ]] || { echo; prologue; } >&2
+        cat <<eof >&2
+
+usage: $comma_application_name [<options>]
+
+options
+$( ( [[ -z "$common_options" ]] || echo "$common_options"; comma-application-common-options ) | sed 's#^#    #' )
+
+eof
+        [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; } >&2
+        exit 0
+    fi
+    function say() { echo "$comma_application_name: $@" >&2; }
+    function saymore() { (( ! options_verbose )) || echo "$comma_application_name: $@" >&2; }
+    function verbose() { (( ! options_verbose )) || echo "$comma_application_name: $@" >&2; }
+    function die() { say "$@"; exit 1; }
+    local options; options=$( ( echo "$common_options"; comma-application-common-options ) | comma-options-to-name-value "$@" ) || die "invalid options"
+    eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
+    # declare -a options_unnamed
+    mapfile -t options_unnamed < <( grep '^"' <<< "$options" | sed -e 's#^"##' -e 's#"$##' )
+}
+
+export -f comma-application-init
+
+function comma-application-swiss-init()
+{
+    comma_application_name=$( basename "$0" )
+    local common_options=$( cat )
+    [[ -n "$1" ]] || { echo "$comma_application_name: please specify operation" >&2; exit 1; }
+    comma_application_swiss_operation="$1" # todo? quick and dirty, allow --help anywhere on the command line?
+    if comma_options_help $@; then
+        if [[ "${comma_application_swiss_operation}" == "--help" || "${comma_application_swiss_operation}" == "-h" ]]; then
+            [[ "$( type -t prologue )" != "function" ]] || { echo; prologue; }
+            echo "$common_options" | comma-application-swiss-usage >&2
+            [[ "$( type -t epilogue )" != "function" ]] || { epilogue; echo; }
+        else
+            { [[ -z "$common_options" ]] || echo "$common_options"; comma-application-common-options; } | comma-application-swiss-usage-operation "${comma_application_swiss_operation}" || exit 1
+            echo
+        fi >&2
+        exit 0
+    fi
+    function say() { echo "$comma_application_name: ${comma_application_swiss_operation}: $@" >&2; }
+    function saymore() { (( ! options_verbose )) || echo "$comma_application_name: ${comma_application_swiss_operation}: $@" >&2; }
+    function verbose() { (( ! options_verbose )) || echo "$comma_application_name: ${comma_application_swiss_operation}: $@" >&2; }
+    function die() { say "$@"; exit 1; }
+    [[ $( type -t ${comma_application_swiss_operation}-run ) == "function" ]] || die "expected operation, got '${comma_application_swiss_operation}'" # quick and dirty
+    local options_described=$( echo "$common_options"; comma-application-common-options )
+    local options; options=$( comma-options-to-name-value "$@" <<< "$options_described" ) || die "invalid options"
+    eval "$( grep -v '^"' <<< "$options" | sed 's#^#options_#' | comma_path_value_mangle )"
+    #(( !options_verbose )) || verbose_option="--verbose"
+    #(( !options_input_fields )) || { eval "echo \$${operation//-/_}_input_fields"; exit 0; } # quick and dirty
+    #(( !options_input_format )) || { eval "echo \$${operation//-/_}_input_format"; exit 0; } # quick and dirty
+    #(( !options_output_fields )) || { eval "echo \$${operation//-/_}_output_fields"; exit 0; } # quick and dirty
+    #(( !options_output_format )) || { eval "echo \$${operation//-/_}_output_format"; exit 0; } # quick and dirty
+    if [[ $( type -t ${comma_application_swiss_operation}-options ) == "function" ]]; then
+        local operation_options_described=$( ${comma_application_swiss_operation}-options )
+        local operation_options; operation_options=$( comma-options-to-name-value "$@" <<< "$operation_options_described" ) || die "invalid options"
+        eval "$( grep -v '^"' <<< "$operation_options" | sed 's#^#options_#' | comma_path_value_mangle )"
+    fi
+    mapfile -t options_unnamed < <( ( echo "$options_described"; echo "$operation_options_described"; ) | comma-options-to-name-value "$@" | grep '^"' | sed -e 's#^"##' -e 's#"$##' )
+}
+
+export -f comma-application-swiss-init
+
+function comma-application-swiss-usage-operation()
+{
+    local operation="$1"
+    [[ $( type -t ${operation}-run ) == "function" ]] || { echo "$( basename $0 ): expected operation, got: '${comma_application_swiss_operation}', see --help with no other options for more information" >&2; return 1; } # quick and dirty
+    local common_options=$( cat )
+    local found=0
+    if [[ -z "$common_options" ]]; then echo "${operation}"; else echo "$( basename "$0" ) ${operation}"; fi # uber quick and dirty for now
+    [[ $( type -t ${operation}-description ) != "function" ]] || { ${operation}-description | sed 's#^#    #'; found=1; }
+    if [[ $( type -t ${operation}-usage ) == "function" ]]; then echo "    usage"; ${operation}-usage | sed 's#^#        #'; found=1
+    else echo "    usage: $( basename $0 ) ${comma_application_swiss_operation} [<options>]"; fi
+    [[ -z "$common_options" ]] || { echo "    common options"; echo "$common_options" | sed 's#^#        #'; }
+    [[ $( type -t ${operation}-options ) != "function" ]] || { echo "    options"; ${operation}-options | sed 's#^#        #'; found=1; }
+    [[ $( type -t ${operation}-examples ) != "function" ]] || { echo "    examples"; ${operation}-examples | sed 's#^#        #'; found=1; }
+    (( ! found )) || return 0
+    echo "$( basename $0 ): expected operation, got: '${operation}', see --help with no other options for more information" >&2
+    return 1
+}
+
+export -f comma-application-swiss-usage-operation
+
+function comma-application-swiss-usage()
+{
+    local common_options=$( cat )
+    echo
+    if [[ $( type -t usage ) == "function" ]]; then usage; else echo "usage: $( basename "$0" ) <operation> <options>"; fi
+    echo; echo "common options"
+    { [[ -z "$common_options" ]] || echo "$common_options"; comma-application-common-options; } | sed 's#^#   #'
+    echo; echo "available operations: ${operations[@]}"
+    echo; echo "operations"
+    for operation in ${operations[@]}; do
+        comma-application-swiss-usage-operation "${operation}" | sed 's#^#    #'
+        echo
+    done
+}
+
+export -f comma-application-swiss-usage
+
+function comma-application-swiss-run() { ${comma_application_swiss_operation}-run "$@"; }
+
+export -f comma-application-swiss-run
diff --git a/bash/comma-name-value-util b/bash/comma-name-value-util
index 450445d90..1774a7478 100644
--- a/bash/comma-name-value-util
+++ b/bash/comma-name-value-util
@@ -39,6 +39,9 @@ readonly comma_name_value_util_include_guard_=1
     || source $( type -p comma-log-util ) \
     || { echo "$name: cannot source 'comma-log-util' from '$BASH_SOURCE'" >&2; exit 1; }
 
+# usage: echo <path-value pairs> | comma_path_value_mangle [<delimiter>] [<default_value>]
+#        <delimiter>: default='_'
+#
 # take path-value pairs, mangle path to turn them into bash
 # expressions, e.g:
 # echo hello/world=5 | comma_path_value_mangle
@@ -53,15 +56,18 @@ readonly comma_name_value_util_include_guard_=1
 # local hello_world="5"
 function comma_path_value_mangle()
 {
-    local delimiter="$1"
+    local delimiter="$1" default_value="$2"
     [[ -n "$delimiter" ]] || delimiter="_"
     local path name value
     while IFS='=' read -r path value || [[ -n "$path" ]]; do
         [[ -n "$path" && ! "$path" =~ ^[#\"] ]] || continue
         name=${path//\//$delimiter}
         name=${name//-/$delimiter}
-        value=${value#\"}
-        value=${value%\"}
+        name=${name//[/$delimiter}
+        name=${name//]/}        # just remove trailing ] since it's always followed by / or the end of the line
+        value="${value#\"}"
+        value="${value%\"}"
+        [[ -n "$value" || -z "$default_value" ]] || value="$default_value"
         echo "$name='$value'"
     done
 }
@@ -267,15 +273,15 @@ function comma_path_value_to_var()
         name=${name//-/$delimiter}
         # we are occasionally passed bad data in JSON etc
         # don't attempt to eval anything that is not a legal variable name
-        [[ "$name" =~ $regex ]] || { echo "comma-application-util: comma_path_value_to_var skipping invalid variable name '$name'" >&2 ; ret_code=1 ; continue ; }
+        [[ "$name" =~ $regex ]] || { echo "comma-name-value-util: comma_path_value_to_var skipping invalid variable name '$name'" >&2 ; ret_code=1 ; continue ; }
         # Strip quotes then add them back. This ensures consistent behaviour.
         value=${value#\"}
         value=\"${value%\"}\"
         eval "$export_variable $name=$value" \
-            || { echo "comma-application-util: comma_path_value_to_var failed '$export_variable $name=$value'" >&2 ; ret_code=1 ; }
+            || { echo "comma-name-value-util: comma_path_value_to_var failed '$export_variable $name=$value'" >&2 ; ret_code=1 ; }
     done
     if (( $ret_code != 0 )) ; then
-        echo "comma-application-util: comma_path_value_to_var encountered an error, callstack:" >&2
+        echo "comma-name-value-util: comma_path_value_to_var encountered an error, callstack:" >&2
         comma_stacktrace >&2
     fi
     return $ret_code
diff --git a/bash/comma-resources-util b/bash/comma-resources-util
index 165b72a0d..85ae2038d 100644
--- a/bash/comma-resources-util
+++ b/bash/comma-resources-util
@@ -168,13 +168,8 @@ export -f comma_queue_is_empty_infile
 # Extract cpu count, cores and sockets from lscpu
 function comma_cpu_resources()
 {
-    local lscpu=$( lscpu --parse )
-    local fields=$( echo "$lscpu" | grep '^#' | tail -1 | sed 's/^[# ]*//' )
-    {
-        # lscpu --parse gives us zero-based indexes. Add one to get the count
-        echo "$lscpu" | tail -1 | csv-shuffle --fields $fields --output CPU,Core,Socket
-        echo "1,1,1"
-    } | csv-calc sum --format 3i | name-value-from-csv --fields cpu,core,socket --prefix cpu
+    local fields='cpu,core,socket'
+    { lscpu --parse="$fields" | grep -v '^#' | tail -n1; echo 1,1,1; } | csv-calc sum --format 3i | name-value-from-csv --fields="$fields" --prefix=cpu
 }
 
 # Output the most commonly used system resources: number of CPUs, total RAM,
diff --git a/bash/process/comma-process-util b/bash/process/comma-process-util
index 011ca4e26..5cec38f29 100755
--- a/bash/process/comma-process-util
+++ b/bash/process/comma-process-util
@@ -454,9 +454,13 @@ declare -r terminate_comma_execute_and_wait
 # @description runs a given command as a background task and waits for it to terminate
 #
 # Usage:
-#   comma_execute_and_wait command[,command2[,command3]] [--signals=signal1,signal2,...] \
+#   comma_execute_and_wait command[ command2[ command3]] [--signals=signal1,signal2,...] \
 #                          [--max-wait=max_wait] [--process|--group] [--any|--all] \
 #                          [--pid-fifo=<named pipe>]
+# Quick example:
+#   function _hello() { echo "hello $1"; }
+#   export -f _hello
+#   comma_execute_and_wait --group "some-command-line-util --some-option" "bash -c _hello world"
 #
 # The function executes the given command(s) (non-option argument) in a background process(es)
 # and waits for its completion (or timeout, see below).
diff --git a/bash/test/comma-application-util/comma-application-init/application b/bash/test/comma-application-util/comma-application-init/application
new file mode 100755
index 000000000..001411dcf
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-init/application
@@ -0,0 +1,24 @@
+#!/bin/bash
+
+source $( type -p comma-application-util )
+
+function prologue() { echo "sample application: print parsed command line option values and exit"; }
+
+function epilogue() { echo "example: ./application some unnamed --mandatory blah stuff"; }
+
+function options-description()
+{
+    cat <<eof
+--defaulting,-d=<value>; default=hello; default value
+--flag; flag option
+--mandatory,-m=<value>; this is mandatory option
+--optional,-o=[<value>]; this is optional option
+eof
+}
+
+comma-application-init $@ < <( options-description ) || exit 1
+echo "options/defaulting=$options_defaulting"
+echo "options/flag=$options_flag"
+echo "options/mandatory=$options_mandatory"
+echo "options/optional=$options_optional"
+for (( i = 0; i < ${#options_unnamed[@]}; ++i )); do echo "options/unnamed[$i]=${options_unnamed[$i]}"; done
diff --git a/bash/test/comma-application-util/comma-application-init/expected b/bash/test/comma-application-util/comma-application-init/expected
new file mode 100644
index 000000000..c60f7fcb7
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-init/expected
@@ -0,0 +1,61 @@
+help/output/line[0]=""
+help/output/line[1]="sample application: print parsed command line option values and exit"
+help/output/line[2]=""
+help/output/line[3]="usage: application [<options>]"
+help/output/line[4]=""
+help/output/line[5]="options"
+help/output/line[6]="--defaulting,-d=<value>; default=hello; default value"
+help/output/line[7]="--flag; flag option"
+help/output/line[8]="--mandatory,-m=<value>; this is mandatory option"
+help/output/line[9]="--optional,-o=[<value>]; this is optional option"
+help/output/line[10]="--verbose,-v; output more messages to stderr"
+help/output/line[11]=""
+help/output/line[12]="example: ./application some unnamed --mandatory blah stuff"
+help/status=0
+
+options/mandatory[0]/output/line[0]="options/defaulting=hello"
+options/mandatory[0]/output/line[1]="options/flag="
+options/mandatory[0]/output/line[2]="options/mandatory=blah"
+options/mandatory[0]/output/line[3]="options/optional="
+options/mandatory[0]/status=0
+options/mandatory[1]/output=""
+options/mandatory[1]/status=1
+
+options/optional[0]/output/line[0]="options/defaulting=hello"
+options/optional[0]/output/line[1]="options/flag="
+options/optional[0]/output/line[2]="options/mandatory=blah"
+options/optional[0]/output/line[3]="options/optional="
+options/optional[0]/status=0
+options/optional[1]/output/line[0]="options/defaulting=hello"
+options/optional[1]/output/line[1]="options/flag="
+options/optional[1]/output/line[2]="options/mandatory=blah"
+options/optional[1]/output/line[3]="options/optional=bye"
+options/optional[1]/status=0
+
+options/flag[0]/output/line[0]="options/defaulting=hello"
+options/flag[0]/output/line[1]="options/flag="
+options/flag[0]/output/line[2]="options/mandatory=blah"
+options/flag[0]/output/line[3]="options/optional="
+options/flag[0]/status=0
+options/flag[1]/output/line[0]="options/defaulting=hello"
+options/flag[1]/output/line[1]="options/flag=1"
+options/flag[1]/output/line[2]="options/mandatory=blah"
+options/flag[1]/output/line[3]="options/optional="
+options/flag[1]/status=0
+
+options/unnamed[0]/output/line[0]="options/defaulting=hello"
+options/unnamed[0]/output/line[1]="options/flag="
+options/unnamed[0]/output/line[2]="options/mandatory=blah"
+options/unnamed[0]/output/line[3]="options/optional="
+options/unnamed[0]/output/line[4]="options/unnamed[0]=a"
+options/unnamed[0]/output/line[5]="options/unnamed[1]=b"
+options/unnamed[0]/output/line[6]="options/unnamed[2]=c"
+options/unnamed[0]/status=0
+options/unnamed[1]/output/line[0]="options/defaulting=hello"
+options/unnamed[1]/output/line[1]="options/flag=1"
+options/unnamed[1]/output/line[2]="options/mandatory=blah"
+options/unnamed[1]/output/line[3]="options/optional="
+options/unnamed[1]/output/line[4]="options/unnamed[0]=a"
+options/unnamed[1]/output/line[5]="options/unnamed[1]=b"
+options/unnamed[1]/output/line[6]="options/unnamed[2]=c"
+options/unnamed[1]/status=0
diff --git a/bash/test/comma-application-util/comma-application-init/input b/bash/test/comma-application-util/comma-application-init/input
new file mode 100644
index 000000000..9ab3eccd0
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-init/input
@@ -0,0 +1,9 @@
+help="./application -h 2>&1"
+options/mandatory[0]="./application --mandatory blah"
+options/mandatory[1]="./application"
+options/optional[0]="./application --mandatory blah"
+options/optional[1]="./application --mandatory blah --optional bye"
+options/flag[0]="./application --mandatory blah"
+options/flag[1]="./application --mandatory blah --flag"
+options/unnamed[0]="./application a b --mandatory blah c"
+options/unnamed[1]="./application a b --mandatory blah --flag c"
diff --git a/bash/test/comma-application-util/comma-application-swiss-init/application b/bash/test/comma-application-util/comma-application-swiss-init/application
new file mode 100755
index 000000000..bd9db9fb4
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-swiss-init/application
@@ -0,0 +1,24 @@
+#!/bin/bash
+
+source $( type -p comma-application-util )
+
+operations=( lol roll )
+
+function prologue() { echo "sample application: for a given operation, print parsed command line option values and exit"; }
+
+function epilogue() { echo "example: ./application lol"; }
+
+function options-description() { echo "--some-common-option=[<value>]; default=hello; a sample common option"; }
+
+function lol-description() { echo "laugh out loud"; }
+function lol-usage() { echo "specialised usage: ./application lol [<options>]"; }
+function lol-options() { echo "--how-loud=<value>; default=0; how loud to laugh in dB"; }
+function lol-run() { echo "lol/options/how_loud=$options_how_loud"; }
+
+function roll-description() { echo "roll on the floor"; }
+function roll-options() { echo "--screaming; roll on the floor screaming"; }
+function roll-run() { echo "roll/options/screaming=$options_screaming"; }
+
+comma-application-swiss-init $@ < <( options-description ) || exit 1
+echo "options/some_common_option=$options_some_common_option"
+comma-application-swiss-run $@
diff --git a/bash/test/comma-application-util/comma-application-swiss-init/expected b/bash/test/comma-application-util/comma-application-swiss-init/expected
new file mode 100644
index 000000000..38c190c8b
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-swiss-init/expected
@@ -0,0 +1,69 @@
+help[0]/output/line[0]=""
+help[0]/output/line[1]="sample application: for a given operation, print parsed command line option values and exit"
+help[0]/output/line[2]=""
+help[0]/output/line[3]="usage: application <operation> <options>"
+help[0]/output/line[4]=""
+help[0]/output/line[5]="common options"
+help[0]/output/line[6]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[0]/output/line[7]="--verbose,-v; output more messages to stderr"
+help[0]/output/line[8]=""
+help[0]/output/line[9]="available operations: lol roll"
+help[0]/output/line[10]=""
+help[0]/output/line[11]="operations"
+help[0]/output/line[12]="lol"
+help[0]/output/line[13]="laugh out loud"
+help[0]/output/line[14]="usage"
+help[0]/output/line[15]="specialised usage: ./application lol [<options>]"
+help[0]/output/line[16]="options"
+help[0]/output/line[17]="--how-loud=<value>; default=0; how loud to laugh in dB"
+help[0]/output/line[18]=""
+help[0]/output/line[19]="roll"
+help[0]/output/line[20]="roll on the floor"
+help[0]/output/line[21]="usage: application --help [<options>]"
+help[0]/output/line[22]="options"
+help[0]/output/line[23]="--screaming; roll on the floor screaming"
+help[0]/output/line[24]=""
+help[0]/output/line[25]="example: ./application lol"
+help[0]/status=0
+
+help[1]/output/line[0]="application lol"
+help[1]/output/line[1]="laugh out loud"
+help[1]/output/line[2]="usage"
+help[1]/output/line[3]="specialised usage: ./application lol [<options>]"
+help[1]/output/line[4]="common options"
+help[1]/output/line[5]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[1]/output/line[6]="--verbose,-v; output more messages to stderr"
+help[1]/output/line[7]="options"
+help[1]/output/line[8]="--how-loud=<value>; default=0; how loud to laugh in dB"
+help[1]/status=0
+
+help[2]/output/line[0]="application roll"
+help[2]/output/line[1]="roll on the floor"
+help[2]/output/line[2]="usage: application roll [<options>]"
+help[2]/output/line[3]="common options"
+help[2]/output/line[4]="--some-common-option=[<value>]; default=hello; a sample common option"
+help[2]/output/line[5]="--verbose,-v; output more messages to stderr"
+help[2]/output/line[6]="options"
+help[2]/output/line[7]="--screaming; roll on the floor screaming"
+help[2]/status=0
+
+help[3]/status=1
+
+run/lol[0]/output/line[0]="options/some_common_option=hello"
+run/lol[0]/output/line[1]="lol/options/how_loud=0"
+run/lol[0]/status=0
+
+run/lol[1]/output/line[0]="options/some_common_option=blah"
+run/lol[1]/output/line[1]="lol/options/how_loud=120"
+run/lol[1]/status=0
+
+run/roll[0]/output/line[0]="options/some_common_option=hello"
+run/roll[0]/output/line[1]="roll/options/screaming="
+run/roll[0]/status=0
+
+run/roll[1]/output/line[0]="options/some_common_option=hello"
+run/roll[1]/output/line[1]="roll/options/screaming=1"
+run/roll[1]/status=0
+
+run/fall[0]/output=""
+run/fall[0]/status=1
diff --git a/bash/test/comma-application-util/comma-application-swiss-init/input b/bash/test/comma-application-util/comma-application-swiss-init/input
new file mode 100644
index 000000000..2aa5d0237
--- /dev/null
+++ b/bash/test/comma-application-util/comma-application-swiss-init/input
@@ -0,0 +1,10 @@
+help[0]="./application --help 2>&1"
+help[1]="./application lol --help 2>&1"
+help[2]="./application roll --help 2>&1"
+help[3]="./application fall --help 2>&1"
+
+run/lol[0]="./application lol"
+run/lol[1]="./application lol --some-common-option blah --how-loud=120"
+run/roll[0]="./application roll"
+run/roll[1]="./application roll --screaming"
+run/fall[0]="./application fall"
diff --git a/bash/test/comma-application-util/comma-source-relative/a/b/x b/bash/test/comma-application-util/comma-source-relative/a/b/x
new file mode 100644
index 000000000..b2b26ad4d
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/a/b/x
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+echo "a/b/x/sourced=1"
diff --git a/bash/test/comma-application-util/comma-source-relative/a/b/y b/bash/test/comma-application-util/comma-source-relative/a/b/y
new file mode 100644
index 000000000..57886fadc
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/a/b/y
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+echo "a/b/y/sourced=1"
diff --git a/bash/test/comma-application-util/comma-source-relative/a/z b/bash/test/comma-application-util/comma-source-relative/a/z
new file mode 100644
index 000000000..c117c82e6
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/a/z
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+echo "a/z/sourced=1"
diff --git a/bash/test/comma-application-util/comma-source-relative/expected b/bash/test/comma-application-util/comma-source-relative/expected
new file mode 100644
index 000000000..930585d1c
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/expected
@@ -0,0 +1,13 @@
+once/a/b/x/sourced=1
+multiple/a/b/x/sourced=1
+multiple/a/b/y/sourced=1
+multiple/a/z/sourced=1
+wildcard/a/b/x/sourced=1
+wildcard/a/b/y/sourced=1
+directory/a/b/x/sourced=1
+directory/a/b/y/sourced=1
+directories/a/b/x/sourced=1
+directories/a/b/y/sourced=1
+directories/a/b/x/sourced=1
+directories/a/b/y/sourced=1
+directories/a/z/sourced=1
diff --git a/bash/test/comma-application-util/comma-source-relative/test b/bash/test/comma-application-util/comma-source-relative/test
new file mode 100755
index 000000000..5b8a9e95c
--- /dev/null
+++ b/bash/test/comma-application-util/comma-source-relative/test
@@ -0,0 +1,9 @@
+#!/bin/bash
+
+source ../../../comma-application-util || exit 1
+
+comma-source-relative a/b/x | sed 's#^#once/#'
+comma-source-relative a/b/x a/b/y a/z | sed 's#^#multiple/#'
+comma-source-relative a/b/* | sed 's#^#wildcard/#'
+comma-source-relative a/b | sed 's#^#directory/#'
+comma-source-relative a/b a | sed 's#^#directories/#'
diff --git a/bash/test/comma_status_ok/expected b/bash/test/comma-application-util/comma_status_ok/expected
similarity index 100%
rename from bash/test/comma_status_ok/expected
rename to bash/test/comma-application-util/comma_status_ok/expected
diff --git a/bash/test/comma_status_ok/test b/bash/test/comma-application-util/comma_status_ok/test
similarity index 100%
rename from bash/test/comma_status_ok/test
rename to bash/test/comma-application-util/comma_status_ok/test
diff --git a/bash/test/comma_background/signature/args/expected b/bash/test/comma_background/signature/args/expected
index 4e62e0068..5acb607de 100644
--- a/bash/test/comma_background/signature/args/expected
+++ b/bash/test/comma_background/signature/args/expected
@@ -1,5 +1,7 @@
 #python
 
+from functools import reduce
+
 # iterate through a path of attributes: "obj/data/member/value"
 def deepgetattr(obj, attr):
     """Recurses through an attribute chain to get the ultimate value."""
diff --git a/bash/test/comma_background/signature/basic/test b/bash/test/comma_background/signature/basic/test
index ad66984bf..f7bad1464 100755
--- a/bash/test/comma_background/signature/basic/test
+++ b/bash/test/comma_background/signature/basic/test
@@ -19,7 +19,7 @@ echo "clock_ticks_per_second=$ticks"
 comma_process_exec_and_validate "$fifo" sleep 100 || { echo "$scriptname: fatal system error, wrong background PID" >&2; exit 1; }
 background_pid=$!
 
-now=$( python -c "import sys; from numpy import int64; a = sys.stdin.readline().split()[0]; print int64(float(a) * $ticks)" < /proc/uptime )
+now=$( python3 -c "import sys; from numpy import int64; a = sys.stdin.readline().split()[0]; print( int64(float(a) * $ticks) )" < /proc/uptime )
 echo "time/now=$now"
 
 signature=$( comma_process_signature "$background_pid" )
diff --git a/bash/test/comma_name_value_to_options/expected b/bash/test/comma_name_value_to_options/expected
index 28464c9e2..b45350421 100644
--- a/bash/test/comma_name_value_to_options/expected
+++ b/bash/test/comma_name_value_to_options/expected
@@ -6,10 +6,16 @@ basic[4]/text=""
 basic[5]/text=""
 basic[6]/text="----hello_world=1 "
 multi[0]/text="--hello_world=1 --hello=world --hello=world ----hello_world=1 "
-co_to_nv[0]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
-co_to_nv[1]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
-co_to_nv[2]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
-co_to_nv[3]/text="debug=|1|@directory=|\|/tmp\||@verbose=|1|@"
+
+#co_to_nv[0]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
+#co_to_nv[1]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
+#co_to_nv[2]/text="debug=|1|@directory=|/tmp|@verbose=|1|@"
+#co_to_nv[3]/text="debug=|1|@directory=|\|/tmp\||@verbose=|1|@"
+co_to_nv[0]/text="debug=__quote__1__quote__&directory=__quote__/tmp__quote__&verbose=__quote__1__quote__&"
+co_to_nv[1]/text="debug=__quote__1__quote__&directory=__quote__/tmp__quote__&verbose=__quote__1__quote__&"
+co_to_nv[2]/text="debug=__quote__1__quote__&directory=__quote__/tmp__quote__&verbose=__quote__1__quote__&"
+co_to_nv[3]/text="debug=__quote__1__quote__&directory=__quote____backslash__quote__/tmp__backslash__quote____quote__&verbose=__quote__1__quote__&"
+
 cnv_to_o[0]/text="--debug=1 --directory=/tmp --verbose=1 "
 cnv_to_o[1]/text="--debug=1 --directory=/tmp --verbose=1 "
 cnv_to_o[2]/text="--debug=1 --directory=/tmp --verbose=1 "
diff --git a/bash/test/comma_name_value_to_options/test b/bash/test/comma_name_value_to_options/test
index e8c1f5369..7e549281c 100755
--- a/bash/test/comma_name_value_to_options/test
+++ b/bash/test/comma_name_value_to_options/test
@@ -58,6 +58,8 @@ echo '--debug; much more debug output
 --verbose,-v; more output'
 }
 
+function escape() { sed -e 's#"#__quote__#g' -e 's#\\#__backslash#g' | tr '\n' '&'; }
+
 echo "basic[0]/text=\"$( comma_name_value_to_options <<< 'hello world' )\""
 echo "basic[1]/text=\"$( comma_name_value_to_options <<< 'hello_world=1' )\""
 echo "basic[2]/text=\"$( comma_name_value_to_options <<< 'hello=world' )\""
@@ -73,14 +75,14 @@ hello="world"
 hello_world
 --hello_world=1' | tr '\n' '@' )\""
 
-echo "co_to_nv[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp" --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
-echo "co_to_nv[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp" --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
-echo "co_to_nv[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp" --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
-echo "co_to_nv[3]/text=\"$( command_description | comma-options-to-name-value '--directory="/tmp"' --debug --verbose | tr '\n' '@' | tr '"' '|' )\""
+echo "co_to_nv[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp"   --debug --verbose | escape )\""
+echo "co_to_nv[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp"   --debug --verbose | escape )\""
+echo "co_to_nv[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp"   --debug --verbose | escape )\""
+echo "co_to_nv[3]/text=\"$( command_description | comma-options-to-name-value '--directory="/tmp"' --debug --verbose | escape )\""
 
-echo "cnv_to_o[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp" --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
-echo "cnv_to_o[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp" --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
-echo "cnv_to_o[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp" --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
+echo "cnv_to_o[0]/text=\"$( command_description | comma-options-to-name-value --directory "/tmp"   --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
+echo "cnv_to_o[1]/text=\"$( command_description | comma-options-to-name-value --directory="/tmp"   --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
+echo "cnv_to_o[2]/text=\"$( command_description | comma-options-to-name-value "--directory=/tmp"   --debug --verbose | comma_name_value_to_options | tr '"' '|' )\""
 
 comma_name_value_to_options <<< 'directory=/tmp
 verbose="1"
diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/expected b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
index 7c500cc85..59c377d89 100644
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/expected
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/expected
@@ -4,3 +4,14 @@ basic/var_b='22'
 no_newline_at_end/var_a=basic/var_a
 no_newline_at_end/var_b=basic/var_b
 
+path/a_b_c='1'
+dashes/a_b_c='1'
+path_with_dashes/a_b_c='1'
+subscript/a_b_0='1'
+subscript_followed_by_path/a_b_0_c='1'
+a="123"
+b="123"
+c="123"
+
+skip_empty_lines_n='a'
+skip_empty_lines_v='b'
diff --git a/bash/test/comma_name_value_util/comma_path_value_mangle/test b/bash/test/comma_name_value_util/comma_path_value_mangle/test
index e619aa266..be4561030 100755
--- a/bash/test/comma_name_value_util/comma_path_value_mangle/test
+++ b/bash/test/comma_name_value_util/comma_path_value_mangle/test
@@ -7,6 +7,18 @@ input="var_a=21
 var_b=22"
 
 echo "$input" | comma_path_value_mangle | sed 's|^|basic/|'
-
 echo -n "$input" | comma_path_value_mangle | sed 's|^|no_newline_at_end/|'
+echo "a/b/c=1" | comma_path_value_mangle | sed 's|^|path/|'
+echo "a-b-c=1" | comma_path_value_mangle | sed 's|^|dashes/|'
+echo "a/b-c=1" | comma_path_value_mangle | sed 's|^|path_with_dashes/|'
+echo "a/b[0]=1" | comma_path_value_mangle | sed 's|^|subscript/|'
+echo "a/b[0]/c=1" | comma_path_value_mangle | sed 's|^|subscript_followed_by_path/|'
+( echo a; echo b; echo c ) | comma_path_value_mangle '_' 123
+
+cat <<eof | comma_path_value_mangle
+
+skip_empty_lines/n=a
+
+skip_empty_lines/v=b
 
+eof
\ No newline at end of file
diff --git a/bash/test/examples/expected b/bash/test/examples/expected
new file mode 100644
index 000000000..2027deaff
--- /dev/null
+++ b/bash/test/examples/expected
@@ -0,0 +1,4 @@
+hello/world/output="hello world"
+hello/world/status=0
+hello/jimmy/output="hello jimmy"
+hello/jimmy/status=0
\ No newline at end of file
diff --git a/bash/test/examples/input b/bash/test/examples/input
new file mode 100644
index 000000000..e58f29871
--- /dev/null
+++ b/bash/test/examples/input
@@ -0,0 +1,2 @@
+hello/world="some-function world"
+hello/jimmy="some-function jimmy"
\ No newline at end of file
diff --git a/bash/test/examples/my-util b/bash/test/examples/my-util
new file mode 100644
index 000000000..b27a99881
--- /dev/null
+++ b/bash/test/examples/my-util
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+function some-function() { echo "hello $1"; }
\ No newline at end of file
diff --git a/bash/test/examples/test b/bash/test/examples/test
new file mode 100755
index 000000000..d692563aa
--- /dev/null
+++ b/bash/test/examples/test
@@ -0,0 +1,4 @@
+#!/bin/bash
+source $( type -p comma-test-util ) # test framework stuff
+source my-util # bash utils under test
+comma_test_commands # execute tests defined in file called 'input' and match output agains values in file called 'expected'
diff --git a/bash/test/test b/bash/test/test
new file mode 100755
index 000000000..bff14d7ad
--- /dev/null
+++ b/bash/test/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util ) # test framework stuff
+comma_test_commands # execute tests defined in file called 'input' and match output agains values in file called 'expected'
diff --git a/containers/CMakeLists.txt b/containers/CMakeLists.txt
index 1506e39fb..1e9d5a730 100644
--- a/containers/CMakeLists.txt
+++ b/containers/CMakeLists.txt
@@ -1,16 +1,19 @@
 SET( PROJECT "containers" )
-SET( TARGET_NAME comma${PROJECT} )
+SET( TARGET_NAME comma_${PROJECT} )
 
 FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
+FILE( GLOB multidimensional_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/multidimensional/*.h )
+FILE( GLOB ordered_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/ordered/*.h )
 
-SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
-
-add_custom_target( ${TARGET_NAME} ${source} ${includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
+SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${multidimensional_includes} ${ordered_includes} )
+add_custom_target( ${TARGET_NAME} ${source} ${includes} ${multidimensional_includes} ${ordered_includes} ) # ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_includes} )
 #SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
 #TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_base )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+INSTALL( FILES ${multidimensional_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/multidimensional )
+INSTALL( FILES ${ordered_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ordered )
 #INSTALL(
 #    TARGETS ${TARGET_NAME}
 #    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
@@ -18,6 +21,10 @@ INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 #    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
 #)
 
-IF( comma_BUILD_TESTS )
-    ADD_SUBDIRECTORY( test )
-ENDIF( comma_BUILD_TESTS )
+if( comma_BUILD_TESTS )
+    add_subdirectory( test )
+endif( comma_BUILD_TESTS )
+
+if( comma_BUILD_APPLICATIONS )
+    add_subdirectory( applications )
+endif( comma_BUILD_APPLICATIONS )
diff --git a/containers/applications/CMakeLists.txt b/containers/applications/CMakeLists.txt
new file mode 100644
index 000000000..a7433d78c
--- /dev/null
+++ b/containers/applications/CMakeLists.txt
@@ -0,0 +1,7 @@
+set( dir ${SOURCE_CODE_BASE_DIR}/containers/applications )
+
+add_executable( math-lookup math-lookup.cpp ) # todo! should math-lookup be here at all? does it create circular dependencies?
+#add_dependencies( math-lookup comma_containers )
+target_link_libraries( math-lookup ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_name_value comma_csv comma_string )
+set_target_properties( math-lookup PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS math-lookup RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/containers/applications/math-lookup.cpp b/containers/applications/math-lookup.cpp
new file mode 100644
index 000000000..fd8886204
--- /dev/null
+++ b/containers/applications/math-lookup.cpp
@@ -0,0 +1,250 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#include <fstream>
+#include <iostream>
+#include <memory>
+#include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../csv/stream.h"
+#include "../../csv/traits.h"
+#include "../../name_value/parser.h"
+#include "../multidimensional/array.h"
+#include "../multidimensional/traits.h"
+
+void usage( bool verbose )
+{
+    std::cerr << "operations on a multidimensional lookup table" << std::endl;
+    std::cerr << "lookup tables with up to 4-dimension" << std::endl;
+    std::cerr << "values are currently supported; if you need more, just ask" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat input.csv | math-lookup <operation> [<lut-filename>[;<lut-csv-options>]] <options>" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    index: todo: output index for a given input" << std::endl;
+    std::cerr << "    interpolate: output interpolated value for the given input" << std::endl;
+    std::cerr << "    nearest: todo: output table element index and value nearest to the given input" << std::endl;
+    std::cerr << "    query: output table element index and value for the given input" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --origin,-o=<point>; e.g: --origin=0,1,2,3" << std::endl;
+    std::cerr << "    --resolution,-r=<point>; e.g: --resolution=0.5,3,2,3" << std::endl;
+    std::cerr << "    --shape=<point>; e.g: --shape=3,2,5,3, same as in numpy" << std::endl;
+    std::cerr << "                     i.e. shape[0] is the slowest-changing" << std::endl;
+    std::cerr << "                     i.e. expected lookup table memory layout" << std::endl;
+    std::cerr << "                     is rows first" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "input/output options" << std::endl;
+    std::cerr << "    --input-fields; todo: print input fields for an operation to stdout and exit" << std::endl;
+    std::cerr << "    --output-fields; todo: print output fields for an operation to stdout and exit" << std::endl;
+    std::cerr << "    --output-format; todo: print output format for an operation to stdout and exit" << std::endl;
+    std::cerr << "    --permissive; discard inputs outside lookup table" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+// todo
+// - 1-dimensional: fix
+// - nearest: fix
+// - regression test: basics
+
+static bool permissive{false};
+static bool verbose{false};
+
+// template< typename T, std::size_t D, typename S >
+// std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
+
+// template< typename T, std::size_t D, typename S >
+// std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { auto r = lhs; r *= rhs; return r; }
+
+// template< typename T, std::size_t D >
+// std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] += rhs[i]; } return lhs; } // quick and dirty; let compiler optimize
+
+// template< typename T, std::size_t D >
+// std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { auto r = lhs; r += rhs; return r; }
+
+template< typename T, std::size_t D >
+std::ostream& operator<<( std::ostream& os, const std::array< T, D >& rhs ) { std::string d; for( unsigned int i = 0; i < D; ++i ) { os << d << rhs[i]; d = ","; } return os; }
+
+namespace comma { namespace applications { namespace lookup { namespace operations {
+
+template< typename T, std::size_t D >
+struct _array { std::array< T, D > point; };
+
+template < typename T, std::size_t D, std::size_t E >
+struct lut
+{
+    typedef std::array< double, D > point_t;
+    typedef comma::containers::multidimensional::index< D > index_t; // typedef std::array< std::size_t, D > index_t;
+    typedef std::array< T, E > value_t;
+    typedef comma::containers::multidimensional::grid< value_t, D, point_t > grid_t;
+    typedef _array< double, D > input_t;
+    typedef _array< T, D > output_t;
+
+    static grid_t& load( grid_t& g, const comma::csv::options& csv )
+    {
+        std::ifstream ifs( csv.filename, std::ios::binary );
+        COMMA_ASSERT_BRIEF( ifs.is_open(), "lookup table: failed to open '" << csv.filename << "'" );
+        std::size_t size = g.data().size() * sizeof( T ) * E;
+        ifs.read( reinterpret_cast< char* >( &g.data()[0] ), size );
+        COMMA_ASSERT_BRIEF( ifs.gcount() > 0, "lookup table: failed to read from '" << csv.filename << "'" );
+        COMMA_ASSERT_BRIEF( std::size_t( ifs.gcount() ) == size, "lookup table: on file '" << csv.filename << "': expected " << size << " bytes; got: " << ifs.gcount() );
+        return g;
+    }
+
+    static std::pair< index_t, value_t > interpolate( const grid_t& g, const point_t& p )
+    {
+        std::pair< index_t, value_t > r;
+        r.first = g.index_of( p );
+        r.second = g.interpolated( p );
+        return r;
+    }
+
+    static std::pair< index_t, value_t > nearest( const grid_t& g, const point_t& p )
+    {
+        std::pair< index_t, value_t > r;
+        r.first = g.nearest_to( p );
+        r.second = g[r.first];
+        return r;
+    }
+
+    static std::pair< index_t, value_t > query( const grid_t& g, const point_t& p )
+    {
+        std::pair< index_t, value_t > r;
+        r.first = g.index_of( p );
+        r.second = g[r.first];
+        return r;
+    }
+
+    static int run( const std::string& operation
+                  , const comma::csv::options& csv
+                  , const comma::csv::options& lut_csv
+                  , const std::vector< double >& origin
+                  , const std::vector< double >& resolution
+                  , const std::vector< std::size_t >& shape )
+    {
+        std::pair< index_t, value_t > ( *f )( const grid_t&, const point_t& );
+        if( operation == "interpolate" ) { f = lut< T, D, E >::interpolate; }
+        else if( operation == "nearest" ) { COMMA_THROW_BRIEF( comma::exception, "nearest: todo" ); } //else if( operation == "nearest" ) { f = lut< T, D, E >::nearest; }
+        else if( operation == "query" ) { f = lut< T, D, E >::query; }
+        else { COMMA_THROW_BRIEF( comma::exception, "expected operation; got: '" << operation << "'" ); }
+        point_t o, r;
+        index_t s;
+        std::memcpy( &o[0], &origin[0], D * sizeof( double ) ); // quick and dirty
+        std::memcpy( &r[0], &resolution[0], D * sizeof( double ) ); // quick and dirty
+        std::memcpy( &s[0], &shape[0], D * sizeof( std::size_t ) ); // quick and dirty
+        grid_t grid( o, r, s );
+        load( grid, lut_csv );
+        input_t zero;
+        std::memset( &zero.point[0], 0, zero.point.size() * sizeof( T ) );
+        comma::csv::input_stream< input_t > istream( std::cin, csv, zero );
+        comma::csv::output_stream< std::pair< index_t, value_t > > ostream( std::cout, csv.binary() );
+        auto tied = comma::csv::make_tied( istream, ostream );
+        while( istream.ready() || std::cin.good() )
+        {
+            const auto& p = istream.read();
+            if( !p ) { break; }
+            if( !grid.has( p->point ) ) 
+            {
+                if( permissive ) { comma::saymore() << "discarded input outside grid: " << p->point << std::endl; continue; }
+                comma::say() << "input outside grid: " << p->point << "; use --permissive to discard" << std::endl;
+                return 1;
+            }
+            tied.append( f( grid, p->point ) );
+            if( csv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    }
+};
+
+template < typename T, std::size_t D > static int run_with_dim( const std::string& operation
+                                                              , const comma::csv::options& csv
+                                                              , const comma::csv::options& lut_csv
+                                                              , const std::vector< double >& origin
+                                                              , const std::vector< double >& resolution
+                                                              , const std::vector< std::size_t >& shape )
+{
+    switch( lut_csv.format().count() )
+    {
+        case 1: return lut< T, D, 1 >::run( operation, csv, lut_csv, origin, resolution, shape );
+        case 2: return lut< T, D, 2 >::run( operation, csv, lut_csv, origin, resolution, shape );
+        case 3: return lut< T, D, 3 >::run( operation, csv, lut_csv, origin, resolution, shape );
+        case 4: return lut< T, D, 4 >::run( operation, csv, lut_csv, origin, resolution, shape );
+        default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup table values currently supported; got: " << lut_csv.format().count() << " dimensions in " << lut_csv.format().string() );
+    }
+    return 1;
+}
+
+template < typename T > static int run_as( const std::string& operation
+                                         , const comma::csv::options& csv
+                                         , const comma::csv::options& lut_csv
+                                         , const std::vector< double >& origin
+                                         , const std::vector< double >& resolution
+                                         , const std::vector< std::size_t >& shape )
+{
+    switch( origin.size() )
+    {
+        // todo! case 1: return run_with_dim< T, 1 >( operation, csv, lut_csv, origin, resolution, shape );
+        case 2: return run_with_dim< T, 2 >( operation, csv, lut_csv, origin, resolution, shape );
+        case 3: return run_with_dim< T, 3 >( operation, csv, lut_csv, origin, resolution, shape );
+        case 4: return run_with_dim< T, 4 >( operation, csv, lut_csv, origin, resolution, shape );
+        default: COMMA_THROW( comma::exception, "up to 4-dimensional lookup tables currently supported; got: " << origin.size() << " dimensions" );
+    }
+    return 1;
+}
+
+} } } } // namespace comma { namespace applications { namespace lookup { namespace operations {
+
+namespace comma { namespace visiting {
+
+template < typename T, std::size_t D > struct traits< comma::applications::lookup::operations::_array< T, D > >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, comma::applications::lookup::operations::_array< T, D >& p, Visitor& v ) { v.apply( "point", p.point ); }
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::applications::lookup::operations::_array< T, D >& p, Visitor& v ) { v.apply( "point", p.point ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace applications { namespace lookup { namespace operations {
+
+static int run( const comma::command_line_options& options, const csv::options& csv, const std::vector< std::string >& unnamed )
+{
+    COMMA_ASSERT_BRIEF( unnamed.size() > 1, "please specify lookup table file as: math-lookup <operation> <filename>" );
+    auto lut_csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( unnamed[1] );
+    COMMA_ASSERT_BRIEF( lut_csv.binary(), "lookup table: on file '" << lut_csv.filename << "': only binary files are currently supported, e.g: 'lut.bin;binary=3f'" );
+    const auto& origin = comma::split_as< double >( options.value< std::string >( "--origin,-o" ), ',' );
+    const auto& resolution = comma::split_as< double >( options.value< std::string >( "--resolution,-r" ), ',' );
+    const auto& shape = comma::split_as< std::size_t >( options.value< std::string >( "--shape" ), ',' );
+    COMMA_ASSERT_BRIEF( origin.size() == resolution.size(), "expected --origin and --resolution of the same dimensions; got: " << origin.size() << " and " << resolution.size() );
+    COMMA_ASSERT_BRIEF( origin.size() == shape.size(), "expected --origin and --shape of the same dimensions; got: " << origin.size() << " and " << shape.size() );
+    switch( lut_csv.format().elements()[0].type ) // todo! quick and dirty
+    {
+        case comma::csv::format::float_t: return comma::applications::lookup::operations::run_as< float >( unnamed[0], csv, lut_csv, origin, resolution, shape );
+        case comma::csv::format::double_t: return comma::applications::lookup::operations::run_as< double >( unnamed[0], csv, lut_csv, origin, resolution, shape );
+        default: COMMA_THROW( comma::exception, "only float and double as lookup table values are supported; got: '" << unnamed[1] << "'" );
+    }
+    return 1;
+}
+
+} } } } // namespace comma { namespace applications { namespace lookup { namespace operations {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        comma::csv::options csv( options );
+        const auto& unnamed = options.unnamed( "--flush,--permissive,--verbose,-v", "-.*" );
+        if( unnamed.empty() ) { comma::say() << "please specify operation" << std::endl; return 1; }
+        permissive = options.exists( "--permissive" );
+        verbose = options.exists( "--verbose,-v" );
+        return comma::applications::lookup::operations::run( options, csv, unnamed );
+    }
+    catch( std::exception& ex ) { comma::say() << "caught exception: " << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "caught unknown exception" << std::endl; }
+    return 1;
+}
diff --git a/containers/cached.h b/containers/cached.h
new file mode 100644
index 000000000..0ec819807
--- /dev/null
+++ b/containers/cached.h
@@ -0,0 +1,70 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All Rights Reserved
+
+#include <deque>
+#include <memory>
+#include <unordered_map>
+namespace comma {
+
+template < typename T, typename K, typename Hash = std::hash< K > >
+class cached
+{
+    public:
+        cached( unsigned int max_size = 0 ): _size( max_size ) {}
+
+        template < typename... Args > T& get( Args... args );
+
+        template < typename... Args > const T& get( Args... args ) const;
+
+        template < typename... Args > auto operator()( Args... args ) { return get( args... )( args... ); }
+
+        template < typename... Args > auto operator()( Args... args ) const { return get( args... )( args... ); }
+
+        void clear() { _values.clear(); }
+
+        void pop( unsigned int size = 1 );
+
+        const std::unordered_map< K, std::unique_ptr< T >, Hash >& values() const { return _values; }
+
+    protected:
+        mutable std::unordered_map< K, std::unique_ptr< T >, Hash > _values; // todo! use proper move semantics instead of unique_ptr
+        mutable std::deque< K > _keys;
+        unsigned int _size{0};
+};
+
+template < typename T, typename K, typename Hash >
+template < typename... Args >
+T& cached< T, K, Hash >::get( Args... args )
+{
+    K k{ args... };
+    auto i = _values.find( k );
+    if( i != _values.end() ) { return *( i->second ); }
+    if( _size > 0 && _values.size() == _size ) { pop(); }
+    _keys.emplace_back( k );
+    return *( _values.emplace( std::make_pair( k, std::make_unique< T >( k ) ) ).first->second );
+}
+
+template < typename T, typename K, typename Hash >
+template < typename... Args >
+const T& cached< T, K, Hash >::get( Args... args ) const
+{
+    K k{ args... };
+    auto i = _values.find( k );
+    if( i != _values.end() ) { return *( i->second ); }
+    if( _size > 0 && _values.size() == _size ) { pop(); }
+    _keys.emplace_back( k );
+    return *( _values.emplace( std::make_pair( k, std::make_unique< T >( k ) ) ).first->second );
+}
+
+template < typename T, typename K, typename Hash >
+inline void cached< T, K, Hash >::pop( unsigned int size )
+{
+    for( unsigned int i = 0; i < size; ++i )
+    {
+        if( _keys.empty() ) { return; }
+        _values.erase( _keys.front() );
+        _keys.pop_front();
+    }
+}
+
+} // namespace comma {
diff --git a/containers/cyclic_buffer.h b/containers/cyclic_buffer.h
index fdbe97691..bfdbc45a9 100644
--- a/containers/cyclic_buffer.h
+++ b/containers/cyclic_buffer.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CONTAINERS_CYCLIC_BUFFER_H_
-#define COMMA_CONTAINERS_CYCLIC_BUFFER_H_
+#pragma once
 
 #include <vector>
 #include <boost/optional.hpp>
@@ -50,49 +21,42 @@ template < typename T >
 class cyclic_buffer
 {
     public:
-        /// constructor
         cyclic_buffer( std::size_t size, const T& t = T() );
         
-        /// copy constructor
         cyclic_buffer( const cyclic_buffer& rhs ) { operator=( rhs ); }
         
-        /// assignment
         const cyclic_buffer& operator=( const cyclic_buffer& rhs );
         
-        /// return front
         T& front();
         
-        /// return front
         const T& front() const;
         
-        /// return back
         T& back();
         
-        /// return back
-        
         const T& back() const;
+
+        std::size_t front_index() const { return begin_(); }
+
+        std::size_t end_index() const { return end_(); }
         
-        /// push a new element at the end of the list
-        void push( const T& t );
+        void push( const T& t, bool force = false );
         
-        /// push a new element at the end of the list
         template < typename Iterator >
-        void push( Iterator begin, Iterator end );
+        void push( Iterator begin, Iterator end, bool force = false );
         
-        /// pop the new element at the front of the list
         void pop( std::size_t n = 1 );
         
-        /// return current size
         std::size_t size() const;
         
-        /// return capacity
         std::size_t capacity() const;
         
-        /// return true, if empty
         bool empty() const;
         
-        /// clear
         void clear();
+
+        const std::vector< T >& data() const { return vector_; }
+
+        std::vector< T >& data() { return vector_; }
         
     protected:
         std::vector< T > vector_;
@@ -173,19 +137,27 @@ template < typename T >
 inline std::size_t cyclic_buffer< T >::capacity() const { return vector_.size(); }
 
 template < typename T >
-inline void cyclic_buffer< T >::push( const T& t )
+inline void cyclic_buffer< T >::push( const T& t, bool force )
 {
-    if( size() == vector_.size() ) { COMMA_THROW( comma::exception, "full" ); }
-    vector_[ end_() ] = t;
+    if( size() == vector_.size() )
+    { 
+        if( !force ) { COMMA_THROW( comma::exception, "full" ); }
+        vector_[ begin_() ] = t;
+        ++begin_;
+    }
+    else
+    {
+        vector_[ end_() ] = t;
+    }
     ++end_;
     empty_ = false;
 }
 
 template < typename T >
 template < typename Iterator >
-inline void cyclic_buffer< T >::push( Iterator begin, Iterator end )
+inline void cyclic_buffer< T >::push( Iterator begin, Iterator end, bool force )
 {
-    for( Iterator it = begin; it != end; ++it ) { push( *it ); }
+    for( Iterator it = begin; it != end; ++it ) { push( *it, force ); }
 }
 
 template < typename T >
@@ -244,5 +216,3 @@ inline const T& fixed_cyclic_buffer< T, S >::operator[]( std::size_t i ) const
 }
 
 } // namespace comma {
-
-#endif // COMMA_CONTAINERS_CYCLIC_BUFFER_H_
diff --git a/containers/enums.h b/containers/enums.h
new file mode 100644
index 000000000..b1b1fb572
--- /dev/null
+++ b/containers/enums.h
@@ -0,0 +1,53 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <map>
+#include <string>
+#include <vector>
+#include "find.h"
+
+namespace comma { namespace enums {
+
+/// trivial convenience wrapper; works only for enums with sequential values
+template < typename Enum, typename K = std::string >
+std::map< K, Enum > as_map( const std::vector< K >& keys, unsigned int begin = 0 );
+
+/// trivial convenience wrapper; works only for enums with sequential values
+template < typename Enum, typename K = std::string >
+std::map< Enum, K > as_key_map( const std::vector< K >& keys, unsigned int begin = 0 );
+
+/// trivial convenience wrapper
+template < typename Enum, typename K = std::string >
+Enum find( const K& k, const std::vector< K >& keys, unsigned int begin = 0 );
+
+// todo: visiting traits
+template < typename Enum, typename Names >
+struct named: public Enum, Names
+{
+    const std::string& name() { return this->names()[static_cast< unsigned int >( *this )]; }
+};
+
+
+template < typename Enum, typename K >
+inline std::map< K, Enum > as_map( const std::vector< K >& keys, unsigned int begin )
+{
+    std::map< K, Enum > m;
+    for( unsigned int i{0}, j{begin}; i < keys.size(); ++i, ++j ) { m[keys[i]] = static_cast< Enum >( j ); }
+    return m;
+}
+
+template < typename Enum, typename K >
+inline std::map< Enum, K > as_key_map( const std::vector< K >& keys, unsigned int begin )
+{
+    std::map< Enum, K > m;
+    for( unsigned int i{0}, j{begin}; i < keys.size(); ++i, ++j ) { m[static_cast< Enum >( j )] = keys[i]; }
+    return m;
+}
+
+template < typename Enum, typename K >
+Enum find( const K& k, const std::vector< K >& keys, unsigned int begin ) { return containers::find_or_throw< K, Enum >( as_map< Enum, K >( keys, begin ), k ); }
+
+} } // namespace comma { namespace enums {
diff --git a/containers/find.h b/containers/find.h
new file mode 100644
index 000000000..76e7b58a6
--- /dev/null
+++ b/containers/find.h
@@ -0,0 +1,52 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <map>
+#include <unordered_map>
+#include "../base/exception.h"
+
+namespace comma { namespace containers {
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > const V& find_or_throw( const std::map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > V& find_or_throw( std::map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > const V& find_or_throw( const std::unordered_map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+/// trivial convenience wrapper: find element, if not found, throw exception
+template < typename K, typename V > V& find_or_throw( std::unordered_map< K, V >& m, const K& k, const std::string& message = std::string() );
+
+
+namespace impl {
+
+template < typename M, typename K > inline const auto& find_or_throw( const M& m, const K& k, const std::string& message )
+{
+    auto it = m.find( k );
+    COMMA_ASSERT( it != m.end(), ( message.empty() ? std::string() : ( message + ": " ) ) << "k '" << k << "' not found" );
+    return it->second;
+}
+
+template < typename M, typename K > inline auto& find_or_throw( M& m, const K& k, const std::string& message )
+{
+    auto it = m.find( k );
+    COMMA_ASSERT( it != m.end(), ( message.empty() ? std::string() : ( message + ": " ) ) << "k '" << k << "' not found" );
+    return it->second;
+}
+
+} // namespace impl {
+
+template < typename K, typename V > inline const V& find_or_throw( const std::map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+template < typename K, typename V > inline V& find_or_throw( std::map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+template < typename K, typename V > inline const V& find_or_throw( const std::unordered_map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+template < typename K, typename V > inline V& find_or_throw( std::unordered_map< K, V >& m, const K& k, const std::string& message ) { return impl::find_or_throw( m, k, message ); }
+
+} } // namespace comma { namespace containers {
diff --git a/containers/multidimensional/array.h b/containers/multidimensional/array.h
new file mode 100644
index 000000000..5d08c17d4
--- /dev/null
+++ b/containers/multidimensional/array.h
@@ -0,0 +1,319 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+#include <cstring>
+#include "../../base/types.h"
+#include "array_traits.h"
+#include "index.h"
+
+namespace comma { namespace containers { namespace multidimensional {
+
+template < typename V, unsigned int D >
+class slice
+{
+    public:
+        typedef multidimensional::index< D > index_type; // typedef std::array< std::size_t, D > index_type; // todo: typedef multidimensional::index< D > index_type;
+
+        typedef V value_type;
+
+        static const unsigned int dimensions{D};
+
+        slice( const index_type& shape, V* data ): _shape( shape ), _size( _product( _shape ) ), _data( data ) {}
+
+        slice& operator=( const slice& rhs ) = default;
+
+        V& operator[]( const index_type& i ) { return _data[ _index( i ) ]; }
+
+        const V& operator[]( const index_type& i ) const { return _data[ _index( i ) ]; }
+
+        template < unsigned int I >
+        slice< V, D - I > at( const multidimensional::index< I >& i );
+
+        template < unsigned int I >
+        const slice< V, D - I > at( const multidimensional::index< I >& i ) const;
+
+        slice< V, D - 1 > at( std::size_t i ) { return at< 1 >( multidimensional::index< 1 >{i} ); }
+
+        const slice< V, D - 1 > at( std::size_t i ) const { return at< 1 >( multidimensional::index< 1 >{i} ); }
+
+        V* data() { return _data; }
+        
+        const V* data() const { return _data; }
+
+        const index_type& shape() const { return _shape; }
+
+        class const_iterator;
+
+        class iterator
+        {
+            public:
+                iterator() = default;
+                V& operator*() { return *_it; }
+                const V& operator*() const { return *_it; }
+                iterator& operator++() { ++_it; ++_i; return *this; }
+                index_type index() const;
+                bool operator==( const iterator& rhs ) const { return _it == rhs._it; }
+                bool operator==( const const_iterator& rhs ) const { return _it == rhs._it; }
+                bool operator!=( const iterator& rhs ) const { return !operator==( rhs ); }
+                bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
+
+            private:
+                friend class slice< V, D >;
+                std::size_t _i{0};
+                V* _it{nullptr};
+                index_type _shape;
+                iterator( std::size_t i, V* it, const index_type& shape ): _i( i ), _it( it ), _shape( shape ) {}
+        };
+
+        class const_iterator
+        {
+            public:
+                const_iterator() = default;
+                const V& operator*() const { return *_it; }
+                const_iterator& operator++() { ++_it; ++_i; return *this; }
+                index_type index() const;
+                bool operator==( const iterator& rhs ) const { return _it == rhs._it; }
+                bool operator==( const const_iterator& rhs ) const { return _it == rhs._it; }
+                bool operator!=( const iterator& rhs ) const { return !operator==( rhs ); }
+                bool operator!=( const const_iterator& rhs ) const { return !operator==( rhs ); }
+
+            private:
+                friend class slice< V, D >;
+                std::size_t _i{0};
+                const V* _it{nullptr};
+                index_type _shape;
+                const_iterator( std::size_t i, V* it, const index_type& shape ): _i( i ), _it( it ), _shape( shape ) {}
+        };
+
+        iterator begin() { return iterator( 0, _data, _shape ); }
+
+        const_iterator begin() const { return const_iterator( 0, _data, _shape ); }
+
+        iterator end() { return iterator( _size, _data + _size, _shape ); }
+
+        const_iterator end() const { return const_iterator( _size, _data + _size, _shape ); }
+
+        std::size_t absolute_index( const index_type& i ) const { return _index( i ); }
+
+    protected:
+        index_type _shape;
+        std::size_t _size;
+        V* _data;
+        std::size_t _index( const index_type& i ) const;
+        static std::size_t _product( const index_type& i );
+};
+
+
+template < typename V, unsigned int D, typename S = std::vector< V > >
+class array
+{
+    public:
+        typedef slice< V, D > slice_type;
+
+        typedef typename slice_type::index_type index_type;
+
+        typedef V value_type;
+
+        typedef S storage_type;
+
+        const unsigned int dimensions{D};
+
+        array( const index_type& shape, const V& default_value = V() );
+
+        V& operator[]( const index_type& i ) { return _slice[i]; } // V& operator[]( const index_type& i ) { return _data[ absolute_index( i ) ]; } //{ return _slice[i]; }
+
+        const V& operator[]( const index_type& i ) const { return _slice[i]; } // const V& operator[]( const index_type& i ) const { return _data[ absolute_index( i ) ]; } //{ return _slice[i]; }
+
+        template < unsigned int I >
+        multidimensional::slice< V, D - I > at( const multidimensional::index< I >& i ) { return _slice.template at< I >( i ); } // todo!
+
+        template < unsigned int I >
+        const multidimensional::slice< V, D - I > at( const multidimensional::index< I >& i ) const { return _slice.template at< I >( i ); } // todo!
+
+        multidimensional::slice< V, D - 1 > at( std::size_t i ) { return _slice.at( i ); }
+
+        const multidimensional::slice< V, D - 1 > at( std::size_t i ) const { return _slice.at( i ); }
+
+        storage_type& data() { return _data; }
+
+        const storage_type& data() const { return _data; }
+
+        const index_type& shape() const { return _slice.shape(); }
+
+        std::size_t absolute_index( const index_type& i ) const { return _slice.absolute_index( i ); }
+
+        typedef typename slice_type::iterator iterator;
+
+        typedef typename slice_type::const_iterator const_iterator;
+
+        iterator begin() { return _slice.begin(); }
+
+        const_iterator begin() const { return _slice.begin(); }
+
+        iterator end() { return _slice.end(); }
+
+        const_iterator end() const { return _slice.end(); }
+
+    protected:
+        storage_type _data;
+        slice_type _slice;
+};
+
+template < typename V, unsigned int D, typename P = std::array< double, D >, typename Traits = impl::operations< D >, typename S = std::vector< V > >
+class grid: public array< V, D, S >
+{
+    public:
+        typedef P point_type;
+
+        typedef array< V, D, S > base_type;
+
+        typedef typename base_type::index_type index_type;
+
+        typedef typename base_type::value_type value_type;
+
+        grid( const P& origin, const P& resolution, const index_type& shape, const V& default_value = V() ): base_type( shape, default_value ), _origin( origin ), _resolution( resolution ) {}
+
+        index_type index_of( const point_type& point ) const { return Traits::template index_of< P, index_type >( point, _origin, _resolution ); }
+
+        point_type lower_bound( const point_type& point ) const { return Traits::add( _origin + Traits::multiply( _resolution, index_of( point ) ) ); }
+
+        V& operator()( const point_type& p ) { return this->operator[]( index_of( p ) ); }
+
+        const V& operator()( const point_type& p ) const { return this->operator[]( index_of( p ) ); }
+
+        const point_type& origin() const { return _origin; }
+
+        const point_type& resolution() const { return _resolution; }
+
+        V interpolated( const point_type& point ) const; // todo: flag/enum or alike for different interpolation types; currently linear only
+
+        index_type nearest_to( const point_type& point ) const;
+
+        bool has( const point_type& point ) const;
+
+    private:
+        point_type _origin;
+        point_type _resolution;
+};
+
+namespace impl {
+
+template < unsigned int D, unsigned int I = D >
+struct index_traits
+{
+    typedef comma::containers::multidimensional::index< D > index_type; // typedef std::array< std::size_t, D > index_type;
+    static unsigned int value( const index_type& i, const index_type& shape ) { return i[ I - 1 ] + index_traits< D, I - 1 >::value( i, shape ) * shape[ I - 1 ]; }
+    static void value( std::size_t j, index_type& i, const index_type& shape ) { i[ I - 1 ] = j % shape[ I - 1 ]; index_traits< D, I - 1 >::value( j / shape[ I - 1 ], i, shape ); }
+    static index_type value( std::size_t j, const index_type& shape ) { index_type i; value( j, i, shape ); return i; }
+    static std::size_t product( const index_type& i ) { return i[ I - 1 ] * index_traits< D, I - 1 >::product( i ); }
+    template < unsigned int J >
+    static std::pair< comma::containers::multidimensional::index< J >, comma::containers::multidimensional::index< D - J > > split( const index_type& i ) // todo: use metaprogramming, kinda same as product
+    {
+        std::pair< comma::containers::multidimensional::index< J >, comma::containers::multidimensional::index< D - J > > p;
+        unsigned int k = 0;
+        for( unsigned int n = 0; n < J; ++n, ++k ) { p.first[n] = i[k]; }
+        for( unsigned int n = 0; n < D - J; ++n, ++k ) { p.second[n] = i[k]; }
+        return p;
+    }
+};
+
+template < unsigned int D >
+struct index_traits< D, 1 >
+{
+    typedef comma::containers::multidimensional::index< D > index_type; // typedef std::array< std::size_t, D > index_type;
+    static unsigned int value( const index_type& i, const index_type& ) { return i[0]; }
+    static void value( std::size_t j, index_type& i, const index_type& size ) { i[0] = j; }
+    static std::size_t product( const index_type& i ) { return i[0]; }
+};
+
+} // namespace impl {
+
+template < typename V, unsigned int D >
+inline std::size_t slice< V, D >::_index( const typename slice< V, D >::index_type& i ) const { return impl::index_traits< D >::value( i, _shape ); }
+
+template < typename V, unsigned int D >
+inline std::size_t slice< V, D >::_product( const typename slice< V, D >::index_type& i ) { return impl::index_traits< D >::product( i ); }
+
+template < typename V, unsigned int D >
+inline typename slice< V, D >::index_type slice< V, D >::iterator::index() const { return impl::index_traits< D >::value( _i, _shape ); }
+
+template < typename V, unsigned int D >
+inline typename slice< V, D >::index_type slice< V, D >::const_iterator::index() const { return impl::index_traits< D >::value( _i, _shape ); }
+
+template < typename V, unsigned int D >
+template < unsigned int I >
+inline slice< V, D - I > slice< V, D >::at( const multidimensional::index< I >& i )
+{
+    auto s = impl::index_traits< D >::template split< I >( _shape );
+    return slice< V, D - I >( s.second, _data + impl::index_traits< I >::value( i, s.first ) * impl::index_traits< D - I >::product( s.second ) );
+}
+
+template < typename V, unsigned int D >
+template < unsigned int I >
+inline const slice< V, D - I > slice< V, D >::at( const multidimensional::index< I >& i ) const
+{
+    auto s = impl::index_traits< D >::template split< I >( _shape );
+    return slice< V, D - I >( s.second, _data + impl::index_traits< I >::value( i, s.first ) * impl::index_traits< D - I >::product( s.second ) );
+}
+
+template < typename V, unsigned int D, typename S >
+inline array< V, D, S >::array( const typename array< V, D, S >::index_type& shape, const V& default_value ): _data( impl::index_traits< D >::product( shape ), default_value ), _slice( shape, &_data[0] ) {}
+
+template < typename V, unsigned int D, typename P, typename Traits, typename S >
+V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
+{
+    const index_type i = index_of( point );
+    P element_origin = Traits::add( Traits::vmultiply( _resolution, i ), _origin );
+    const auto& weights = Traits::interpolation::linear::weights( point, element_origin, _resolution );
+    const auto& neighbours = impl::neighbours< index_type, D >;
+    V v = this->operator[]( i ) * weights[0]; // todo?! value traits?!
+    for( unsigned int j = 1; j < weights.size(); ++j ) { v += this->operator[]( Traits::add( i, neighbours[j] ) ) * weights[j]; } // todo?! value traits?!
+    return v;
+}
+
+// template < typename V, unsigned int D, typename P, typename Traits, typename S >
+// V grid< V, D, P, Traits, S >::interpolated( const P& point ) const
+// {
+//     const index_type i = index_of( point );
+//     const P p = Traits::subtract( point, Traits::add( Traits::vmultiply( _resolution, i ), _origin ) );
+//     //std::cerr << "==> a: point: " << point[0] << "," << point[1] << " p: " << p[0] << "," << p[1] << " _resolution: " << _resolution[0] << "," << _resolution[1] << std::endl;
+//     const auto& neighbours = impl::neighbours< index_type, D >;
+//     double s = 0;
+//     V v = this->operator[]( i ); // todo?! value traits?!
+//     for( unsigned int j = 0; j < neighbours.size(); ++j )
+//     {
+//         P d = Traits::subtract( p, Traits::vmultiply( _resolution, neighbours[j] ) );
+//         double n = Traits::dot( d, d ); //double n = std::sqrt( Traits::dot( d, d ) );
+//         index_type k = Traits::add( i, neighbours[j] );
+//         if( math::equal( n, 0 ) ) { return this->operator[]( k ); }
+//         double w = 1 / n;
+//         s += w;
+//         //std::cerr << "==> b: j: " << j << " k: " << k[0] << "," << k[1] << " n: " << n << " w: " << w << std::endl;
+//         if( j == 0 ) { v *= w; } else { v += this->operator[]( k ) * w; } // quick and dirty for now
+//     }
+//     //std::cerr << "==> c: s: " << s << std::endl;
+//     return v * ( 1 / s );
+// }
+
+template < typename V, unsigned int D, typename P, typename Traits, typename S >
+typename grid< V, D, P, Traits, S >::index_type grid< V, D, P, Traits, S >::nearest_to( const P& point ) const
+{
+    P element_origin = _resolution;
+    index_type i = index_of( point );
+    Traits::add( Traits::vmultiply( element_origin, i ), _origin );
+    return Traits::add( Traits::template nearest< index_type >( point, const_cast< const P& >( element_origin ), _resolution ), i );
+}
+
+template < typename V, unsigned int D, typename P, typename Traits, typename S >
+inline bool grid< V, D, P, Traits, S >::has( const P& point ) const // quick and dirty for now
+{
+    const auto& i = index_of( point );
+    for( unsigned int k = 0; k < D; ++k ) { if( i[k] < 0 || i[k] >= this->shape()[k] ) { return false; } }
+    return true;
+}
+
+} } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/multidimensional/array_traits.h b/containers/multidimensional/array_traits.h
new file mode 100644
index 000000000..59d9eec0e
--- /dev/null
+++ b/containers/multidimensional/array_traits.h
@@ -0,0 +1,153 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+#include <cmath>
+#include <type_traits>
+#include "../../math/compare.h"
+#include "index.h"
+
+template< typename T, std::size_t D, typename S >
+inline std::array< T, D >& operator*=( std::array< T, D >& lhs, const S& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] *= rhs; } return lhs; } // quick and dirty; let compiler optimize
+
+template< typename T, std::size_t D, typename S >
+inline std::array< T, D > operator*( const std::array< T, D >& lhs, const S& rhs ) { auto r = lhs; r *= rhs; return r; }
+
+template< typename T, std::size_t D >
+inline std::array< T, D >& operator+=( std::array< T, D >& lhs, const std::array< T, D >& rhs ) { for( unsigned int i = 0; i < D; ++i ) { lhs[i] += rhs[i]; } return lhs; } // quick and dirty; let compiler optimize
+
+template< typename T, std::size_t D >
+inline std::array< T, D > operator+( const std::array< T, D >& lhs, const std::array< T, D >& rhs ) { auto r = lhs; r += rhs; return r; }
+
+namespace comma { namespace containers { namespace multidimensional { namespace impl {
+
+template < typename T > inline int index( T p, T origin, T resolution )
+{
+    static constexpr int negative_flooring = static_cast< int >( -1.5 ) == -1 ? -1 : static_cast< int >( -1.5 ) == -2 ? 0 : 0;
+    static constexpr int positive_flooring = static_cast< int >( 1.5 ) == 1 ? 0 : static_cast< int >( 1.5 ) == 2 ? -1 : -1;
+    double diff = ( p - origin ) / resolution;
+    int i = diff;
+    if( i == 0 || diff != i ) { i += diff < 0 ? negative_flooring : positive_flooring; }
+    return i;
+}
+
+template < int Base, unsigned int Pow > static constexpr int pow = Base * pow< Base, Pow - 1 >;
+template < int Base > static constexpr int pow< Base, 0 >{1};
+template < typename I, std::size_t Size > static constexpr std::array< I, Size > neighbours; // quick and dirty, for now leaving it to the enthusiasts to implement it using metaprogramming
+template < typename I > static constexpr std::array< I, 2 > neighbours< I, 1 > = {{ I{ 0 }, I{ 1 } }};
+template < typename I > static std::array< I, 4 > neighbours< I, 2 > = {{ I{ 0, 0 }, I{ 0, 1 }, I{ 1, 0 }, I{ 1, 1 } }};
+template < typename I > static std::array< I, 8 > neighbours< I, 3 > = {{ I{ 0, 0, 0 }, I{ 0, 0, 1 }, I{ 0, 1, 0 }, I{ 0, 1, 1 }, I{ 1, 0, 0 }, I{ 1, 0, 1 }, I{ 1, 1, 0 }, I{ 1, 1, 1 } }};
+template < typename I > static std::array< I, 16 > neighbours< I, 4 > = {{ I{ 0, 0, 0, 0 }, I{ 0, 0, 0, 1 }, I{ 0, 0, 1, 0 }, I{ 0, 0, 1, 1 }, I{ 0, 1, 0, 0 }, I{ 0, 1, 0, 1 }, I{ 0, 1, 1, 0 }, I{ 0, 1, 1, 1 }, I{ 1, 0, 0, 0 }, I{ 1, 0, 0, 1 }, I{ 1, 0, 1, 0 }, I{ 1, 0, 1, 1 }, I{ 1, 1, 0, 0 }, I{ 1, 1, 0, 1 }, I{ 1, 1, 1, 0 }, I{ 1, 1, 1, 1 } }};
+// template < typename I > static constexpr std::array< I, 2 > neighbours< I, 1 > = {{ {{ 0 }}, {{ 1 }} }};
+// template < typename I > static constexpr std::array< I, 4 > neighbours< I, 2 > = {{ {{ 0, 0 }}, {{ 0, 1 }}, {{ 1, 0 }}, {{ 1, 1 }} }};
+// template < typename I > static constexpr std::array< I, 8 > neighbours< I, 3 > = {{ {{ 0, 0, 0 }}, {{ 0, 0, 1 }}, {{ 0, 1, 0 }}, {{ 0, 1, 1 }}, {{ 1, 0, 0 }}, {{ 1, 0, 1 }}, {{ 1, 1, 0 }}, {{ 1, 1, 1 }} }};
+// template < typename I > static constexpr std::array< I, 16 > neighbours< I, 4 > = {{ {{ 0, 0, 0, 0 }}, {{ 0, 0, 0, 1 }}, {{ 0, 0, 1, 0 }}, {{ 0, 0, 1, 1 }}, {{ 0, 1, 0, 0 }}, {{ 0, 1, 0, 1 }}, {{ 0, 1, 1, 0 }}, {{ 0, 1, 1, 1 }}, {{ 1, 0, 0, 0 }}, {{ 1, 0, 0, 1 }}, {{ 1, 0, 1, 0 }}, {{ 1, 0, 1, 1 }}, {{ 1, 1, 0, 0 }}, {{ 1, 1, 0, 1 }}, {{ 1, 1, 1, 0 }}, {{ 1, 1, 1, 1 }} }};
+// todo: add more dimensions as required or write that little metaprogramming piece
+
+template < std::size_t Size > struct operations
+{
+    template < typename S, typename T > static S& add( S& s, const T& t ) { s[ Size - 1 ] += t[ Size - 1 ]; operations< Size - 1 >::add( s, t ); return s; }
+    template < typename S, typename T > static S& subtract( S& s, const T& t ) { s[ Size - 1 ] -= t[ Size - 1 ]; operations< Size - 1 >::subtract( s, t ); return s; }
+    template < typename S, typename T > static S& vdivide( S& s, const T& t ) { s[ Size - 1 ] /= t[ Size - 1 ]; operations< Size - 1 >::vdivide( s, t ); return s; }
+    template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[ Size - 1 ] *= t; operations< Size - 1 >::multiply( s, t ); return s; }
+    template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[ Size - 1 ] *= t[ Size - 1 ]; operations< Size - 1 >::vmultiply( s, t ); return s; }
+    template < typename S, typename T > static double dot( S& s, const T& t ) { return s[ Size - 1 ] * t[ Size - 1 ] + operations< Size - 1 >::dot( s, t ); }
+    template < typename S, typename T > static S& mask( S& s, const T& t ) { s[ Size - 1 ] = t[ Size - 1 ] ? t[ Size - 1 ] : s[ Size - 1 ]; operations< Size - 1 >::mask( s, t ); return s; }
+    template < typename S, typename T > static S masked( const S& s, const T& t ) { S m = s; mask( m, t ); return m; }
+    template < typename S, typename T > static S& logical_not( S& s ) { s[ Size - 1 ] = !s[ Size - 1 ]; operations< Size - 1 >::logical_not( s ); return s; }
+    template < typename S > static S& fill( S&s, double value ) { s[ Size - 1 ] = value; operations< Size - 1 >::fill( s, value ); return s; }
+    template < typename S > static S filled( double value ) { S s; fill( s, value ); return s; }
+    template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
+    template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[Size] ) >::type { return s[ Size - 1 ] * operations< Size - 1 >::product( s ); }
+    template < typename S, typename T, typename Diff > static bool near( const S& s, const T& t, const Diff& epsilon ) { return comma::math::equal( s[ Size - 1 ], t[ Size - 1 ], epsilon ) && operations< Size - 1 >::near( s, t, epsilon ); }
+    template < typename S, typename T > static S add( const S& s, const T& t ) { S r = s; add( r, t ); return r; }
+    template < typename S, typename T > static S subtract( const S& s, const T& t ) { S r = s; subtract( r, t ); return r; }
+    template < typename S, typename T > static S vdivide( const S& s, const T& t ) { S r = s; vdivide( r, t ); return r; }
+    template < typename S, typename T > static S multiply( const S& s, const T& t ) { S r = s; multiply( r, t ); return r; }
+    template < typename S, typename T > static S vmultiply( const S& s, const T& t ) { S r = s; vmultiply( r, t ); return r; }
+
+    template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution )
+    {
+        i[ Size - 1 ] = index( p[ Size - 1 ], origin[ Size - 1 ], resolution[ Size - 1 ] );
+        operations< Size - 1 >::index_of( i, p, origin, resolution );
+        return i;
+    }
+
+    template < typename S, typename I > static I index_of( const S& p, const S& origin, const S& resolution ) { I i; index_of( i, p, origin, resolution ); return i; }
+
+    template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) // todo? metaprogram?
+    {
+        const S& s = subtract( p, origin );
+        double m = dot( s, s );
+        unsigned int j = 0;
+        const auto& n = neighbours< I, Size >;
+        for( unsigned int i = 1; m > 0 && i < n.size(); ++i )
+        {
+            const S& r = subtract( vmultiply( resolution, n[i] ), s );
+            double d = dot( r, r );
+            if( d < m ) { m = d; j = i; }
+        }
+        return n[j];
+    }
+
+    template < typename S, typename I > static std::array< double, pow< 2, Size > > squared_norms( const S& p, const S& origin, const S& resolution ) // todo? metaprogram?
+    {
+        const S& s = subtract( p, origin );
+        std::array< double, pow< 2, Size > > d;
+        const auto& n = neighbours< I, Size >;
+        for( unsigned int i = 0; i < n.size(); ++i )
+        {
+            const S& r = subtract( vmultiply( resolution, n[i] ), s );
+            d[i] = dot( r, r );
+        }
+        return d;
+    }
+
+    template < typename S, typename I > static std::array< double, pow< 2, Size > > norms( const S& p, const S& origin, const S& resolution )
+    {
+        std::array< double, pow< 2, Size > > d = squared_norms( p, origin, resolution );
+        for( auto& v: d ) { v = std::sqrt( v ); }
+        return d;
+    }
+
+    struct interpolation
+    {
+        struct linear
+        {
+            template < typename S > static std::array< double, pow< 2, Size > > weights( const S& s )
+            {
+                S t;
+                subtract( fill( t, 1. ), s );
+                const auto& n = neighbours< std::array< unsigned int, Size >, Size >;
+                std::array< double, pow< 2, Size > > w;
+                for( unsigned int i = 0; i < pow< 2, Size >; ++i ) { w[i] = product( masked( s, n[ pow< 2, Size > - i - 1 ] ) ) * product( masked( t, n[i] ) ); }
+                return w;
+            }
+
+            template < typename S > static std::array< double, pow< 2, Size > > weights( const S& p, const S& origin, const S& resolution ) { return weights( vdivide( subtract( p, origin ), resolution ) ); }
+        };
+    };
+};
+
+template <> struct operations< 1 >
+{
+    template < typename S, typename T > static S& add( S& s, const T& t ) { s[0] += t[0]; return s; }
+    template < typename S, typename T > static S& subtract( S& s, const T& t ) { s[0] -= t[0]; return s; }
+    template < typename S, typename T > static S& vdivide( S& s, const T& t ) { s[0] /= t[0]; return s; }
+    template < typename S, typename T > static S& multiply( S& s, const T& t ) { s[0] *= t; return s; }
+    template < typename S, typename T > static S& vmultiply( S& s, const T& t ) { s[0] *= t[0]; return s; }
+    template < typename S, typename T > static double dot( S& s, const T& t ) { return s[0] * t[0]; }
+    template < typename S, typename T > static S& logical_not( S& s ) { s[0] = !s[0]; return s; }
+    template < typename S, typename T > static S& mask( S& s, const T& t ) { s[0] = t[0] ? t[0] : s[0]; return s; }
+    template < typename S > static auto product( const S& s ) -> typename std::remove_reference< decltype( s[0] ) >::type { return s[0]; }
+    template < typename S, typename T, typename Diff > static bool near( const S& s, const T& t, const Diff& epsilon ) { return comma::math::equal( s[0], t[0], epsilon ); }
+    template < typename S > static S& fill( S&s, double value ) { s[0] = value; return s; }
+    template < typename S > static S zero() { S s; fill( s, 0 ); return s; }
+    template < typename S, typename I > static I& index_of( I& i, const S& p, const S& origin, const S& resolution ) { i[0] = index( p[0], origin[0], resolution[0] ); return i; }
+    template < typename S, typename I > static I nearest( const S& p, const S& origin, const S& resolution ) { return p[0] - origin[0] < resolution[0] / 2 ? I{ 0 } : I{ 1 }; }
+};
+
+} } } } // namespace comma { namespace containers { namespace multidimensional { namespace impl {
diff --git a/containers/multidimensional/index.h b/containers/multidimensional/index.h
new file mode 100644
index 000000000..6df4a3430
--- /dev/null
+++ b/containers/multidimensional/index.h
@@ -0,0 +1,108 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+#include <cstring>
+#include "../../base/types.h"
+
+namespace comma { namespace containers { namespace multidimensional {
+
+template < unsigned int D, typename T = std::size_t >
+struct index: public std::array< T, D >
+{
+    typedef T value_t;
+
+    typedef std::array< T, D > base_t;
+
+    index(): base_t{} {}
+
+    index( const index& rhs ): base_t( static_cast< const base_t& >( rhs ) ) {}
+
+    template < typename... Args > index( T t, Args... args ); // quick and dirty for now to avoid compile warning // template < typename... Args > index( Args... args ): base_t( { args... } ) {}
+
+    bool operator<( const index& rhs ) const;
+
+    bool operator==( const index& rhs ) const;
+
+    bool operator!=( const index& rhs ) const { return !operator==( rhs ); }
+
+    index& operator=( const index& rhs ) = default;
+
+    index& operator=( const base_t& rhs ) { static_cast< base_t& >( *this ) = rhs; }
+
+    operator base_t() { return static_cast< base_t& >( *this ); }
+
+    operator base_t() const { return static_cast< const base_t& >( *this ); }
+
+    index& increment( const index& sizes );
+
+    class iterator
+    {
+        public:
+            iterator( const index< D >& shape ): _shape( shape ) {}
+
+            iterator& operator++() { _valid = _index.increment( _shape ) != index< D >{}; return *this; }
+
+            operator bool() const { return _valid; }
+            
+            const index< D >& operator*() const { return _index; }
+
+        private:
+            index< D > _index;
+            index< D > _shape;
+            bool _valid{true};
+    };
+};
+
+namespace impl {
+
+template < typename T, unsigned int D, unsigned int I > struct type_cast
+{
+    template < typename... Args > static void assign( index< D, T >& i, T v, Args... args )
+    {
+        i[ D - I ] = v;
+        type_cast< T, D, I - 1 >::assign( i, args... );
+    }
+};
+
+template < typename T, unsigned int D > struct type_cast< T, D, 1 >
+{
+    static void assign( index< D, T >& i, T v ) { i[ D - 1 ] = v; }
+};
+
+} // namespace impl {
+
+template < unsigned int D, typename T > 
+template < typename... Args > inline index< D, T >::index( T t, Args... args )
+{
+    impl::type_cast< T, D, D >::assign( *this, t, args... );
+}
+
+template < unsigned int D, typename T > inline bool index< D, T >::operator<( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    for( unsigned int i = 0; i < D; ++i )
+    {
+        if( ( *this )[i] < rhs[i] ) { return true; }
+    }
+    return false;
+}
+
+template < unsigned int D, typename T > inline bool index< D, T >::operator==( const index& rhs ) const // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    return std::memcmp( reinterpret_cast< const char* >( this ), reinterpret_cast< const char* >( &rhs ), sizeof( std::size_t ) * D ) == 0;
+}
+
+template < unsigned int D, typename T > inline index< D, T >& index< D, T >::increment( const index< D, T >& sizes ) // todo: unravel in compile time (compiler probably will do it anyway)
+{
+    for( unsigned int i{0}, j{D - 1}; i < D; ++i, --j )
+    {
+        if( ++( *this )[j] < sizes[j] ) { return *this; }
+        ( *this )[j] = 0;
+    }
+    return *this;
+}
+
+} } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/multidimensional/map.h b/containers/multidimensional/map.h
new file mode 100644
index 000000000..b4347d7d8
--- /dev/null
+++ b/containers/multidimensional/map.h
@@ -0,0 +1,177 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <array>
+#include <functional>
+#include <unordered_map>
+#include <boost/functional/hash.hpp>
+#include "../../base/types.h"
+#include "array_traits.h"
+
+namespace comma { namespace containers { namespace multidimensional {
+
+/// quick and dirty hash for array-like containers (its support is awkward in boost)
+template < typename Array, std::size_t Size >
+struct array_hash : public std::function< std::size_t( const Array& ) > // struct array_hash : public std::unary_function< Array, std::size_t >
+{
+    std::size_t operator()( Array const& array ) const
+    {
+        std::size_t seed = 0;
+        for( std::size_t i = 0; i < Size; ++i ) { boost::hash_combine( seed, array[i] ); }
+        return seed;
+        // return boost::hash_range( &array[0], &array[Size] ); // not so easy...
+    }
+};
+
+/// unordered map with array-like keys
+template < typename K, typename V, std::size_t Size, typename P = std::array< K, Size >, typename Traits = impl::operations< Size > >
+class map : public std::unordered_map< std::array< comma::int32, Size >, V, array_hash< std::array< comma::int32, Size >, Size > >
+{
+    public:
+        typedef std::unordered_map< std::array< comma::int32, Size >, V, array_hash< std::array< comma::int32, Size >, Size > > base_type;
+
+        typedef base_type map_type;
+
+        typedef base_type as_map;
+        
+        enum { dimensions = Size };
+        
+        typedef P point_type;
+
+        typedef typename base_type::key_type index_type;
+
+        typedef typename base_type::key_type key_type; // for brevity
+
+        typedef typename base_type::mapped_type mapped_type; // for brevity
+        
+        typedef typename base_type::iterator iterator; // otherwise it does not build on windows...
+        
+        typedef typename base_type::const_iterator const_iterator; // otherwise it does not build on windows...
+
+        /// constructor
+        map( const point_type& origin, const point_type& resolution );
+
+        /// constructor, origin is all zeroes
+        map( const point_type& resolution );
+        
+        /// insert element at the given point, if it does not exist
+        iterator touch_at( const point_type& point );
+        
+        /// insert element at the given point, if it does not exist
+        std::pair< iterator, bool > insert( const point_type& point, const mapped_type& value );
+        
+        /// return index of the point, always rounds it down (does floor for a given resolution)
+        key_type index_of( const point_type& point ) const;
+        
+        /// same as index_of( point ), but static
+        static key_type index_of( const point_type& point, const point_type& origin, const point_type& resolution );
+        
+        /// same as index_of( point ), but static with origin assumed all zeroes
+        static key_type index_of( const point_type& point, const point_type& resolution );
+        
+        /// find value by point
+        iterator at( const point_type& point );
+        
+        /// find value by point
+        const_iterator at( const point_type& point ) const;
+        
+        /// find value by key
+        iterator find( const key_type& index );
+        
+        /// find value by key
+        const_iterator find( const key_type& index ) const;
+        
+        /// return origin
+        const point_type& origin() const;
+        
+        /// return resolution
+        const point_type& resolution() const;
+
+    private:
+        point_type _origin;
+        point_type _resolution;
+};
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Traits >::point_type& origin, const typename map< K, V, Size, P, Traits >::point_type& resolution )
+    : _origin( origin )
+    , _resolution( resolution )
+{
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline map< K, V, Size, P, Traits >::map( const typename map< K, V, Size, P, Traits >::point_type& resolution )
+    : _origin( Traits::template zero< P >() )
+    , _resolution( resolution )
+{
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::touch_at( const typename map< K, V, Size, P, Traits >::point_type& point )
+{
+    key_type index = index_of( point );
+    iterator it = this->base_type::find( index );
+    if( it != this->end() ) { return it; }
+    return this->base_type::insert( std::make_pair( index, mapped_type() ) ).first;
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline std::pair< typename map< K, V, Size, P, Traits >::iterator, bool > map< K, V, Size, P, Traits >::insert( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::mapped_type& value )
+{
+    return this->base_type::insert( std::make_pair( index_of( point ), value ) );
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& origin, const typename map< K, V, Size, P, Traits >::point_type& resolution )
+{
+    return Traits::template index_of< P, key_type >( point, origin, resolution );
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point, const typename map< K, V, Size, P, Traits >::point_type& resolution )
+{
+    return index_of( point, Traits::template zero< P >(), resolution );
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::key_type map< K, V, Size, P, Traits >::index_of( const typename map< K, V, Size, P, Traits >::point_type& point ) const
+{
+    return index_of( point, _origin, _resolution );
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::at( const typename map< K, V, Size, P, Traits >::point_type& point )
+{
+    index_type i = index_of( point );
+    return this->base_type::find( i );
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::at( const typename map< K, V, Size, P, Traits >::point_type& point ) const
+{
+    index_type i = index_of( point );
+    return this->base_type::find( i );
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::key_type& index )
+{
+    return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline typename map< K, V, Size, P, Traits >::const_iterator map< K, V, Size, P, Traits >::find( const typename map< K, V, Size, P, Traits >::key_type& index ) const
+{
+    return this->base_type::find( index ); // otherwise strange things happen... debug, when we have time
+}
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline const typename map< K, V, Size, P, Traits >::point_type& map< K, V, Size, P, Traits >::origin() const { return _origin; }
+
+template < typename K, typename V, std::size_t Size, typename P, typename Traits >
+inline const typename map< K, V, Size, P, Traits >::point_type& map< K, V, Size, P, Traits >::resolution() const { return _resolution; }
+
+} } } // namespace comma { namespace containers { namespace multidimensional {
diff --git a/containers/multidimensional/traits.h b/containers/multidimensional/traits.h
new file mode 100644
index 000000000..1e32fbff1
--- /dev/null
+++ b/containers/multidimensional/traits.h
@@ -0,0 +1,25 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+#pragma once
+
+#include "../../visiting/traits.h"
+#include "index.h"
+
+namespace comma { namespace visiting {
+
+template < unsigned int D, typename T > struct traits< comma::containers::multidimensional::index< D, T > >
+{
+    typedef comma::containers::multidimensional::index< D, T > value_t;
+
+    template < typename Key, class Visitor > static void visit( const Key& k, value_t& p, Visitor& v )
+    {
+        comma::visiting::traits< std::array< T, D > >::visit( k, static_cast< std::array< T, D >& >( p ), v );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key& k, const value_t& p, Visitor& v )
+    {
+        comma::visiting::traits< std::array< T, D > >::visit( k, static_cast< const std::array< T, D >& >( p ), v );
+    }
+};
+
+} } // namespace comma { namespace visiting {
diff --git a/containers/ordered/queues.h b/containers/ordered/queues.h
new file mode 100644
index 000000000..27580392a
--- /dev/null
+++ b/containers/ordered/queues.h
@@ -0,0 +1,77 @@
+// Copyright (c) 2024 Mission Systems
+
+/// @authors aspen eyers, vsevolod vlaskine
+
+#pragma once
+
+#include <deque>
+#include <tuple>
+
+namespace comma { namespace containers { namespace ordered {
+
+/// @todo variadic types
+/// @todo don't use std::pair, use traits instead?
+/// @todo max_diff, grater or grater_equal? & document; unit test on ints; unit test on max diff 0]
+/// @todo pop_all will remove the first elements from both queues, but we may want to pop just one element and still keep the other one
+///       Use case: we want to get every (valid) element from both queues with its corresponding element from the other queue and process them
+///       independently. If we pop both elements, we may lose the correspondence between the elements from the two queues. 
+template < typename K, typename T, typename S >
+class queues: public std::tuple< std::deque< std::pair< K, T > >, std::deque< std::pair< K, S > > >
+{
+    public:
+        typedef std::tuple< std::deque< std::pair< K, T > >, std::deque< std::pair< K, S > > > queues_type;
+        typedef std::tuple< std::pair< K, T >, std::pair< K, S > > values_type;
+        typedef std::tuple< const std::pair< K, T >&, const std::pair< K, S >& > ref_type;
+        typedef decltype( K() - K() ) diff_type;
+        queues( diff_type max_diff ): _max_diff( max_diff ) {}
+        bool ready() const;
+        void purge();
+        void pop_all();
+        ref_type front() const;
+
+    private:
+        diff_type _max_diff;
+        static diff_type _abs_diff(K lhs, K rhs) { return lhs < rhs ? (rhs - lhs) : (lhs - rhs); }
+        template < unsigned int I, unsigned int J > bool _purge();
+};
+
+template < typename K, typename T, typename S >
+inline bool queues<K, T, S>::ready() const
+{
+    if( std::get<0>(*this).empty() || std::get<1>(*this).empty() ) { return false; }
+    return _abs_diff( std::get<1>(*this).front().first, std::get<0>(*this).front().first ) <= _max_diff;
+}
+
+template < typename K, typename T, typename S >
+inline void queues<K, T, S>::purge()
+{
+    if( std::get<1>(*this).empty() || std::get<0>(*this).empty() ) { return; }
+    // If not purge 0,1, then purge 1,0
+    while( std::get<0>(*this).front().first - std::get<1>(*this).front().first > _max_diff ) 
+    { 
+        if( std::get<1>(*this).empty() ) { return; }
+        std::get<1>(*this).pop_front();
+    }
+    while( std::get<1>(*this).front().first - std::get<0>(*this).front().first > _max_diff ) 
+    { 
+        if( std::get<0>(*this).empty() ) { return; }
+        std::get<0>(*this).pop_front();
+    }
+}
+
+template < typename K, typename T, typename S >
+void queues<K, T, S>::pop_all()
+{
+    std::get<0>(*this).pop_front();
+    std::get<1>(*this).pop_front();
+    return;
+}
+
+
+template < typename K, typename T, typename S >
+inline typename queues<K, T, S>::ref_type queues<K, T, S>::front() const
+{
+    return { std::get<0>(*this).front(), std::get<1>(*this).front() };
+}
+
+} } } // namespace comma { namespace containers { namespace ordered {
diff --git a/containers/test/CMakeLists.txt b/containers/test/CMakeLists.txt
index bdfd90360..4442cc2c5 100644
--- a/containers/test/CMakeLists.txt
+++ b/containers/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT containers )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base ${GTEST_BOTH_LIBRARIES} )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT containers )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} comma_base pthread ) # target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/containers/test/array_traits_test.cpp b/containers/test/array_traits_test.cpp
new file mode 100644
index 000000000..6be69a2f3
--- /dev/null
+++ b/containers/test/array_traits_test.cpp
@@ -0,0 +1,68 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <array>
+#include <gtest/gtest.h>
+#include "../../math/compare.h"
+#include "../multidimensional/array_traits.h"
+
+namespace ccmi = comma::containers::multidimensional::impl; 
+
+TEST( array_traits, operations_nearest )
+{
+    {
+        typedef std::array< double, 1 > point_t;
+        typedef std::array< int, 1 > index_t;
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.3}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{0}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.5}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+        { index_t i = ccmi::operations< 1 >::nearest< point_t, index_t >( point_t{0.999}, point_t{0}, point_t{1} ); EXPECT_EQ( index_t{1}, i ); }
+    }
+    {
+        typedef std::array< double, 2 > point_t;
+        typedef std::array< int, 2 > index_t;
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }        
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.2}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{0.1, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1}; index_t actual = ccmi::operations< 2 >::nearest< point_t, index_t >( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+    }
+    {
+        typedef std::array< double, 3 > point_t;
+        typedef std::array< int, 3 > index_t;
+        { index_t expected{0, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0.7, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0.7, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+    }
+    {
+        typedef std::array< float, 3 > point_t;
+        typedef std::array< float, 3 > index_t;
+        { index_t expected{0, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 0, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 1, 0}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0.7, 0}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{0, 0, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0, 0, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+        { index_t expected{1, 1, 1}; index_t actual = ccmi::operations< 3 >::nearest< point_t, index_t >( point_t{0.7, 0.7, 0.7}, point_t{0, 0, 0}, point_t{1, 1, 1} ); EXPECT_EQ( expected, actual ); }
+    }
+}
+
+TEST( array_traits, interpolation_linear_weights )
+{
+    {
+        typedef std::array< double, 2 > point_t;
+        typedef std::array< double, 4 > weights_t;
+        { weights_t expected{1, 0, 0, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0, 1, 0, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0, 0, 1, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{1, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0, 0, 0, 1}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{1, 1}, point_t{0, 0}, point_t{1, 1} ); EXPECT_EQ( expected, actual ); }
+        { weights_t expected{0.3, 0.7, 0, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0, 0.7}, point_t{0, 0}, point_t{1, 1} ); EXPECT_TRUE( ccmi::operations< 3 >::near( expected, actual, 1e-6 ) ); }
+        { weights_t expected{0.3, 0, 0.7, 0}; auto actual = ccmi::operations< 2 >::interpolation::linear::weights( point_t{0.7, 0}, point_t{0, 0}, point_t{1, 1} ); EXPECT_TRUE( ccmi::operations< 3 >::near( expected, actual, 1e-6 ) ); }
+        // todo: way more testing
+    }
+}
diff --git a/containers/test/cached_test.cpp b/containers/test/cached_test.cpp
new file mode 100644
index 000000000..68f4238b5
--- /dev/null
+++ b/containers/test/cached_test.cpp
@@ -0,0 +1,148 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All Rights Reserved
+
+#include <gtest/gtest.h>
+#include <vector>
+#include <boost/functional/hash.hpp>
+#include "../cached.h"
+
+struct square
+{
+    typedef int key;
+
+    square( int x ): a( x ) {}
+
+    int calculate( int x ) const { return a * x; }
+
+    int a{0};
+};
+
+TEST( cached, basics )
+{
+    comma::cached< square, int > c;
+    EXPECT_EQ( c.get( 5 ).calculate( 5 ), 25 );
+    EXPECT_EQ( c.values().size(), 1 );
+    EXPECT_EQ( c.get( 5 ).calculate( 5 ), 25 );
+    EXPECT_EQ( c.values().size(), 1 );
+    EXPECT_EQ( c.get( 10 ).calculate( 10 ), 100 );
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c.get( 10 ).calculate( 10 ), 100 );
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c.get( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.values().size(), 3 );
+    EXPECT_EQ( c.get( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.values().size(), 3 );
+    c.pop();
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c.values().size(), 2 );
+    EXPECT_EQ( c.get( 20 ).calculate( 20 ), 400 );
+    EXPECT_EQ( c.values().size(), 2 );
+}
+
+struct someclass
+{
+    typedef std::pair< int, int > key;
+
+    struct hash
+    {
+        std::size_t operator()( key const& p ) const
+        {
+            std::size_t seed = 0;
+            boost::hash_combine( seed, p.first );
+            boost::hash_combine( seed, p.second );
+            return seed;
+        }
+    };
+
+    someclass( const key& k ) {}
+
+    void dummy( int x, int y ) const {}
+};
+
+TEST( cached, key )
+{
+    comma::cached< someclass, someclass::key, someclass::hash > c;
+    c.get( 1, 2 ).dummy( 1, 2 );
+    EXPECT_EQ( c.values().size(), 1 );
+    c.get( 1, 2 ).dummy( 1, 2 );
+    EXPECT_EQ( c.values().size(), 1 );
+    c.get( 3, 1 ).dummy( 3, 1 );
+    EXPECT_EQ( c.values().size(), 2 );
+    c.get( 3, 1 ).dummy( 3, 1 );
+    EXPECT_EQ( c.values().size(), 2 );
+}
+
+struct plan
+{
+    struct params
+    {
+        int size{0};
+        bool real{false};
+        bool inverse{false};
+
+        bool operator==( const params& rhs ) const { return size == rhs.size && real == rhs.real && inverse == rhs.inverse; }
+
+        params( const std::vector< int >& v, bool real, bool inverse ): size( v.size() ), real( real ), inverse( inverse ) {}
+
+        params( const std::set< int >& v, bool x ): size( v.size() ), real( x ), inverse( x ) {}
+    };
+
+    plan( const params& ) {}
+
+    void operator()( const std::vector< int >&, bool, bool ) {}
+
+    void operator()( const std::set< int >&, bool ) {}
+
+    void size() {}
+};
+
+namespace std {
+
+template <> struct hash< plan::params >
+{
+    std::size_t operator()( plan::params const& k ) const
+    {
+        std::size_t seed = 0;
+        boost::hash_combine( seed, k.size );
+        boost::hash_combine( seed, k.real );
+        boost::hash_combine( seed, k.inverse );
+        return seed;
+    }
+};
+
+} // namespace std {
+
+TEST( cached, hashing_non_intrusive )
+{
+    comma::cached< plan, plan::params > c;
+    c.get( std::vector< int >{ 1, 2, 3 }, true, false )( std::vector< int >{ 1, 2, 3 }, true, false );
+    EXPECT_EQ( c.values().size(), 1 );
+    c.get( std::vector< int >{ 1, 2, 3 }, true, false )( std::vector< int >{ 1, 2, 3 }, true, false );
+    EXPECT_EQ( c.values().size(), 1 );
+    c.get( std::vector< int >{ 1, 2 }, true, false )( std::vector< int >{ 1, 2 }, true, false );
+    EXPECT_EQ( c.values().size(), 2 );
+    c.get( std::vector< int >{ 1, 2 }, true, false )( std::vector< int >{ 1, 2 }, true, false );
+    c.get( std::vector< int >{ 1, 2 }, true, false ).size();
+    EXPECT_EQ( c.values().size(), 2 );
+}
+
+TEST( cached, operators )
+{
+    comma::cached< plan, plan::params > plans;
+    plans( std::vector< int >{ 1, 2, 3 }, true, false );
+    EXPECT_EQ( plans.values().size(), 1 );
+    plans( std::vector< int >{ 1, 2, 3 }, true, false );
+    EXPECT_EQ( plans.values().size(), 1 );
+    plans( std::vector< int >{ 1, 2 }, true, false );
+    EXPECT_EQ( plans.values().size(), 2 );
+    plans( std::vector< int >{ 1, 2 }, true, false );
+    EXPECT_EQ( plans.values().size(), 2 );
+
+    plans( std::set< int >{ 1, 2 }, true );
+    EXPECT_EQ( plans.values().size(), 3 );
+    plans( std::set< int >{ 1, 2 }, true );
+    EXPECT_EQ( plans.values().size(), 3 );
+    plans( std::vector< int >{ 1, 2 }, true, true );
+    EXPECT_EQ( plans.values().size(), 3 );
+}
+
diff --git a/containers/test/cyclic_buffer_test.cpp b/containers/test/cyclic_buffer_test.cpp
index 29eb69e8e..cc12f841d 100644
--- a/containers/test/cyclic_buffer_test.cpp
+++ b/containers/test/cyclic_buffer_test.cpp
@@ -29,6 +29,7 @@
 
 
 #include <gtest/gtest.h>
+#include "../../base/exception.h"
 #include "../cyclic_buffer.h"
 
 namespace comma {
@@ -82,8 +83,7 @@ TEST( cyclic_buffer, push_pop )
         EXPECT_EQ( b.size(), 4 - i );
     }
     EXPECT_TRUE( b.empty() );
-    EXPECT_EQ( b.size(), 0u );    
-    
+    EXPECT_EQ( b.size(), 0u );
     for( unsigned int i = 0; i < 5u; ++i )
     {
         b.push( i );
@@ -92,6 +92,28 @@ TEST( cyclic_buffer, push_pop )
     EXPECT_EQ( b.size(), 1u );    
 }
 
+TEST( cyclic_buffer, push_force )
+{
+    cyclic_buffer< unsigned int > b( 3 );
+    b.push( 0 );
+    b.push( 1 );
+    b.push( 2 );
+    EXPECT_EQ( b.front(), 0 );
+    EXPECT_EQ( b.back(), 2 );
+    EXPECT_THROW( b.push( 3 ), comma::exception );
+    b.push( 3, true );
+    EXPECT_EQ( b.front(), 1 );
+    EXPECT_EQ( b.back(), 3 );
+    EXPECT_THROW( b.push( 4 ), comma::exception );
+    b.push( 4, true );
+    EXPECT_EQ( b.front(), 2 );
+    EXPECT_EQ( b.back(), 4 );
+    EXPECT_THROW( b.push( 5 ), comma::exception );
+    b.push( 5, true );
+    EXPECT_EQ( b.front(), 3 );
+    EXPECT_EQ( b.back(), 5 );
+}
+
 TEST( cyclic_buffer, fixed_cyclic_buffer )
 {
     fixed_cyclic_buffer< unsigned int, 3 > b;
diff --git a/containers/test/multidimensional_array_test.cpp b/containers/test/multidimensional_array_test.cpp
new file mode 100644
index 000000000..8a48b321e
--- /dev/null
+++ b/containers/test/multidimensional_array_test.cpp
@@ -0,0 +1,285 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <gtest/gtest.h>
+//#include <boost/date_time/posix_time/posix_time.hpp>
+#include "../multidimensional/array.h"
+
+namespace cmd = comma::containers::multidimensional; 
+
+TEST( multidimensional_array, impl_index_value )
+{
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {0, 0}, {1, 5} ), 0 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {0, 1}, {1, 5} ), 1 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {0, 4}, {1, 5} ), 4 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 0}, {1, 5} ), 5 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 1}, {2, 5} ), 6 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 2}, {2, 5} ), 7 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {1, 2}, {3, 5} ), 7 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::value( {2, 2}, {3, 5} ), 12 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {0, 0, 0}, {2, 3, 4} ), 0 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {0, 0, 3}, {2, 3, 4} ), 3 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {0, 1, 3}, {2, 3, 4} ), 7 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {1, 2, 3}, {2, 3, 4} ), 3 + 4 * ( 2 + 3 * 1 ) );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::value( {1, 2, 4}, {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+}
+
+TEST( multidimensional_array, impl_index_product )
+{
+    EXPECT_EQ( cmd::impl::index_traits< 1 >::product( {2} ), 2 );
+    EXPECT_EQ( cmd::impl::index_traits< 2 >::product( {2, 3} ), 6 );
+    EXPECT_EQ( cmd::impl::index_traits< 3 >::product( {2, 3, 4} ), 2 * 3 * 4 );
+    EXPECT_EQ( cmd::impl::index_traits< 4 >::product( {2, 3, 4, 5} ), 2 * 3 * 4 * 5 );
+}
+
+TEST( multidimensional_array, impl_index_inverted_value )
+{
+    typedef std::array< std::size_t, 3 > array_t;
+    { array_t a{0, 0, 0}; EXPECT_EQ( cmd::impl::index_traits< 3 >::value( 0, {2, 3, 4} ), a ); }
+    { array_t a{0, 0, 1}; EXPECT_EQ( cmd::impl::index_traits< 3 >::value( 1, {2, 3, 4} ), a ); }
+    { array_t a{2, 1, 3}; EXPECT_EQ( cmd::impl::index_traits< 3 >::value( 3 + 4 * ( 1 + 3 * 2 ), {2, 3, 4} ), a ); }
+    // todo: way more tests
+}
+
+TEST( multidimensional_array, index )
+{
+    {
+        cmd::array< int, 3 > a( {2, 3, 4}, 0 );
+        unsigned int i = 0;
+        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        typedef cmd::array< int, 3 >::index_type array_index_t;
+        typedef cmd::index< 3 > index_t;
+        EXPECT_EQ( ( array_index_t{1, 2, 3} ), ( index_t{1, 2, 3} ) );
+        EXPECT_EQ( ( index_t{1, 2, 3} ), ( array_index_t{1, 2, 3} ) );
+        EXPECT_EQ( ( a[{1, 2, 3}]), 23 );
+        EXPECT_EQ( ( a[ index_t( {1, 2, 3} )] ), 23 );
+        EXPECT_EQ( ( a[ index_t( {1, 2, 3} )] ), 23 );
+    }
+}
+
+TEST( multidimensional_array, iteration )
+{
+    {
+        typedef std::array< std::size_t, 3 > array_t;
+        cmd::array< int, 3 > a( {2, 3, 4}, 0 );
+        { array_t s{2, 3, 4}; EXPECT_EQ( a.shape(), s ); EXPECT_EQ( a.data().size(), 2 * 3 * 4 ); }
+        unsigned int i = 0;
+        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        i = 0;
+        for( auto it = a.data().begin(); it != a.data().end(); ++it ) { EXPECT_EQ( *it, i++ ); }
+        auto it = a.begin();
+        { array_t a{0, 0, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 0 ); ++it; }
+        { array_t a{0, 0, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 1 ); ++it; }
+        { array_t a{0, 0, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 2 ); ++it; }
+        { array_t a{0, 0, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 3 ); ++it; }
+        { array_t a{0, 1, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 4 ); ++it; }
+        { array_t a{0, 1, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 5 ); ++it; }
+        { array_t a{0, 1, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 6 ); ++it; }
+        { array_t a{0, 1, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 7 ); ++it; }
+        { array_t a{0, 2, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 8 ); ++it; }
+        { array_t a{0, 2, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 9 ); ++it; }
+        { array_t a{0, 2, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 10 ); ++it; }
+        { array_t a{0, 2, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 11 ); ++it; }
+        { array_t a{1, 0, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 12 ); ++it; }
+        { array_t a{1, 0, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 13 ); ++it; }
+        { array_t a{1, 0, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 14 ); ++it; }
+        { array_t a{1, 0, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 15 ); ++it; }
+        { array_t a{1, 1, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 16 ); ++it; }
+        { array_t a{1, 1, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 17 ); ++it; }
+        { array_t a{1, 1, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 18 ); ++it; }
+        { array_t a{1, 1, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 19 ); ++it; }
+        { array_t a{1, 2, 0}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 20 ); ++it; }
+        { array_t a{1, 2, 1}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 21 ); ++it; }
+        { array_t a{1, 2, 2}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 22 ); ++it; }
+        { array_t a{1, 2, 3}; EXPECT_EQ( it.index(), a ); EXPECT_EQ( *it, 23 ); ++it; }
+        EXPECT_TRUE( it == a.end() );
+    }
+}
+
+TEST( multidimensional_array, array )
+{
+    {
+        cmd::array< int, 3 > a( {2, 3, 4}, 0 );
+        unsigned int i = 0;
+        for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+        EXPECT_EQ( ( a[{0, 0, 0}] ), 0 );
+        EXPECT_EQ( ( a[{0, 1, 0}] ), 4 );
+        EXPECT_EQ( ( a[{1, 2, 3}] ), 23 );
+        a[{0, 0, 0}] = 111; EXPECT_EQ( ( a[{0, 0, 0}] ), 111 );
+        a[{1, 1, 2}] = 222; EXPECT_EQ( ( a[{1, 1, 2}] ), 222 );
+        a[{1, 2, 3}] = 333; EXPECT_EQ( ( a[{1, 2, 3}] ), 333 );
+    }
+}
+
+TEST( multidimensional_array, slice )
+{
+    {
+        {
+            cmd::array< int, 3 > a( {2, 3, 4}, 0 );
+            unsigned int i = 0;
+            for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+            typedef cmd::array< int, 2 >::index_type index_t;
+            cmd::slice< int, 2 > s = a.at( 0 );
+            { index_t i{0, 0}; EXPECT_EQ( s[i], 0 ); }
+            { index_t i{0, 1}; EXPECT_EQ( s[i], 1 ); }
+            { index_t i{0, 2}; EXPECT_EQ( s[i], 2 ); }
+            { index_t i{0, 3}; EXPECT_EQ( s[i], 3 ); }
+            { index_t i{1, 0}; EXPECT_EQ( s[i], 4 ); }
+            { index_t i{1, 1}; EXPECT_EQ( s[i], 5 ); }
+            { index_t i{1, 2}; EXPECT_EQ( s[i], 6 ); }
+            { index_t i{1, 3}; EXPECT_EQ( s[i], 7 ); }
+            { index_t i{2, 0}; EXPECT_EQ( s[i], 8 ); }
+            { index_t i{2, 1}; EXPECT_EQ( s[i], 9 ); }
+            { index_t i{2, 2}; EXPECT_EQ( s[i], 10 ); }
+            { index_t i{2, 3}; EXPECT_EQ( s[i], 11 ); }
+            {
+                auto t = s.at( 0 );
+                typedef cmd::array< int, 1 >::index_type index_t;
+                { index_t i{0}; EXPECT_EQ( t[i], 0 ); }
+                { index_t i{1}; EXPECT_EQ( t[i], 1 ); }
+                { index_t i{2}; EXPECT_EQ( t[i], 2 ); }
+                { index_t i{3}; EXPECT_EQ( t[i], 3 ); }
+                t = s.at( 1 );
+                { index_t i{0}; EXPECT_EQ( t[i], 4 ); }
+                { index_t i{1}; EXPECT_EQ( t[i], 5 ); }
+                { index_t i{2}; EXPECT_EQ( t[i], 6 ); }
+                { index_t i{3}; EXPECT_EQ( t[i], 7 ); }
+            }
+            s = a.at( 1 );
+            { index_t i{0, 0}; EXPECT_EQ( s[i], 12 ); }
+            { index_t i{0, 1}; EXPECT_EQ( s[i], 13 ); }
+            { index_t i{0, 2}; EXPECT_EQ( s[i], 14 ); }
+            { index_t i{0, 3}; EXPECT_EQ( s[i], 15 ); }
+            { index_t i{1, 0}; EXPECT_EQ( s[i], 16 ); }
+            { index_t i{1, 1}; EXPECT_EQ( s[i], 17 ); }
+            { index_t i{1, 2}; EXPECT_EQ( s[i], 18 ); }
+            { index_t i{1, 3}; EXPECT_EQ( s[i], 19 ); }
+            { index_t i{2, 0}; EXPECT_EQ( s[i], 20 ); }
+            { index_t i{2, 1}; EXPECT_EQ( s[i], 21 ); }
+            { index_t i{2, 2}; EXPECT_EQ( s[i], 22 ); }
+            { index_t i{2, 3}; EXPECT_EQ( s[i], 23 ); }
+            s[{1, 3}] = 111; EXPECT_EQ( ( a[{1, 1, 3}] ), 111 );
+        }
+        {
+            cmd::array< int, 3 > a( {2, 3, 4}, 0 );
+            unsigned int i = 0;
+            for( auto it = a.begin(); it != a.end(); ++it ) { *it = i++; }
+            typedef cmd::array< int, 1 >::index_type index_t;
+            {
+                cmd::slice< int, 1 > s = a.at< 2 >( {0, 0} ); // todo! super-ugly! improve templating!
+                { index_t i{0}; EXPECT_EQ( s[i], 0 ); } // todo: improve usage on 1-dimensional slices
+                { index_t i{1}; EXPECT_EQ( s[i], 1 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 2 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 3 ); }
+                s = a.at< 2 >( {0, 1} );
+                { index_t i{0}; EXPECT_EQ( s[i], 4 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 5 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 6 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 7 ); }
+                s = a.at< 2 >( {0, 2} );
+                { index_t i{0}; EXPECT_EQ( s[i], 8 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 9 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 10 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 11 ); }
+                s = a.at< 2 >( {1, 0} );
+                { index_t i{0}; EXPECT_EQ( s[i], 12 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 13 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 14 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 15 ); }
+                s = a.at< 2 >( {1, 1} );
+                { index_t i{0}; EXPECT_EQ( s[i], 16 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 17 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 18 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 19 ); }
+                s = a.at< 2 >( {1, 2} );
+                { index_t i{0}; EXPECT_EQ( s[i], 20 ); }
+                { index_t i{1}; EXPECT_EQ( s[i], 21 ); }
+                { index_t i{2}; EXPECT_EQ( s[i], 22 ); }
+                { index_t i{3}; EXPECT_EQ( s[i], 23 ); }
+            }
+        }
+    }
+}
+
+TEST( multidimensional_array, grid_index )
+{
+    {
+        cmd::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 3}, 0 );
+        typedef std::array< std::size_t, 2 > index_t;
+        int i = 0;
+        for( auto it = g.begin(); it != g.end(); ++it ) { *it = i++; }
+        { index_t i = {0, 0}; EXPECT_EQ( g.index_of( {0, 0} ), i ); }
+        { index_t i = {0, 1}; EXPECT_EQ( g.index_of( {0, 1} ), i ); }
+        { index_t i = {1, 0}; EXPECT_EQ( g.index_of( {1, 0} ), i ); }
+        { index_t i = {1, 1}; EXPECT_EQ( g.index_of( {1, 1} ), i ); }
+        { index_t i = {0, 1}; EXPECT_EQ( g.index_of( {0, 1.01} ), i ); }
+        // todo: more tests
+    }
+}
+
+TEST( multidimensional_array, grid_interpolate )
+{
+    {
+        cmd::grid< double, 2 > g( {0, 0}, {1, 1}, {2, 2}, 0 );
+        g[{0, 0}] = 0; g[{0, 1}] = 1; g[{1, 0}] = 0; g[{1, 1}] = 1;
+        EXPECT_EQ( g.interpolated( {0, 0} ), 0 );
+        EXPECT_EQ( g.interpolated( {0, 0.5} ), 0.5 );
+        EXPECT_EQ( g.interpolated( {0.5, 0.5} ), 0.5 );
+        //EXPECT_EQ( g.interpolated( {0.5, 0} ), 0.5 );
+        //EXPECT_EQ( g.interpolated( {1, 0} ), 2 );
+        //EXPECT_EQ( g.interpolated( {1, 1} ), 3 );
+    }
+}
+
+// TEST( vector_of_vectors, performance )
+// {
+//     //std::pair< unsigned int, unsigned int > size{ 10000000, 4 };
+//     std::pair< unsigned int, unsigned int > size{ 4096, 8 };
+//     std::vector< std::vector< float > > a( size.first, std::vector< float >( size.second, 0 ) );
+//     std::vector< float > b( size.first * size.second, 0 );
+//     {
+//         auto t0 = boost::posix_time::microsec_clock::universal_time();
+//         for( auto& c: a )
+//         {
+//             for( auto& d: c )
+//             {
+//                 d += 10;
+//             }
+//         }
+//         auto t1 = boost::posix_time::microsec_clock::universal_time();
+//         for( auto& d: b )
+//         {
+//             d += 10;
+//         }
+//         auto t2 = boost::posix_time::microsec_clock::universal_time();
+//         auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
+//         auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
+//         //std::cerr << "==> cashe hits:\tspeedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
+//         std::cerr << "==> cashe hits:\tspeedup: " << ( e0 / e1 ) << std::endl;
+//     }
+//     {
+//         std::vector< float > z( size.first * size.second, 0 );
+//         auto t0 = boost::posix_time::microsec_clock::universal_time();
+//         for( unsigned int i = 0; i < b.size(); ++i ) { z[i] = b[i]; }
+//         auto t1 = boost::posix_time::microsec_clock::universal_time();
+//         std::memcpy( reinterpret_cast< char* >( &z[0] ), reinterpret_cast< const char* >( &b[0] ), b.size() * sizeof( b[0] ) );
+//         auto t2 = boost::posix_time::microsec_clock::universal_time();
+//         auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
+//         auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
+//         //std::cerr << "==> memcpy:\tspeedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
+//         std::cerr << "==> memcpy vs element-wise assignment:\tspeedup: " << ( e0 / e1 ) << std::endl;
+//     }
+//     {
+//         std::vector< float > z( size.first * size.second, 0 );
+//         auto t0 = boost::posix_time::microsec_clock::universal_time();
+//         std::copy( b.begin(), b.end(), z.begin() );
+//         auto t1 = boost::posix_time::microsec_clock::universal_time();
+//         std::memcpy( reinterpret_cast< char* >( &z[0] ), reinterpret_cast< const char* >( &b[0] ), b.size() * sizeof( b[0] ) );
+//         auto t2 = boost::posix_time::microsec_clock::universal_time();
+//         auto e0 = double( ( t1 - t0 ).total_microseconds() ) / 1e6;
+//         auto e1 = double( ( t2 - t1 ).total_microseconds() ) / 1e6;
+//         //std::cerr << "==> memcpy:\tspeedup: " << ( e0 / e1 ) << "\tvector of vectors: elapsed: " << e0 << "\tvector: elapsed: " << e1 << std::endl;
+//         std::cerr << "==> memcpy vs std::copy:\tspeedup: " << ( e0 / e1 ) << std::endl;
+//     }
+//     // todo! multidimensional::array performance
+// }
diff --git a/containers/test/multidimensional_index_test.cpp b/containers/test/multidimensional_index_test.cpp
new file mode 100644
index 000000000..186ac816b
--- /dev/null
+++ b/containers/test/multidimensional_index_test.cpp
@@ -0,0 +1,80 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <gtest/gtest.h>
+//#include <boost/date_time/posix_time/posix_time.hpp>
+#include "../multidimensional/index.h"
+
+namespace cmd = comma::containers::multidimensional; 
+
+TEST( multidimentional_index, basics )
+{
+    {
+        cmd::index< 4 > i;
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 0 );
+        EXPECT_EQ( i[2], 0 );
+        EXPECT_EQ( i[3], 0 );
+    }
+    {
+        cmd::index< 4 > i{};
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 0 );
+        EXPECT_EQ( i[2], 0 );
+        EXPECT_EQ( i[3], 0 );
+    }
+    {
+        cmd::index< 4 > i{0, 1, 2, 3};
+        EXPECT_EQ( i[0], 0 );
+        EXPECT_EQ( i[1], 1 );
+        EXPECT_EQ( i[2], 2 );
+        EXPECT_EQ( i[3], 3 );
+    }
+    {
+        cmd::index< 1 > i;
+        cmd::index< 1 > j{5};
+        EXPECT_TRUE( i < j );
+        EXPECT_TRUE( i != j );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{1} );
+        EXPECT_EQ( i.increment( j ), cmd::index< 1 >{2} );
+    }
+    {
+        cmd::index< 2 > i;
+        cmd::index< 2 > j{3, 2};
+        EXPECT_EQ( i               , ( cmd::index< 2 >{0, 0} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0, 1} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1, 0} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{1, 1} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2, 0} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{2, 1} ) );
+        EXPECT_TRUE( i < j );
+        EXPECT_EQ( i.increment( j ), ( cmd::index< 2 >{0, 0} ) );
+        EXPECT_TRUE( i == cmd::index< 2 >{} );
+    }
+    {
+        cmd::index< 2 >::iterator i{{3u, 2u}};
+        EXPECT_TRUE( bool( i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 1u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{1u, 1u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 0u} ) );
+        EXPECT_TRUE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{2u, 1u} ) );
+        EXPECT_FALSE( bool( ++i ) );
+        EXPECT_EQ( *i, ( cmd::index< 2 >{0u, 0u} ) );
+    }
+    {
+        unsigned int count{0};
+        for( cmd::index< 2 >::iterator i{{3u, 2u}}; i; ++i, ++count );
+        EXPECT_EQ( count, 6 );
+    }
+}
diff --git a/containers/test/multidimensional_map_test.cpp b/containers/test/multidimensional_map_test.cpp
new file mode 100644
index 000000000..e0516f19d
--- /dev/null
+++ b/containers/test/multidimensional_map_test.cpp
@@ -0,0 +1,141 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#include <gtest/gtest.h>
+#include "../multidimensional/map.h"
+
+TEST( multikey_map, usage )
+{
+    comma::containers::multidimensional::map< double, int, 3 > m( { 0, 0, 0 }, { 1, 2, 3 } );
+    m.touch_at( { 1, 2, 3 } );
+    // todo
+}
+
+TEST( multikey_map, index )
+{
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
+    {
+        map_type m( {1, 1, 1} );
+        {
+            map_type::index_type i = {{ 0, 0, 0 }};
+            EXPECT_EQ( i, m.index_of( {0., 0., 0.} ) );
+            EXPECT_EQ( i, m.index_of( {0.001, 0.001, 0.001} ) );
+            EXPECT_EQ( i, m.index_of( {0.999, 0.999, 0.999} ) );
+        }
+        {
+            map_type::index_type i = {{ 1, 1, 1 }};
+            EXPECT_EQ( i, m.index_of( {1.0, 1.0, 1.0} ) );
+            EXPECT_EQ( i, m.index_of( {1.001, 1.001, 1.001} ) );
+            EXPECT_EQ( i, m.index_of( {1.999, 1.999, 1.999} ) );
+        }
+        {
+            map_type::index_type i = {{ -1, -1, -1 }};
+            EXPECT_EQ( i, m.index_of( {-1.0, -1.0, -1.0} ) );
+            EXPECT_EQ( i, m.index_of( {-0.999, -0.999, -0.999} ) );
+            EXPECT_EQ( i, m.index_of( {-0.001, -0.001, -0.001} ) );
+        }
+    }
+    {
+        map_type m( {0.3, 0.3, 0.3} );
+        {
+            map_type::index_type i = {{ 0, 0, 0 }};
+            EXPECT_EQ( i, m.index_of( {0, 0, 0} ) );
+            EXPECT_EQ( i, m.index_of( {0.001, 0.001, 0.001} ) );
+            EXPECT_EQ( i, m.index_of( {0.299, 0.299, 0.299} ) );
+        }        
+        {
+            map_type::index_type i = {{ 1, 1, 1 }};
+            EXPECT_EQ( i, m.index_of( {0.3, 0.3, 0.3} ) );
+            EXPECT_EQ( i, m.index_of( {0.3001, 0.3001, 0.3001} ) );
+            EXPECT_EQ( i, m.index_of( {0.3999, 0.3999, 0.3999} ) );
+        }
+        {
+            map_type::index_type i = {{ -1, -1, -1 }};
+            EXPECT_EQ( i, m.index_of( {-0.3, -0.3, -0.3} ) );
+            EXPECT_EQ( i, m.index_of( {-0.299, -0.299, -0.299} ) );
+            EXPECT_EQ( i, m.index_of( {-0.001, -0.001, -0.001} ) );
+        }        
+    }
+}
+
+TEST( multikey_map, operations )
+{
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
+    map_type m( {1, 1, 1} );
+    {
+        EXPECT_TRUE( ( m.at( map_type::point_type{1., 1., 1.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.touch_at( map_type::point_type{1., 1., 1.} ) != m.end() ) );
+        EXPECT_EQ( 1, m.size() );
+        EXPECT_TRUE( ( m.at( map_type::point_type{1., 1., 1.} ) != m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{1., 1., 1.} ) == m.at( map_type::point_type{1.1, 1.1, 1.1} ) ) );
+        EXPECT_TRUE( ( m.touch_at( {1, 1, 1} ) != m.end() ) );
+        EXPECT_EQ( 1, m.size() );
+        EXPECT_TRUE( ( m.touch_at( {1.1, 1.1, 1.1} ) != m.end() ) );
+        EXPECT_EQ( 1, m.size() );
+    }
+    {
+        EXPECT_TRUE( ( m.at( map_type::point_type{-1., -1., -1.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.touch_at( {-1., -1., -1.} ) != m.end() ) );
+        EXPECT_EQ( 2, m.size() );
+        EXPECT_TRUE( ( m.at( map_type::point_type{-1., -1., -1.} ) != m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{-1., -1., -1.} ) == m.at( map_type::point_type{-0.1, -0.1, -0.1} ) ) );
+        EXPECT_TRUE( ( m.touch_at( {-1., -1., -1.} ) != m.end() ) );
+        EXPECT_EQ( 2, m.size() );
+        EXPECT_TRUE( ( m.touch_at( {-0.1, -0.1, -0.1} ) != m.end() ) );
+        EXPECT_EQ( 2, m.size() );
+    }
+    {
+        EXPECT_TRUE( ( m.at( map_type::point_type{0., 0., 0.} ) == m.end() ) );
+        EXPECT_TRUE( ( m.touch_at( {0., 0., 0.} ) != m.end() ) );
+        EXPECT_EQ( 3, m.size() );
+        EXPECT_TRUE( ( m.at( map_type::point_type{0., 0, 0} ) != m.end() ) );
+        EXPECT_TRUE( ( m.at( map_type::point_type{0., 0, 0} ) == m.at( map_type::point_type{0.1, 0.1, 0.1} ) ) );
+        EXPECT_TRUE( ( m.touch_at( {0., 0, 0} ) != m.end() ) );
+        EXPECT_EQ( 3, m.size() );
+        EXPECT_TRUE( ( m.touch_at( {0.1, 0.1, 0.1} ) != m.end() ) );
+        EXPECT_EQ( 3, m.size() );
+    }
+}
+
+TEST( multikey_map, test )
+{
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
+    map_type m( {1, 1, 1} );
+    EXPECT_TRUE( m.empty() );
+}
+
+TEST( multikey_map, neighbourhood )
+{
+    typedef comma::containers::multidimensional::map< double, int, 3 > map_type;
+    map_type m( {1, 1, 1} );
+    {
+        EXPECT_TRUE( ( m.at( map_type::point_type{1, 1, 1} ) == m.end() ) );
+        {
+            EXPECT_TRUE( ( m.touch_at( {1, 1, 1} ) != m.end() ) );
+            EXPECT_EQ( 1, m.size() );
+            m.touch_at( {1, 1, 1} )->second = 111;
+            EXPECT_EQ( 111, m.at( map_type::point_type{1, 1, 1} )->second );
+            map_type::index_type index = {{ 1, 1, 1 }};
+            EXPECT_EQ( 111, m.base_type::find( index )->second );
+        }
+        {
+            EXPECT_TRUE( ( m.touch_at( {2, 2, 2} ) != m.end() ) );
+            EXPECT_EQ( 2, m.size() );
+            m.touch_at( {2, 2, 2} )->second = 222;
+            EXPECT_EQ( 222, m.at( map_type::point_type{2, 2, 2} )->second );
+            map_type::index_type index = {{ 2, 2, 2 }};
+            EXPECT_EQ( 222, m.base_type::find( index )->second );
+        }
+        {
+            map_type::index_type index = {{ -1, 0, 0 }};
+            EXPECT_TRUE( m.base_type::find( index ) == m.end() );
+        }
+        {
+            map_type::index_type index = {{ 0, 0, 0 }};
+            EXPECT_TRUE( m.base_type::find( index ) == m.end() );
+        }
+        {
+            map_type::index_type index = {{ 2, 2, 3 }};
+            EXPECT_TRUE( m.base_type::find( index ) == m.end() );
+        }
+    }
+}
diff --git a/containers/test/ordered_queues_test.cpp b/containers/test/ordered_queues_test.cpp
new file mode 100644
index 000000000..923197ea7
--- /dev/null
+++ b/containers/test/ordered_queues_test.cpp
@@ -0,0 +1,202 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+
+#include <gtest/gtest.h>
+#include <boost/date_time/posix_time/posix_time.hpp>
+#include "../ordered/queues.h"
+
+TEST( queues, usage )
+{
+    typedef comma::containers::ordered::queues< int, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/  };
+
+    EXPECT_EQ( std::get<0>(q).size(), 0 );
+    EXPECT_EQ( std::get<1>(q).size(), 0 );
+    EXPECT_EQ( q.ready(), false );
+
+    std::get<0>(q).push_back( std::make_pair( 0, 1 ) );
+    EXPECT_EQ( std::get<0>(q).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 0 );
+    EXPECT_EQ( q.ready(), false );
+
+    std::get<1>(q).push_back( std::make_pair( 0, 1 ) );
+    EXPECT_EQ( std::get<1>(q).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+    // Purge should only remove items if they are unsynced
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).front().second, 1 );
+    EXPECT_EQ( std::get<1>(q).front().second, 1 );
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+}
+
+TEST( queues, sync_first_to_second ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/  };
+
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 0}, {2, 0}, {4, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 4 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );    
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+}
+
+TEST( queues, sync_second_to_first ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/  };
+
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {1, 0}, {2, 0}, {4, 5} });
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_EQ( std::get<1>(q).front().first, 4 );    
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+
+}
+
+TEST( queues, empty_list_before_sync ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 0}, {1, 0}, {2, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 0 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), false );
+}
+
+TEST( queues, sync_and_pop ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 0.9 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 1}, {1, 1}, {2, 1}, {3, 1}, {4, 1}, {5, 1} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {3, 2}, {5, 2}});
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 3 ); // {3, 1}, {4, 1}, {5, 1} });
+    EXPECT_EQ( std::get<1>(q).size(), 2 ); // {3, 2}, {5, 2}});
+    EXPECT_EQ( std::get<0>(q).front().first, 3 );
+    EXPECT_EQ( std::get<1>(q).front().first, 3 );
+    EXPECT_EQ( q.ready(), true );
+
+    auto data = q.front();
+    q.pop_all();
+    EXPECT_EQ( std::get<0>(data).first, 3 );
+    EXPECT_EQ( std::get<1>(data).first, 3 );
+    EXPECT_EQ( std::get<0>(q).size(), 2 ); // {4, 1}, {5, 1} });
+    EXPECT_EQ( std::get<1>(q).size(), 1 ); // {5, 2}});
+    EXPECT_EQ( std::get<0>(q).front().first, 4 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );
+
+    EXPECT_EQ( q.ready(), false );
+    q.purge();
+    EXPECT_EQ( q.ready(), true );
+
+    EXPECT_EQ( std::get<0>(q).size(), 1 ); // {5, 1} });
+    EXPECT_EQ( std::get<1>(q).size(), 1 ); // {5, 2}});
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );
+    EXPECT_EQ( q.ready(), true );
+}
+
+TEST( queues, max_time_offset ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {3, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 3 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );        
+    EXPECT_EQ( q.ready(), true );
+}
+
+TEST( queues, floating_point_error ){
+    typedef comma::containers::ordered::queues< float, int, int > queues_t;
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {3.000001, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_NEAR( std::get<0>(q).front().first, 3.000001, 1e-6 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );        
+    EXPECT_EQ( q.ready(), true );
+    }
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {2.999999, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 0 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().first, 5 );        
+    EXPECT_EQ( q.ready(), false );
+    }
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {3.000001, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<1>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_NEAR( std::get<1>(q).front().first, 3.000001, 1e-6 );
+    EXPECT_EQ( q.ready(), true );
+    }
+    {
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {5, 5} });
+    std::get<1>(q) = std::deque< std::pair< float, int > >({ {2.999999, 5} });
+    q.purge();
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 0 );
+    EXPECT_EQ( std::get<0>(q).front().second, 5 );
+    EXPECT_EQ( std::get<0>(q).front().first, 5 );
+    EXPECT_EQ( q.ready(), false );
+    }    
+}
+
+TEST( queues, type_difference )
+{
+    typedef comma::containers::ordered::queues< float, int, double > queues_t;
+    queues_t q{ 2 /*timeout*/ };
+    std::get<0>(q) = std::deque< std::pair< float, int > >({ {0, 1} });
+    std::get<1>(q) = std::deque< std::pair< float, double > >({ {0, 1.0} });
+}
+
+TEST( queues, boost_time )
+{
+    typedef comma::containers::ordered::queues< boost::posix_time::ptime, double, double > queues_t;
+    queues_t q{boost::posix_time::seconds( 2 /*timeout*/  ) };
+
+    boost::posix_time::ptime t( boost::gregorian::date( 2023, 1, 1 ) );
+    std::get<0>(q) = std::deque< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    std::get<1>(q) = std::deque< std::pair< boost::posix_time::ptime, double > >({ {t, 1.0} });
+    EXPECT_EQ( std::get<0>(q).size(), 1 );
+    EXPECT_EQ( std::get<1>(q).size(), 1 );
+    EXPECT_EQ( q.ready(), true );
+}
diff --git a/containers/vector.h b/containers/vector.h
index 342187fbb..091c550f0 100644
--- a/containers/vector.h
+++ b/containers/vector.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CONTAINERS_VECTOR_H_
-#define COMMA_CONTAINERS_VECTOR_H_
+#pragma once
 
 #include <cmath>
 #include <vector>
@@ -69,5 +40,3 @@ struct regular_vector : public std::vector< T >
 };
 
 } // namespace comma {
-
-#endif // COMMA_CONTAINERS_VECTOR_H_
diff --git a/csv/CMakeLists.txt b/csv/CMakeLists.txt
index 3de46ff97..ec9d76ec4 100644
--- a/csv/CMakeLists.txt
+++ b/csv/CMakeLists.txt
@@ -11,7 +11,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} ${impl_includes} )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} ${impl_source} ${impl_includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+target_link_libraries( ${TARGET_NAME} comma_application comma_timing comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
diff --git a/csv/applications/CMakeLists.txt b/csv/applications/CMakeLists.txt
index 7cd1fb6c4..9a3b6fa06 100644
--- a/csv/applications/CMakeLists.txt
+++ b/csv/applications/CMakeLists.txt
@@ -7,11 +7,17 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${play_source} ${play_includes} ${source} ${i
 
 add_executable( csv-quote csv-quote.cpp )
 target_link_libraries( csv-quote ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
+set_target_properties( csv-quote PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-quote RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-fields ${dir}/csv-fields.cpp )
+target_link_libraries ( csv-fields ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
+set_target_properties( csv-fields PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS csv-fields RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
 add_executable( csv-format ${dir}/csv-format.cpp )
 add_executable( csv-size ${dir}/csv-size.cpp )
+add_executable( csv-seek ${dir}/csv-seek.cpp )
 add_executable( csv-select ${dir}/csv-select.cpp )
 add_executable( csv-bin-cut ${dir}/csv-bin-cut.cpp )
 add_executable( csv-from-columns ${dir}/csv-from-columns.cpp )
@@ -28,39 +34,64 @@ add_executable( csv-from-bin ${dir}/csv-from-bin.cpp )
 add_executable( csv-calc ${dir}/csv-calc.cpp )
 add_executable( csv-calc-new ${dir}/csv-calc.new.cpp )
 add_executable( csv-crc ${dir}/csv-crc.cpp )
-add_executable( csv-play ${dir}/csv-play.cpp ${dir}/play/multiplay.cpp ${dir}/play/play.cpp )
+add_executable( csv-play ${dir}/csv-play.cpp ${dir}/play/multiplay.h ${dir}/play/multiplay.cpp ${dir}/play/play.h ${dir}/play/play.cpp )
 add_executable( csv-shape ${dir}/csv-shape.cpp )
 add_executable( csv-shuffle ${dir}/csv-shuffle.cpp )
 add_executable( csv-thin ${dir}/csv-thin.cpp )
 add_executable( csv-analyse ${dir}/csv-analyse.cpp )
 add_executable( csv-to-sql ${dir}/csv-to-sql.cpp )
 
-target_link_libraries ( csv-fields ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-format ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-size ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-bin-cut ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_xpath )
-target_link_libraries ( csv-split comma_csv comma_application comma_io comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+target_link_libraries ( csv-split comma_csv comma_application comma_io comma_string comma_xpath comma_name_value ${comma_ALL_EXTERNAL_LIBRARIES} )
 target_link_libraries ( csv-from-columns ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string )
-target_link_libraries ( csv-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
+target_link_libraries ( csv-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string comma_name_value )
 target_link_libraries ( csv-sort ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
-target_link_libraries ( csv-select ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string )
-target_link_libraries ( csv-paste ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_io )
-target_link_libraries ( csv-time ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
+target_link_libraries ( csv-seek ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string comma_name_value )
+target_link_libraries ( csv-select ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_xpath comma_string comma_name_value )
+target_link_libraries ( csv-paste ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv comma_io comma_name_value )
+target_link_libraries ( csv-time ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string comma_timing )
 target_link_libraries ( csv-time-delay ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string comma_xpath )
-target_link_libraries ( csv-time-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_string comma_xpath )
+target_link_libraries ( csv-time-join ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_string comma_xpath comma_name_value )
 target_link_libraries ( csv-time-stamp ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string )
 target_link_libraries ( csv-to-bin ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application ) # profiler )
 target_link_libraries ( csv-from-bin ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application )
 target_link_libraries ( csv-calc ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_string )
 target_link_libraries ( csv-calc-new ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_string )
 target_link_libraries ( csv-crc ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_string )
-target_link_libraries ( csv-play ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_io )
+target_link_libraries ( csv-play ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_io comma_name_value )
 target_link_libraries ( csv-shape ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-shuffle ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 target_link_libraries ( csv-thin ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_application comma_io )
 target_link_libraries ( csv-analyse ${comma_ALL_EXTERNAL_LIBRARIES} comma_application )
 target_link_libraries ( csv-to-sql ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_csv )
 
+set_target_properties( csv-bin-cut PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-format PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-join PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-sort PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-from-columns PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-paste PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-split PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time-delay PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time-join PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-time-stamp PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-to-bin PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-from-bin PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-size PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-calc PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-play PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-shape PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-shuffle PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-crc PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-seek PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-select PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-thin PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-analyse PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( csv-to-sql PROPERTIES LINK_FLAGS_RELEASE -s )
+
 install( TARGETS csv-bin-cut
                  csv-fields
                  csv-format
@@ -81,6 +112,7 @@ install( TARGETS csv-bin-cut
                  csv-shape
                  csv-shuffle
                  csv-crc
+                 csv-seek
                  csv-select
                  csv-thin
                  csv-analyse
@@ -92,34 +124,57 @@ install ( PROGRAMS csv-gate DESTINATION ${comma_INSTALL_BIN_DIR} )
 
 add_executable( csv-blocks ${dir}/csv-blocks.cpp )
 target_link_libraries ( csv-blocks ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-blocks PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-blocks RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-cast ${dir}/csv-cast.cpp )
 target_link_libraries ( csv-cast ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv )
+set_target_properties( csv-cast PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-cast RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( csv-enumerate ${dir}/csv-enumerate.cpp )
 target_link_libraries ( csv-enumerate ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-enumerate PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-enumerate RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
-add_executable( csv-interval ${dir}/csv-interval.cpp )
-target_link_libraries ( csv-interval ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath )
-install( TARGETS csv-interval RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+add_executable( csv-intervals ${dir}/csv-intervals.cpp )
+target_link_libraries ( csv-intervals ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_name_value )
+set_target_properties( csv-intervals PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS csv-intervals RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
          
 add_executable( csv-units ${dir}/csv-units.cpp )
 target_link_libraries ( csv-units ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_io comma_xpath comma_string )
+set_target_properties( csv-units PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-units RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
+add_executable( csv-random ${dir}/csv-random.cpp )
+target_link_libraries ( csv-random ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-random PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS csv-random RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
+add_executable( csv-strings ${dir}/csv-strings.cpp )
+target_link_libraries ( csv-strings ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-strings PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS csv-strings RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
 add_executable( csv-update ${dir}/csv-update.cpp )
 target_link_libraries ( csv-update ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_io comma_string comma_xpath comma_csv )
+set_target_properties( csv-update PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-update RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 if( NOT WIN32 )
     add_executable( csv-repeat ${dir}/csv-repeat.cpp )
     target_link_libraries ( csv-repeat comma_application comma_csv comma_io )
+    set_target_properties( csv-repeat PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS csv-repeat RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 endif()
 
 add_executable( csv-bin-reverse ${dir}/csv-bin-reverse.cpp )
 target_link_libraries ( csv-bin-reverse ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_string comma_xpath comma_csv )
+set_target_properties( csv-bin-reverse PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS csv-bin-reverse RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
+add_executable( csv-bits ${dir}/csv-bits.cpp )
+target_link_libraries ( csv-bits ${comma_ALL_EXTERNAL_LIBRARIES} comma_application comma_csv comma_string )
+set_target_properties( csv-bits PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS csv-bits RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
diff --git a/csv/applications/csv-analyse.cpp b/csv/applications/csv-analyse.cpp
index d07a38c4b..d86a9c760 100644
--- a/csv/applications/csv-analyse.cpp
+++ b/csv/applications/csv-analyse.cpp
@@ -37,7 +37,6 @@
 #include <iostream>
 #include <map>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 
 using namespace comma;
 
@@ -63,18 +62,15 @@ class histogram
         //sort, ugly
         std::multimap< std::size_t, std::size_t > sorted;
         std::size_t sum=0;
-        
         for(std::map< std::size_t, std::size_t >::const_iterator it=histogram_.begin(), end=histogram_.end(); it!=end; ++it )
         {
             sorted.insert( std::make_pair(it->second,it->first) );
             sum += it->second;
-        }
-        
+        }        
         for(std::multimap< std::size_t, std::size_t >::const_reverse_iterator it=sorted.rbegin(), end=sorted.rend(); it!=end; ++it )
         {
             os << it->second << "," << it->first << "," << (double)((double)(it->first)/(double)sum) << std::endl;
         }
-    
         return os;
     }
 
@@ -84,12 +80,9 @@ class histogram
     std::map< std::size_t, std::size_t > histogram_; //length, count
 };
 
-std::ostream& operator<<(std::ostream& os, const histogram & h)
-{
-    return h.print_sorted(os);
-}
+std::ostream& operator<<(std::ostream& os, const histogram & h) { return h.print_sorted(os); }
 
-static void usage()
+static void usage( bool )
 {
     std::cerr << std::endl;
     std::cerr << "Analyse binary data to guess message lengths in unknown binary stream: output candidate lengths, repeat counts and normalised probabilities" << std::endl;
@@ -121,7 +114,6 @@ static void usage()
     std::cerr << std::endl;
     std::cerr << "See also: \"csv-size\", \"csv-bin-cut\"" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( -1 );
 }
@@ -133,33 +125,22 @@ int main( int ac, char** av )
         #ifdef WIN32
             _setmode( _fileno( stdin ), _O_BINARY );
         #endif
-
-        command_line_options options( ac, av );
-        if( ac > 1 || options.exists( "--help" ) || options.exists( "-h" ) ) { usage(); } //could just say ac > 1... but leave for future args
-
-        histogram h;
-
-        const std::size_t read_size=65535; //todo: better way?
+        command_line_options options( ac, av, usage );
+        const std::size_t read_size = 65535; // todo? better way?
         std::vector< unsigned char > data( read_size );
-        std::size_t offset=0;
-
-        //read as many bytes as available on stdin
-        while( std::cin.good() && !std::cin.eof() )
+        std::size_t offset = 0;
+        histogram h;
+        while( std::cin.good() && !std::cin.eof() ) //read as many bytes as available on stdin
         {
             int bytes_read = ::read( 0, &data[0], read_size );
             if( bytes_read <= 0 ) { break; }
-                        
-            for( int i=0; i<bytes_read; ++i )
-            {
-                h.observe(data[i],offset+i);
-            }
-            offset+=bytes_read;
+            for( int i = 0; i < bytes_read; ++i ) { h.observe( data[i], offset + i ); }
+            offset += bytes_read;
         }
-       
         std::cout << h;
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "csv-analyse: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-analyse: unknown exception" << std::endl; }
-    usage();
+    return 1;
 }
diff --git a/csv/applications/csv-bin-cut.cpp b/csv/applications/csv-bin-cut.cpp
index ce87a1067..3fbc2c9b1 100644
--- a/csv/applications/csv-bin-cut.cpp
+++ b/csv/applications/csv-bin-cut.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author dmitry mikhin
 
@@ -40,7 +13,6 @@
 #include <fstream>
 #include <numeric>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../csv/format.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
@@ -150,7 +122,6 @@ namespace {
             std::cerr << "Format specifications:" << std::endl;
             std::cerr << csv::format::usage() << std::endl;
         }
-        std::cerr << comma::contact_info << std::endl;
         std::cerr << std::endl;
         exit( 0 );
     }
@@ -291,7 +262,8 @@ namespace {
         // - check for read errors / end of input
         // - write the buffer to stdout
         std::streampos record_start = 0;
-        if ( skip_ ) {
+        if ( skip_ )
+        {
             ifs.seekg( 0, std::ios_base::end );
             std::streampos fsize = ifs.tellg();
             unsigned int nrecords = fsize / irecord_size_;
@@ -309,7 +281,8 @@ namespace {
                 std::streamoff off = fields_[i].input_offset - ( i == 0 ? 0 : fields_[i - 1].input_offset + fields_[i - 1].size );
                 ifs.seekg( off, std::ios_base::cur );
                 ifs.read( &obuf_[ fields_[i].offset ], fields_[i].size );
-                if ( ifs.eof() ) {
+                if ( ifs.eof() )
+                {
                     if ( i == 0 ) { break; }
                     std::cerr << "csv-bin-cut: encountered eof mid-record in '" << fname << "'" << std::endl; exit( 1 );
                 }
@@ -334,12 +307,16 @@ namespace {
     int seeker::process( const std::vector< std::string > & files )
     {
         if ( files.empty() ) { return read_all( std::cin ); }
-        for ( std::vector< std::string >::const_iterator ifile = files.begin(); ifile < files.end(); ++ifile ) {
-            if ( count_max_ >= 0 && count_ >= count_max_ ) { return 0; }
-            if ( *ifile == "-" ) {
+        for ( std::vector< std::string >::const_iterator ifile = files.begin(); ifile < files.end(); ++ifile )
+        {
+            if( count_max_ >= 0 && count_ >= count_max_ ) { return 0; }
+            if( *ifile == "-" )
+            {
                 int rv = read_all( std::cin );
                 if ( rv != 0 ) { return rv; }
-            } else {
+            }
+            else
+            {
                 std::ifstream ifs( &( *ifile )[0], std::ifstream::binary );
                 if ( !ifs.is_open() ) { std::cerr << "csv-bin-cut: cannot open '" << *ifile << "' for reading" << std::endl; exit( 1 ); }
                 int rv = ( force_read_ ? read_all( ifs ) : read_fields( ifs, *ifile ) );
@@ -361,31 +338,22 @@ int main( int ac, char** av )
     {
         command_line_options options( ac, av, usage );
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         std::vector< std::string > files = options.unnamed( "--help,-h,--verbose,-v,--flush,--read-all,--force-read", "--fields,-f,--output-fields,--output,-o,--binary,-b,--skip,--count" );
         if( !csv.binary() )
         {
             if( files.size() == 1 && files[0] != "-" ) // deprecated, left for backward compatibility
             {
-                try
-                {
-                    csv.format( comma::csv::format( files[0] ) );
-                    files.clear();
-                }
-                catch ( comma::exception & )
-                {
-                    // it's not a format string
-                }
+                try { csv.format( comma::csv::format( files[0] ) ); files.clear(); }
+                catch ( comma::exception & ) {} // it's not a format string
             }
         }
         if( !csv.binary() ) { std::cerr << "csv-bin-cut: please specify --binary" << std::endl; exit( 1 ); }
-
         const std::vector< field >& fields = setup_fields( options, csv );
-
         unsigned int skip = options.value< unsigned int >( "--skip", 0 );
         long int count_max = options.value< long int >( "--count", -1 );
         bool flush = options.exists( "--flush" );
         bool force_read = options.exists( "--read-all,--force-read" );
-
         seeker seek( fields, csv, skip, count_max, flush, force_read );
         return seek.process( files );
     }
diff --git a/csv/applications/csv-bits.cpp b/csv/applications/csv-bits.cpp
new file mode 100644
index 000000000..b4c7edebc
--- /dev/null
+++ b/csv/applications/csv-bits.cpp
@@ -0,0 +1,173 @@
+#include <endian.h>
+#include <array>
+#include <memory>
+#include <numeric>
+#include <vector>
+#include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../base/types.h"
+#include "../../string/string.h"
+#include "../stream.h"
+#include "../traits.h"
+
+void usage( bool verbose )
+{
+    std::cerr << "converting between bits and csv and other bit operations" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat input.bin | csv-bits <operation> <options> > output.bin" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations: from-csv (unpack), to-csv (pack)" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    from-csv (pack): todo; convert input csv as to packed bits in big endian order" << std::endl;
+    std::cerr << "        options" << std::endl;
+    //std::cerr << "            --endian=<which>; default=big; todo: endianness of input: big or little" << std::endl;
+    std::cerr << "            --binary,-b=[<format>]; input is binary; see details below" << std::endl;
+    std::cerr << "            --flush; see below" << std::endl;
+    std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    to-csv (unpack): convert packed bits to integers as csv; input bits are expected in big endian order" << std::endl;
+    std::cerr << "        options" << std::endl;
+    //std::cerr << "            --endian=<which>; default=big; todo: endianness of output: big or little" << std::endl;
+    std::cerr << "            --binary,-b=[<format>]; output is binary; see details below" << std::endl;
+    std::cerr << "            --flush; see below" << std::endl;
+    std::cerr << "            --sizes=<sizes>; comma-separated bit field sizes (todo: support multiplier)" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+// todo
+//   - to-csv
+//     - sort out endianness: big endian vs transparent semantic use in the mainstream use case
+//     - unit test
+//     - support uint64
+//   - from-csv
+//   - use constexpr
+
+namespace comma { namespace csv_bits {
+
+struct unpacked
+{
+    std::vector< comma::uint32 > values;
+    unpacked( unsigned int size = 0 ): values( size, 0 ) {}
+};
+
+struct field
+{
+    unsigned int begin;
+    unsigned int begin_byte;
+    unsigned char begin_mask;
+    unsigned int size;
+    unsigned int bytes;
+    unsigned int shift;
+    bool little_endian;
+
+    static std::array< unsigned char, 8 > begin_masks;
+
+    field() = default;
+    field( unsigned int begin, unsigned int size, bool little_endian )
+        : begin( begin )
+        , begin_byte( begin / 8 )
+        , begin_mask( begin_masks[ begin % 8 ] )
+        , size( size )
+        , bytes( size / 8 + int( size % 8 > 0 ) )
+        , shift( 64 - begin % 8 - size )
+        , little_endian( little_endian )
+    {
+        if( size > sizeof( comma::uint32 ) * 8 ) { COMMA_THROW( comma::exception, "expected size up to " << ( sizeof( comma::uint32 ) * 8 ) << " bits; got: " << size ); }
+    }
+
+    comma::uint32 get( const std::vector< char >& buf ) const // todo: quick and dirty, watch performance
+    {
+        comma::uint64 r = 0;
+        char* p = reinterpret_cast< char* >( &r );
+        std::memcpy( p, &buf[ begin_byte ], bytes );
+        p[0] &= begin_mask;
+        // todo: something like: r = little_endian ? le64toh( r ) : be64toh( r );
+        comma::uint64 s = htobe64( r ) >> shift;
+        return s;
+    }
+};
+
+std::array< unsigned char, 8 > field::begin_masks = { 255, 127, 63, 31, 15, 7, 3, 1 }; // todo: use constexpr
+
+} } // namespace comma { namespace csv_bits {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv_bits::unpacked >
+{
+    template < typename K, typename V > static void visit( const K&, const comma::csv_bits::unpacked& p, V& v ) { v.apply( "values", p.values ); }
+    template < typename K, typename V > static void visit( const K&, comma::csv_bits::unpacked& p, V& v ) { v.apply( "values", p.values ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace csv_bits { namespace from_csv {
+
+int run( const comma::command_line_options& options )
+{
+    #ifdef WIN32
+        _setmode( _fileno( stdout ), _O_BINARY );
+    #endif
+    comma::csv::options csv( options );
+    std::cerr << "csv-bits: from-csv: todo" << std::endl;
+    return 1;
+}
+
+} } } // namespace comma { namespace csv_bits { namespace from_csv {
+
+namespace comma { namespace csv_bits { namespace to_csv {
+
+int run( const comma::command_line_options& options )
+{
+    #ifdef WIN32
+        _setmode( _fileno( stdin ), _O_BINARY );
+    #endif
+    comma::csv::options csv( options );
+    if( !csv.flush ) { std::cin.tie( NULL ); }
+    const auto& sizes = comma::split_as< unsigned int >( options.value< std::string >( "--sizes" ), ',' );
+    unsigned int size = std::accumulate( sizes.begin(), sizes.end(), 0 );
+    if( size % 8 > 0 ) { std::cerr << "csv-bits: to-csv: expected input record size in bits divisible by 8; got: " << size << " (oddly-sized record support: todo)" << std::endl; return 1; }
+    size /= 8;
+    bool little_endian = options.value< std::string >( "--endian", "big" ) == "little";
+    std::vector< std::pair< unsigned int, unsigned int > > indices;
+    std::vector< comma::csv_bits::field > fields;
+    unsigned int begin = 0;
+    for( auto s: sizes ) { fields.push_back( comma::csv_bits::field( begin, s, little_endian ) ); begin += s; }
+    std::vector< char > buf( size );
+    comma::csv_bits::unpacked output( sizes.size() );
+    comma::csv::output_stream< comma::csv_bits::unpacked > os( std::cout, csv, output );
+    while( std::cin.good() )
+    {
+        std::cin.read( &buf[0], size );
+        if( std::cin.gcount() <= 0 ) { break; }
+        if( std::cin.gcount() < size ) { std::cerr << "csv-bits: to-csv: expected " << size << " byte(s); got: " << std::cin.gcount() << std::endl; return 1; }
+        for( unsigned int i = 0; i < sizes.size(); ++i ) { output.values[i] = fields[i].get( buf ); }
+        os.write( output );
+    }
+    return 0;
+}
+
+} } } // namespace comma { namespace csv_bits { namespace to_csv {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        const auto& unnamed = options.unnamed( "--flush, --verbose, -v", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-bits: please specify operation" << std::endl; return 1; }
+        if( unnamed.size() > 1 ) { std::cerr << "csv-bits: expected operation; got: " << comma::join( unnamed, ',' ) << std::endl; return 1; }
+        const std::string& operation = unnamed[0];
+        if( operation == "to-csv" || operation == "unpack" ) { return comma::csv_bits::to_csv::run( options ); }
+        if( operation == "from-csv" || operation == "pack" ) { return comma::csv_bits::from_csv::run( options ); }
+        std::cerr << "csv-bits: expected operation; got: \"" << operation << "\"" << std::endl;
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-bits: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-bits: unknown exception" << std::endl; }
+    return 1;
+}
diff --git a/csv/applications/csv-blocks.cpp b/csv/applications/csv-blocks.cpp
index 5e3c9b24a..ebcab1dd0 100644
--- a/csv/applications/csv-blocks.cpp
+++ b/csv/applications/csv-blocks.cpp
@@ -27,7 +27,7 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-/// @author dewey nguyen
+/// @authors dewey nguyen, vsevolod vlaskine
 
 #include <stdio.h>
 #include <stdlib.h>
@@ -41,7 +41,6 @@
 
 #include <boost/unordered_map.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -139,8 +138,20 @@ static void usage( bool more )
     std::cerr << "        attention: output does not preserve input order, since there is no reasonable tradeof there" << std::endl;
     std::cerr << "                   use csv-sort for post-processing, if required" << std::endl;
     std::cerr << "    group|make-blocks" << std::endl;
-    std::cerr << "        cat something.csv | csv-blocks group --fields=,id, " << std::endl;
+    std::cerr << "        usage: cat something.csv | csv-blocks group --fields=,id, " << std::endl;
     std::cerr << "            appends group's block field based on specified id key or keys" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --fields=<fields>" << std::endl;
+    std::cerr << "                id: any number of id fields to group by" << std::endl;
+    std::cerr << "                scalar: group by scalar, which can be integer, floating point number, or time" << std::endl;
+    std::cerr << "                        options" << std::endl;
+    std::cerr << "                            --block-gap,--gap=<value>; minimum gap in values between block" << std::endl;
+    std::cerr << "                                                       double (for time: seconds as double), see examples" << std::endl;
+    std::cerr << "                            --block-span,--span=<value>; maximum block span, double (for time: seconds as" << std::endl;
+    std::cerr << "                                                         double), see examples" << std::endl;
+    std::cerr << "                            --discard-out-of-range; discard input records with scalar out of range defined by --min and --max" << std::endl;
+    std::cerr << "                            --min=[<value>]; convenience option: min value for the scalar range, see examples" << std::endl;
+    std::cerr << "                            --max=[<value>]; convenience option: max value for the scalar range, see examples" << std::endl;
     std::cerr << "    head" << std::endl;
     std::cerr << "        reads records from first block to stdout, if --num-of-blocks=<num> specified, read more than one blocks" << std::endl;
     std::cerr << "        requires the index from 'index' mode in the inputs" << std::endl;
@@ -181,10 +192,16 @@ static void usage( bool more )
     std::cerr << "    ( echo \"a,1,2,3\"; echo \"a,4,2,3\"; echo \"b,5,5,6\"; echo \"c,7,5,6\"; echo \"c,7,8,9\"; echo \"c,7,8,9\" ) >$block_csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    group|make-blocks" << std::endl;
-    std::cerr << "        cat $block_csv | csv-blocks group --fields=id" << std::endl;
-    std::cerr << "            unique ascending block number are assigned based on one id field" << std::endl;
-    std::cerr << "        cat $block_csv | csv-blocks group --fields=id,,id" << std::endl;
-    std::cerr << "            unique ascending block number are assigned based on two id fields" << std::endl;
+    std::cerr << "        unique ascending block number are assigned based on one id field" << std::endl;
+    std::cerr << "            cat $block_csv | csv-blocks group --fields=id" << std::endl;
+    std::cerr << "        unique ascending block number are assigned based on two id fields" << std::endl;
+    std::cerr << "            cat $block_csv | csv-blocks group --fields=id,,id" << std::endl;
+    std::cerr << "        group by scalar span - try it" << std::endl;
+    std::cerr << "            seq 20 | csv-blocks group --fields=scalar --span 5" << std::endl;
+    std::cerr << "            seq 1 3 20 | csv-blocks group --fields scalar --span 4" << std::endl;
+    std::cerr << "        group by scalar gap - try it" << std::endl;
+    std::cerr << "            seq 20 | csv-blocks group --fields=scalar --gap 1" << std::endl;
+    std::cerr << "            seq 20 | csv-blocks group --fields=scalar --gap 2" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    index" << std::endl;
     std::cerr << "        cat $block_csv | csv-blocks group --fields=id | csv-blocks index --fields=,,,,block" << std::endl;
@@ -207,7 +224,6 @@ static void usage( bool more )
     std::cerr << "            After indexing the input in reverse order, the stream is read block-by-block, with the first line given the maximal" << std::endl;
     std::cerr << "            element id in the block, essentially, the block size" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "contact info: " << comma::contact_info <<std::endl;
     std::cerr << std::endl;
     exit(0);
 }
@@ -218,8 +234,6 @@ static comma::csv::options csv;
 static bool reverse_index = false;
 // All the data for this block
 static std::deque< std::string > block_records;
-static comma::csv::impl::unstructured keys;
-static comma::uint32 current_block = 1;
 static comma::int32 increment_step = 1;
 
 static void output_record_and_index( const std::string& input, comma::uint32 index, bool is_binary, char delimiter )
@@ -255,7 +269,27 @@ static bool empty_( const std::string& s ) // quick and dirty
     return true;
 }
 
-template < typename T > static void set_fields( const comma::command_line_options& options, std::string& first_line, T& default_input )
+static double to_double( const input_t& lhs ) // quick and dirty
+{
+    if( lhs.key.longs.size() == 1 ) { return lhs.key.longs[0]; }
+    if( lhs.key.doubles.size() == 1 ) { return lhs.key.doubles[0]; }
+    if( lhs.key.time.size() == 1 ) { COMMA_THROW( comma::exception, "cannot convert time to double" ); }
+    if( lhs.key.strings.size() == 1 ) { COMMA_THROW( comma::exception, "cannot convert strings to double" ); }
+    COMMA_THROW( comma::exception, "never here" );
+}
+
+static double diff( const input_t& lhs, const input_t& rhs ) // quick and dirty
+{
+    if( lhs.key.longs.size() == 1 ) { return std::abs( double( lhs.key.longs[0] ) - rhs.key.longs[0] ); }
+    if( lhs.key.doubles.size() == 1 ) { return std::abs( lhs.key.doubles[0] - rhs.key.doubles[0] ); }
+    if( lhs.key.time.size() == 1 ) { return std::abs( double( ( lhs.key.time[0] - rhs.key.time[0] ).total_microseconds() ) / 1000000 ); }
+    if( lhs.key.strings.size() == 1 ) { COMMA_THROW( comma::exception, "difference for strings: not implemented" ); }
+    COMMA_THROW( comma::exception, "never here" );
+}
+
+struct how_t { enum values { none, by_id, by_scalar }; };
+
+template < typename T > static how_t::values set_fields( const comma::command_line_options& options, std::string& first_line, T& default_input )
 {
     std::vector< std::string > v = comma::split( csv.fields, ',' );
     comma::csv::format f;
@@ -270,8 +304,29 @@ template < typename T > static void set_fields( const comma::command_line_option
     }
     // This is to load the keys into input_t structure
     unsigned int size = f.count();
-    for( std::size_t i = 0; i < size; ++i ) { if( i < v.size() ) { if( v[i] == "id" ) { v[i] = "key/" + default_input.key.append( f.offset( i ).type ); continue; } } }
+    how_t::values how = how_t::none;
+    for( std::size_t i = 0; i < size; ++i )
+    { 
+        if( i < v.size() )
+        { 
+            if( v[i] == "id" )
+            {
+                if( how == how_t::by_scalar ) { COMMA_THROW( comma::exception, "expected either id or scalar in --fields; got both in: \"" << csv.fields << "\"" ); }
+                how = how_t::by_id;
+                v[i] = "key/" + default_input.key.append( f.offset( i ).type );
+            }
+            else if( v[i] == "scalar" )
+            {
+                if( how == how_t::by_id ) { COMMA_THROW( comma::exception, "expected either id or scalar in --fields; got both in: \"" << csv.fields << "\"" ); }
+                if( how == how_t::by_scalar ) { COMMA_THROW( comma::exception, "expected not more than one scalar in --fields; got: \"" << csv.fields << "\"" ); }
+                how = how_t::by_scalar;
+                v[i] = "key/" + default_input.key.append( f.offset( i ).type );
+            }
+        }
+    }
+    if( how == how_t::none ) { COMMA_THROW( comma::exception, "please specify at least one id or scalar in --fields; got: \"" << csv.fields << "\"" ); }
     csv.fields = comma::join( v, ',' );
+    return how;
 }
 
 #ifndef WIN32
@@ -413,16 +468,14 @@ int main( int ac, char** av )
         verbose = options.exists( "--verbose,-v" );
         strict = options.exists( "--strict" );
         csv = comma::csv::options( options );
-        csv.full_xpath = true;
         csv.quote.reset();
         comma::csv::options csv_out;
+        csv_out.full_xpath = false;
         if( csv.binary() ) { csv_out.format( comma::csv::format("ui") ); }
-        std::vector< std::string > unnamed = options.unnamed( "--help,-h,--reverse,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--help,-h,--reverse,--verbose,-v,--discard-out-of-range", "-.*" );
         if( unnamed.empty() ) { std::cerr << name() << "please specify operation" << std::endl; return 1; }
         const std::string  operation = unnamed.front();
-        
         if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << std::endl; }
-        
         if( operation == "accumulate" )
         {
             std::string first_line;
@@ -471,38 +524,93 @@ int main( int ac, char** av )
         }
         if( operation == "group" || operation == "make-blocks" )
         {
-            current_block = options.value< comma::uint32 >( "--starting-block,--from", 0 ); // default is 0
-            
+            comma::uint32 current_block = options.value< comma::uint32 >( "--starting-block,--from", 0 );
             std::string first_line;
             input_t default_input;
-            set_fields( options, first_line, default_input );
-            if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << std::endl; }
-            if ( default_input.key.empty() ) { std::cerr << name() << "please specify at least one id field" << std::endl; return 1; }
-            
+            auto how = set_fields( options, first_line, default_input );
+            if( verbose ) { std::cerr << name() << "csv fields: " << csv.fields << "; making blocks by " << ( how == how_t::by_id ? "id" : "scalar" ) << std::endl; }
+            boost::optional< double > gap;
+            boost::optional< double > span;
+            boost::optional< double > min;
+            boost::optional< double > max;
+            if( how == how_t::by_scalar )
+            {
+                options.assert_mutually_exclusive( "--gap,--span", "--min,--max" ); // for now
+                gap = options.optional< double >( "--block-gap,--gap" );
+                span = options.optional< double >( "--block-span,--span" );
+                min = options.optional< double >( "--min" );
+                max = options.optional< double >( "--max" );
+            }
             comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
             comma::csv::output_stream< appended_column > ostream( std::cout, csv_out );
             comma::csv::tied< input_t, appended_column > tied( istream, ostream );
-            
+            auto update_block = [&]( const input_t& p )->bool
+            {
+                static input_t last = p;
+                switch( how )
+                {
+                    case how_t::by_id:
+                        if( !( last.key == p.key ) ) { ++current_block; }
+                        last = p;
+                        return true;
+                    case how_t::by_scalar:
+                    {
+                        static input_t first = p;
+                        if( gap || span )
+                        {
+                            if( ( gap && diff( last, p ) >= *gap ) || ( span && diff( first, p ) >= *span ) ) { ++current_block; first = p; }
+                            last = p;
+                            return true;
+                        }
+                        else
+                        {
+                            static bool last_in_range = false;
+                            static bool discard_output_out_of_range = options.exists( "--discard-out-of-range" );
+                            double v = to_double( p );
+                            bool in_range = ( !min || !comma::math::less( v, *min ) ) && ( !max || !comma::math::less( *max, v ) );
+                            static bool first_record = true;
+                            if( !first_record ) // quick and dirty
+                            {
+                                if( discard_output_out_of_range )
+                                {
+                                    if( last_in_range && !in_range ) { ++current_block; }
+                                }
+                                else
+                                {
+                                    if( last_in_range != in_range ) { ++current_block; } // quick and dirty
+                                }
+                            }
+                            last = p;
+                            last_in_range = in_range;
+                            first_record = false;
+                            return in_range || !discard_output_out_of_range;
+                        }
+                    }
+                    case how_t::none: // never here
+                        return true;
+                }
+                return true; // never here
+            };
             if( !first_line.empty() ) 
             { 
                 input_t p = comma::csv::ascii< input_t >( csv, default_input ).get( first_line ); 
-                if( !(keys == p.key) ) { ++current_block; }
-                keys = p.key;
-                // This is needed because the record wasnt read in by istream
-                // Write it out
-                if( istream.is_binary() ) { std::cout.write( (char*)&p, istream.binary().size() ); }
-                else { std::cout << first_line << istream.ascii().ascii().delimiter(); }
-                ostream.write( appended_column( current_block ) );
-                if( csv.flush ) { std::cout.flush(); }
+                if( update_block( p ) )
+                {
+                    if( istream.is_binary() ) { std::cout.write( (char*)&p, istream.binary().size() ); }
+                    else { std::cout << first_line << istream.ascii().ascii().delimiter(); }
+                    ostream.write( appended_column( current_block ) );
+                    if( csv.flush ) { std::cout.flush(); }
+                }
             }
             while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
             {
                 const input_t* p = istream.read();
                 if( !p ) { break; }
-                if( !(keys == p->key) ) { ++current_block; }
-                keys = p->key;
-                tied.append( appended_column( current_block ) );
-                if( csv.flush ) { std::cout.flush(); }
+                if( update_block( *p ) )
+                {
+                    tied.append( appended_column( current_block ) );
+                    if( csv.flush ) { std::cout.flush(); }
+                }
             }            
             return 0;
         }
@@ -546,60 +654,51 @@ int main( int ac, char** av )
         else if( operation == "index" )
         {
             reverse_index = options.exists("--reverse");
-            
             comma::csv::input_stream< input_with_block > istream( std::cin, csv );
-            
             char delimiter = istream.is_binary() ? ',' : istream.ascii().ascii().delimiter();
             comma::uint32 block = 0;
             comma::uint32 index = 0;
             std::string buffer;
             if( istream.is_binary() ) { buffer.resize( istream.binary().size() ); }
-            
             while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
             {
                 const input_with_block* p = istream.read();
                 if( !p ) { break; }
-                
                 if( block != p->block ) 
                 { 
                     if ( reverse_index ) { output_reverse_indexing( block_records, istream.is_binary(), delimiter  ); }
                     else { index = 0; }
                 }
                 block = p->block;
-                
                 if ( reverse_index )
                 {
-                    // Reverse index mode - accumulate whole block before indexing
                     if( istream.is_binary() )  
                     { 
                         ::memcpy( &buffer[0], istream.binary().last(),  istream.binary().size() ); 
                         block_records.push_back( buffer );
                     }
-                    else { block_records.push_back( comma::join( istream.ascii().last(), delimiter ) ); }
+                    else
+                    {
+                        block_records.push_back( comma::join( istream.ascii().last(), delimiter ) );
+                    }
                 }
                 else
                 {
-                    // Forward index mode - append index to each record
                     if( istream.is_binary() ) { ::memcpy( &buffer[0], istream.binary().last(),  istream.binary().size() ); }
                     else { buffer = comma::join( istream.ascii().last(), delimiter ); }
                     output_record_and_index( buffer, index, istream.is_binary(), delimiter );
                     index++;
                 }
             }
-            
-            // flushes the last block
             if ( reverse_index ) { output_reverse_indexing( block_records, istream.is_binary(), delimiter  ); }
-            
             return 0;
         }
         else if( operation == "increment" )    // operation is head
         {
             increment_step = options.value< comma::int32 >( "--step", 1 );
-            
             comma::csv::input_stream< input_with_block > istream( std::cin, csv );
             comma::csv::output_stream< appended_column > ostream( std::cout, csv_out );
             comma::csv::tied< input_with_block, appended_column > tied( istream, ostream );
-            
             appended_column incremented;
             while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
             {
@@ -609,7 +708,6 @@ int main( int ac, char** av )
                 tied.append( incremented );
                 if( csv.flush ) { std::cout.flush(); }
             }
-            
             return 0;
         }
         else if( operation == "read-until" )
diff --git a/csv/applications/csv-calc.cpp b/csv/applications/csv-calc.cpp
index 1670f4ac2..2d1208ab6 100644
--- a/csv/applications/csv-calc.cpp
+++ b/csv/applications/csv-calc.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2020 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
@@ -36,17 +9,21 @@
 #include <io.h>
 #endif
 
+#include <deque>
+#include <functional>
 #include <iostream>
-#include <boost/bind.hpp>
+#include <map>
+#include <type_traits>
+#include <unordered_set>
+#include <boost/bind/bind.hpp>
 #include <boost/function.hpp>
 #include <boost/optional.hpp>
 #include <boost/ptr_container/ptr_vector.hpp>
 #include <boost/scoped_ptr.hpp>
 #include <boost/unordered_map.hpp>
 #include <boost/date_time/posix_time/posix_time_types.hpp>
-#include "../../application/contact_info.h"
-#include "../../application/verbose.h"
 #include "../../base/exception.h"
+#include "../../base/none.h"
 #include "../../csv/format.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
@@ -72,7 +49,7 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "column-wise calculation, optionally by id and block" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage: cat data.csv | " << comma::verbose.app_name() << " <what> [<options>] > calc.csv" << std::endl;
+    std::cerr << "usage: cat data.csv | csv-calc <what> [<options>] > calc.csv" << std::endl;
     std::cerr << std::endl;
     std::cerr << "<what>: comma-separated list of operations" << std::endl;
     std::cerr << "        results will be output in the same order" << std::endl;
@@ -90,7 +67,7 @@ static void usage( bool verbose )
     std::cerr << "        <n> is the desired percentile (e.g. 0.9)" << std::endl;
     std::cerr << "        <method> is one of 'nearest' or 'interpolate' (default: nearest)" << std::endl;
     std::cerr << "        see --help --verbose for more details" << std::endl;
-    std::cerr << "    radius: size / 2" << std::endl;
+    std::cerr << "    radius: diameter / 2" << std::endl;
     std::cerr << "    size: number of values" << std::endl;
     std::cerr << "    skew[=sample]: skew" << std::endl;
     std::cerr << "         sample: use sample skew (default: population stddev)" << std::endl;
@@ -102,6 +79,7 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "<options>" << std::endl;
     std::cerr << "    --append: append statistics to each input line" << std::endl;
+    std::cerr << "    --append-once,--append-to-first: append statistics to first input line for each block and/or each id" << std::endl;
     std::cerr << "    --delimiter,-d <delimiter> : default ','" << std::endl;
     std::cerr << "    --fields,-f: field names for which the extents should be computed, default: all fields" << std::endl;
     std::cerr << "                 if 'block' field present, calculate block-wise" << std::endl;
@@ -137,14 +115,14 @@ static void usage( bool verbose )
         std::cerr << std::endl;
     }
     std::cerr << "examples" << std::endl;
-    std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.9" << std::endl;
-    std::cerr << "    seq 1 1000 | " << comma::verbose.app_name() << " percentile=0.9:interpolate --verbose" << std::endl;
+    std::cerr << "    seq 1 1000 | csv-calc percentile=0.9" << std::endl;
+    std::cerr << "    seq 1 1000 | csv-calc percentile=0.1,percentile=0.9" << std::endl;
+    std::cerr << "    seq 1 1000 | csv-calc percentile=0.9:interpolate --verbose" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | " << comma::verbose.app_name() << " --fields=a,block percentile=0.9" << std::endl;
+    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | csv-calc --fields=a,block percentile=0.9" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | " << comma::verbose.app_name() << " --fields=a,id percentile=0.9" << std::endl;
+    std::cerr << "    {(seq 1 500 | csv-paste \"-\" \"value=0\") ; (seq 1 100 | csv-paste \"-\" \"value=1\") ; (seq 501 1000 | csv-paste \"-\" \"value=0\")} | csv-calc --fields=a,id percentile=0.9" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( -1 );
 }
@@ -213,14 +191,14 @@ class Values
         std::vector< comma::csv::format::element > input_elements_;
         std::vector< comma::csv::format::element > elements_;
         std::vector< char > buffer_;
-        boost::optional< unsigned int > block_index_;
-        boost::optional< unsigned int > id_index_;
+        boost::optional< unsigned int > block_index_{ comma::silent_none< unsigned int >() };
+        boost::optional< unsigned int > id_index_{ comma::silent_none< unsigned int >() };
         comma::csv::format::element block_element_;
         comma::csv::format::element id_element_;
         unsigned int block_;
         unsigned int id_;
-        boost::function< comma::uint32( const char* ) > block_from_bin_;
-        boost::function< comma::uint32( const char* ) > id_from_bin_;
+        std::function< comma::uint32( const char* ) > block_from_bin_;
+        std::function< comma::uint32( const char* ) > id_from_bin_;
         template < typename T > static comma::uint32 from_bin_( const char* buf ) { return comma::csv::format::traits< T >::from_bin( buf ); }
 
         void init_indices_()
@@ -260,15 +238,15 @@ class Values
                 block_element_ = input_format_.offset( *block_index_ );
                 switch( block_element_.type )
                 {
-                    case comma::csv::format::char_t: block_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::int8: block_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::uint8: block_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, _1 ); break;
-                    case comma::csv::format::int16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, _1 ); break;
-                    case comma::csv::format::uint16: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, _1 ); break;
-                    case comma::csv::format::int32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, _1 ); break;
-                    case comma::csv::format::uint32: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, _1 ); break;
-                    case comma::csv::format::int64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, _1 ); break;
-                    case comma::csv::format::uint64: block_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, _1 ); break;
+                    case comma::csv::format::char_t: block_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int8: block_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint8: block_from_bin_ = std::bind( &Values::from_bin_< unsigned char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int16: block_from_bin_ = std::bind( &Values::from_bin_< comma::int16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint16: block_from_bin_ = std::bind( &Values::from_bin_< comma::uint16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int32: block_from_bin_ = std::bind( &Values::from_bin_< comma::int32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint32: block_from_bin_ = std::bind( &Values::from_bin_< comma::uint32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int64: block_from_bin_ = std::bind( &Values::from_bin_< comma::int64 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint64: block_from_bin_ = std::bind( &Values::from_bin_< comma::uint64 >, std::placeholders::_1 ); break;
                     default: COMMA_THROW( comma::exception, "expected integer for block id, got format " << input_format_.string() );
                 }
             }
@@ -277,15 +255,15 @@ class Values
                 id_element_ = input_format_.offset( *id_index_ );
                 switch( id_element_.type )
                 {
-                    case comma::csv::format::char_t: id_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::int8: id_from_bin_ = boost::bind( &Values::from_bin_< char >, _1 ); break;
-                    case comma::csv::format::uint8: id_from_bin_ = boost::bind( &Values::from_bin_< unsigned char >, _1 ); break;
-                    case comma::csv::format::int16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int16 >, _1 ); break;
-                    case comma::csv::format::uint16: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint16 >, _1 ); break;
-                    case comma::csv::format::int32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int32 >, _1 ); break;
-                    case comma::csv::format::uint32: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint32 >, _1 ); break;
-                    case comma::csv::format::int64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::int64 >, _1 ); break;
-                    case comma::csv::format::uint64: id_from_bin_ = boost::bind( &Values::from_bin_< comma::uint64 >, _1 ); break;
+                    case comma::csv::format::char_t: id_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int8: id_from_bin_ = std::bind( &Values::from_bin_< char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint8: id_from_bin_ = std::bind( &Values::from_bin_< unsigned char >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int16: id_from_bin_ = std::bind( &Values::from_bin_< comma::int16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint16: id_from_bin_ = std::bind( &Values::from_bin_< comma::uint16 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int32: id_from_bin_ = std::bind( &Values::from_bin_< comma::int32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint32: id_from_bin_ = std::bind( &Values::from_bin_< comma::uint32 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::int64: id_from_bin_ = std::bind( &Values::from_bin_< comma::int64 >, std::placeholders::_1 ); break;
+                    case comma::csv::format::uint64: id_from_bin_ = std::bind( &Values::from_bin_< comma::uint64 >, std::placeholders::_1 ); break;
                     default: COMMA_THROW( comma::exception, "expected integer for block id, got format " << input_format_.string() );
                 }
             }
@@ -309,7 +287,7 @@ class ascii_input
             return values_.get();
         }
 
-        const std::string line() { return line_; }
+        const std::string& line() const { return line_; }
         
     private:
         comma::csv::options csv_;
@@ -334,10 +312,15 @@ class binary_input
         {
             while( true )
             {
+                //std::cin.read( &buffer_[0], csv_.format().size() );
+                //if( std::cin.gcount() == 0 ) { return NULL; }
+                //if( std::cin.gcount() != int( csv_.format().size() ) ) { COMMA_THROW( comma::exception, "expected " << csv_.format().size() << " bytes; got " << std::cin.gcount() ); }
+                //values_.set( &buffer_[0] );
+                //return &values_;
                 if( offset_ >= csv_.format().size() )
                 {
                     values_.set( cur_ );
-                    line_ = std::string(cur_, csv_.format().size());
+                    line_ = std::string( cur_, csv_.format().size() );
                     cur_ += csv_.format().size();
                     offset_ -= csv_.format().size();
                     if( cur_ == end_ ) { cur_ = &buffer_[0]; offset_ = 0; }
@@ -348,7 +331,8 @@ class binary_input
                 offset_ += count;
             }
         }
-        const std::string line() { return line_; }
+        
+        const std::string& line() const { return line_; }
 
     private:
         comma::csv::options csv_;
@@ -369,11 +353,11 @@ template < typename T, typename V > struct map_traits
 
 template < typename V > struct map_traits< boost::posix_time::ptime, V >
 {
-    struct hash : public std::unary_function< boost::posix_time::ptime, std::size_t >
+    struct hash : public std::function< boost::posix_time::ptime( std::size_t ) >
     {
         std::size_t operator()( const boost::posix_time::ptime& t ) const
         {
-            BOOST_STATIC_ASSERT( sizeof( t ) == sizeof( comma::uint64 ) );
+            static_assert( sizeof( t ) == sizeof( comma::uint64 ), "expected 8-byte time" );
             std::size_t seed = 0;
             boost::hash_combine( seed, reinterpret_cast< const comma::uint64& >( t ) ); // quick and dirty
             return seed;
@@ -431,6 +415,7 @@ namespace Operations
     struct base
     {
         virtual ~base() {}
+        virtual void reset() = 0;
         virtual void push( const char* ) = 0;
         virtual void calculate( char* ) = 0;
         virtual base* clone() const = 0;
@@ -445,6 +430,7 @@ namespace Operations
     class Min : public base
     {
         public:
+            void reset() { min_ = comma::silent_none< T >(); }
             void push( const char* buf )
             {
                 const T& t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -456,13 +442,14 @@ namespace Operations
             friend class Centre< T, F >;
             friend class Diameter< T, F >;
             friend class Radius< T, F >;
-            boost::optional< T > min_;
+            boost::optional< T > min_{ comma::silent_none< T >() };
     };
 
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
     class Max : public base
     {
         public:
+            void reset() { max_ = comma::silent_none< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -474,13 +461,14 @@ namespace Operations
             friend class Centre< T, F >;
             friend class Diameter< T, F >;
             friend class Radius< T, F >;
-            boost::optional< T > max_;
+            boost::optional< T > max_{ comma::silent_none< T >() };
     };
 
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
     class Sum : public base
     {
         public:
+            void reset() { sum_ = comma::silent_none< T >(); }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -489,12 +477,13 @@ namespace Operations
             void calculate( char* buf ) { if( sum_ ) { comma::csv::format::traits< T, F >::to_bin( *sum_, buf ); } }
             base* clone() const { return new Sum< T, F >( *this ); }
         private:
-            boost::optional< T > sum_;
+            boost::optional< T > sum_{ comma::silent_none< T >() };
     };
 
     template < comma::csv::format::types_enum F >
     class Sum< boost::posix_time::ptime, F > : public base
     {
+        void reset() { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "sum not defined for time" ); }
         base* clone() const { COMMA_THROW( comma::exception, "sum not defined for time" ); }
@@ -504,6 +493,7 @@ namespace Operations
     class Centre : public base
     {
         public:
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< T, F >::to_bin( *min_.min_ + ( *max_.max_ - *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Centre< T, F >( *this ); }
@@ -519,6 +509,7 @@ namespace Operations
     class Mode : public base
     {
         public:
+            void reset() { value_count_ = impl::value_count< T >(); }
             void push( const char* buf ) { value_count_.update( comma::csv::format::traits< T, F >::from_bin( buf ) ); }
             void calculate( char* buf ) { if( !value_count_.map().empty() ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value_count_.mode().first ), buf ); } }
             base* clone() const { return new Mode< T, F >( *this ); }
@@ -531,6 +522,7 @@ namespace Operations
     {
         public:
             Mean() : count_( 0 ) {}
+            void reset() { mean_.reset(); count_ = 0; }
             void push( const char* buf )
             {
                 T t = comma::csv::format::traits< T, F >::from_bin( buf );
@@ -540,7 +532,7 @@ namespace Operations
             void calculate( char* buf ) { if( count_ > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( *mean_ ), buf ); } }
             base* clone() const { return new Mean< T, F >( *this ); }
         private:
-            boost::optional< typename result_traits< T >::type > mean_;
+            boost::optional< typename result_traits< T >::type > mean_{ comma::silent_none< typename result_traits< T >::type >() };
             std::size_t count_;
     };
 
@@ -552,89 +544,76 @@ namespace Operations
 
             Percentile() : percentile_( 0.0 ), method_( nearest ) {}
 
-            void push( const char* buf )
-            {
-                values_.insert( comma::csv::format::traits< T, F >::from_bin( buf ));
-            }
+            void push( const char* buf ) { values_.insert( comma::csv::format::traits< T, F >::from_bin( buf ) ); }
 
             void set_options( const std::vector< std::string >& options )
             {
-                if( options.size() == 0 ) {
-                    std::cerr << comma::verbose.app_name() << ": percentile operation requires a percentile" << std::endl;
-                    exit( 1 );
-                }
-
+                if( options.empty() ) { std::cerr << comma::verbose.app_name() << ": percentile operation requires a percentile" << std::endl; exit( 1 ); }
                 percentile_ = boost::lexical_cast< double >( options[0] );
-                if( percentile_ < 0.0 || percentile_ > 1.0 ) {
-                    std::cerr << comma::verbose.app_name() << ": percentile value should be between 0 and 1, got " << percentile_ << std::endl;
-                    exit( 1 );
-                }
-
-                if( options.size() == 2 ) {
-                    if( options[1] == "nearest" ) method_ = nearest;
-                    else if( options[1] == "interpolate" ) method_ = interpolate;
-                    else {
-                        std::cerr << comma::verbose.app_name() << ": expected percentile method, got " << options[1] << std::endl;
-                        exit( 1 );
-                    }
-                }
+                if( percentile_ < 0.0 || percentile_ > 1.0 ) { std::cerr << comma::verbose.app_name() << ": percentile value should be between 0 and 1, got " << percentile_ << std::endl; exit( 1 ); }
+                if( options.size() < 2 ) { return; }
+                if( options[1] == "nearest" ) { method_ = nearest; }
+                else if( options[1] == "interpolate" ) { method_ = interpolate; }
+                else { std::cerr << comma::verbose.app_name() << ": expected percentile method, got '" << options[1] << "'" << std::endl; exit( 1 ); }
             }
 
             void calculate( char* buf )
             {
+                if( values_.empty() ) { return; }
                 std::size_t count = values_.size();
-
-                if( count > 0 )
+                comma::verbose << "calculating " << percentile_*100 << "th percentile using ";
+                T value = comma::csv::format::traits< T, F >::zero();
+                typename std::multiset< T >::iterator it = values_.begin();
+                switch( method_ )
                 {
-                    comma::verbose << "calculating " << percentile_*100 << "th percentile using ";
-                    T value;
-                    typename std::multiset< T >::iterator it = values_.begin();
-                    switch( method_ )
-                    {
-                        std::size_t rank;
-                        
-                        case nearest:
-                            // https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method
-                            comma::verbose << "nearest rank method" << std::endl;
-                            comma::verbose << "see https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method" << std::endl;
-                            rank = ( percentile_ == 0.0 ? 1 : std::ceil( count * percentile_ ));
-                            comma::verbose << "n = " << rank << std::endl;
-                            std::advance( it, rank - 1 );
+                    std::size_t rank;
+                    
+                    case nearest:
+                        // https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method
+                        comma::verbose << "nearest rank method" << std::endl;
+                        comma::verbose << "see https://en.wikipedia.org/wiki/Percentile#The_Nearest_Rank_method" << std::endl;
+                        rank = ( percentile_ == 0.0 ? 1 : std::ceil( count * percentile_ ));
+                        comma::verbose << "n = " << rank << std::endl;
+                        std::advance( it, rank - 1 );
+                        value = *it;
+                        break;
+
+                    case interpolate:
+                        // https://en.wikipedia.org/wiki/Percentile#The_Linear_Interpolation_Between_Closest_Ranks_method
+                        // (third method in that section)
+                        comma::verbose << "NIST linear interpolation method" << std::endl;
+                        comma::verbose << "see http://www.itl.nist.gov/div898/handbook/prc/section2/prc262.htm" << std::endl;
+                        double x = percentile_ * ( count + 1 );
+                        comma::verbose << "p = " << percentile_ << "; N = " << count << "; p(N + 1) = " << x;
+                        if( x <= 1.0 )
+                        {
+                            comma::verbose << "; below 1 - choosing smallest value" << std::endl;
                             value = *it;
-                            break;
-
-                        case interpolate:
-                            // https://en.wikipedia.org/wiki/Percentile#The_Linear_Interpolation_Between_Closest_Ranks_method
-                            // (third method in that section)
-                            comma::verbose << "NIST linear interpolation method" << std::endl;
-                            comma::verbose << "see http://www.itl.nist.gov/div898/handbook/prc/section2/prc262.htm" << std::endl;
-                            double x = percentile_ * ( count + 1 );
-                            comma::verbose << "p = " << percentile_ << "; N = " << count
-                                           << "; p(N + 1) = " << x;
-                            if( x <= 1.0 ) {
-                                comma::verbose << "; below 1 - choosing smallest value" << std::endl;
-                                value = *it;
-                            } else if( x >= count ) {
-                                comma::verbose << "; above N - choosing largest value" << std::endl;
-                                value = *( values_.rbegin() );
-                            } else {
-                                rank = x;
-                                double remainder = x - rank;
-                                comma::verbose << "; k = " << rank << "; d = " << remainder << std::endl;
-                                std::advance( it, rank - 1 );
-                                double v1 = *it;
-                                double v2 = *++it;
-                                value = v1 + ( v2 - v1 ) * remainder;
-                                comma::verbose << "v1 = " << v1 << "; v2 = " << v2
-                                               << "; result = " << value << std::endl;
-                            }
-                            break;
-                    }
-                    comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value ), buf );
+                        }
+                        else if( x >= count )
+                        {
+                            comma::verbose << "; above N - choosing largest value" << std::endl;
+                            value = *( values_.rbegin() );
+                        }
+                        else
+                        {
+                            rank = x;
+                            double remainder = x - rank;
+                            comma::verbose << "; k = " << rank << "; d = " << remainder << std::endl;
+                            std::advance( it, rank - 1 );
+                            double v1 = *it;
+                            double v2 = *++it;
+                            value = v1 + ( v2 - v1 ) * remainder;
+                            comma::verbose << "v1 = " << v1 << "; v2 = " << v2 << "; result = " << value << std::endl;
+                        }
+                        break;
                 }
+                comma::csv::format::traits< T, F >::to_bin( static_cast< T >( value ), buf );
             }
 
             base* clone() const { return new Percentile< T, F >( *this ); }
+            
+            void reset() { values_.clear(); }
 
         private:
             std::multiset< T > values_;
@@ -645,6 +624,7 @@ namespace Operations
     template < comma::csv::format::types_enum F >
     class Percentile< boost::posix_time::ptime, F > : public base
     {
+        void reset() { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void push( const char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         void calculate( char* ) { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
         base* clone() const { COMMA_THROW( comma::exception, "percentile not implemented for time, todo" ); }
@@ -722,6 +702,8 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return previous_.mean(); }
             
+            void reset() { previous_.reset(); value_ = 0; count_ = 0; }
+            
         private:
             Moment< T, M - 1 > previous_;
             typename result_traits< T >::type value_;
@@ -733,6 +715,7 @@ namespace Operations
     {
         public:
             Moment() : value_( 0 ), count_( 0 ) {}
+            
             void update ( const T t )
             {   
                 ++count_;
@@ -741,6 +724,8 @@ namespace Operations
             
             typename result_traits< T >::type mean() const { return value_; }
             
+            void reset() { value_ = 0; count_ = 0; }
+            
         private:
             typename result_traits< T >::type value_;
             std::size_t count_;
@@ -762,9 +747,10 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( std::sqrt( static_cast< long double >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() )  ) ) ), buf ); } }
             base* clone() const { return new Stddev< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
     };
 
@@ -782,9 +768,10 @@ namespace Operations
             }
             void calculate( char* buf ) { stddev_.calculate(buf); }
             base* clone() const { return new Stddev< boost::posix_time::ptime, F >( *this ); }
+            void reset() { stddev_.reset(); first_ = boost::none; }
         private:
             Stddev< double, F > stddev_;
-            boost::optional<boost::posix_time::ptime> first_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -803,9 +790,10 @@ namespace Operations
             void update( const T t ) { moments_.update(t); }
             void calculate( char* buf ) { if( moments_.count() > 0 ) { comma::csv::format::traits< T, F >::to_bin( static_cast< T >( moments_.value() / ( sample_ ? moments_.count() - 1 : moments_.count() ) ), buf ); } }
             base* clone() const { return new Variance< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 2 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
     };
 
@@ -823,9 +811,10 @@ namespace Operations
             }
             void calculate( char* buf ) { variance_.calculate(buf); }
             base* clone() const { return new Variance< boost::posix_time::ptime, F >( *this ); }
+            void reset() { variance_.reset(); first_ = boost::none; }
         private:
-            Variance< double, F> variance_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Variance< double, F > variance_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -846,7 +835,6 @@ namespace Operations
                 if( moments_.count() > 0 ) 
                 { 
                     typename result_traits< T >::type n = moments_.count();
-                    
                     // corrected sample skew requires at least 3 samples
                     typename result_traits< T >::type correction = sample_ ? sqrt( n * ( n - 1 ) ) / ( n - 2 ) : 1 ;
                     typename result_traits< T >::type m2 = moments_.previous().value();
@@ -855,9 +843,10 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Skew< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 3 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
     };
 
@@ -875,9 +864,10 @@ namespace Operations
             }
             void calculate( char* buf ) { skew_.calculate(buf); }
             base* clone() const { return new Skew< boost::posix_time::ptime, F >( *this ); }
+            void reset() { skew_.reset(); first_ = boost::none; }
         private:
-            Skew< double, F> skew_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Skew< double, F > skew_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T, comma::csv::format::types_enum F = comma::csv::format::type_to_enum< T >::value >
@@ -889,8 +879,8 @@ namespace Operations
             { 
                 for (std::size_t i = 0; i < options.size(); i++) 
                 {
-                    if ( options[i] == "sample" ) { sample_ = true; }
-                    else if ( options[i] == "excess" ) { excess_ = true; }
+                    if( options[i] == "sample" ) { sample_ = true; }
+                    else if( options[i] == "excess" ) { excess_ = true; }
                 }
             }
             void push( const char* buf ) 
@@ -917,9 +907,10 @@ namespace Operations
                 } 
             }
             base* clone() const { return new Kurtosis< T, F >( *this ); }
+            void reset() { moments_.reset(); first_ = boost::none; }
         private:
             Moment< T, 4 > moments_;
-            boost::optional<T> first_;
+            boost::optional< T > first_{ comma::silent_none< T >() };
             bool sample_;
             bool excess_;
     };
@@ -938,9 +929,10 @@ namespace Operations
             }
             void calculate( char* buf ) { kurtosis_.calculate(buf); }
             base* clone() const { return new Kurtosis< boost::posix_time::ptime, F >( *this ); }
+            void reset() { kurtosis_.reset(); first_ = boost::none; }
         private:
-            Kurtosis< double, F> kurtosis_;
-            boost::optional<boost::posix_time::ptime> first_;
+            Kurtosis< double, F > kurtosis_;
+            boost::optional< boost::posix_time::ptime > first_{ comma::silent_none< boost::posix_time::ptime >() };
     };
     
     template < typename T > struct Diff
@@ -962,6 +954,7 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ), buf ); } }
             base* clone() const { return new Diameter< T, F >( *this ); }
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -974,6 +967,7 @@ namespace Operations
             void push( const char* buf ) { min_.push( buf ); max_.push( buf ); }
             void calculate( char* buf ) { if( min_.min_ ) { comma::csv::format::traits< typename Diff< T >::Type >::to_bin( Diff< T >::subtract( *max_.max_, *min_.min_ ) / 2, buf ); } }
             base* clone() const { return new Radius< T, F >( *this ); }
+            void reset() { min_ = Min< T, F >(); max_ = Max< T, F >(); }
         private:
             Min< T, F > min_;
             Max< T, F > max_;
@@ -987,6 +981,7 @@ namespace Operations
             void push( const char* ) { ++count_; }
             void calculate( char* buf ) { comma::csv::format::traits< comma::uint32 >::to_bin( count_, buf ); }
             base* clone() const { return new Size< T, F >( *this ); }
+            void reset() { count_ = 0; }
         private:
             std::size_t count_;
     };
@@ -1035,13 +1030,14 @@ namespace Operations
     template <> struct traits< Enum::kurtosis > { template < typename T, comma::csv::format::types_enum F > struct FromEnum { typedef Kurtosis< T, F > Type; }; };
 } // namespace Operations
 
-class Operationbase
+class operation_base
 {
     public:
-        virtual ~Operationbase() {}
+        virtual ~operation_base() {}
         virtual void push( const char* buf ) = 0;
         virtual void calculate() = 0;
-        virtual Operationbase* clone() const = 0;
+        virtual operation_base* clone() const = 0;
+        virtual void reset() = 0;
         const comma::csv::format& output_format() const { return output_format_; }
         const char* buffer() const { return &buffer_[0]; }
 
@@ -1053,20 +1049,20 @@ class Operationbase
         std::vector< comma::csv::format::element > output_elements_;
         std::vector< char > buffer_;
 
-        Operationbase* deep_copy_to_( Operationbase* lhs ) const
+        operation_base* deep_copy_to_( operation_base* lhs ) const
         {
             lhs->input_format_ = input_format_;
             lhs->input_elements_ = input_elements_;
             lhs->output_format_ = output_format_;
             lhs->output_elements_ = output_elements_;
             lhs->buffer_ = buffer_;
-            for( std::size_t i = 0; i < operations_.size(); ++i ) { lhs->operations_.push_back( operations_[i].clone() ); }
+            for( auto& o: operations_ ) { lhs->operations_.push_back( o.clone() ); }
             return lhs;
         }
 };
 
 template < Operations::Enum::Values E >
-struct Operation : public Operationbase
+struct Operation : public operation_base
 {
     Operation() {}
     Operation( const comma::csv::format& format
@@ -1079,7 +1075,7 @@ struct Operation : public Operationbase
         for( std::size_t i = 0; i < input_elements_.size(); ++i )
         {
             comma::csv::format::types_enum output_type = input_elements_[i].type;
-            switch( E ) // quick and dirty, implement in operations::traits, just no time
+            switch( E ) // quick and dirty, operations::traits would be better, but likely to be optimized by compiler anyway
             {
                 case Operations::Enum::radius:
                 case Operations::Enum::diameter:
@@ -1131,57 +1127,84 @@ struct Operation : public Operationbase
     {
         for( std::size_t i = 0; i < operations_.size(); ++i ) { operations_[i].calculate( &buffer_[0] + output_elements_[i].offset ); }
     }
+    
+    void reset() { for( auto& o: operations_ ) { o.reset(); } }
 
-    Operationbase* clone() const { Operation< E >* op = new Operation< E >; return deep_copy_to_( op ); }
+    operation_base* clone() const { Operation< E >* op = new Operation< E >; return deep_copy_to_( op ); }
 };
 
-typedef boost::unordered_map< comma::uint32, boost::ptr_vector< Operationbase >* > OperationsMap;
-typedef boost::unordered_map< comma::uint32, std::string > ResultsMap;
-typedef std::vector< std::pair < comma::uint32, std::string > > Inputs;
+typedef boost::unordered_map< comma::uint32, std::vector< operation_base* >* > operations_map_t;
+typedef boost::unordered_map< comma::uint32, std::string > results_map_t;
+typedef std::deque< std::pair < comma::uint32, std::string > > inputs_t;
 
-static void init_operations( boost::ptr_vector< Operationbase >& operations
-                           , const std::vector< Operations::operation_parameters >& operations_parameters
-                           , const comma::csv::format& format )
+class operations_battery_farm_t // all this pain is because operations polymorhism is too slow when there are a lot of ids
 {
-    static boost::ptr_vector< Operationbase > sample;
-    if( sample.empty() )
-    {
-        sample.reserve( operations_parameters.size() );
-        for( std::size_t i = 0; i < operations_parameters.size(); ++i )
+    public:
+        typedef std::vector< operation_base* > operations_t;
+        
+        operations_battery_farm_t(): end_( 0 ) {}
+        
+        ~operations_battery_farm_t()
+        { 
+            for( auto& operation: operations_ ) { for( auto& o: operation ) { delete o; } } // quick and dirty; shame on me
+        }
+        
+        operations_t& make( const std::vector< Operations::operation_parameters >& operations_parameters, const comma::csv::format& format )
         {
-            switch( operations_parameters[i].type )
+            if( operations_.empty() )
             {
-                case Operations::Enum::min: sample.push_back( new Operation< Operations::Enum::min >( format ) ); break;
-                case Operations::Enum::max: sample.push_back( new Operation< Operations::Enum::max >( format ) ); break;
-                case Operations::Enum::centre: sample.push_back( new Operation< Operations::Enum::centre >( format ) ); break;
-                case Operations::Enum::mean: sample.push_back( new Operation< Operations::Enum::mean >( format ) ); break;
-                case Operations::Enum::mode: sample.push_back( new Operation< Operations::Enum::mode >( format ) ); break;
-                case Operations::Enum::percentile: sample.push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::radius: sample.push_back( new Operation< Operations::Enum::radius >( format ) ); break;
-                case Operations::Enum::diameter: sample.push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
-                case Operations::Enum::variance: sample.push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::stddev: sample.push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::skew: sample.push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::kurtosis: sample.push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
-                case Operations::Enum::sum: sample.push_back( new Operation< Operations::Enum::sum >( format ) ); break;
-                case Operations::Enum::size: sample.push_back( new Operation< Operations::Enum::size >( format ) ); break;
+                operations_.push_back( operations_t() );
+                operations_[0].reserve( operations_parameters.size() );
+                for( std::size_t i = 0; i < operations_parameters.size(); ++i )
+                {
+                    switch( operations_parameters[i].type )
+                    {
+                        case Operations::Enum::min: operations_[0].push_back( new Operation< Operations::Enum::min >( format ) ); break;
+                        case Operations::Enum::max: operations_[0].push_back( new Operation< Operations::Enum::max >( format ) ); break;
+                        case Operations::Enum::centre: operations_[0].push_back( new Operation< Operations::Enum::centre >( format ) ); break;
+                        case Operations::Enum::mean: operations_[0].push_back( new Operation< Operations::Enum::mean >( format ) ); break;
+                        case Operations::Enum::mode: operations_[0].push_back( new Operation< Operations::Enum::mode >( format ) ); break;
+                        case Operations::Enum::percentile: operations_[0].push_back( new Operation< Operations::Enum::percentile >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::radius: operations_[0].push_back( new Operation< Operations::Enum::radius >( format ) ); break;
+                        case Operations::Enum::diameter: operations_[0].push_back( new Operation< Operations::Enum::diameter >( format ) ); break;
+                        case Operations::Enum::variance: operations_[0].push_back( new Operation< Operations::Enum::variance >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::stddev: operations_[0].push_back( new Operation< Operations::Enum::stddev >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::skew: operations_[0].push_back( new Operation< Operations::Enum::skew >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::kurtosis: operations_[0].push_back( new Operation< Operations::Enum::kurtosis >( format, operations_parameters[i].options ) ); break;
+                        case Operations::Enum::sum: operations_[0].push_back( new Operation< Operations::Enum::sum >( format ) ); break;
+                        case Operations::Enum::size: operations_[0].push_back( new Operation< Operations::Enum::size >( format ) ); break;
+                    }
+                }
             }
+            if( end_ == operations_.size() )
+            {
+                operations_.push_back( operations_t( operations_[0].size() ) );
+                for( unsigned int i = 0; i < operations_[0].size(); ++i ) { operations_.back()[i] = operations_[0][i]->clone(); }
+            }
+            for( auto& s: operations_[end_] ) { s->reset(); }
+            return operations_[ end_++ ];
         }
-    }
-    operations.clear();
-    for( std::size_t i = 0; i < sample.size(); ++i ) { operations.push_back( sample[i].clone() ); }
-}
+        
+        void reset() { end_ = 0; }
+        
+    private:
+        typedef std::deque< operations_t > operations_t_;
+        operations_t_ operations_;
+        unsigned int end_;
+};
 
-static void output( const comma::csv::options& csv, ResultsMap& results, boost::optional< comma::uint32 > block, bool has_block, bool has_id )
+static operations_battery_farm_t operations_battery_farm;
+        
+static void output( const comma::csv::options& csv, results_map_t& results, boost::optional< comma::uint32 > block, bool has_block, bool has_id )
 {
-    for( ResultsMap::iterator it = results.begin(); it != results.end(); ++it )
+    for( results_map_t::iterator it = results.begin(); it != results.end(); ++it )
     {
-        std::cout << it->second;
+        std::cout.write( &it->second[0], it->second.size() );
         if( csv.binary() )
         {
             if( has_id )  { std::cout.write( reinterpret_cast< const char* >( &it->first ), sizeof( comma::uint32 ) ); } // quick and dirty
             if( has_block ) { std::cout.write( reinterpret_cast< const char* >( &( *block ) ), sizeof( comma::uint32 ) ); } // quick and dirty
-            std::cout.flush();
+            if( csv.flush ) { std::cout.flush(); }
         }
         else
         {
@@ -1193,34 +1216,50 @@ static void output( const comma::csv::options& csv, ResultsMap& results, boost::
     results.clear();
 }
 
-static void append_and_output( const comma::csv::options& csv, Inputs& inputs, ResultsMap& results )
-{    
+static void append_and_output( const comma::csv::options& csv, inputs_t& inputs, results_map_t& results, std::unordered_set< comma::uint32 >& ids )
+{
     for ( size_t i = 0; i < inputs.size(); ++i )
     {
         std::cout << inputs[i].second;
-        if (!csv.binary()) { std::cout << csv.delimiter; }
-        std::cout << results.find(inputs[i].first)->second;
-        if (!csv.binary()) { std::cout << std::endl; }
+        if( !csv.binary() ) { std::cout << csv.delimiter; }
+        const auto& r = results.find( inputs[i].first )->second;
+        std::cout.write( &r[0], r.size() );
+        if( !csv.binary() ) { std::cout << std::endl; }
     }
+    if( csv.flush ) { std::cout.flush(); }
     results.clear();
     inputs.clear();
+    ids.clear();
 }
 
-static void calculate( const comma::csv::options& csv, OperationsMap& operations, ResultsMap& results )
+static void calculate( const comma::csv::options& csv, operations_map_t& operations, results_map_t& results )
 {
-    for( OperationsMap::iterator it = operations.begin(); it != operations.end(); ++it )
+    for( operations_map_t::iterator it = operations.begin(); it != operations.end(); ++it )
     {
         std::string r;
+        if( csv.binary() )
+        {
+            unsigned int size = 0;
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { size += ( *it->second )[i]->output_format().size(); }
+            r.reserve( size );
+        }
         for( std::size_t i = 0; i < it->second->size(); ++i )
         {
-            ( *it->second )[i].calculate();
-            if( csv.binary() ) { r.append( ( *it->second )[i].buffer(), ( *it->second )[i].output_format().size() ); }
-            else { if( i > 0 ) { r += csv.delimiter; } r.append(( *it->second )[i].output_format().bin_to_csv( ( *it->second )[i].buffer(), csv.delimiter, 12 )); }
+            ( *it->second )[i]->calculate();
+            if( csv.binary() )
+            { 
+                r.append( ( *it->second )[i]->buffer(), ( *it->second )[i]->output_format().size() );
+            }
+            else
+            {
+                if( i > 0 ) { r += csv.delimiter; }
+                r.append( ( *it->second )[i]->output_format().bin_to_csv( ( *it->second )[i]->buffer(), csv.delimiter, csv.precision ) );
+            }
         }
-        results[it->first] = r;
+        results[ it->first ] = r;
     }
-    for( OperationsMap::iterator it = operations.begin(); it != operations.end(); ++it ) { delete it->second; } // quick and dirty
     operations.clear();
+    operations_battery_farm.reset();
 }
 
 int main( int ac, char** av )
@@ -1229,11 +1268,14 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
-        std::vector< std::string > unnamed = options.unnamed( "", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
+        std::vector< std::string > unnamed = options.unnamed( "--append,--append-once,--append-to-first,--flush,--output-fields,--output-format", "--binary,-b,--delimiter,-d,--format,--fields,-f,--output-fields" );
         comma::csv::options csv( options );
+        csv.full_xpath = false;
+        std::cout.precision( csv.precision );
         #ifdef WIN32
         if( csv.binary() ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
+        if( !csv.flush && csv.binary() ) { std::cin.tie( NULL ); std::ios_base::sync_with_stdio( false ); } // todo? quick and dirty, redesign binary_input instead?
         if( unnamed.empty() ) { std::cerr << comma::verbose.app_name() << ": please specify operations" << std::endl; exit( 1 ); }
         std::vector< std::string > v = comma::split( unnamed[0], ',' );
         std::vector< Operations::operation_parameters > operations_parameters( v.size() );
@@ -1243,21 +1285,22 @@ int main( int ac, char** av )
             operations_parameters[i].type = Operations::from_name( p[0] );
             if( p.size() == 2 ){ operations_parameters[i].options = comma::split( p[1], ':' ); }
         }
-        boost::optional< comma::csv::format > format;
+        boost::optional< comma::csv::format > format = { comma::silent_none< comma::csv::format >() };
         if( csv.binary() ) { format = csv.format(); }
         else if( options.exists( "--format" ) ) { format = comma::csv::format( options.value< std::string >( "--format" ) ); }
         boost::scoped_ptr< ascii_input > ascii;
         boost::scoped_ptr< binary_input > binary;
         if( csv.binary() ) { binary.reset( new binary_input( csv ) ); }
         else { ascii.reset( new ascii_input( csv, format ) ); }
-        OperationsMap operations;
-        ResultsMap results;
-        Inputs inputs;
+        operations_map_t operations;
+        results_map_t results;
+        inputs_t inputs;
+        std::unordered_set< comma::uint32 > ids; // quick and dirty
         boost::optional< comma::uint32 > block = boost::make_optional< comma::uint32 >( false, 0 );
         bool has_block = csv.has_field( "block" );
         bool has_id = csv.has_field( "id" );
-        bool append = options.exists("--append");
-        
+        bool append_once = options.exists( "--append-once,--append-to-first" );
+        bool append = options.exists( "--append" ) || append_once;
         if( options.exists( "--output-fields" ) )
         {
             std::vector < std::string > fields = comma::split(csv.fields, ',');
@@ -1267,32 +1310,28 @@ int main( int ac, char** av )
                 std::replace(v[op].begin(), v[op].end(), '=', '_');
                 std::replace(v[op].begin(), v[op].end(), '.', '_');
                 std::replace(v[op].begin(), v[op].end(), ':', '_');
-                for (std::size_t f = 0; f < fields.size(); f++ )
+                for( std::size_t f = 0; f < fields.size(); f++ )
                 {
-                    if (fields[f] == "" || fields[f] == "id" || fields[f] == "block") { continue; }
-                    output_fields.push_back(fields[f] + "/" + v[op]);
+                    if( fields[f] == "" || fields[f] == "id" || fields[f] == "block" ) { continue; }
+                    output_fields.push_back( fields[f] + "/" + v[op] );
                 }
             }
-            if (has_id && !append) { output_fields.push_back("id"); }
-            if (has_block && !append ) { output_fields.push_back("block"); }
-            std::cout << comma::join(output_fields, ',') << std::endl;
+            if( has_id && !append ) { output_fields.push_back( "id" ); }
+            if( has_block && !append ) { output_fields.push_back( "block" ); }
+            std::cout << comma::join( output_fields, ',' ) << std::endl;
             return 0;
         }
-        if (options.exists("--output-format"))
+        if( options.exists( "--output-format" ) )
         {
             if ( !format ) { std::cerr << comma::verbose.app_name() << ": option --output-format requires input format to be specified, please use --format or --binary" << std::endl; return 1; }
-            boost::ptr_vector< Operationbase > ops;
-            init_operations(ops, operations_parameters, Values(csv, *format).format());
-            for ( std::size_t i = 0; i < ops.size(); ++i ) 
-            { 
-                if ( i > 0 ) { std::cout << csv.delimiter; }
-                std::cout << ops[i].output_format().string();
-            }
-            if (has_id && !append) { std::cout << csv.delimiter << "ui"; }
-            if (has_block && !append) { std::cout << csv.delimiter << "ui"; }
+            auto ops = operations_battery_farm.make( operations_parameters, Values( csv, *format ).format() );
+            std::cout << ops[0]->output_format().string();
+            for( std::size_t i = 1; i < ops.size(); ++i ) { std::cout << ',' << ops[i]->output_format().string(); }
+            if( has_id && !append ) { std::cout << ",ui"; }
+            if( has_block && !append ) { std::cout << ",ui"; }
             std::cout << std::endl;
             return 0;
-        } 
+        }
         while( std::cin.good() && !std::cin.eof() )
         {
             const Values* v = csv.binary() ? binary->read() : ascii->read();
@@ -1300,28 +1339,27 @@ int main( int ac, char** av )
             if( has_block )
             {
                 if( block && *block != v->block() ) 
-                { 
-                    calculate(csv, operations, results);
-                    if ( append ) { append_and_output(csv, inputs, results); inputs.clear(); }
-                    else { output( csv, results, block, has_block, has_id ); }
+                {
+                    calculate( csv, operations, results );
+                    if ( append ) { append_and_output( csv, inputs, results, ids ); } else { output( csv, results, block, has_block, has_id ); }
                 }
                 block = v->block();
             }
-            OperationsMap::iterator it = operations.find( v->id() );
-            if( it == operations.end() )
+            operations_map_t::iterator it = operations.find( v->id() );
+            if( it == operations.end() ) { it = operations.insert( std::make_pair( v->id(), &operations_battery_farm.make( operations_parameters, v->format() ) ) ).first; }
+            if( append )
             {
-                it = operations.insert( std::make_pair( v->id(), new boost::ptr_vector< Operationbase > ) ).first;
-                init_operations( *it->second, operations_parameters, v->format() );
+                if( !append_once || ids.find( v->id() ) == ids.end() ) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
+                ids.insert( v->id() ); // quick and dirty
             }
-            if (append) { inputs.push_back( std::make_pair( v->id(), csv.binary() ? binary->line() : ascii->line() ) ); }
-            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i].push( v->buffer() ); }
+            for( std::size_t i = 0; i < it->second->size(); ++i ) { ( *it->second )[i]->push( v->buffer() ); }
         }
-        calculate(csv, operations, results);
-        if ( append ) { append_and_output(csv, inputs, results); }
+        calculate( csv, operations, results );
+        if ( append ) { append_and_output( csv, inputs, results, ids ); }
         else { output( csv, results, block, has_block, has_id ); }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << comma::verbose.app_name() << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << comma::verbose.app_name() << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-calc: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-calc: unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/applications/csv-calc.new.cpp b/csv/applications/csv-calc.new.cpp
index e9bf661d9..84642d4b4 100644
--- a/csv/applications/csv-calc.new.cpp
+++ b/csv/applications/csv-calc.new.cpp
@@ -1,32 +1,7 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+/// @author vsevolod vlaskine
 
 #include <string.h>
 #include <algorithm>
@@ -36,10 +11,9 @@
 #include <string>
 #include <vector>
 #include <boost/array.hpp>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/function.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -82,7 +56,6 @@ static void usage()
     std::cerr << "examples" << std::endl;
     std::cerr << "    todo" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
@@ -182,7 +155,6 @@ static std::pair< entry_t, comma::csv::options > make_input_( const comma::csv::
         else { vf.push_back( "" ); }
     }
     p.second.fields = comma::join( vf, ',' );
-    p.second.full_xpath = true;
     return p;
 }
 
@@ -360,7 +332,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //             {
 //                 get_< R >( *result_ ).push_back( R() );
 //                 bound_functors< T > b( boost::bind( f.reset, boost::ref( get_< R >( *result_ ).back() ) )
-//                                      , boost::bind( f.update, boost::ref( get_< R >( *result_ ).back(), _1 ) )
+//                                      , boost::bind( f.update, boost::ref( get_< R >( *result_ ).back(), boost::placeholders::_1 ) )
 //                                      , boost::bind( f.finalize, boost::ref( get_< R >( *result_ ).back() ) ) );
 //                 get_< T >().push_back( b );
 //             }
@@ -385,7 +357,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef T result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { if( rhs < lhs ) { lhs = rhs; } }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, _1, _2 ), std::numeric_limits< T >::max() ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, boost::placeholders::_1, _2 ), std::numeric_limits< T >::max() ); }
 // };
 // 
 // template <> struct min< std::string >
@@ -393,7 +365,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef std::string type;
 //     typedef std::string result_type;
 //     static void apply( result_type&, const std::string& ) {}
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, _1, _2 ) ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &min::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template <> struct min< boost::posix_time::ptime >
@@ -401,7 +373,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef boost::posix_time::ptime type;
 //     typedef boost::posix_time::ptime result_type;
 //     static void apply( boost::posix_time::ptime& lhs, const boost::posix_time::ptime& rhs ) { if( lhs.is_not_a_date_time() || rhs < lhs ) { lhs = rhs; } }
-//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &min::apply, _1, _2 ) ); }
+//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &min::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template < typename T > struct max
@@ -409,7 +381,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef T result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { if( lhs < rhs ) { lhs = rhs; } }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, _1, _2 ), std::numeric_limits< T >::min() ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, boost::placeholders::_1, _2 ), std::numeric_limits< T >::min() ); }
 // };
 // 
 // template <> struct max< std::string >
@@ -417,7 +389,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef std::string type;
 //     typedef std::string result_type;
 //     static void apply( result_type& lhs, const std::string& rhs ) { if( lhs < rhs ) { lhs = rhs; } }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, _1, _2 ) ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &max::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template <> struct min< boost::posix_time::ptime >
@@ -425,7 +397,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef boost::posix_time::ptime type;
 //     typedef boost::posix_time::ptime result_type;
 //     static void apply( boost::posix_time::ptime& lhs, const boost::posix_time::ptime& rhs ) { if( lhs.is_not_a_date_time() || rhs < lhs ) { lhs = rhs; } }
-//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &max::apply, _1, _2 ) ); }
+//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &max::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template < typename T > struct size
@@ -433,7 +405,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef double result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { ++rhs; }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &size::apply, _1, _2 ), 0 ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &size::apply, boost::placeholders::_1, _2 ), 0 ); }
 // };
 // 
 // template < typename T > struct sum
@@ -441,7 +413,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef T type;
 //     typedef T result_type;
 //     static void apply( result_type& lhs, const T& rhs ) { lhs += rhs; }
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, _1, _2 ), 0 ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, boost::placeholders::_1, _2 ), 0 ); }
 // };
 // 
 // template <> struct sum< std::string >
@@ -449,7 +421,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef std::string type;
 //     typedef std::string result_type;
 //     static void apply( result_type&, const std::string& ) {}
-//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, _1, _2 ) ); }
+//     static operation::options< result_type, T > options() { return operation::options< result_type, T >( boost::bind( &sum::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // template <> struct sum< boost::posix_time::ptime >
@@ -457,7 +429,7 @@ template <> struct bound_result_traits< boost::posix_time::ptime >
 //     typedef boost::posix_time::ptime type;
 //     typedef boost::posix_time::ptime result_type;
 //     static void apply( boost::posix_time::ptime&, const boost::posix_time::ptime& ) {}
-//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &sum::apply, _1, _2 ) ); }
+//     static operation::options< result_type, boost::posix_time::ptime > options() { return operation::options< result_type, boost::posix_time::ptime >( boost::bind( &sum::apply, boost::placeholders::_1, _2 ) ); }
 // };
 // 
 // } // namespace operations {
diff --git a/csv/applications/csv-cast.cpp b/csv/applications/csv-cast.cpp
index a1b1a83ac..bec891db7 100644
--- a/csv/applications/csv-cast.cpp
+++ b/csv/applications/csv-cast.cpp
@@ -39,13 +39,12 @@
 #include <cstring>
 #include <iostream>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/format.h"
 
 static const std::string app_name = "csv-cast";
 
-static void usage()
+static void usage( bool verbose = false )
 {
     std::cerr << "reads binary in the given input format and writes binary in the given output format" << std::endl;
     std::cerr << std::endl;
@@ -55,6 +54,7 @@ static void usage()
     std::cerr << std::endl;
     std::cerr << "    --binary,-b,--from: input binary format" << std::endl;
     std::cerr << "    --output-binary,--output,-o,--to: output binary format" << std::endl;
+    std::cerr << "    --flush: flush stdout after each record" << std::endl;
     std::cerr << "    --force: allow narrowing conversions" << std::endl;
     std::cerr << std::endl;
     std::cerr << comma::csv::format::usage() << std::endl;
@@ -75,8 +75,8 @@ static void usage()
     std::cerr << "    lexical cast, convert s[22],s[10],s[6] to t,2d (creates sample binary data)" << std::endl;
     std::cerr << "        echo {0..9}.2345789,3.1415 | fmt -1 | csv-time-stamp | csv-to-bin s[22],s[10],s[6] | csv-cast s[22],s[10],s[6] t,2d | csv-from-bin t,2d" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
+    exit(0);
 }
 
 static void check_conversions( const comma::csv::format& iformat, const comma::csv::format& oformat, const bool force )
@@ -256,21 +256,23 @@ int main( int ac, char** av )
 #endif
     try
     {
-        comma::command_line_options options( ac, av );
-        if( options.exists( "--help,-h" ) ) { usage(); return 0; }
+        comma::command_line_options options( ac, av, usage );
         if( ac < 3 ) { usage(); return 1; }
         comma::csv::format iformat( options.value< std::string >( "--binary,-b,--from", av[1] ) );
         comma::csv::format oformat( options.value< std::string >( "--output-binary,--output,-o,--to", av[2] ) );
         check_conversions( iformat, oformat, options.exists( "--force" ) );
+        bool flush = options.exists( "--flush" );
         std::vector< char > in( iformat.size() );
         std::vector< char > out( oformat.size() );
+        if( !flush ) { std::cin.tie( NULL ); }
         while( std::cin.good() )
         {
             std::cin.read( &in[0], iformat.size() );
             if( std::cin.gcount() == 0 ) { break; }
             if( std::cin.gcount() < static_cast< int >( iformat.size() ) ) { COMMA_THROW( comma::exception, "expected " << iformat.size() << " bytes, got only " << std::cin.gcount() ); }
             cast( iformat, in, oformat, out );
-            std::cout.write( &out[0], oformat.size() ).flush();
+            std::cout.write( &out[0], oformat.size() );
+            if( flush ) { std::cout.flush(); }
         }
         return 0;
     }
diff --git a/csv/applications/csv-crc.cpp b/csv/applications/csv-crc.cpp
index cdaabdc39..703bc14a2 100644
--- a/csv/applications/csv-crc.cpp
+++ b/csv/applications/csv-crc.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 /// @author james underwood
 
@@ -42,55 +41,56 @@
 #include <boost/crc.hpp>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 
 static void usage( bool )
 {
-    std::cerr << std::endl;
-    std::cerr << "wrap/check crc on fixed-width input (ascii or binary)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: csv-crc <commands> [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<command>" << std::endl;
-    std::cerr << "    wrap: add crc" << std::endl;
-    std::cerr << "    check: check crc; exit, if check fails" << std::endl;
-    std::cerr << "    recover: recover with given parameters (see below)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "data options" << std::endl;
-    std::cerr << "    --crc-size; output given crc size to stdout and exit" << std::endl;
-    std::cerr << "    --delimiter,-d=<delimiter>: ascii csv delimiter" << std::endl;
-    std::cerr << "    --size=<size>: binary data size; if absent, expect ascii csv" << std::endl;
-    std::cerr << "                   for wrap: payload size" << std::endl;
-    std::cerr << "                   for check/recover size including crc" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "crc options" << std::endl;
-    std::cerr << "    --crc=<which>:" << std::endl;
-    std::cerr << "        16: 16-bit, generator 0x8805" << std::endl;
-    std::cerr << "        ccitt: 16-bit, generator 0x1021" << std::endl;
-    std::cerr << "        xmodem: 16-bit, generator 0x1021" << std::endl;
-    std::cerr << "        32: 32-bit, generator 0x04C11DB7" << std::endl;
-    //std::cerr << "        checksum16: simple 16-bit checksum (todo)" << std::endl;
-    //std::cerr << "        checksum32: simple 32-bit checksum (todo)" << std::endl;
-    std::cerr << "        default: ccitt" << std::endl;
-    std::cerr << "    --big-endian,--net-byte-order: if binary, crc is big endian" << std::endl;
-    std::cerr << "    --verbose,-v: more output" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    For a definitive list of 16 bits CRC algorithms see:" << std::endl;
-    std::cerr << "    http://reveng.sourceforge.net/crc-catalogue/16.htm" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "recovery options" << std::endl;
-    std::cerr << "    --give-up-after=<n>: if check fails, give up after <n> bytes" << std::endl;
-    std::cerr << "                         if absent and no --recover-after: default 0" << std::endl;
-    std::cerr << "                         if absent and --recover-after: default infinity (don't give up)" << std::endl;
-    std::cerr << "    --recover-after=<n>: if check fails and then new valid crc found" << std::endl;
-    std::cerr << "                         make sure that at least <n> subsequent lines (ascii) or" << std::endl;
-    std::cerr << "                         packets (binary) are valid, before output; default 0, i.e. recover on the next valid" << std::endl;
-    std::cerr << "    --discard-on-recovery,--discard: discard those <n> packets accumulated during the recovery check" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    std::cerr << R"(
+wrap/check crc on fixed-width input (ascii or binary)
+
+usage: csv-crc <command> [<options>]
+
+<command>
+    wrap:    add crc
+    check:   check crc; exit if check fails
+    recover: recover with given parameters (see below)
+
+general options
+    --help,-h;    this help
+    --verbose,-v: more output
+
+data options
+    --crc-size;      output given crc size to stdout and exit
+    --delimiter,-d=[<char>]: ascii csv delimiter
+    --size=[<size>]: binary data size; if absent, expect ascii csv
+                     for wrap: payload size
+                     for check/recover: size including crc
+
+crc options
+    --crc=<which>:
+        16:     16-bit, generator 0x8805
+        ccitt:  16-bit, generator 0x1021
+        xmodem: 16-bit, generator 0x1021
+        32:     32-bit, generator 0x04C11DB7
+        default: ccitt
+    --big-endian,--net-byte-order: if binary, crc is big endian
+
+recover options
+    --give-up-after=<n>: if check fails, give up after <n> bytes
+                         default: infinity; don't give up
+    --recover-after=<n>: if check fails and then new valid crc found
+                         make sure that at least <n> subsequent lines (ascii)
+                         or packets (binary) are valid, before output;
+                         default: 0; recover on the next valid packet
+    --discard-on-recovery,--discard: discard packets accumulated when recovering
+
+    Note that the check command is equivalent to
+    csv-crc recover --give-up-after 0
+
+For a definitive list of 16 bit CRC algorithms see:
+http://reveng.sourceforge.net/crc-catalogue/16.htm
+)";
+    exit( 0 );
 }
 
 static bool verbose;
@@ -144,6 +144,7 @@ static bool run_()
         bool recovered = true;
         std::size_t recovered_count = 0;
         std::size_t recovered_byte_count = 0;
+        std::size_t current_recovered_byte_count = 0;
         std::vector< char > recovery_buffer( recover_after * size );
         while( std::cin.good() && !std::cin.eof() )
         {
@@ -165,35 +166,44 @@ static bool run_()
                     if( big_endian ) { expected = traits< typename Crc::value_type >::hton( expected ); }
                     if( crc == expected )
                     {
+                        bool output_input_buffer = true;
                         if( !recovered )
                         {
                             if( recovered_count == recover_after )
                             {
-                                std::cerr << "csv-crc: recovered after " << recovered_byte_count << " byte(s)" << std::endl;
+                                comma::say() << "recovered after " << recovered_byte_count << " byte(s)" << std::endl;
                                 if( !discard_on_recovery ) { std::cout.write( &recovery_buffer[0], recovery_buffer.size() ); }
                                 recovered = true;
                                 recovered_count = 0;
                                 recovered_byte_count = 0;
+                                current_recovered_byte_count = 0;
                             }
                             else
                             {
                                 ::memcpy( &recovery_buffer[ recovered_count * size ], p, size );
                                 ++recovered_count;
+                                output_input_buffer = false;        // we're just stashing them until we check
                             }
                         }
-                        std::cout.write( p, size );
+                        if( output_input_buffer ) { std::cout.write( p, size ); }
                         std::cout.flush();
                     }
                     else // quick and dirty: lots of code duplication, but just to make it working
                     {
-                        if( recovered ) { std::cerr << "csv-crc: crc check failed" << ( !give_up_after || *give_up_after > 0 ? "; recovering..." : "" ) << std::endl; }
+                        if( current_recovered_byte_count / size > recovered_count )
+                        {
+                            recovered_count = 0;
+                            current_recovered_byte_count = 0;
+                        }
+                        if( recovered ) { comma::say() << "crc check failed" << ( !give_up_after || *give_up_after > 0 ? "; recovering..." : "" ) << std::endl; }
                         recovered = false;
-                        ++recovered_byte_count;
+                        if( give_up_after && recovered_byte_count >= *give_up_after ) { break; }
                     }
                 }
                 unsigned int step = recovered ? size : 1;
                 p += step;
                 offset -= step;
+                if( !recovered ) { recovered_byte_count += step; current_recovered_byte_count += step; }
                 if( end - p < int( size ) )
                 {
                     ::memcpy( begin, p, offset ); // todo: quick and dirty, check if works in case of overlapping
@@ -205,7 +215,7 @@ static bool run_()
             if( r <= 0 ) { break; }
             offset += r;
         }
-        if( offset > 0 && offset < size ) { std::cerr << "csv-crc: expected at least " << size << " byte(s), got only " << offset << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( offset <= 0 || offset >= size, "expected at least " << size << " byte(s), got only " << offset );
     }
     else
     {
@@ -231,7 +241,7 @@ static bool run_()
                 }
                 else
                 {
-                    std::cerr << "csv-crc: check failed (recovery is not implemented for ascii mode, todo)" << std::endl;
+                    comma::say() << "check failed (recovery is not implemented for ascii mode, todo)" << std::endl;
                     return 1;
                 }
             }
@@ -253,10 +263,10 @@ int main( int ac, char** av )
             else if( crc == "ccitt" ) { std::cout << sizeof( boost::crc_ccitt_type::value_type ) << std::endl; }
             else if( crc == "xmodem" ) { std::cout << sizeof( boost::crc_xmodem_type::value_type ) << std::endl; }
             else if( crc == "xmodem-boost" ) { std::cout << sizeof( boost::crc_xmodem_type::value_type ) << std::endl; }
-            else { std::cerr << "csv-crc: expected crc type, got \"" << crc << "\"" << std::endl; return 1; }
+            else { comma::say() << "expected crc type, got \"" << crc << "\"" << std::endl; return 1; }
             return 0;
         }
-        if( wrap && recover ) { std::cerr << "csv-crc: if 'wrap', then no 'check' or 'recover'" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !wrap || !recover, "if 'wrap', then no 'check' or 'recover'" );
         verbose = options.exists( "--verbose,-v" );
         give_up_after = options.optional< unsigned int >( "--give-up-after" );
         recover_after = options.value( "--recover-after", 0 );
@@ -266,13 +276,13 @@ int main( int ac, char** av )
         big_endian = options.exists( "--big-endian,--net-byte-order" );
         delimiter = options.value< char >( "--delimiter,-d", ',' );
         std::vector< std::string > commands = options.unnamed( "--discard-on-recovery,--discard,--verbose,-v,--big-endian,--net-byte-order", "--size,--delimiter,-d,--crc,--give-up-after,--recover-after" );
-        if( commands.empty() ) { std::cerr << "csv-crc: specify a command" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !commands.empty(), "please specify a command" );
         for( std::size_t i = 0; i < commands.size(); ++i )
         {
             if( commands[i] == "wrap" ) { wrap = true; }
             else if( commands[i] == "check" ) { recover = true; give_up_after = 0; }
             else if( commands[i] == "recover" ) { recover = true; }
-            else { std::cerr << "csv-crc: expected command, got '" << commands[i] << "'" << std::endl; return 1; }
+            else { comma::say() << "expected command, got '" << commands[i] << "'" << std::endl; return 1; }
         }
         // The list of crc versions predefined by boost is given at
         //     http://www.boost.org/doc/libs/1_58_0/libs/crc/crc.html#crc_ex
@@ -288,16 +298,9 @@ int main( int ac, char** av )
         // the following is designated boost::crc_xmodem_t in the git repo for boost/crc.hpp
         else if( crc == "xmodem" ) { return run_< boost::crc_optimal< 16, 0x1021, 0, 0, false, false > >(); }
         else if( crc == "xmodem-boost" ) { return run_< boost::crc_xmodem_type >(); }
-        std::cerr << "csv-crc: expected crc type, got \"" << crc << "\"" << std::endl;
-        return 1;
-    }
-    catch( std::exception& ex )
-    {
-        std::cerr << "csv-crc: " << ex.what() << std::endl;
-    }
-    catch( ... )
-    {
-        std::cerr << "csv-crc: unknown exception" << std::endl;
+        comma::say() << "expected crc type, got '" << crc << "'" << std::endl;
     }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/applications/csv-enumerate.cpp b/csv/applications/csv-enumerate.cpp
index a58cfc4f7..10b15b6c7 100644
--- a/csv/applications/csv-enumerate.cpp
+++ b/csv/applications/csv-enumerate.cpp
@@ -29,7 +29,7 @@
 
 /// @author vsevolod vlaskine
 
-#include <boost/unordered_map.hpp>
+#include <unordered_map>
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -39,42 +39,58 @@
 
 static void usage( bool verbose )
 {
-    std::cerr << std::endl;
-    std::cerr << "append unique id to csv records with the same values; support integer, time, and string fields" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: cat data.csv | csv-enumerate <options>" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "todo: support floating point values as input keys" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --fields,-f=<fields>; fields of interest, actual field names do not matter; e.g: --fields ,,,a,,b,,,c" << std::endl;
-    std::cerr << "    --format=<binary format>; if input is ascii and deducing data types may be ambiguous, define field types explicitly, value as in --binary" << std::endl;
-    std::cerr << "    --output-map,--map: do not output input records, only an unsorted records" << std::endl;
-    std::cerr << "                        output fields" << std::endl;
-    std::cerr << "                            - list of input key values; in same binary as input" << std::endl;
-    std::cerr << "                            - corresponding enumeration index as ui" << std::endl;
-    std::cerr << "                            - number of values for this enumeration index as ui" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "csv options" << std::endl;
-    if( verbose ) { std::cerr << comma::csv::options::usage() << std::endl; } else { std::cerr << "    run csv-enumerate --help --verbose for more..." << std::endl; }
-    std::cerr << std::endl;
+    std::cerr << R"(
+append unique id to csv records with the same values; support integer, time, and string fields
+
+usage: cat data.csv | csv-enumerate <options>
+
+todo: support floating point values as input keys
+
+options
+    --fields,-f=<fields>; fields of interest, actual field names do not matter
+                          e.g: --fields ,,,a,,b,,,c
+    --format=<binary format>; if input is ascii and deducing data types may be ambiguous,
+                              define field types explicitly, value as in --binary
+    --output-map,--map: do not output input records, only an unsorted list of keys
+                        output fields
+                            - list of input key values; in same binary as input
+                            - corresponding enumeration index as ui
+                            - number of values for this enumeration index as ui
+    --verbose,-v: more output to stderr
+)" << std::endl;
+std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
     exit( 0 );
 }
 
+struct output
+{
+    comma::uint32 id;
+    output( comma::uint32 id = 0 ): id( id ) {}
+};
+
+namespace comma { namespace visiting {
+
+template <> struct traits< output >
+{
+    template < typename K, typename V > static void visit( const K&, const output& p, V& v ) { v.apply( "id", p.id ); }
+    template < typename K, typename V > static void visit( const K&, output& p, V& v ) { v.apply( "id", p.id ); }
+};
+
+} } // namespace comma { namespace visiting {
+
 int main( int ac, char** av )
 {
     typedef comma::csv::impl::unstructured input_t;
-    typedef boost::unordered_map< comma::csv::impl::unstructured, std::pair< comma::uint32, comma::uint32 >, comma::csv::impl::unstructured::hash >  map_t;
+    typedef std::unordered_map< comma::csv::impl::unstructured, std::pair< comma::uint32, comma::uint32 >, comma::csv::impl::unstructured::hash >  map_t;
     try
     {
         comma::command_line_options options( ac, av, usage );
-        bool verbose = options.exists( "--verbose,-v" );
         bool output_map = options.exists( "--output-map,--map" );
         comma::csv::options csv( options );
         bool has_non_empty_field = false;
         for( const auto& f: comma::split( csv.fields, ',' ) ) { if( !f.empty() ) { has_non_empty_field = true; break; } }
-        if( !has_non_empty_field ) { std::cerr << "csv-enumerate: please specify at least one key in fields" << std::endl; return 1; }
-        csv.full_xpath = true;
+        COMMA_ASSERT_BRIEF( has_non_empty_field, "please specify at least one key in fields" );
         std::string first_line;
         comma::csv::format f;
         if( csv.binary() ) { f = csv.format(); }
@@ -84,21 +100,22 @@ int main( int ac, char** av )
             while( std::cin.good() && first_line.empty() ) { std::getline( std::cin, first_line ); }
             if( first_line.empty() ) { return 0; }
             f = comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter );
-            if( verbose ) { std::cerr << "csv-enumerate: guessed format: " << f.string() << std::endl; }
+            comma::saymore() << "guessed format: " << f.string() << std::endl;
         }
         input_t default_input;
         std::vector< std::string > v = comma::split( csv.fields, ',' );
+        std::vector< std::string > format; // quick and dirty
+        std::vector< std::string > s;
+        if( csv.binary() ) { format = comma::split( csv.format().expanded_string(), ',' ); }
         for( unsigned int i = 0; i < v.size(); ++i )
         {
             if( v[i].empty() ) { continue; }
             v[i] = default_input.append( f.offset( i ).type );
+            if( csv.binary() ) { s.push_back( format[i] ); }
         }
-        if( verbose ) { std::cerr << "csv-enumerate: fields " << csv.fields << " interpreted as: " << comma::join( v, ',' ) << std::endl; }
+        std::string map_output_binary_format = comma::join( s, ',' );
+        comma::saymore() << "fields " << csv.fields << " interpreted as: " << comma::join( v, ',' ) << std::endl;
         csv.fields = comma::join( v, ',' );
-        comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
-        #ifdef WIN32
-        if( istream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
-        #endif
         static map_t map;
         comma::uint32 id = 0;
         if( !first_line.empty() )
@@ -107,6 +124,15 @@ int main( int ac, char** av )
             map[ comma::csv::ascii< input_t >( csv, default_input ).get( first_line ) ] = std::make_pair( id++, 1 );
             if( !output_map ) { std::cout << first_line << csv.delimiter << 0 << std::endl; }
         }
+        comma::csv::options output_csv;
+        output_csv.delimiter = csv.delimiter;
+        if( csv.binary() ) { output_csv.format( comma::csv::format::value< output >() ); }
+        comma::csv::input_stream< input_t > istream( std::cin, csv, default_input );
+        comma::csv::output_stream< output > ostream( std::cout, output_csv );
+        comma::csv::tied< input_t, output > tied( istream, ostream );
+        #ifdef WIN32
+        if( istream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        #endif
         while( istream.ready() || std::cin.good() )
         {
             const input_t* p = istream.read();
@@ -114,30 +140,21 @@ int main( int ac, char** av )
             map_t::iterator it = map.find( *p );
             comma::uint32 cur = id;
             if( it == map.end() ) { map[ *p ] = std::make_pair( id++, 1 ); } else { cur = it->second.first; ++( it->second.second ); }
-            if( !output_map )
-            {
-                if( csv.binary() )
-                {
-                    std::cout.write( istream.binary().last(), csv.format().size() );
-                    std::cout.write( reinterpret_cast< const char* >( &cur ), sizeof( comma::uint32 ) );
-                    if( csv.flush ) { std::cout.flush(); }
-                }
-                else
-                {
-                    std::cout << comma::join( istream.ascii().last(), csv.delimiter ) << csv.delimiter << cur << std::endl;
-                }
-            }
+            if( !output_map ) { tied.append( output( cur ) ); }
         }
         if( !output_map ) { return 0; }
-        comma::csv::options output_csv;
-        output_csv.delimiter = csv.delimiter;
-        output_csv.full_xpath = true;
-        if( csv.binary() ) { output_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" ); }
-        comma::csv::output_stream< map_t::value_type > ostream( std::cout, output_csv, std::make_pair( default_input, std::make_pair( 0, 0 ) ) );
-        for( map_t::const_iterator it = map.begin(); it != map.end(); ++it ) { ostream.write( *it ); }
+        comma::csv::options output_map_csv;
+        output_map_csv.delimiter = csv.delimiter;
+        if( csv.binary() )
+        { 
+            output_map_csv.format( map_output_binary_format + ",2ui" ); //output_map_csv.format( comma::csv::format::value< input_t >( default_input ) + ",2ui" );
+            comma::say() << "binary output format for map: '" << output_map_csv.format().string() << "'" << std::endl;
+        }
+        comma::csv::output_stream< map_t::value_type > omstream( std::cout, output_map_csv, std::make_pair( default_input, std::make_pair( 0, 0 ) ) );
+        for( map_t::const_iterator it = map.begin(); it != map.end(); ++it ) { omstream.write( *it ); }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-enumerate: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-enumerate: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/applications/csv-fields.cpp b/csv/applications/csv-fields.cpp
index 6cea12a13..f2f705901 100644
--- a/csv/applications/csv-fields.cpp
+++ b/csv/applications/csv-fields.cpp
@@ -29,16 +29,15 @@
 
 /// @author vsevolod vlaskine
 
+#include <functional>
 #include <iostream>
 #include <string>
 #include <set>
 #include <map>
-#include "../../application/contact_info.h"
+#include <unordered_map>
 #include "../../application/command_line_options.h"
 #include "../../string/string.h"
 
-using namespace comma;
-
 static void usage( bool )
 {
     std::cerr << std::endl;
@@ -53,6 +52,7 @@ static void usage( bool )
     std::cerr << "    numbers (default): convert comma-separated field names to field numbers" << std::endl;
     std::cerr << "                       e.g. for combining with cut or csv-bin-cut" << std::endl;
     std::cerr << "        --count,--size: output the total number of fields" << std::endl;
+    std::cerr << "        --fields=[<fields>]: number only fields with given names, same as csv-fields clear --except ... | csv-fields numbers" << std::endl;
     std::cerr << "        --fill: number even empty fields, e.g. try: echo ,, | csv-fields numbers --fill" << std::endl;
     std::cerr << "        --from=<value>: start field numbering from <value>; default=1" << std::endl;
     std::cerr << "                        to keep it consistent with linux cut utility" << std::endl;
@@ -95,6 +95,8 @@ static void usage( bool )
     std::cerr << "    make-fixed: normalise input to a fixed number of fields" << std::endl;
     std::cerr << "        --count,--size=<n>: number of output fields" << std::endl;
     std::cerr << "        --force: chop input to <n> fields if larger" << std::endl;
+    std::cerr << "        --values=[<values>]: fill missing fields with given values" << std::endl;
+    std::cerr << "                             if --count not specified, use number of <values> as desired number of fields" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    numbers" << std::endl;
@@ -155,29 +157,35 @@ static void usage( bool )
     std::cerr << "        a,b,c,d,," << std::endl;
     std::cerr << "        x,y,z,,," << std::endl;
     std::cerr << std::endl;
+    std::cerr << "    make-fixed" << std::endl;
+    std::cerr << "        { echo a,b; echo x,y,z; } | csv-fields make-fixed --count=6 --fields=A,B,C,D,E,F" << std::endl;
+    std::cerr << "        a,b,C,D,E,F" << std::endl;
+    std::cerr << "        x,y,z,D,E,F" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "        { echo a,b,c,d; echo x,y,z; } | csv-fields make-fixed --count=3 --force" << std::endl;
     std::cerr << "        a,b,c" << std::endl;
     std::cerr << "        x,y,z" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 int main( int ac, char** av )
 {
     try
     {
-        command_line_options options( ac, av, usage );
+        comma::command_line_options options( ac, av, usage );
         std::string operation = "numbers";
         const std::vector< std::string > unnamed = options.unnamed( "--help,-h", "-.*" );
         char delimiter = options.value( "--delimiter,-d", ',' );
         if( !unnamed.empty() ) { operation = unnamed[0]; }
-        if( operation == "numbers" )
+        auto numbers = [&]()->int
         {
             int from = options.value( "--from", 1 );
             bool fill = options.exists( "--fill" );
-            std::string prefix = options.value< std::string >( "--prefix", "" );
+            options.assert_mutually_exclusive( "--fill,--fields" );
+            const auto& v = comma::split( options.value< std::string >( "--fields", "" ), ',', true );
+            std::set< std::string > fields( v.begin(), v.end() );
+            std::string prefix = options.value< std::string >( "--prefix", "" );            
             while( std::cin.good() )
             {
                 std::string line;
@@ -189,14 +197,15 @@ int main( int ac, char** av )
                 for( unsigned int i = 0; i < v.size(); ++i )
                 {
                     if( v[i].empty() && !fill ) { continue; }
+                    if( !fields.empty() && fields.find( v[i] ) == fields.end() ) { continue; }
                     std::cout << comma << prefix << ( i + from );
                     comma = ',';
                 }
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "clear" )
+        };
+        auto clear = [&]()->int
         {
             options.assert_mutually_exclusive( "--except,--keep,--mask,--remove,--inverted-mask,--complement-mask,--unmask,--unmasked" );
             std::string keep = options.value< std::string >( "--keep,--except", "" );
@@ -249,8 +258,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "default" )
+        };
+        auto default_operation = [&]()->int
         {
             options.assert_mutually_exclusive( "--value,--values" );
             std::vector< std::string > defaults;
@@ -276,8 +285,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "prefix" )
+        };
+        auto prefix = [&]()->int
         {
             options.assert_mutually_exclusive( "--fields,--except" );
             const std::string& e = options.value< std::string >( "--except", "" );
@@ -309,8 +318,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "rename" )
+        };
+        auto rename = [&]()->int
         {
             const std::vector< std::string >& fields = comma::split( options.value< std::string >( "--fields" ), ',' );
             const std::vector< std::string >& to = comma::split( options.value< std::string >( "--to" ), ',' );
@@ -334,8 +343,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "strip" )
+        };
+        auto strip = [&]()->int
         {
             options.assert_mutually_exclusive( "--fields,--except" );
             const std::string& e = options.value< std::string >( "--except", "" );
@@ -364,8 +373,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "cut" )
+        };
+        auto cut = [&]()->int
         {
             options.assert_mutually_exclusive( "--except,--fields", "--empty" );
             bool except = options.exists( "--except" );
@@ -394,8 +403,8 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        if( operation == "has" )
+        };
+        auto has = [&]()->int
         {
             const std::string& f = options.value< std::string >( "--fields" );
             const std::vector< std::string >& v = comma::split( f, delimiter );
@@ -411,10 +420,12 @@ int main( int ac, char** av )
             if( !matches ) { return 1; }
             if( any ) { return 0; }
             return matches == fields.size() ? 0 : 1;
-        }
-        if( operation == "make-fixed" )
+        };
+        auto make_fixed = [&]()->int
         {
-            const unsigned int count = options.value< unsigned int >( "--count,--size" );
+            const std::vector< std::string >& values = comma::split( options.value< std::string >( "--values", "" ), ',', true );
+            const unsigned int count = options.value< unsigned int >( "--count,--size", values.size() );
+            if( count == 0 ) { std::cerr << "csv-fields: make-fixed: please specify either --count or --values" << std::endl; }
             bool force = options.exists( "--force" );
             while( std::cin.good() )
             {
@@ -425,7 +436,7 @@ int main( int ac, char** av )
                 if( v.size() <= count )
                 {
                     std::cout << line;
-                    for( unsigned int i = v.size(); i < count; i++ ) { std::cout << delimiter; }
+                    for( unsigned int i = v.size(); i < count; i++ ) { std::cout << delimiter << ( i < values.size() ? values[i] : std::string() ); }
                 }
                 else
                 {
@@ -436,8 +447,19 @@ int main( int ac, char** av )
                 std::cout << std::endl;
             }
             return 0;
-        }
-        std::cerr << "csv-fields: expected operation, got: \"" << operation << "\"" << std::endl;
+        };
+        std::unordered_map< std::string, std::function< int() > > operations = { { "clear", clear }
+                                                                               , { "cut", cut }
+                                                                               , { "default", default_operation }
+                                                                               , { "has", has }
+                                                                               , { "make-fixed", make_fixed }
+                                                                               , { "numbers", numbers }
+                                                                               , { "prefix", prefix }
+                                                                               , { "rename", rename }
+                                                                               , { "strip", strip } };
+        auto o = operations.find( operation );
+        if( o != operations.end() ) { return o->second(); }
+        std::cerr << "csv-fields: expected operation, got '" << operation << "'" << std::endl;
         return 1;
     }
     catch( std::exception& ex ) { std::cerr << "csv-fields: " << ex.what() << std::endl; }
diff --git a/csv/applications/csv-format.cpp b/csv/applications/csv-format.cpp
index ab0b7bff6..f9cbc8bd4 100644
--- a/csv/applications/csv-format.cpp
+++ b/csv/applications/csv-format.cpp
@@ -33,20 +33,15 @@
 #include <iostream>
 #include <sstream>
 #include <string>
-#include <set>
 #include <boost/lexical_cast.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../csv/format.h"
 #include "../../string/string.h"
 
-using namespace comma;
-static const char *app_name = "csv-format";
-
-static void usage()
+static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
-    std::cerr << "usage: echo \"3f,2f,d\" | " << app_name << " [options] (expand|collapse|count|repeat)" << std::endl;
+    std::cerr << "usage: echo \"3f,2f,d\" | csv-format [options] (expand|collapse|count|repeat)" << std::endl;
     std::cerr << std::endl;
     std::cerr << "perform various operations on format strings" << std::endl;
     std::cerr << std::endl;
@@ -56,6 +51,7 @@ static void usage()
     std::cerr << "    guess: take a csv string, output (roughly) guessed format; e.g: echo 20170101T000000,1,2,3 | csv-format guess --format ,,ui" << std::endl;
     std::cerr << "    expand: output fully expand format, e.g. 2i,3f -> i,i,f,f,f" << std::endl;
     std::cerr << "    repeat: replicate the format n times, e.g. 2i,3f --count 2 -> 2i,3f,2i,3f" << std::endl;
+    std::cerr << "    size: output format size in bytes, e.g: echo 2i,3f | csv-format size would output 20" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    guess:" << std::endl;
@@ -64,9 +60,7 @@ static void usage()
     std::cerr << "    repeat:" << std::endl;
     std::cerr << "        --count=n: replicate the format n times" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 static std::string incomplete_expanded( const std::string& s ) // quick and dirty
@@ -116,19 +110,18 @@ int main( int ac, char** av )
 {
     try
     {
-        command_line_options options( ac, av );
-        if( options.exists( "--help,-h" ) ) { usage(); }
+        comma::command_line_options options( ac, av, usage );
         const std::vector< std::string > unnamed = options.unnamed( "--help,-h", "-.*" );
-        if( unnamed.empty() )
-        { std::cerr << app_name << ": expected an operation (e.g. \"expand\")" << std::endl; return 1; }
-        if( unnamed.size() != 1 ) { usage(); }
+        if( unnamed.empty() ) { std::cerr << "csv-format: please specify operation" << std::endl; return 1; }
+        if( unnamed.size() > 1 ) { std::cerr << "csv-format: please only one operation" << std::endl; return 1; }
         std::string operation = unnamed[0];
         std::string line;
         std::function< void( const std::string& ) > handle;
         if( operation == "expand" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).expanded_string() << std::endl; }; }
         else if( operation == "collapse" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).collapsed_string() << std::endl; }; }
         else if( operation == "count" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).count() << std::endl; }; }
-        else if( operation == "guess" ) { handle = [&]( const std::string& s )  {
+        else if( operation == "size" ) { handle = [&]( const std::string& s ) { std::cout << comma::csv::format( s ).size() << std::endl; }; }
+        else if( operation == "guess" ) { handle = [&]( const std::string& s ) {
                                                                                     static const std::vector< std::string >& e = comma::split( incomplete_expanded( options.value< std::string >( "--format", "" ) ), ',' );
                                                                                     static char delimiter = options.value( "--delimiter,-d", ',' );
                                                                                     const std::vector< std::string >& v = comma::split( s, delimiter );
@@ -150,7 +143,7 @@ int main( int ac, char** av )
                                                                                         std::cout << std::endl;
                                                                                     }
                                                                                 }; }
-        else { std::cerr << app_name << ": expected operation; got: \"" << operation << "\"" << std::endl; return 1; }
+        else { std::cerr << "csv-format: expected operation; got: \"" << operation << "\"" << std::endl; return 1; }
         while( std::getline( std::cin, line ) )
         {
             const std::string& stripped = comma::strip( line );
@@ -158,7 +151,7 @@ int main( int ac, char** av )
         }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << app_name << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << app_name << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-format: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-format: unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/applications/csv-from-bin.cpp b/csv/applications/csv-from-bin.cpp
index 644dc4524..f901114c7 100644
--- a/csv/applications/csv-from-bin.cpp
+++ b/csv/applications/csv-from-bin.cpp
@@ -39,7 +39,6 @@
 #include <stdlib.h>
 #include <iostream>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/format.h"
 #include "../../string/string.h"
@@ -54,7 +53,6 @@ static void usage()
     std::cerr << "--precision: set precision (number of mantissa digits) for floating point types" << std::endl;
     std::cerr << csv::format::usage() << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/csv/applications/csv-interval.cpp b/csv/applications/csv-intervals.cpp
similarity index 53%
rename from csv/applications/csv-interval.cpp
rename to csv/applications/csv-intervals.cpp
index 5fa81d6a2..0042e47c9 100644
--- a/csv/applications/csv-interval.cpp
+++ b/csv/applications/csv-intervals.cpp
@@ -27,26 +27,29 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author Vinny Do
 
+#include <fstream>
 #include <iostream>
 #include <limits>
 #include <set>
 #include <string>
+#include <tuple>
 #include <boost/icl/interval.hpp>
 #include <boost/icl/interval_map.hpp>
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
-#include "../../visiting/traits.h"
+#include "../../csv/traits.h"
 #include "../../csv/impl/unstructured.h"
-
-static const std::string app_name = "csv-interval";
+#include "../../io/stream.h"
+#include "../../name_value/map.h"
+#include "../../name_value/parser.h"
+#include "../../string/string.h"
+#include "../../visiting/traits.h"
 
 static bool verbose;
 static bool debug;
-static std::string first_line;
 static bool append;
 
 template < typename T > struct limits
@@ -91,21 +94,23 @@ static void usage( bool verbose = false )
 {
     std::cerr << "takes csv intervals and separates them at points of overlap if any" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage: cat intervals.csv | " << app_name << " [OPTIONS...]" << std::endl;
+    std::cerr << "usage: cat intervals.csv | csv-intervals <operation> [<options>]" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operations" << std::endl;
+    std::cerr << "    contain: given a set of intervals, take scalars on stdin, append 1 if contained in the intervals, 0 if not" << std::endl;
+    std::cerr << "    join: given a set of intervals, take scalars on stdin, append payloads of the intervals the scalars are contained in" << std::endl;
+    std::cerr << "    make: make intervals" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: show help; --help --verbose for more help" << std::endl;
     std::cerr << "    --verbose,-v: more info" << std::endl;
-    std::cerr << "    --append,-a: append output intervals instead of outputting them in place" << std::endl;
-    std::cerr << "    --debug: print debug" << std::endl;
+    std::cerr << "    --debug: more debug output" << std::endl;
     std::cerr << "    --input-fields: print input fields and exit" << std::endl;
     // std::cerr << "    --input-format: print input format and exit" << std::endl;
     std::cerr << "    --output-fields: print output fields and exit" << std::endl;
     // std::cerr << "    --output-format: print output format and exit" << std::endl;
-    std::cerr << "    --empty: empty value used to signify unbounded intervals" << std::endl;
+    std::cerr << "    --empty=[<empty-value>]: empty value used to signify unbounded intervals" << std::endl;
     std::cerr << "             default for time is \"not-a-date-time\"" << std::endl;
-    std::cerr << "    --format: input format (ascii only), also affects the --limits option; if not given the format is guessed" << std::endl;
-    std::cerr << "    --intervals-only: only output the intervals, ignore payload if any" << std::endl;
     std::cerr << "    --limits,-l: replace empty bounds with type limits" << std::endl;
     std::cerr << "                 b  : " << (int)limits< char >::lowest() << " " << (int)limits< char >::max() << std::endl;
     std::cerr << "                 ub : " << (int)limits< unsigned char >::lowest() << " " << (int)limits< unsigned char >::max() << std::endl;
@@ -121,14 +126,31 @@ static void usage( bool verbose = false )
     std::cerr << "                 s  : \"" << limits< std::string >::lowest() << "\" \"" << limits< std::string >::max() << "\"" << std::endl;
     std::cerr << "                 t  : " << limits< boost::posix_time::ptime >::lowest() << " " << limits< boost::posix_time::ptime >::max() << std::endl;
     std::cerr << "                 lt : " << limits< boost::posix_time::ptime >::lowest() << " " << limits< boost::posix_time::ptime >::max() << std::endl;
-    std::cerr << "    --overlap-count=[<count>]; output only intervals with <count> overlaps" << std::endl;
-    std::cerr << "    --overlap-count-min,--min-overlap-count=[<count>]; output only intervals with at least <count> overlaps" << std::endl;
-    std::cerr << "    --overlap-count-max,--max-overlap-count=[<count>]; output only intervals with not more than <count> overlaps" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "operation details" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    contain" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --intervals=<filename>: file or stream name" << std::endl;
+    std::cerr << "    join" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --intervals=<filename>: file or stream name" << std::endl;
+    std::cerr << "            --matching: output matching input records, do not append the intervals" << std::endl;
+    std::cerr << "            --not-matching: output not matching input records" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    make" << std::endl;
+    std::cerr << "        options" << std::endl;
+    std::cerr << "            --append,-a: append output intervals instead of outputting them in place" << std::endl;
+    std::cerr << "            --format=[<format>]: input format (ascii only), also affects the --limits option; if not given the format is guessed" << std::endl;
+    std::cerr << "            --intervals-only: only output the intervals, ignore payload if any" << std::endl;    
+    std::cerr << "            --overlap-count=[<count>]; output only intervals with <count> overlaps" << std::endl;
+    std::cerr << "            --overlap-count-min,--min-overlap-count=[<count>]; output only intervals with at least <count> overlaps" << std::endl;
+    std::cerr << "            --overlap-count-max,--max-overlap-count=[<count>]; output only intervals with not more than <count> overlaps" << std::endl;
     std::cerr << std::endl;
     std::cerr << "ascii notes" << std::endl;
     std::cerr << "    unbounded intervals may be indicated by no value (e.g. ,3 \u2261 -\u221e,3), both sides unbounded is also supported" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "for examples see verbose help: " << app_name << " --help --verbose" << std::endl;
+    std::cerr << "for examples see verbose help: csv-intervals --help --verbose" << std::endl;
     std::cerr << std::endl;
     if( verbose )
     {
@@ -143,7 +165,7 @@ static void usage( bool verbose = false )
         std::cerr << "        B:      [2      4]"           << std::endl;
         std::cerr << "        C:           [3           6]" << std::endl;
         std::cerr << std::endl;
-        std::cerr << "        echo -e '1,5,A\\n2,4,B\\n3,6,C' | " << app_name << std::endl;
+        std::cerr << "        echo -e '1,5,A\\n2,4,B\\n3,6,C' | csv-intervals make" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        A: [1 2][2 3][3 4][4 5]"      << std::endl;
         std::cerr << "        B:      [2 3][3 4]"           << std::endl;
@@ -157,7 +179,7 @@ static void usage( bool verbose = false )
         std::cerr << "        D:            [3           8]"                    << std::endl;
         std::cerr << "        Z: [-\u221e                          +\u221e]"    << std::endl;
         std::cerr << std::endl;
-        std::cerr << "        echo -e ',4,A\\n2,4,B\\n3,6,C\\n3,8,D\\n,,Z' | " << app_name << " --format 2i" << std::endl;
+        std::cerr << "        echo -e ',4,A\\n2,4,B\\n3,6,C\\n3,8,D\\n,,Z' | csv-intervals make" << " --format 2i" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        A: [-\u221e 2][2 3][3 4]"                         << std::endl;
         std::cerr << "        B:       [2 3][3 4]"                              << std::endl;
@@ -172,7 +194,7 @@ static void usage( bool verbose = false )
         std::cerr << "        C:                                                                                       [20140916T190000 +\u221e]" << std::endl;
         std::cerr << "        Z: [-\u221e                                                                                                    +\u221e]" << std::endl;
         std::cerr << std::endl;
-        std::cerr << "        echo -e ',20140916T030000.000000,A\\n20140916T010000.000000,20140916T190000.000000,B\\n20140916T190000.000000,,C\\n,,Z' | " << app_name << " --format 2t" << std::endl;
+        std::cerr << "        echo -e ',20140916T030000.000000,A\\n20140916T010000.000000,20140916T190000.000000,B\\n20140916T190000.000000,,C\\n,,Z' | csv-intervals make" << " --format 2t" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        A: [-\u221e 20140916T010000][20140916T010000 20140916T030000]" << std::endl;
         std::cerr << "        B:                     [20140916T010000 20140916T030000][20140916T030000 20140916T190000]" << std::endl;
@@ -248,6 +270,18 @@ struct interval_t
     to_t< To > to;
 };
 
+
+template < typename T > struct scalar_traits { static T zero() { return 0; } };
+template <> struct scalar_traits< boost::posix_time::ptime > { static boost::posix_time::ptime zero() { return boost::posix_time::ptime(); } };
+template <> struct scalar_traits< std::string > { static std::string zero() { return ""; } };
+
+template < typename T > struct scalar_t
+{ 
+    T scalar{ scalar_traits< T >::zero() };
+    scalar_t() {}
+    scalar_t( const T& t ): scalar( t ) {}
+};
+
 namespace comma { namespace visiting {
 
 template < typename T > struct traits< from_t< T > >
@@ -268,6 +302,12 @@ template < typename From, typename To > struct traits< interval_t< From, To > >
     template < typename K, typename V > static void visit( const K&, const interval_t< From, To >& p, V& v ) { v.apply( "", p.from ); v.apply( "", p.to ); }
 };
 
+template < typename T > struct traits< scalar_t< T > >
+{
+    template < typename K, typename V > static void visit( const K&, scalar_t< T >& p, V& v ) { v.apply( "scalar", p.scalar ); }
+    template < typename K, typename V > static void visit( const K&, const scalar_t< T >& p, V& v ) { v.apply( "scalar", p.scalar ); }
+};
+
 } } // namespace comma { namespace visiting {
 
 template < typename From, typename To = From >
@@ -287,14 +327,16 @@ struct intervals
     unsigned int min_overlap_count;
     unsigned int max_overlap_count;
 
-    intervals( const comma::command_line_options& options ) : options( options )
-                                                            , csv( options )
-                                                            , ocsv( options )
-                                                            , ascii_csv( options )
-                                                            , empty( traits< bound_type >::cast( options.optional< std::string >( "--empty" ) ) )
-                                                            , intervals_only( options.exists( "--intervals-only" ) )
-                                                            , use_limits( options.exists( "--limits,-l" ) )
+    intervals( const comma::command_line_options& options, const comma::csv::options& csv_ ) 
+        : options( options )
+        , csv( csv_ )
+        , ocsv( csv )
+        , ascii_csv( csv )
+        , empty( traits< bound_type >::cast( options.optional< std::string >( "--empty" ) ) )
+        , intervals_only( options.exists( "--intervals-only" ) )
+        , use_limits( options.exists( "--limits,-l" ) )
     {
+        csv.full_xpath = false;
         if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< From, To > >(), ',' ); }
         if( ocsv.fields.empty() || intervals_only )
         {
@@ -303,7 +345,7 @@ struct intervals
         }
         ascii_csv.fields = ocsv.fields;
         ascii_csv.quote = boost::none;
-        if( verbose ) { std::cerr << app_name << ": empty: "; empty ? std::cerr << *empty : std::cerr << "<none>"; std::cerr << std::endl; }
+        if( verbose ) { std::cerr << "csv-intervals: empty: "; empty ? std::cerr << *empty : std::cerr << "<none>"; std::cerr << std::endl; }
         options.assert_mutually_exclusive( "overlap-count-min,overlap-count-max", "overlap-count" );
         if( options.exists( "--overlap-count" ) )
         {
@@ -394,9 +436,9 @@ struct intervals
         }
     }
 
-    void run()
+    void read( std::istream& is, const std::string& first_line ) // preparing for adding operations
     {
-        comma::csv::input_stream< interval_t< From, To > > istream( std::cin, csv );
+        comma::csv::input_stream< interval_t< From, To > > istream( is, csv );
         comma::csv::ascii< interval_t< std::string > > ascii( csv.fields );
         if( !first_line.empty() )
         {
@@ -410,10 +452,10 @@ struct intervals
             if( !first.to.value.empty() && ( !empty || interval.to.value != *empty  ) ) { to.value = interval.to.value; }
             payload = first_line;
             if( !intervals_only && !append ) { ascii.put( interval_t< std::string >(), payload ); } // blank out interval from payload
-            if( verbose ) { std::cerr << app_name << ": from: " << from << " to: " << to << " payload: " << payload << std::endl; }
+            if( verbose ) { std::cerr << "csv-intervals: from: " << from << " to: " << to << " payload: " << payload << std::endl; }
             add( from, to, payload );
         }
-        while( istream.ready() || std::cin.good()  )
+        while( istream.ready() || is.good()  )
         {
             const interval_t< From, To >* interval = istream.read();
             if( !interval ) { break; }
@@ -438,108 +480,239 @@ struct intervals
                 if( !intervals_only && !append ) { ascii.put( interval_t< std::string >(), buf ); } // blank out interval from payload
                 payload = comma::join( buf, csv.delimiter );
             }
-            if( verbose ) { std::cerr << app_name << ": from: " << from << " to: " << to << " payload: " << ( csv.binary() ? "<binary>" : payload ) << std::endl; }
+            if( verbose ) { std::cerr << "csv-intervals: from: " << from << " to: " << to << " payload: " << ( csv.binary() ? "<binary>" : payload ) << std::endl; }
             add( from, to, payload );
         }
-        write();
+    }
+
+    int contain( std::istream& is, const std::string& first_line )
+    {
+        comma::csv::options icsv( options );
+        icsv.full_xpath = false;
+        comma::csv::input_stream< scalar_t< From > > istream( std::cin, icsv );
+        comma::csv::output_stream< scalar_t< bool > > ostream( std::cout, icsv.binary() );
+        auto tied = comma::csv::make_tied( istream, ostream );
+        this->read( is, first_line ); // todo: support block
+        while( istream.ready() || std::cin.good() )
+        {
+            auto p = istream.read();
+            if( !p ) { break; }
+            bool contained = false;
+            for( typename map_t::iterator it = map.begin(); it != map.end() && !contained; ++it ) // todo! quadratic complexity; how the heck to query icl map? use boost::...::query?
+            {
+                const bound_t< bound_type >& from = it->first.lower();
+                const bound_t< bound_type >& to = it->first.upper();
+                contained = ( !from.value || p->scalar >= *from.value ) && ( !to.value || p->scalar < *to.value );
+            }
+            tied.append( scalar_t< bool >( contained ) );
+            if( icsv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    }
+    
+    int join( std::istream& is, const std::string& first_line )
+    {
+        options.assert_mutually_exclusive( "--matching,--not-matching" );
+        bool matching = options.exists( "--matching" );
+        bool not_matching = options.exists( "--not-matching" );
+        bool output_joined = !matching && !not_matching;
+        comma::csv::options icsv( options );
+        if( output_joined && csv.binary() != icsv.binary() ) { std::cerr << "csv-intervals: join: expected both inputs ascii or both binary; got stdin " << ( icsv.binary() ? "binary" : "ascii" ) << " while --intervals " << ( csv.binary() ? "binary" : "ascii" ) << std::endl; return 1; }
+        icsv.full_xpath = false;
+        comma::csv::input_stream< scalar_t< From > > istream( std::cin, icsv );
+        append = true;
+        this->read( is, first_line ); // todo: support block
+        while( istream.ready() || std::cin.good() )
+        {
+            auto p = istream.read();
+            if( !p ) { break; }
+            bool found = false;
+            typename map_t::iterator it;
+            for( it = map.begin(); it != map.end(); ++it ) // todo! quadratic complexity; how the heck to query icl map? use boost::...::query?
+            {
+                const bound_t< bound_type >& from = it->first.lower();
+                const bound_t< bound_type >& to = it->first.upper();
+                found = ( !from.value || p->scalar >= *from.value ) && ( !to.value || p->scalar < *to.value );
+                if( found ) { break; }
+            }
+            if( output_joined )
+            {
+                if( found )
+                {
+                    std::string joined = csv.binary() ? "" : comma::join( istream.ascii().last(), icsv.delimiter );
+                    for( const auto& s: it->second )
+                    {
+                        if( csv.binary() )
+                        {
+                            std::cout.write( istream.binary().last(), icsv.format().size() );
+                            std::cout.write( &s[0], s.size() );
+                        }
+                        else
+                        {
+                            std::cout << joined << icsv.delimiter << s << std::endl;
+                        }
+                    }
+                }
+            }
+            else if( matching == found )
+            {
+                if( icsv.binary() ) { std::cout.write( istream.binary().last(), icsv.format().size() ); }
+                else { std::cout << comma::join( istream.ascii().last(), icsv.delimiter ) << std::endl; }
+            }
+            if( icsv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    }
+    
+    int make( const std::string& first_line )
+    {
+        this->read( std::cin, first_line );
+        this->write();
+        return 0;
     }
 };
 
-// template < typename From > static void run( const comma::command_line_options& options, const comma::csv::format::types_enum to_type )
-// {
-//     switch( to_type )
-//     {
-//         case comma::csv::format::int8:          intervals< From, char >( options ).run(); break;
-//         case comma::csv::format::uint8:         intervals< From, unsigned char >( options ).run(); break;
-//         case comma::csv::format::int16:         intervals< From, comma::int16 >( options ).run(); break;
-//         case comma::csv::format::uint16:        intervals< From, comma::uint16 >( options ).run(); break;
-//         case comma::csv::format::int32:         intervals< From, comma::int32 >( options ).run(); break;
-//         case comma::csv::format::uint32:        intervals< From, comma::uint32 >( options ).run(); break;
-//         case comma::csv::format::int64:         intervals< From, comma::int64 >( options ).run(); break;
-//         case comma::csv::format::uint64:        intervals< From, comma::uint64 >( options ).run(); break;
-//         case comma::csv::format::char_t:        intervals< From, char >( options ).run(); break;
-//         case comma::csv::format::float_t:       intervals< From, float >( options ).run(); break;
-//         case comma::csv::format::double_t:      intervals< From, double >( options ).run(); break;
-//         default:                                COMMA_THROW( comma::exception, "from/to type mismatch" ); break;
-//     }
-// }
+static std::tuple< comma::csv::format::types_enum, std::string > interval_type( std::istream& is, comma::csv::options csv, const std::string& format )
+{
+    if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< double > >(), ',' ); }
+    if( !csv.has_field( "from,to" ) ) { COMMA_THROW( comma::exception, "expected from and to fields" ); }
+    std::string first_line;
+    csv.full_xpath = false;
+    if( !csv.binary() )
+    {
+        if( format.empty() )
+        {
+            while( is.good() && first_line.empty() ) { std::getline( is, first_line ); }
+            if( first_line.empty() ) { exit( 0 ); } // quick and dirty
+            csv.format( comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter ) );
+            if( verbose ) { std::cerr << "csv-intervals: guessed format: " << csv.format().string() << std::endl;; }
+        }
+        else
+        {
+            csv.format( format );
+        }
+    }
+    const std::vector< std::string >& fields = comma::split( csv.fields, ',' );
+    unsigned int from_index = 0;
+    unsigned int to_index = 1;
+    for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "from" ) { from_index = i; break; } }
+    for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "to" ) { to_index = i; break; } }
+    const comma::csv::format::types_enum from_type = csv.format().offset( from_index ).type;
+    const comma::csv::format::types_enum to_type = csv.format().offset( to_index ).type;
+    if( ( ( from_type == comma::csv::format::time || from_type == comma::csv::format::long_time ) && ( to_type != comma::csv::format::time && to_type != comma::csv::format::long_time ) ) ||
+        ( ( ( from_type != comma::csv::format::time && from_type != comma::csv::format::long_time ) && ( to_type == comma::csv::format::time || to_type == comma::csv::format::long_time ) ) ) )
+        { COMMA_THROW( comma::exception, "from/to type mismatch; time" ); }
+    if( ( from_type == comma::csv::format::fixed_string || to_type == comma::csv::format::fixed_string ) && from_type != to_type )
+        { COMMA_THROW( comma::exception, "from/to type mismatch; string" ); }
+    if( from_type != to_type ) { std::cerr << "csv-intervals: support only from and to of the same type, got from: " << comma::csv::format::to_format( from_type ) << ", to: " << comma::csv::format::to_format( to_type ) << std::endl; exit( 1 ); }
+    return std::tie( to_type, first_line );
+}
 
 int main( int ac, char** av )
 {
     try
     {
-        comma::command_line_options options( ac, av );
+        comma::command_line_options options( ac, av, usage );
         verbose = options.exists( "--verbose,-v" );
         debug = options.exists( "--debug" );
-        append = options.exists( "--append,-a" );
-        if( options.exists( "--help,-h" ) ) { usage( verbose ); }
-        if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
-        if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
-        comma::csv::options csv( options );
-        if( csv.fields.empty() ) { csv.fields = comma::join( comma::csv::names< interval_t< double > >(), ',' ); }
-        if( !csv.has_field( "from,to" ) ) { COMMA_THROW( comma::exception, "expected from and to fields" ); }
         options.assert_mutually_exclusive( "--binary,--format" );
-        if( options.exists( "--binary,-b" ) ) {}
-        else if( options.exists( "--format" ) ) { csv.format( options.value< std::string >( "--format" ) ); }
-        else
+        const auto& unnamed = options.unnamed( "--append,-a,--debug,--flush,--input-fields,--matching,--not-matching,--output-fields,--intervals-only,--limits,-l", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-intervals: please specify operation" << std::endl; return 1; }
+        std::string operation = unnamed[0];
+        if( operation == "make" )
         {
-            while( std::cin.good() && first_line.empty() ) { std::getline( std::cin, first_line ); }
-            if( first_line.empty() ) { return 0; }
-            csv.format( comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter ) );
-            if( verbose ) { std::cerr << app_name << ": guessed format: " << csv.format().string() << std::endl;; }
+            append = options.exists( "--append,-a" );
+            if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
+            if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< interval_t< double > >(), ',' ) << std::endl; return 0; }
+            comma::csv::options csv( options );
+            auto t = interval_type( std::cin, comma::csv::options( options ), options.value< std::string >( "--format,-f", "" ) );
+            const comma::csv::format::types_enum to_type = std::get< 0 >( t );
+            std::string first_line = std::get< 1 >( t );
+            switch( to_type )
+            {
+                case comma::csv::format::int8:          intervals< char >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::time:
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options, csv ).make( first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options, csv ).make( first_line ); return 0;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); return 0; // never here
+            }
+            return 0;
         }
-        const std::vector< std::string >& fields = comma::split( csv.fields, ',' );
-        unsigned int from_index = 0;
-        unsigned int to_index = 1;
-        for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "from" ) { from_index = i; break; } }
-        for( unsigned int i = 0; i < fields.size(); ++i ) { if( fields[i] == "to" ) { to_index = i; break; } }
-        const comma::csv::format::types_enum from_type = csv.format().offset( from_index ).type;
-        const comma::csv::format::types_enum to_type = csv.format().offset( to_index ).type;
-        if( ( ( from_type == comma::csv::format::time || from_type == comma::csv::format::long_time ) && ( to_type != comma::csv::format::time && to_type != comma::csv::format::long_time ) ) ||
-          ( ( ( from_type != comma::csv::format::time && from_type != comma::csv::format::long_time ) && ( to_type == comma::csv::format::time || to_type == comma::csv::format::long_time ) ) ) )
-        { COMMA_THROW( comma::exception, "from/to type mismatch; time" ); }
-        if( ( from_type == comma::csv::format::fixed_string || to_type == comma::csv::format::fixed_string ) && from_type != to_type )
-        { COMMA_THROW( comma::exception, "from/to type mismatch; string" ); }
-//         switch( from_type )
-//         {
-//             case comma::csv::format::int8:          run< char >( options, to_type ); break;
-//             case comma::csv::format::uint8:         run< unsigned char >( options, to_type ); break;
-//             case comma::csv::format::int16:         run< comma::int16 >( options, to_type ); break;
-//             case comma::csv::format::uint16:        run< comma::uint16 >( options, to_type ); break;
-//             case comma::csv::format::int32:         run< comma::int32 >( options, to_type ); break;
-//             case comma::csv::format::uint32:        run< comma::uint32 >( options, to_type ); break;
-//             case comma::csv::format::int64:         run< comma::int64 >( options, to_type ); break;
-//             case comma::csv::format::uint64:        run< comma::uint64 >( options, to_type ); break;
-//             case comma::csv::format::char_t:        run< char >( options, to_type ); break;
-//             case comma::csv::format::float_t:       run< float >( options, to_type ); break;
-//             case comma::csv::format::double_t:      run< double >( options, to_type ); break;
-//             case comma::csv::format::time:
-//             case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).run(); break;
-//             case comma::csv::format::fixed_string:  intervals< std::string >( options ).run(); break;
-//             default:                                COMMA_THROW( comma::exception, "unknown type" ); break;
-//         }
-        if( from_type != to_type ) { std::cerr << app_name << ": support only from and to of the same type, got from: " << comma::csv::format::to_format( from_type ) << ", to: " << comma::csv::format::to_format( to_type ) << std::endl; return 1; }
-        switch( to_type )
+        if( operation == "contain" )
         {
-            case comma::csv::format::int8:          intervals< char >( options ).run(); break;
-            case comma::csv::format::uint8:         intervals< unsigned char >( options ).run(); break;
-            case comma::csv::format::int16:         intervals< comma::int16 >( options ).run(); break;
-            case comma::csv::format::uint16:        intervals< comma::uint16 >( options ).run(); break;
-            case comma::csv::format::int32:         intervals< comma::int32 >( options ).run(); break;
-            case comma::csv::format::uint32:        intervals< comma::uint32 >( options ).run(); break;
-            case comma::csv::format::int64:         intervals< comma::int64 >( options ).run(); break;
-            case comma::csv::format::uint64:        intervals< comma::uint64 >( options ).run(); break;
-            case comma::csv::format::char_t:        intervals< char >( options ).run(); break;
-            case comma::csv::format::float_t:       intervals< float >( options ).run(); break;
-            case comma::csv::format::double_t:      intervals< double >( options ).run(); break;
-            case comma::csv::format::time:
-            case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options ).run(); break;
-            case comma::csv::format::fixed_string:  intervals< std::string >( options ).run(); break;            
-            default:                                COMMA_THROW( comma::exception, "from/to type mismatch" ); break;
+            if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< scalar_t< double > >(), ',' ) << std::endl; return 0; }
+            if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< scalar_t< double > >(), ',' ) << std::endl; return 0; }
+            auto i = options.value< std::string >( "--intervals" );
+            comma::csv::options csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( i );
+            std::string format = comma::name_value::map( i ).value< std::string >( "format", "" );
+            comma::io::istream is( csv.filename );
+            auto t = interval_type( *is, csv, format );
+            const comma::csv::format::types_enum to_type = std::get< 0 >( t );
+            std::string first_line = std::get< 1 >( t );
+            switch( to_type )
+            {
+                case comma::csv::format::int8:          intervals< char >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::time:
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options, csv ).contain( *is, first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options, csv ).contain( *is, first_line ); return 0;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); // never here
+            }
+            return 0;
         }
-        return 0;
+        if( operation == "join" )
+        {
+            if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< scalar_t< double > >(), ',' ) << std::endl; return 0; }
+            if( options.exists( "--output-fields" ) ) { std::cerr << "csv-intervals join: does not have --output-fields" << std::endl; return 1; }
+            auto i = options.value< std::string >( "--intervals" );
+            comma::csv::options csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( i );
+            std::string format = comma::name_value::map( i ).value< std::string >( "format", "" );
+            comma::io::istream is( csv.filename );
+            auto t = interval_type( *is, csv, format );
+            const comma::csv::format::types_enum to_type = std::get< 0 >( t );
+            std::string first_line = std::get< 1 >( t );
+            switch( to_type )
+            {
+                case comma::csv::format::int8:          intervals< char >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint8:         intervals< unsigned char >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::int16:         intervals< comma::int16 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint16:        intervals< comma::uint16 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::int32:         intervals< comma::int32 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint32:        intervals< comma::uint32 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::int64:         intervals< comma::int64 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::uint64:        intervals< comma::uint64 >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::char_t:        intervals< char >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::float_t:       intervals< float >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::double_t:      intervals< double >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::time:
+                case comma::csv::format::long_time:     intervals< boost::posix_time::ptime >( options, csv ).join( *is, first_line ); return 0;
+                case comma::csv::format::fixed_string:  intervals< std::string >( options, csv ).join( *is, first_line ); return 0;            
+                default:                                COMMA_THROW( comma::exception, "invalid type" ); // never here
+            }
+            return 0;
+        }
+        std::cerr << "csv-intervals: expected operation, got: '" << operation << "'" << std::endl;
     }
-    catch( std::exception& ex ) { std::cerr << app_name << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << app_name << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "csv-intervals: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-intervals: unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/applications/csv-join.cpp b/csv/applications/csv-join.cpp
index 161a7df33..39fab1839 100644
--- a/csv/applications/csv-join.cpp
+++ b/csv/applications/csv-join.cpp
@@ -1,49 +1,21 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
 #include <string.h>
+#include <functional>
 #include <iostream>
 #include <map>
 #include <sstream>
 #include <string>
+#include <type_traits>
+#include <unordered_map>
 #include <vector>
-#include <boost/array.hpp>
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/functional/hash.hpp>
-#include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
-#include <boost/static_assert.hpp>
-#include <boost/unordered_map.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -68,14 +40,17 @@ static void usage( bool more )
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
+    std::cerr << "    --block-less; todo! better option name! input and filter block ids expected sorted" << std::endl;
+    std::cerr << "                  todo! document" << std::endl;
+    std::cerr << "    --drop-id-fields,--drop-id; remove id and block fields from filter output (same as if you did csv-join|csv-shuffle)" << std::endl;
     std::cerr << "    --first-matching: output only the first matching record (a bit of hack for now, but we needed it)" << std::endl;
     std::cerr << "    --flag-matching: output all records, with 1 appended to matching records and 0 appended to not-matching records" << std::endl;
     std::cerr << "    --matching: output only matching records from stdin" << std::endl;
     std::cerr << "    --nearest: if --radius specified, output only nearest record" << std::endl;
     std::cerr << "    --not-matching: not matching records as read from stdin, no join performed" << std::endl;
-    std::cerr << "    --strict: fail, if id on stdin is not found, or there are multiple filter keys on --unique, etc" << std::endl;
+    std::cerr << "    --output-swap,--swap-output,--swap; output filter records first with the stdin record appended, a convenience option" << std::endl;
     std::cerr << "    --radius,--epsilon=<value>; compare keys in given radius; the keys will be interpreted as floating point numbers" << std::endl;
-    std::cerr << "    --swap-output,--swap; output filter records first with the stdin record appended, a convenience option" << std::endl;
+    std::cerr << "    --strict: fail, if id on stdin is not found, or there are multiple filter keys on --unique, etc" << std::endl;
     std::cerr << "    --unique,--unique-matches: expect only unique matches, exit with error otherwise" << std::endl;
     std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
     std::cerr << std::endl;
@@ -105,40 +80,59 @@ static void usage( bool more )
         std::cerr << "        any other field name: key" << std::endl;
         std::cerr << std::endl;
         std::cerr << "        block acts as a key but stream processing occurs at the end of each" << std::endl;
-        std::cerr << "        block. If no block field is given the entire input is considered to be" << std::endl;
-        std::cerr << "        one block. Blocks are required to be contiguous in the input stream." << std::endl;
+        std::cerr << "        block; if no block field is given the entire input is considered to be" << std::endl;
+        std::cerr << "        one block; blocks are required to be contiguous in the input stream" << std::endl;
+    }
+    else
+    {
+        std::cerr << "    run csv-join --help --verbose for more..." << std::endl;
     }
     std::cerr << std::endl;
-    std::cerr << "Examples (try them):" << std::endl;
-    std::cerr << "    on the following data file:" << std::endl;
-    std::cerr << "        echo 1,1,2,hello > data.csv" << std::endl;
-    std::cerr << "        echo 1,2,3,hello >> data.csv" << std::endl;
-    std::cerr << "        echo 3,3,4,world >> data.csv" << std::endl;
-    std::cerr << "        echo 3,4,3,world >> data.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    join with a matching record" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=id \"data.csv;fields=id\"" << std::endl;
-    std::cerr << "        echo 3,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
-    std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
-    std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --not-matching" << std::endl;
-    std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --strict" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    join by key which is a string" << std::endl;
-    std::cerr << "        echo 1,hello | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
-    std::cerr << "        echo 1,world | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --not-matching" << std::endl;
-    std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --strict" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    finite state machine" << std::endl;
-    std::cerr << "        csv-join --fields=event \"data.csv;fields=event,state,next_state\" --initial-state 1" << std::endl;
-    std::cerr << "        <input:1>" << std::endl;
-    std::cerr << "        <input:1>" << std::endl;
-    std::cerr << "        <input:3>" << std::endl;
-    std::cerr << "        <input:3>" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
+    if( more )
+    {
+        std::cerr << "examples (try them)" << std::endl;
+        std::cerr << "    on the following data file:" << std::endl;
+        std::cerr << "        echo 1,1,2,hello > data.csv" << std::endl;
+        std::cerr << "        echo 1,2,3,hello >> data.csv" << std::endl;
+        std::cerr << "        echo 3,3,4,world >> data.csv" << std::endl;
+        std::cerr << "        echo 3,4,3,world >> data.csv" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    join with a matching record" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=id \"data.csv;fields=id\"" << std::endl;
+        std::cerr << "        echo 3,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
+        std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\"" << std::endl;
+        std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --not-matching" << std::endl;
+        std::cerr << "        echo 5,blah | csv-join --fields=id \"data.csv;fields=,,id\" --strict" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    join by key which is a string" << std::endl;
+        std::cerr << "        echo 1,hello | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
+        std::cerr << "        echo 1,world | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --not-matching" << std::endl;
+        std::cerr << "        echo 1,blah | csv-join --fields=,id \"data.csv;fields=,,,id\" --string --strict" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    block id ordered, gaps in filter blocks allowed" << std::endl;
+        std::cerr << "        csv-paste line-number value=0 | head \\" << std::endl;
+        std::cerr << "            | csv-join --fields block,id <( echo 3,0; echo 6,0 )';fields=block,id' --block-less" << std::endl;
+        std::cerr << "    finite state machine" << std::endl;
+        std::cerr << "        csv-join --fields=event \"data.csv;fields=event,state,next_state\" --initial-state 1" << std::endl;
+        std::cerr << "        <input:1>" << std::endl;
+        std::cerr << "        <input:1>" << std::endl;
+        std::cerr << "        <input:3>" << std::endl;
+        std::cerr << "        <input:3>" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    --drop-id (same would work in binary as well)" << std::endl;
+        std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y'" << std::endl;
+        std::cerr << "        0,1,2,3,1,A,B,3" << std::endl;
+        std::cerr << "        > echo 0,1,2,3 | csv-join --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y' --drop-id" << std::endl;
+        std::cerr << "        0,1,2,3,A,B" << std::endl;
+        std::cerr << std::endl;
+    }
+    else
+    {
+        std::cerr << "examples" << std::endl;
+        std::cerr << "    run csv-join --help --verbose for more..." << std::endl;
+    }
     exit( 0 );
 }
 
@@ -153,14 +147,18 @@ static bool flag_matching;
 static bool swap_output;
 static comma::csv::options stdin_csv;
 static comma::csv::options filter_csv;
+static bool filter_id_fields_discard; // todo: super-quick and dirty, put in a separate class
+static std::vector< unsigned int > filter_id_fields_flags; // todo: super-quick and dirty, put in a separate class
+static std::vector< std::pair< unsigned int, unsigned int > > filter_id_fields_offsets; // todo: super-quick and dirty, put in a separate class
+static unsigned int filter_id_fields_size{0}; // todo: super-quick and dirty, put in a separate class
 boost::scoped_ptr< comma::io::istream > filter_transport;
 static comma::uint32 block = 0;
 static boost::optional< double > radius;
 
 static void hash_combine_( std::size_t& seed, boost::posix_time::ptime key )
 {
-    BOOST_STATIC_ASSERT( sizeof( boost::posix_time::ptime ) == 8 );
-    boost::hash_combine( seed, *reinterpret_cast< const long long* >( &key ) );
+    static_assert( sizeof( boost::posix_time::ptime ) == 8, "expected time of size 8" );
+    boost::hash_combine( seed, *reinterpret_cast< const comma::uint64* >( &key ) );
 }
 
 template < typename K > static void hash_combine_( std::size_t& seed, K key ) { boost::hash_combine( seed, key ); }
@@ -189,7 +187,7 @@ struct input
         return comma::math::less( keys[0], rhs.keys[0] ); //, *radius );
     }
 
-    struct hash : public std::unary_function< input, std::size_t >
+    struct hash : public std::function< input( std::size_t ) >
     {
         std::size_t operator()( input const& p ) const
         {
@@ -199,7 +197,7 @@ struct input
         }
     };
 
-    typedef boost::unordered_map< input, std::vector< std::string >, hash > unordered_map;
+    typedef std::unordered_map< input, std::vector< std::string >, hash > unordered_map;
     typedef std::map< input, std::vector< std::string > > map;
 };
 
@@ -295,6 +293,7 @@ template < typename T > static std::string keys_as_string( const input< T >& i )
 {
     std::ostringstream oss;
     comma::csv::options csv;
+    csv.full_xpath = false;
     csv.fields = "keys";
     comma::csv::ascii_output_stream< input< T > > os( oss, csv, i );
     os.write( i );
@@ -306,49 +305,79 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
     static typename traits< K, Strict >::map filter_map;
     static input< K > default_input;
 
-    static void read_filter_block()
+    static std::string make_output( const std::vector< std::string >& values ) // todo? implement something like comma::join( values, drop )?
+    {
+        if( filter_id_fields_flags.empty() ) { return comma::join( values, stdin_csv.delimiter ); }
+        std::string s;
+        std::string delimiter;
+        unsigned int i = 0;
+        for( ; i < std::min( filter_id_fields_flags.size(), values.size() ); ++i )
+        {
+            if( filter_id_fields_flags[i] == 0 ) { s += delimiter + values[i]; delimiter = std::string( 1, stdin_csv.delimiter ); }
+        }
+        for( ; i < values.size(); ++i ) { s += delimiter + values[i]; delimiter = std::string( 1, stdin_csv.delimiter ); }
+        return s;
+    }
+
+    static std::string make_output( const char* values ) // todo? quick and dirty for now; use csv::binary? or implement something like csv::format::drop_fields...?
+    {
+        std::string s( filter_csv.format().size() - filter_id_fields_size, '\0' );
+        if( filter_id_fields_flags.empty() )
+        {
+            ::memcpy( &s[0], values, filter_csv.format().size() );
+        }
+        else
+        {
+            char* p = &s[0];
+            unsigned int t = 0;
+            for( const auto& e: filter_id_fields_offsets ) // todo: quick and dirty, watch performance
+            {
+                unsigned int c = e.first - t;
+                std::memcpy( p, values + t, c );
+                p += c;
+                t = e.first + e.second;
+            }
+            std::memcpy( p, values + t, filter_csv.format().size() - t ); // todo: quick and dirty, watch performance
+        }
+        return s;
+    }
+
+    static const input< K >* read_filter_block()
     {
         static comma::csv::input_stream< input< K > > filter_stream( **filter_transport, filter_csv, default_input );
         static const input< K >* last = filter_stream.read();
         filter_map.clear();
-        if( !last ) { return; }
+        if( !last ) { return last; }
         block = last->block;
         comma::uint64 count = 0;
         static comma::signal_flag is_shutdown( comma::signal_flag::hard );
         while( last->block == block && !is_shutdown )
         {
-            typename traits< K, Strict >::map::mapped_type& d = filter_map[ *last ];
-            if( filter_stream.is_binary() )
-            {
-                typename traits< K, Strict >::map::mapped_type& d = filter_map[ *last ];
-                d.push_back( std::string() );
-                d.back().resize( filter_csv.format().size() );
-                ::memcpy( &d.back()[0], filter_stream.binary().last(), filter_csv.format().size() );
-            }
-            else
-            {
-                d.push_back( comma::join( filter_stream.ascii().last(), stdin_csv.delimiter ) );
-            }
+            filter_map[ *last ].push_back( filter_stream.is_binary() ? make_output( filter_stream.binary().last() ) : make_output( filter_stream.ascii().last() ) );
             if( verbose ) { ++count; if( count % 10000 == 0 ) { std::cerr << "csv-join: reading block " << block << "; loaded " << count << " point" << ( count == 1 ? "" : "s" ) << "; hash map size: " << filter_map.size() << std::endl; } }
             //if( ( *filter_transport )->good() && !( *filter_transport )->eof() ) { break; }
             last = filter_stream.read();
             if( !last ) { break; }
         }
         if( verbose ) { std::cerr << "csv-join: read block " << block << " of " << count << " point" << ( count == 1 ? "" : "s" ) << "; hash map size: " << filter_map.size() << std::endl; }
+        return last;
     }
 
     static int run( const comma::command_line_options& options )
     {
+        bool block_less = options.exists( "--block-less" );
         std::vector< std::string > v = comma::split( stdin_csv.fields, ',' );
         std::vector< std::string > w = comma::split( filter_csv.fields, ',' );
+        if( filter_id_fields_discard ) { filter_id_fields_flags.resize( w.size(), 0 ); }
         bool got_state = false;
         bool got_next_state = false;
-        std::size_t filter_state_index;
+        std::size_t filter_state_index{0};
         for( std::size_t k = 0; k < w.size() && ( !got_state || !got_next_state ); ++k ) 
         {
             if( w[k] == "state" ) { got_state = true; filter_state_index = k; continue; }
             if( w[k] == "next_state" ) { got_next_state = true; continue; }
         }
+        if( ( got_state || got_next_state ) && filter_id_fields_discard ) { std::cerr << "csv-join: --drop-id and 'state' or 'next_field' are mutually exclusive" << std::endl; return 1; }
         bool is_state_machine = got_state && got_next_state;
         std::size_t default_input_keys_count = 0;
         bool no_stdin_key_fields = true;
@@ -361,12 +390,26 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
             {
                 if( is_state_machine && ( w[k] == "state" || w[k] == "next_state" ) ) { no_filter_key_fields = false; continue; }
                 if( !w[k].empty() && w[k] != "block" ) { no_filter_key_fields = false; }
+                if( filter_id_fields_discard && w[k] == "block" ) { filter_id_fields_flags[k] = 1; }
                 if( v[i] != w[k] ) { continue; }
-                v[i] = "keys[" + boost::lexical_cast< std::string >( default_input_keys_count ) + "]";
-                w[k] = "keys[" + boost::lexical_cast< std::string >( default_input_keys_count ) + "]";
+                v[i] = "keys[" + std::to_string( default_input_keys_count ) + "]";
+                w[k] = "keys[" + std::to_string( default_input_keys_count ) + "]";
+                if( filter_id_fields_discard ) { filter_id_fields_flags[k] = 1; }
                 ++default_input_keys_count;
             }
         }
+        if( filter_csv.binary() ) // todo: super-quick and dirty; move all the --drop-id stuff to a class
+        {
+            for( unsigned int i = 0; i < filter_id_fields_flags.size(); ++i )
+            {
+                if( filter_id_fields_flags[i] )
+                { 
+                    const auto& e = filter_csv.format().offset( i );
+                    filter_id_fields_offsets.push_back( { e.offset, e.size } );
+                    filter_id_fields_size += e.size;
+                }
+            }
+        }
         bool do_full_join = no_stdin_key_fields && no_filter_key_fields;
         if( default_input_keys_count == 0 && !do_full_join ) { std::cerr << "csv-join: please specify at least one common key; fields: " << stdin_csv.fields << "; filter fields: " << filter_csv.fields << std::endl; return 1; }
         //if( default_input_keys_count == 0 ) { std::cerr << "csv-join: please specify at least one common key; fields: " << stdin_csv.fields << "; filter fields: " << filter_csv.fields << std::endl; return 1; }
@@ -375,7 +418,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         if( is_state_machine )
         {
             state_index = default_input_keys_count;
-            w[filter_state_index] = "keys[" + boost::lexical_cast< std::string >( state_index ) + "]";
+            w[filter_state_index] = "keys[" + std::to_string( state_index ) + "]";
             ++default_input_keys_count;
         }
         default_input.keys.resize( default_input_keys_count );
@@ -390,7 +433,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         filter_transport.reset( new comma::io::istream( filter_csv.filename, filter_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii ) );
         if( filter_transport->fd() == comma::io::invalid_file_descriptor ) { std::cerr << "csv-join: failed to open \"" << filter_csv.filename << "\"" << std::endl; return 1; }
         std::size_t discarded = 0;
-        read_filter_block();
+        auto last = read_filter_block();
         #ifdef WIN32
         if( stdin_stream.is_binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
@@ -398,7 +441,18 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
         {
             const input< K >* p = stdin_stream.read();
             if( !p ) { break; }
-            if( block != p->block ) { read_filter_block(); }
+            if( block_less )
+            {
+                if( p->block < block ) { continue; }
+                while( last && p->block >= last->block )
+                {
+                    last = read_filter_block();
+                }
+            }
+            else
+            {
+                if( p->block != block ) { last = read_filter_block(); }
+            }
             typename traits< K, Strict >::pair pair;
             if( is_state_machine )
             {
@@ -430,6 +484,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
                 if( !strict ) { ++discarded; continue; }
                 std::string s;
                 comma::csv::options c;
+                c.full_xpath = false;
                 c.fields = "keys";
                 std::cerr << "csv-join: match not found for key(s): " << comma::csv::ascii< input< K > >( c, default_input ).put( *p, s ) << ", block: " << block << std::endl;
                 return 1;
@@ -451,7 +506,7 @@ template < typename K, bool Strict = true > struct join_impl_ // quick and dirty
                         if( is_state_machine ) { state = it->first.next_state; }
                         if( flag_matching ) { char match = 1; std::cout.write( &match, 1 ); break; }
                         if( matching ) { break; }
-                        std::cout.write( &( it->second[i][0] ), filter_csv.format().size() );
+                        std::cout.write( &( it->second[i][0] ), it->second[i].size() );
                         if( swap_output ) { std::cout.write( stdin_stream.binary().last(), stdin_csv.format().size() ); }
                         std::cout.flush();
                     }
@@ -499,13 +554,15 @@ int main( int ac, char** av )
         flag_matching = options.exists( "--flag-matching" );
         radius = options.optional< double >( "--radius,--epsilon" );
         nearest = options.exists( "--nearest" );
-        swap_output = options.exists( "--swap-output,--swap" );
+        swap_output = options.exists( "--output-swap,--swap-output,--swap" );
+        filter_id_fields_discard = options.exists( "--drop-id-fields,--drop-id" );
         if( nearest && !radius ) { std::cerr << "csv-join: if using --nearest, please specify --radius" << std::endl; return 1; }
-        options.assert_mutually_exclusive( "--matching,--not-matching,--flag-matching,--swap-output,--swap" );
+        options.assert_mutually_exclusive( "--matching,--not-matching,--flag-matching,--swap-output,--swap,--output-swap" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--first-matching" );
         options.assert_mutually_exclusive( "--radius,--epsilon,--string,-s,--double,--time" );
+        options.assert_mutually_exclusive( "--matching,--not-matching", "--drop-id-fields,--drop-id" );
         stdin_csv = comma::csv::options( options );
-        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--verbose,-v,--block-less,--first-matching,--matching,--not-matching,--string,-s,--time,--double,--strict,--swap-output,--swap,--output-swap,--nearest,--drop-id-fields,--drop-id", "-.*" );
         if( unnamed.empty() ) { std::cerr << "csv-join: please specify the second source" << std::endl; return 1; }
         if( unnamed.size() > 1 ) { std::cerr << "csv-join: expected one file or stream to join, got " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
         comma::name_value::parser parser( "filename", ';', '=', false );
diff --git a/csv/applications/csv-paste.cpp b/csv/applications/csv-paste.cpp
index ef711b9da..ec660a6ea 100644
--- a/csv/applications/csv-paste.cpp
+++ b/csv/applications/csv-paste.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -37,7 +9,6 @@
 #include <boost/lexical_cast.hpp>
 #include <boost/ptr_container/ptr_vector.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/format.h"
 #include "../../io/stream.h"
@@ -71,18 +42,32 @@ static void usage( bool verbose )
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --delimiter,-d <delimiter> : default ','" << std::endl;
+    std::cerr << "    --flush; flush stdout on every record" << std::endl;
+    std::cerr << "    --head=[<n>]; output first <n> records and exit; convenience option, e.g. try:" << std::endl;
+    std::cerr << "        csv-paste 'line-number;size=4' 'line-number;size=4;index' --head=16" << std::endl;
     std::cerr << "    --help,-h : help, --help --verbose for more help" << std::endl;
     std::cerr << "    --verbose,-v; more debug output" << std::endl;
     std::cerr << std::endl;
     std::cerr << "inputs" << std::endl;
-    std::cerr << "    <file> : <filename>[;size=<size>|binary=<format>]: file name or \"-\" for stdin; specify size or format, if binary" << std::endl;
+    std::cerr << "    <file> : <filename>[;<properties>]: file name or \"-\" for stdin; specify size or format, if binary" << std::endl;
+    std::cerr << "        properties" << std::endl;
+    std::cerr << "            binary=<format>: if input is binary, record binary format; or use 'size'" << std::endl;
+    std::cerr << "            block-size=<block-size>; repeat each record <block-size> times" << std::endl;
+    std::cerr << "            size=<size>; if input is binary, record size in bytes; or use 'binary'" << std::endl;
     std::cerr << "    value : value=<csv values>[;binary=<format>]; specify size or format, if binary" << std::endl;
     std::cerr << "    line-number[;<options>] : add the line number; as ui, if binary (quick and dirty, will override the file named \"line-number\")" << std::endl;
     std::cerr << "        options" << std::endl;
-    std::cerr << "            --begin <index>: start line number count at <index>; default: 0" << std::endl;
+    std::cerr << "            --begin <index>: start line number count at <index>, can be negative; default: 0" << std::endl;
+    std::cerr << "            --block-size,--size=<size>: number of records with the same line number; default: 1" << std::endl;
+    std::cerr << "                 WARNING: --size: deprecated, since it is confusing for files" << std::endl;
     std::cerr << "            --index; instead of block number output record index in the block" << std::endl;
+    std::cerr << "            --repeat=[<n>]; repeat a given pattern <n> times" << std::endl;
+    std::cerr << "                no --size: same as --head" << std::endl;
+    std::cerr << "                --size: repeat block of a given size <n> times" << std::endl;
+    std::cerr << "                --shape: repeat a given shape <n> times, e.g. 'line-number;shape=4,3,5;repeat=2'" << std::endl;
     std::cerr << "            --reverse; if --index, output index in descending order" << std::endl;
-    std::cerr << "            --size,--block-size <size>: number of records with the same line number; default: 1" << std::endl;
+    std::cerr << "            --shape=<shape>; iterate through indices of a given shape; <shape>: same meaning as in numpy, e.g. 'line-number;shape=10,5,4'" << std::endl;
+    std::cerr << "            --step=<value>; default=1; line number increment/decrement step" << std::endl;        
     std::cerr << "        examples (try them)" << std::endl;
     std::cerr << "            line number" << std::endl;
     std::cerr << "                seq 0 20 | csv-paste - line-number --begin 5 --size 3" << std::endl;
@@ -94,7 +79,6 @@ static void usage( bool verbose )
     std::cerr << "csv format parameters" << std::endl;
     if( verbose ) { std::cerr << comma::csv::format::usage() << std::endl; } else { std::cerr << "    run csv-paste --help --verbose for more..." << std::endl; }
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
@@ -102,19 +86,20 @@ static void usage( bool verbose )
 class source
 {
     public:
-        source( const std::string& properties = "" ) : properties_( properties )
+        source( const std::string& properties = "" ) : properties_( properties ), block_count_( 0 ), buf_( nullptr )
         {
             comma::name_value::map map( properties, ';', '=' );
             format_ = comma::csv::format( map.value< std::string >( "binary", "" ) );
             unsigned int size = map.value< unsigned int >( "size", format_.size() );
             binary_ = size > 0;
             value_ = std::string( size, 0 );
+            block_size_ = map.value< unsigned int >( "block-size", 1 );
         }
         virtual ~source() {}
         virtual const std::string* read() = 0;
         virtual const char* read( char* buf ) = 0;
         bool binary() const { return binary_; }
-        virtual const bool is_stream() const { return false; }
+        virtual bool is_stream() const { return false; }
         const std::string& properties() const { return properties_; }
         std::size_t size() const { return value_.size(); }
         
@@ -123,6 +108,9 @@ class source
         bool binary_;
         comma::csv::format format_;
         std::string properties_;
+        unsigned int block_size_;
+        unsigned int block_count_;
+        const char* buf_;
 };
 
 class stream : public source
@@ -136,22 +124,35 @@ class stream : public source
         
         const std::string* read()
         {
-            while( stream_->good() && !stream_->eof() )
+            if( block_count_ == block_size_ || value_.empty() )
             {
-                std::getline( *stream_, value_ );
-                if( !value_.empty() && *value_.rbegin() == '\r' ) { value_ = value_.substr( 0, value_.length() - 1 ); } // windows... sigh...
-                if( !value_.empty() ) { return &value_; }
+                block_count_ = 1;
+                while( stream_->good() && !stream_->eof() )
+                {
+                    std::getline( *stream_, value_ );
+                    if( !value_.empty() && *value_.rbegin() == '\r' ) { value_ = value_.substr( 0, value_.length() - 1 ); } // windows... sigh...
+                    if( !value_.empty() ) { return &value_; }
+                }
+                return nullptr;
             }
-            return NULL;
+            ++block_count_;
+            return &value_;
         }
 
         const char* read( char* buf )
         {
-            stream_->read( buf, value_.size() );
-            return stream_->gcount() == int( value_.size() ) ? buf : NULL;
+            if( block_count_ == block_size_ || buf_ == nullptr )
+            {
+                block_count_ = 1;
+                buf_ = buf; // quick and dirty
+                stream_->read( buf, value_.size() );
+                return stream_->gcount() == int( value_.size() ) ? buf : nullptr;
+            }
+            ++block_count_;
+            return buf_;
         }
         
-        const bool is_stream() { return true; }
+        bool is_stream() const { return true; }
         
     private:
         comma::io::istream stream_;
@@ -176,79 +177,120 @@ class line_number : public source
         class options
         {
             public:
-                comma::uint32 size;
-                bool index;
-                bool reverse;
-                comma::uint32 begin;
+                comma::uint32 size{0};
+                bool index{false};
+                bool reverse{false};
+                comma::int32 step{0};
+                comma::int32 begin{0};
+                std::vector< comma::uint32 > shape;
+                std::string format;
+                comma::uint32 repeat{0};
                 
-                options( boost::optional< comma::uint32 > b = boost::optional< comma::uint32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false )
+                options( const boost::optional< comma::int32 >& b = boost::optional< comma::int32 >(), comma::uint32 size = 1, bool index = false, bool reverse = false, int s = 1, unsigned int repeat = 0 )
                     : size( size )
                     , index( index )
                     , reverse( reverse )
+                    , step( s )
                     , begin( begin_( b ) )
+                    , repeat( repeat )
                 {
                 }
                 
                 options( const std::string& properties, const comma::command_line_options& o ) // quick and dirty: use visiting instead
                 {
-                    options defaults( boost::optional< comma::uint32 >(), o.value< comma::uint32 >( "--size,--block-size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ) );
+                    o.assert_mutually_exclusive( "--shape", "--block-size,--size,--reverse,--begin" );
+                    options defaults( boost::optional< comma::int32 >(), o.value< comma::uint32 >( "--block-size,--size", 1 ), o.exists( "--index" ), o.exists( "--reverse" ), o.value< comma::int32 >( "--step", 1 ), o.value< comma::uint32 >( "--repeat", 0 ) );
                     comma::name_value::map map( properties, ';', '=' );
-                    size = map.value< comma::uint32 >( "size", defaults.size );
-                    index = map.value< bool >( "index", defaults.index );
-                    reverse = map.value< bool >( "reverse", defaults.reverse );
-                    auto b = map.optional< comma::uint32 >( "begin" );
-                    if( !b ) { b = o.optional< comma::uint32 >( "--begin" ); }
-                    begin = begin_( b );
+                    map.assert_mutually_exclusive( "shape", "block-size,size,reverse,begin,step" );
+                    std::string s = map.value< std::string >( "shape", o.value< std::string >( "--shape", "" ) );
+                    format = map.value< std::string >( "binary", "" );
+                    if( s.empty() )
+                    {
+                        size = map.value< comma::uint32 >( map.get().find( "block-size" ) != map.get().end() ? "block-size" : "size", defaults.size ); // quick and dirty
+                        index = map.value< bool >( "index", defaults.index );
+                        reverse = map.value< bool >( "reverse", defaults.reverse );
+                        step = map.value< comma::int32 >( "step", defaults.step );
+                        auto b = map.optional< comma::int32 >( "begin" );
+                        if( !b ) { b = o.optional< comma::int32 >( "--begin" ); }
+                        begin = begin_( b );
+                        if( !format.empty() && format != "ui" ) { std::cerr << "csv-paste: currently only ui supported for line-number; got: '" << format << "'" << std::endl; exit( 1 ); } // quick and dirty for now
+                    }
+                    else
+                    {
+                        auto v = comma::split( s, ',' );
+                        shape.resize( v.size() );
+                        for( unsigned int i = 0; i < v.size(); ++i ) { shape[i] = boost::lexical_cast< unsigned int >( v[i] ); }
+                    }
+                    repeat = map.value< comma::int32 >( "repeat", defaults.repeat );
                 }
                 
             private:
-                comma::uint32 begin_( const boost::optional< comma::uint32 >& b )
+                comma::int32 begin_( const boost::optional< comma::int32 >& b ) // todo! handle size correctly for negative values for begin and step
                 {
-                    if( index && reverse && b && ( *b + 1 ) < size ) { COMMA_THROW( comma::exception, "for --reverse --index, for --size " << size << " expected --begin not less than " << ( size - 1 ) << "; got: " << *b ); }
-                    return b ? *b : reverse ? size - 1 : 0;
+                    if( index && reverse && b && ( *b + step ) < int( size ) * step ) { COMMA_THROW( comma::exception, "for --reverse --index, for --size " << size << " expected --begin not less than " << ( size - 1 ) << "; got: " << *b ); }
+                    return b ? *b : reverse ? ( size - 1 ) * step : 0;
                 }
         };
         
         line_number( bool is_binary, const options& options )
-            : source( is_binary ? "binary=ui" : "" )
+            : source( options.format.empty() ? ( is_binary ? options.shape.empty() ? std::string ( "binary=ui" ) : "binary=" + boost::lexical_cast< std::string >( options.shape.size() ) + "ui" : std::string() ) : "binary=" + options.format ) // quick and dirty
             , options_( options )
             , count_( 0 )
             , value_( options_.begin )
+            , values_( options_.shape.size(), 0 )
         {
         }
         
         const std::string* read()
         { 
-            serialized_ = boost::lexical_cast< std::string >( value_ );
-            update_();
-            return &serialized_;
+            serialized_ = values_.empty() ? boost::lexical_cast< std::string >( value_ ) : comma::join( values_, ',' );
+            return update_() ? &serialized_ : nullptr;
         }
         
         const char* read( char* buf ) // quick and dirty
         {
-            comma::csv::format::traits< comma::uint32 >::to_bin( value_, buf );
-            update_();
-            return buf;
+            if( values_.empty() ) { comma::csv::format::traits< comma::int32 >::to_bin( value_, buf ); }
+            else { for( unsigned int i = 0; i < values_.size(); ++i, buf += sizeof( comma::int32 ) ) { comma::csv::format::traits< comma::int32 >::to_bin( values_[i], buf ); } }
+            return update_() ? buf : nullptr;
         }
         
     private:
         options options_;
-        comma::uint32 count_;
-        comma::uint32 value_;
+        comma::uint32 count_{0};
+        comma::int32 value_{0};
+        comma::uint32 _repeats{0};
+        std::vector< comma::uint32 > values_;
         std::string serialized_;
+        bool _done{false};
         
-        void update_()
+        bool update_()
         {
-            ++count_;
-            if( count_ < options_.size )
+            if( _done ) { return false; }
+            if( values_.empty() )
             {
-                if( options_.index ) { value_ += options_.reverse ? -1 : 1; }
+                ++count_; //count_ += options_.step;
+                if( count_ < options_.size )
+                {
+                    if( options_.index ) { value_ += options_.reverse ? -options_.step : options_.step; }
+                }
+                else
+                {
+                    value_ = options_.index ? options_.begin : ( value_ + options_.step );
+                    count_ = 0;
+                    if( options_.repeat > 0 ) { ++_repeats; if( _repeats == options_.repeat ) { _done = true; } }
+                }
             }
             else
             {
-                value_ = options_.index ? options_.begin : ( value_ + 1 );
-                count_ = 0;
+                for( int i = values_.size() - 1; i >= 0; --i )
+                {
+                    ++values_[i];
+                    if( values_[i] < options_.shape[i] ) { break; }
+                    if( i == 0 && options_.repeat > 0 ) { ++_repeats; if( _repeats == options_.repeat ) { _done = true; } }
+                    values_[i] = 0;
+                }
             }
+            return true;
         }
 };
 
@@ -258,14 +300,16 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         char delimiter = options.value( "--delimiter,-d", ',' );
-        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--block-size" );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,--index,--reverse", "--delimiter,-d,--begin,--size,--step,--block-size,--head,--repeat" );
+        bool flush = options.exists( "--flush" );
         boost::ptr_vector< source > sources;
         bool is_binary = false;
-        for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty
+        boost::optional< comma::uint32 > head = options.optional< comma::uint32 >( "--head" );
+        for( unsigned int i = 0; i < unnamed.size(); ++i ) // quick and dirty; really lousy code duplication
         {
             if( unnamed[i].substr( 0, 6 ) == "value=" ) { if( value( unnamed[i] ).binary() ) { is_binary = true; } }
-            else if( unnamed[i] == "line-number" || unnamed[i].substr( 0, 12 ) == "line-number;" ) { continue; } // quick and dirty
-            if( stream( unnamed[i] ).binary() ) { is_binary = true; }
+            else if( unnamed[i] == "line-number" || unnamed[i].substr( 0, 12 ) == "line-number;" ) { if( line_number( is_binary, line_number::options( unnamed[i], options ) ).binary() ) { is_binary = true; } } // quick and dirty
+            else if( stream( unnamed[i] ).binary() ) { is_binary = true; }
         }
         for( unsigned int i = 0; i < unnamed.size(); ++i )
         {
@@ -295,13 +339,13 @@ int main( int ac, char** av )
             std::size_t size = 0;
             for( unsigned int i = 0; i < sources.size(); ++i ) { size += sources[i].size(); }
             std::vector< char > buffer( size );
-            while( true )
+            while( !head || ( *head )-- )
             {
                 unsigned int streams = 0;
                 char* p = &buffer[0];
                 for( unsigned int i = 0; i < sources.size(); p += sources[i].size(), ++i )
                 {
-                    if( sources[i].read( p ) == NULL )
+                    if( sources[i].read( p ) == nullptr )
                     {
                         if( streams == 0 ) { return 0; }
                         std::cerr << "csv-paste: unexpected end of file in " << unnamed[i] << std::endl;
@@ -310,29 +354,28 @@ int main( int ac, char** av )
                     if( sources[i].is_stream() ) { ++streams; }
                 }
                 std::cout.write( &buffer[0], buffer.size() );
-                std::cout.flush();
+                if( flush ) { std::cout.flush(); }
             }
+            return 0;
         }
-        else
+        while( !head || ( *head )-- )
         {
-            while( true )
+            std::ostringstream oss;
+            unsigned int streams = 0;
+            for( unsigned int i = 0; i < sources.size(); ++i )
             {
-                std::ostringstream oss;
-                unsigned int streams = 0;
-                for( unsigned int i = 0; i < sources.size(); ++i )
+                const std::string* s = sources[i].read();
+                if( s == nullptr )
                 {
-                    const std::string* s = sources[i].read();
-                    if( s == NULL )
-                    {
-                        if( streams == 0 ) { return 0; }
-                        std::cerr << "csv-paste: unexpected end of file in " << unnamed[i] << std::endl; return 1;
-                    }
-                    if (sources[i].is_stream()) ++streams;
-                    if( i > 0 ) { oss << delimiter; }
-                    oss << *s;
+                    if( streams == 0 ) { return 0; }
+                    std::cerr << "csv-paste: unexpected end of file in " << unnamed[i] << std::endl;
+                    return 1;
                 }
-                std::cout << oss.str() << std::endl;
+                if( sources[i].is_stream() ) { ++streams; }
+                if( i > 0 ) { oss << delimiter; }
+                oss << *s;
             }
+            std::cout << oss.str() << std::endl;
         }
         return 0;
     }
@@ -340,124 +383,3 @@ int main( int ac, char** av )
     catch( ... ) { std::cerr << "csv-paste: unknown exception" << std::endl; }
     return 1;
 }
-
-
-// int main( int ac, char** av )
-// {
-//     bool show_usage = true;
-//     try
-//     {
-//         comma::command_line_options options( ac, av );
-//         if( options.exists( "--help,-h" ) ) { usage(); }
-//         char delimiter = options.value( "--delimiter,-d", ',' );
-//         std::vector< std::string > unnamed = options.unnamed( "", "--delimiter,-d" );
-//         boost::ptr_vector< std::istream > files;
-//         std::vector< std::pair< std::istream*, std::size_t > > sources;
-//         bool binary = false;
-//         for( unsigned int i = 0; i < unnamed.size(); ++i )
-//         {
-//             std::string filename = unnamed[i];
-//             std::size_t size = 0;
-//             std::vector< std::string > v = comma::split( unnamed[i], ';' );
-//             filename = v[0];
-//             for( std::size_t j = 1; j < v.size(); ++j )
-//             {
-//                 std::vector< std::string > w = comma::split( v[j], '=' );
-//                 if( w.size() != 2 ) { COMMA_THROW( comma::exception, "expected filename and options, got \"" << unnamed[i] << "\"" ); }
-//                 if( w[0] == "binary" )
-//                 {
-//                     if( i == 0 ) { binary = true; }
-//                     else if( !binary ) { COMMA_THROW( comma::exception, unnamed[0] << " is ascii, but " << filename << " is binary" ); }
-//                     size = comma::csv::format( w[1] ).size();
-//                 }
-//                 else if( w[0] == "size" )
-//                 {
-//                     if( i == 0 ) { binary = true; }
-//                     else if( !binary ) { COMMA_THROW( comma::exception, unnamed[0] << " is ascii, but " << filename << " is binary" ); }
-//                     size = boost::lexical_cast< std::size_t >( w[1] );
-//                 }
-//             }
-//             if( binary && size == 0 ) { COMMA_THROW( comma::exception, "in binary mode, please specify size or format for \"" << filename << "\"" ); }
-//             if( filename == "-" )
-//             {
-//                 sources.push_back( std::make_pair( &std::cin, size ) );
-//             }
-//             else
-//             {
-//                 files.push_back( new std::ifstream( filename.c_str() ) );
-//                 if( !files.back().good() || files.back().eof() ) { COMMA_THROW( comma::exception, "failed to open " << unnamed[i] ); }
-//                 sources.push_back( std::make_pair( &files.back(), size ) );
-//             }
-//         }
-//         if( sources.empty() ) { usage(); }
-//         #ifdef WIN32
-//         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); }
-//         #endif
-//         show_usage = false;
-//         if( binary )
-//         {
-//             std::size_t size = 0;
-//             for( unsigned int i = 0; i < sources.size(); ++i ) { size += sources[i].second; }
-//             while( true )
-//             {
-//                 for( unsigned int i = 0; i < sources.size(); ++i )
-//                 {
-//                     std::string s( sources[i].second, 0 );
-//                     char* buf = &s[0];
-//                     sources[i].first->read( buf, sources[i].second );
-//                     int count = sources[i].first->gcount();
-//                     if( count != 0 && (unsigned int)count != sources[i].second ) { COMMA_THROW( comma::exception, unnamed[i] << ": expected " << sources[i].second << " bytes, got " << count ); }
-//                     if( !sources[i].first->good() || sources[i].first->eof() )
-//                     {
-//                         bool ok = true;
-//                         for( unsigned int j = 0; j < sources.size() && ok; ++j )
-//                         {
-//                             if( j > i ) { sources[j].first->peek(); }
-//                             ok = !sources[j].first->good() || sources[j].first->eof();
-//                         }
-//                         if( ok ) { return 0; }
-//                         else { COMMA_THROW( comma::exception, unnamed[i] << ": unexpected end of file" ); }
-//                     }
-//                     std::cout << s;
-//                 }
-//             }
-//         }
-//         else
-//         {
-//             while( true )
-//             {
-//                 bool first = true;
-//                 for( unsigned int i = 0; i < sources.size(); ++i )
-//                 {
-//                     std::string s;
-//                     std::getline( *sources[i].first, s );
-//                     if( !sources[i].first->good() || sources[i].first->eof() )
-//                     {
-//                         bool ok = true;
-//                         for( unsigned int j = 0; j < sources.size() && ok; ++j )
-//                         {
-//                             if( j > i ) { sources[j].first->peek(); }
-//                             ok = !sources[j].first->good() || sources[j].first->eof();
-//                         }
-//                         if( ok ) { return 0; }
-//                         else { COMMA_THROW( comma::exception, unnamed[i] << ": unexpected end of file" ); }
-//                     }
-//                     if( !s.empty() && *s.rbegin() == '\r' ) { s = s.substr( 0, s.length() - 1 ); } // windows... sigh...
-//                     if( s.empty() ) { continue; }
-//                     if( !first ) { std::cout << delimiter; } else { first = false; }
-//                     std::cout << s;
-//                 }
-//                 std::cout << std::endl;
-//             }
-//         }
-//     }
-//     catch( std::exception& ex )
-//     {
-//         std::cerr << "csv-paste: " << ex.what() << std::endl;
-//     }
-//     catch( ... )
-//     {
-//         std::cerr << "csv-paste: unknown exception" << std::endl;
-//     }
-//     if( show_usage ) { usage(); }
-// }
diff --git a/csv/applications/csv-play.cpp b/csv/applications/csv-play.cpp
index 3d9eb2a69..66e513089 100644
--- a/csv/applications/csv-play.cpp
+++ b/csv/applications/csv-play.cpp
@@ -27,169 +27,223 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
 #include <fcntl.h>
 #include <stdio.h>
 #ifdef WIN32
-#include <stdio.h>
 #include <io.h>
 #else
 #include <errno.h>
 #include <sys/ioctl.h>
 #include <sys/types.h>
-#include <termios.h>
 #include <unistd.h>
-#include <sys/types.h>
 #include <sys/stat.h>
 #endif
 #include <termios.h>
 
 #include <iostream>
-#include <fstream>
+#include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../csv/options.h"
-#include "../../csv/stream.h"
 #include "../../csv/traits.h"
 #include "../../name_value/parser.h"
-#include "../../csv/applications/play/play.h"
 #include "../../csv/applications/play/multiplay.h"
 
-static void usage()
+static void bash_completion( unsigned const ac, char const* const* av )
 {
-    std::cerr << std::endl;
-    std::cerr << "play back timestamped data from standard input in a real time manner" << std::endl;
-    std::cerr << "to standard output or optionally into given files/pipes" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: csv-play [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --speed: speed-up playback by a factor, default is 1 (inverse to --slowdown)" << std::endl;
-    std::cerr << "    --slowdown,--slow: slow-down playback by a factor, default is 1 (inverse to --speed)" << std::endl;
-    std::cerr << "    --quiet: don't print warnings when lagging behind" << std::endl;
-    std::cerr << "    --fields <fields> : specify where timestamp is" << std::endl;
-    std::cerr << "                        e.g., if timestamp is the 4th field: --fields=\",,,t\"" << std::endl;
-    std::cerr << "                        default: the timestamp is the first field" << std::endl;
-    std::cerr << "    --binary <format> : use binary format" << std::endl;
-    std::cerr << "    --clients: minimum number of clients to connect to each stream" << std::endl;
-    std::cerr << "               before playback starts; default 0" << std::endl;
-    std::cerr << "               can be specified individually for each client, e.g." << std::endl;
-    std::cerr << "               csv-play file1;pipe;clients=1 file2;tcp:1234;clients=3" << std::endl;
-    std::cerr << "    --interactive,-i: react to key presses:" << std::endl;
-    std::cerr << "                      <whitespace>: pause, resume" << std::endl;
-    std::cerr << "                      left or down arrow key: output one record at a time" << std::endl;
-    std::cerr << "                      shift left or down arrow key: TODO: output one block at a time" << std::endl;
-    std::cerr << "    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )" << std::endl;
-    std::cerr << "    --paused-at-start,--paused; if --interactive, then start playback as paused" << std::endl;
-    std::cerr << "    --resolution=<second>: timestamp resolution; timestamps closer than this value will be" << std::endl;
-    std::cerr << "                           played without delay; the rationale is that microsleep used in csv-play" << std::endl;
-    std::cerr << "                           (boost::this_thread::sleep()) is essentially imprecise and may create" << std::endl;
-    std::cerr << "                           unnecessary delays in the data" << std::endl;
-    std::cerr << "                           default 0.01" << std::endl;
-    std::cerr << "    --from <timestamp> : play back data starting at <timestamp> ( iso format )" << std::endl;
-    std::cerr << "    --to <timestamp> : play back data up to <timestamp> ( iso format )" << std::endl;
-    std::cerr << comma::csv::format::usage();
-    std::cerr << std::endl;
-    std::cerr << "output" << std::endl;
-    std::cerr << "    -: write to stdout (default)" << std::endl;
-    std::cerr << "    offset=<offset>: add <offset> seconds to the timestamp of this source" << std::endl;
-    std::cerr << "    <filename>: write to file or named pipe, e.g. csv-play \"points.csv;pipe\"" << std::endl;
-    std::cerr << "    tcp:<port>: open tcp server socket on given port and write to the tcp clients" << std::endl;
-    std::cerr << "    local:<name>: same as tcp, but use unix/linux domain sockets" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    output timestamped 3d points in real time manner to stdout (e.g. for visualisation)" << std::endl;
-    std::cerr << "        cat points.csv | csv-play | view-points --fields=,x,y,z" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    play back several files and output to, say, named pipes:" << std::endl;
-    std::cerr << "        mkfifo file1.pipe file2.pipe" << std::endl;
-    std::cerr << "        csv-play \"file1.csv;pipe1\" \"file2.csv;pipe2\" &" << std::endl;
-    std::cerr << "        view-points pipe1 pipe2 --fields=,x,y,z" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    same as above, but block, until all the pipes are connected:" << std::endl;
-    std::cerr << "        csv-play \"file1.csv;pipe1\" \"file2.csv;pipe2\" --clients=1 &" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    output multiple inputs of the same format to stdout:" << std::endl;
-    std::cerr << "        csv-play \"file1.csv;-\" \"file2.csv;-\" &" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( -1 );
+    static const char* completion_options =
+        " --help -h"
+        " --speed --slowdown --slow"
+        " --quiet"
+        " --fields --binary"
+        " --clients"
+        " --interactive -i"
+        " --no-flush "
+        " --paused-at-start --paused"
+        " --resolution"
+        " --from --to"
+        ;
+    std::cout << completion_options << std::endl;
+    exit( 0 );
 }
 
+static void interactive_help( std::string prefix )
+{
+    prefix.assign( prefix.size(), ' ' );
+    std::cerr << prefix << "<space>: pause or resume" << std::endl;
+    std::cerr << prefix << "right or down arrow key: output one record at a time" << std::endl;
+    std::cerr << prefix << "<t>: output current timestamp to stderr" << std::endl;
+    std::cerr << prefix << "<q>: quit" << std::endl;
+}
+
+static void usage( bool verbose )
+{
+    std::cerr << R"(
+play back timestamped data from standard input in a real time manner
+to standard output or optionally into given files/pipes
+
+usage: csv-play [<options>]
+
+options
+    --speed: speed-up playback by a factor, default is 1 (inverse to --slowdown)
+    --slowdown,--slow: slow-down playback by a factor, default is 1 (inverse to --speed)
+    --quiet: don't print warnings when lagging behind
+    --fields <fields> : specify where timestamp is
+                        e.g., if timestamp is the 4th field: --fields=',,,t'
+                        default: the timestamp is the first field
+    --binary <format> : use binary format
+    --clients: minimum number of clients to connect to each stream
+               before playback starts; default 0
+               can be specified individually for each client, e.g.
+               csv-play file1;pipe;clients=1 file2;tcp:1234;clients=3
+    --interactive,-i: react to key presses:"
+)";
+    interactive_help( "    --interactive,-i: " );
+    std::cerr << R"(    --no-flush : if present, do not flush the output stream ( use on high bandwidth sources )
+    --paused-at-start,--paused: start playback as paused, implies --interactive
+    --pause-at=[<timestamp>]; pause when timestamp reached, implies --interactive
+    --resolution=<second>: timestamp resolution; timestamps closer than this value will be
+                           played without delay; the rationale is that microsleep used in csv-play
+                           (boost::this_thread::sleep()) is essentially imprecise and may create
+                           unnecessary delays in the data
+                           default 0.01
+    --from <timestamp> : play back data starting at <timestamp> ( iso format )
+    --to <timestamp> : play back data up to <timestamp> ( iso format )
+)" << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose );
+    std::cerr << R"(
+output
+    -: write to stdout (default)
+    offset=<offset>: add <offset> seconds to the timestamp of this source
+    <filename>: write to file or named pipe, e.g. csv-play 'points.csv;pipe'
+    tcp:<port>: open tcp server socket on given port and write to the tcp clients
+    local:<name>: same as tcp, but use unix/linux domain sockets
+
+examples
+    output timestamped 3d points in real time manner to stdout (e.g. for visualisation)
+        cat points.csv | csv-play | view-points --fields=,x,y,z
+
+    play back several files and output to, say, named pipes:
+        mkfifo file1.pipe file2.pipe
+        csv-play 'file1.csv;pipe1' 'file2.csv;pipe2' &
+        view-points pipe1 pipe2 --fields=,x,y,z
+
+    same as above, but block, until all the pipes are connected:
+        csv-play 'file1.csv;pipe1' 'file2.csv;pipe2' --clients=1 &
+
+    output multiple inputs of the same format to stdout:
+        csv-play 'file1.csv;-' 'file2.csv;-' &
+
+    use binary data (try it)
+        > csv-play <( csv-paste line-number | csv-repeat --pace --period 1 | csv-time-amp | csv-to-bin t,ui --flush )';-;binary=t,ui' \
+                   <( csv-paste line-number value=0 | csv-repeat --pace --period 1 | csv-time-stamp | csv-to-bin t,2ui --flush )';tcp:8888;binary=t,2ui' \
+            | csv-from-bin t,ui
+        > #in another shell, run
+        > socat tcp:localhost:8888 - | csv-from-bin t,2ui
+
+    pause and step through output:
+        echo 0 | csv-repeat --period 0.1 --yes | csv-paste - line-number | csv-time-stamp | csv-play --interactive
+
+)" << std::endl;
+    exit( 0 );
+}
+
+static boost::scoped_ptr< comma::csv::applications::play::Multiplay > multiplay;
+static bool quit = false;
+
+class playback_state_t
+{
+public:
+    playback_state_t() : state_( state::running ) {}
+
+    bool is_running() const { return state_ == state::running; }
+
+    bool is_paused() const { return state_ == state::paused; }
+
+    void pause( const boost::posix_time::ptime& t = boost::posix_time::not_a_date_time )
+    {
+        if( state_ == state::paused ) { return; }
+        state_ = state::paused;
+        paused_time_ = boost::posix_time::microsec_clock::universal_time();
+        if( ! t.is_not_a_date_time() ) { std::cerr << "csv-play: paused at " << boost::posix_time::to_iso_string( t ) << std::endl; }
+    }
+
+    void unpause()
+    {
+        multiplay->paused_for( boost::posix_time::microsec_clock::universal_time() - paused_time_ );
+    }
+
+    void run()
+    {
+        if( state_ == state::running ) { return; }
+        if( state_ == state::paused ) { unpause(); }
+        state_ = state::running;
+        std::cerr << "csv-play: resumed" << std::endl;
+    }
+
+    void read_once()
+    {
+        if( state_ == state::paused ) { unpause(); }
+        state_ = state::read_once;
+    }
+
+    void has_read_once() { if( state_ == state::read_once ) { pause(); } }
+
+private:
+    enum class state { running, paused, read_once, read_block };
+    state state_;
+    boost::posix_time::ptime paused_time_;
+};
+
+static playback_state_t playback;
+
 class key_press_handler_t
 {
 public:
-    enum states { running, paused, read_once, read_block };
-    
-    key_press_handler_t( bool interactive, bool paused_at_start ): key_press_( interactive ), paused_( paused_at_start ), state_( paused_ ? paused : running ) { if( paused_at_start ) { std::cerr << "csv-play: paused at start" << std::endl; } }
-    
+    key_press_handler_t( bool interactive ) : key_press_( interactive ) {}
+
     void update( boost::posix_time::ptime t )
+    {
+        key k = get_key();
+        switch( k )
+        {
+            case key::space: if( playback.is_running() ) { playback.pause( t ); } else { playback.run(); } break;
+            case key::down_arrow: case key::right_arrow: playback.read_once(); break;
+            case key::q: quit = true; break;
+            case key::t: std::cerr << boost::posix_time::to_iso_string( t ) << std::endl; break;
+            case key::none: case key::other: break;
+        }
+    }
+    
+private:
+    enum class key { none, space, right_arrow, down_arrow, q, t, other };
+
+    key get_key()
     {
         boost::optional< char > c = key_press_.read();
-        if( !c ) { return; }
+        if( !c ) { return key::none; }
         switch( *c )
         {
-            case 10:
-            case ' ':
-                switch( state_ )
-                {
-                    case running:
-                        std::cerr << "csv-play: paused at " << boost::posix_time::to_iso_string( t ) << std::endl;
-                        state_ = paused;
-                        break;
-                    case paused:
-                        std::cerr << "csv-play: resumed" << std::endl;
-                        state_ = running;
-                        break;
-                    case read_block:
-                        return; // never here, todo
-                    case read_once:
-                        std::cerr << "csv-play: resumed" << std::endl;
-                        state_ = running;
-                        break;
-                };
-                break;
-            case 27:
+            case ' ': return key::space;
+            case 'q': return key::q;
+            case 't': return key::t;
+            case 27:                    // escape sequence for arrows: ESC-[
                 c = key_press_.read();
-                if( !c || *c != 91 ) { return; }
+                if( !c || *c != 91 ) { break; }
                 c = key_press_.read();
-                if( !c ) { return; }
-                switch( *c )
-                {
-                    case 66:
-                    case 67:
-                        state_ = read_once;
-                        break;  
-                    default:
-                        return;
-                }
-            default:
+                if( !c ) { break; }
+                if( *c == 66 ) { return key::down_arrow; }
+                if( *c == 67 ) { return key::right_arrow; }
                 break;
         }
+        return key::other;
     }
-    
-    states state() const { return state_; }
-    
-    void has_read_once() 
-    {
-        switch( state_ )
-        {
-            case running:
-            case paused:
-            case read_block:
-                return;
-            case read_once:
-                state_ = paused;
-        };
-    }
-    
-private:
+
     class key_press_t_
     {
     public:
@@ -206,8 +260,7 @@ class key_press_handler_t
             new_termios.c_iflag &= ~( BRKINT | ICRNL | INPCK | ISTRIP | IXON );
             if( ::tcsetattr( fd_, TCSANOW, &new_termios ) < 0 ) { COMMA_THROW( comma::exception, "failed to set '" << tty << "'" ); }
             std::cerr << "csv-play: running in interactive mode" << std::endl;
-            std::cerr << "          press <whitespace> to pause or resume" << std::endl;
-            std::cerr << "          press left or down arrow key: output one record at a time" << std::endl;
+            interactive_help( "csv-play: " );
         }
         
         ~key_press_t_()
@@ -231,20 +284,18 @@ class key_press_handler_t
         int fd_;
         struct termios old_termios_;
     };
+
     key_press_t_ key_press_;
-    bool paused_;
-    states state_;
 };
 
 int main( int argc, char** argv )
 {
-    boost::scoped_ptr< comma::Multiplay > multiplay;
     try
     {
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
         comma::signal_flag shutdown_flag( signals );
-        comma::command_line_options options( argc, argv );
-        if( options.exists( "--help,-h" ) ) { usage(); }
+        comma::command_line_options options( argc, argv, usage );
+        if( options.exists( "--bash-completion" ) ) bash_completion( argc, argv );
         options.assert_mutually_exclusive( "--speed,--slow,--slowdown" );
         double speed = options.value( "--speed", 1.0 / options.value< double >( "--slow,--slowdown", 1.0 ) );
         double resolution = options.value< double >( "--resolution", 0.01 );
@@ -252,25 +303,34 @@ int main( int argc, char** argv )
         std::string to = options.value< std::string>( "--to", "" );
         bool quiet =  options.exists( "--quiet" );
         bool flush =  !options.exists( "--no-flush" );
-        std::vector< std::string > configstrings = options.unnamed("--interactive,-i,--paused,--paused-at-start,--quiet,--flush,--no-flush","--slow,--slowdown,--speed,--resolution,--binary,--fields,--clients,--from,--to");
+        std::vector< std::string > configstrings = options.unnamed( "--verbose,-v,--interactive,-i,--paused,--paused-at-start,--quiet,--flush,--no-flush","--pause-at,--slow,--slowdown,--speed,--resolution,--binary,--fields,--clients,--from,--to" );
         if( configstrings.empty() ) { configstrings.push_back( "-;-" ); }
-        comma::csv::options csvoptions( argc, argv );
+        comma::csv::options csv( argc, argv );
+        csv.full_xpath = false;
         comma::name_value::parser name_value("filename,output", ';', '=', false );
-        std::vector< comma::Multiplay::SourceConfig > sourceConfigs( configstrings.size() );
-        comma::Multiplay::SourceConfig defaultConfig( "-", options.value( "--clients", 0 ), csvoptions );
-        for( unsigned int i = 0U; i < configstrings.size(); ++i ) { sourceConfigs[i] = name_value.get< comma::Multiplay::SourceConfig >( configstrings[i], defaultConfig ); }
+        std::vector< comma::csv::applications::play::Multiplay::SourceConfig > source_configs( configstrings.size() );
+        comma::csv::applications::play::Multiplay::SourceConfig defaultConfig( "-", options.value( "--clients", 0 ), csv );
+        for( unsigned int i = 0U; i < configstrings.size(); ++i ) { source_configs[i] = name_value.get< comma::csv::applications::play::Multiplay::SourceConfig >( configstrings[i], defaultConfig ); }
         boost::posix_time::ptime fromtime;
         if( !from.empty() ) { fromtime = boost::posix_time::from_iso_string( from ); }
         boost::posix_time::ptime totime;
         if( !to.empty() ) { totime = boost::posix_time::from_iso_string( to ); }
-        multiplay.reset( new comma::Multiplay( sourceConfigs, 1.0 / speed, quiet, boost::posix_time::microseconds( static_cast<unsigned int> (resolution * 1000000) ), fromtime, totime, flush ) );
-        key_press_handler_t key_press_handler( options.exists( "--interactive,-i" ), options.exists( "--paused,--paused-at-start" ) );
-        while( !shutdown_flag && std::cout.good() && !std::cout.bad() && !std::cout.eof() )
+        multiplay.reset( new comma::csv::applications::play::Multiplay( source_configs, speed, quiet, boost::posix_time::microseconds( static_cast< unsigned int >( resolution * 1000000 )), fromtime, totime, flush ));
+        if( options.exists( "--paused,--paused-at-start" )) { playback.pause(); }
+        boost::optional< std::string > pause_at_option = options.optional< std::string >( "--pause-at" );
+        boost::optional< boost::posix_time::ptime > pause_at_timestamp = boost::make_optional< boost::posix_time::ptime >( false, boost::posix_time::not_a_date_time );
+        if( pause_at_option ) { pause_at_timestamp = boost::posix_time::from_iso_string( *pause_at_option ); }
+        key_press_handler_t key_press_handler(  options.exists( "--interactive,-i" )
+                                             || options.exists( "--paused,--paused-at-start" )
+                                             || options.exists( "--pause-at" ));
+        while( !shutdown_flag && !quit && std::cout.good() )
         {
-            key_press_handler.update( multiplay->now() );
-            if( key_press_handler.state() == key_press_handler_t::paused ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }
+            boost::posix_time::ptime now = multiplay->now();
+            key_press_handler.update( now );
+            if( pause_at_timestamp && !now.is_not_a_date_time() && *pause_at_timestamp < now ) { playback.pause( now ); pause_at_timestamp = boost::none; }
+            if( playback.is_paused() ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); continue; }
             if( !multiplay->read() ) { break; }
-            key_press_handler.has_read_once();
+            playback.has_read_once();
         }
         multiplay->close();
         multiplay.reset();
diff --git a/csv/applications/csv-random.cpp b/csv/applications/csv-random.cpp
new file mode 100644
index 000000000..745b0c2e8
--- /dev/null
+++ b/csv/applications/csv-random.cpp
@@ -0,0 +1,531 @@
+// Copyright (c) 2018 Vsevolod Vlaskine
+
+/// @authors vsevolod vlaskine, kent hu
+
+#include <algorithm>
+#include <cstring>
+#include <deque>
+#include <iostream>
+#include <random>
+#include <string>
+#include <vector>
+
+#include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../base/none.h"
+#include "../../base/types.h"
+#include "../../csv/stream.h"
+#include "../../string/string.h"
+
+// todo
+// - seed=true-random
+// - make, true-random: --head=<n>
+// - sample, shuffle
+//   - examples
+// - regression test!
+// - --help vs --help --verbose
+// ? wiki: tutorials
+//   - csv-random
+//   - csv-repeat: --pace etc
+//   - make tutorials searchable
+
+static void usage( bool verbose )
+{
+    std::cerr << "\nrandom operations on input stream";
+    std::cerr << '\n';
+    std::cerr << "\nusage: csv-random <operation> [<options>]";
+    std::cerr << "\n";
+    std::cerr << "\n    where <operation> is one of:";
+    std::cerr << "\n        pseudo-random, make: output pseudo-random numbers";
+    std::cerr << "\n        true-random: output non-deterministic uniformly distributed numbers";
+    std::cerr << "\n        sample: output a uniformly distributed sample of input records";
+    std::cerr << "\n        shuffle: output input records in pseudo-random order";
+    std::cerr << '\n';
+    std::cerr << "\noptions";
+    std::cerr << "\n    --seed=[<unsigned int>]; random seed:";
+    std::cerr << "\n        <n>: integer seed for pseudo-random generator";
+    std::cerr << "\n        'true-random': todo: true random number to use as seed";
+    std::cerr << '\n';
+    std::cerr << "\noperations";
+    std::cerr << "\n    pseudo-random, make: output pseudo-random numbers";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: csv-random make [<options>] > random.csv";
+    std::cerr << "\n               cat input.csv | csv-random make --append [<options>]";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --append; append random numbers to stdin input";
+    std::cerr << "\n            --distribution=<distribution>[;<options>]";
+    std::cerr << "\n                where <distribution> is one of:";
+    std::cerr << "\n                    uniform[;<min>;<max>] (default)";
+    std::cerr << "\n                        if <min>, <max> not present, --range values will be used";
+    std::cerr << "\n                    gaussian[;<mean>;<sigma>]";
+    std::cerr << "\n                    normal: alias for gaussian";
+    std::cerr << "\n                todo: more distributions to plug in, just ask";
+    std::cerr << "\n            --engine=<engine>";
+    std::cerr << "\n                where <engine> is one of: minstd_rand0, minstd_rand, mt19937,";
+    std::cerr << "\n                    mt19937_64 (default), ranlux24_base, ranlux48_base,";
+    std::cerr << "\n                    ranlux24, ranlux48, knuth_b, default_random_engine";
+    std::cerr << "\n            --output-binary; output random numbers as binary";
+    std::cerr << "\n                    specify --binary=<format> for stdin input";
+    std::cerr << "\n            --range=[<min>,<max>]; desired value range";
+    std::cerr << "\n                attention! will pick value until gets something in range";
+    std::cerr << "\n            --type=<type>; default=ui; supported values: b,ub,w,uw,i,ui,l,ul,f,d";
+    std::cerr << "\n                can have more than one <type> i.e. 3ui";
+    std::cerr << '\n';
+    std::cerr << "\n    true-random: output non-deterministic uniformly distributed unsigned int";
+    std::cerr << "\n                 random numbers (if non-deterministic source is not available)";
+    std::cerr << "\n                 e.g. a hardware device, output will be pseudo-random";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: csv-random true-random [<options>]";
+    std::cerr << "\n               cat input.csv | csv-random true-random --append [<options>]";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --append; append random number to stdin input";
+    std::cerr << "\n            --once; output random number only once";
+    std::cerr << "\n            --output-binary; output random numbers as binary";
+    std::cerr << "\n                specify --binary=<format> for stdin input";
+    std::cerr << "\n            --range=[<min>,<max>]; desired value range";
+    std::cerr << "\n                if multiple output values, e.g: --type=f,ui,ub";
+    std::cerr << "\n                --range will be applied to all output values";
+    std::cerr << "\n            --type=<type>; default=ui; todo: supported values: ui;";
+    std::cerr << "\n                e.g: --type=3ui; --type=ui,ui,ui; etc";
+    std::cerr << '\n';
+    std::cerr << "\n        example";
+    std::cerr << "\n            > csv-random make --seed=$( csv-random true-random --once )";
+    std::cerr << '\n';
+    std::cerr << "\n    sample: output uniformly distributed sample of input records of a given size";
+    std::cerr << "\n            record order preserved";
+    std::cerr << "\n            limitation: current implementation accumulates input records before";
+    std::cerr << "\n            outputting, if records are large, it may be memory-inefficient;";
+    std::cerr << "\n            can be improved, just ask";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: cat records.csv | csv-random sample [<options>] > sample.csv";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --engine=<engine>";
+    std::cerr << "\n                where <engine> is one of: minstd_rand0, minstd_rand, mt19937,";
+    std::cerr << "\n                    mt19937_64 (default), ranlux24_base, ranlux48_base,";
+    std::cerr << "\n                    ranlux24, ranlux48, knuth_b, default_random_engine";
+    std::cerr << "\n            --fields=[<fields>]; if 'block' field present, sample each block,";
+    std::cerr << "\n                    otherwise read whole input and then sample";
+    std::cerr << "\n            --ratio=[<ratio>]; portion of each block to output,";
+    std::cerr << "\n                    if block is too small, nothing will be output for it";
+    std::cerr << "\n            --size=<n>; default=1; number of records to output in each block,";
+    std::cerr << "\n                    if smaller than block size, output the whole block";
+    std::cerr << "\n            --sliding-window,--window=[<size>]; todo: sample on sliding window";
+    std::cerr << "\n                    of <size> records";
+    std::cerr << '\n';
+    std::cerr << "\n    shuffle: output input records in pseudo-random order";
+    std::cerr << '\n';
+    std::cerr << "\n        usage: cat records.csv | csv-random shuffle [<options>] > shuffled.csv";
+    std::cerr << '\n';
+    std::cerr << "\n        options";
+    std::cerr << "\n            --engine=<engine>";
+    std::cerr << "\n                where <engine> is one of: minstd_rand0, minstd_rand, mt19937,";
+    std::cerr << "\n                    mt19937_64 (default), ranlux24_base, ranlux48_base,";
+    std::cerr << "\n                    ranlux24, ranlux48, knuth_b, default_random_engine";
+    std::cerr << "\n            --fields=[<fields>]; if 'block' field present, shuffle each block,";
+    std::cerr << "\n                    otherwise read whole input and then shuffle";
+    std::cerr << "\n            --ratio=[<ratio>]; portion of each block to output,";
+    std::cerr << "\n                    same as for \"sample\" operation, but shuffled";
+    std::cerr << "\n            --size=<n>; default=1; number of records to output in each block,";
+    std::cerr << "\n                    same as for \"sample\" operation, but shuffled";
+    std::cerr << "\n            --sliding-window,--window=[<size>]; todo: shuffle on sliding window";
+    std::cerr << "\n                    of <size> records";
+    std::cerr << '\n';
+    std::cerr << "\ncsv options:";
+    std::cerr << comma::csv::options::usage( "", verbose ) << std::endl;
+    std::cerr << "\nexamples";
+    std::cerr << "\n    generate three floating point random samples from gaussian distribution";
+    std::cerr << "\n        csv-random make --distribution gaussian 0,10 --type 3f";
+    std::cerr << "\n        csv-random make --distribution gaussian 0,10 --type 3f \\";
+    std::cerr << "\n            | csv-paste line-number - \\";
+    std::cerr << "\n            | csv-blocks group --fields scalar --span 1000 \\";
+    std::cerr << "\n            | csv-shuffle --fields=id,x,y,z,block --output-fields=id,block,x,y,z";
+    std::cerr << "\n\n";
+    exit( 0 );
+}
+
+static bool verbose;
+static comma::csv::options csv;
+static boost::optional< int > seed;
+
+namespace comma { namespace applications { namespace random { namespace shuffle {
+
+struct input
+{
+    comma::uint32 block{0};
+};
+
+} } } } // namespace comma { namespace applications { namespace random { namespace shuffle {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::applications::random::shuffle::input >
+{
+    template < typename K, typename V > static void visit( const K&, const comma::applications::random::shuffle::input& p, V& v ) { v.apply( "block", p.block ); }
+    template < typename K, typename V > static void visit( const K&, comma::applications::random::shuffle::input& p, V& v ) { v.apply( "block", p.block ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace applications { namespace random {
+
+template < typename T > struct type_traits { static T cast( const T t ) { return t; } };
+template <> struct type_traits< char > { static int cast( const char t ) { return static_cast< int >( t ); } };
+template <> struct type_traits< unsigned char > { static unsigned int cast( const unsigned char t ) { return static_cast< int >( t ); } };
+
+namespace make {
+
+template < typename T, template < typename > class Distribution, typename Engine >
+static int run_impl( Distribution< T >& distribution, bool append, bool binary, std::size_t count, const boost::optional< std::pair< T, T > >& range )
+{
+    Engine engine = ::seed ? Engine( *::seed ) : Engine();
+    auto _pick = [&]() -> T
+    {
+        if( !range ) { return distribution( engine ); }
+        while( true ) // todo? parametrise? while( true ) is quite cruel
+        {
+            T r = distribution( engine );
+            if( r >= range->first && r <= range->second ) { return r; }
+        }
+    };
+    if( !::csv.flush ) { std::cin.tie( nullptr ); }
+    if( append )
+    {
+        if( ::csv.binary() )
+        {
+            std::vector< char > buf( ::csv.format().size() );
+            while( std::cin.good() )
+            {
+                std::cin.read( &buf[0], buf.size() );
+                if( std::cin.gcount() == 0 ) { break; }
+                if( std::cin.gcount() != static_cast< int >( buf.size() ) ) { std::cerr << "csv-random make: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                std::cout.write( &buf[0], buf.size() );
+                for( std::size_t i = 0; i < count; ++i )
+                {
+                    T r = _pick();
+                    std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
+                }
+                if( ::csv.flush ) { std::cout.flush(); }
+            }
+            return 0;
+        }
+        while( std::cin.good() )
+        {
+            std::string s;
+            std::getline( std::cin, s );
+            if( s.empty() ) { continue; }
+            std::cout << s;
+            for( std::size_t i = 0; i < count; ++i ) { std::cout << ::csv.delimiter << type_traits< T >::cast( _pick() ); }
+            std::cout << std::endl;
+            if( ::csv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    }
+    if( binary )
+    {
+        while( std::cout.good() )
+        {
+            for( std::size_t i = 0; i < count; ++i )
+            {
+                T r = _pick();
+                std::cout.write( reinterpret_cast< char* >( &r ), sizeof( T ) );
+            }
+            if( ::csv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    }
+    while( std::cout.good() )
+    {
+        std::string comma;
+        for( std::size_t i = 0; i < count; ++i )
+        {
+            std::cout << comma << type_traits< T >::cast( _pick() );
+            comma = ::csv.delimiter;
+        }
+        std::cout << std::endl;
+        if( ::csv.flush ) { std::cout.flush(); } // todo? remove? std::endl flushes anyway?
+    }
+    return 0;
+}
+
+template < typename T > struct cast_traits { typedef T type; };
+template <> struct cast_traits< char > { typedef int type; };
+template <> struct cast_traits< unsigned char > { typedef unsigned int type; };
+
+template < typename T > static std::vector< T > _as( const std::vector< std::string >& v, unsigned int begin ) // todo? move to library?
+{
+    std::vector< T > r( v.size() - begin );
+    for( unsigned int i = begin; i < v.size(); r[ i - begin ] = boost::lexical_cast< typename cast_traits< T >::type >( v[i] ), ++i );
+    return r;
+}
+
+template < typename T, template < typename > class Distribution, unsigned int Size > struct distribution_traits { static Distribution< T > make( const std::vector< T >& p ); }; // quick and dirty
+template < typename T, template < typename > class Distribution > struct distribution_traits< T, Distribution, 0 > { static Distribution< T > make( const std::vector< T >& p ) { return Distribution< T >(); } };
+template < typename T, template < typename > class Distribution > struct distribution_traits< T, Distribution, 1 > { static Distribution< T > make( const std::vector< T >& p ) { return Distribution< T >( p[0] ); } };
+template < typename T, template < typename > class Distribution > struct distribution_traits< T, Distribution, 2 > { static Distribution< T > make( const std::vector< T >& p ) { return Distribution< T >( p[0], p[1] ); } };
+
+template < typename T, template < typename > class Distribution > static Distribution< T > make_distribution( const std::vector< std::string >& params ) // quick and dirty
+{
+    const auto& p = _as< T >( params, 1 );
+    switch( p.size() ) // quick and dirty; does not scale, but for now just to make it working
+    {
+        case 0: return distribution_traits< T, Distribution, 0 >::make( p );
+        case 1: return distribution_traits< T, Distribution, 1 >::make( p );
+        case 2: return distribution_traits< T, Distribution, 2 >::make( p );
+        default: COMMA_THROW( comma::exception, "distribution traits for " << p.size() << " parameters: not implemented; just ask" );
+    }
+}
+
+template < typename T, template < typename > class Distribution >
+static int run_impl( const std::vector< std::string >& params, const comma::command_line_options& options )
+{
+    const auto& append = options.exists( "--append" );
+    const auto& binary = options.exists( "--output-binary" ) || ::csv.binary();
+    const auto& engine = options.value< std::string >( "--engine", "mt19937_64" );
+    const auto& count = comma::csv::format( options.value< std::string >( "--type", "ui" ) ).count();
+    boost::optional< std::pair< T, T > > range;
+    if( options.exists( "--range" ) && params[0] != "uniform" ) { range = comma::csv::ascii< std::pair< T, T > >().get( options.value< std::string >( "--range" ) ); } // quick and dirty
+    Distribution< T > distribution = make_distribution< T, Distribution >( params );
+    if( engine == "minstd_rand0" ) { return run_impl< T, Distribution, std::minstd_rand0 >( distribution, append, binary, count, range ); }
+    if( engine == "minstd_rand" ) { return run_impl< T, Distribution, std::minstd_rand >( distribution, append, binary, count, range ); }
+    if( engine == "mt19937" ) { return run_impl< T, Distribution, std::mt19937 >( distribution, append, binary, count, range ); }
+    if( engine == "mt19937_64" ) { return run_impl< T, Distribution, std::mt19937_64 >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux24_base" ) { return run_impl< T, Distribution, std::ranlux24_base >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux48_base" ) { return run_impl< T, Distribution, std::ranlux48_base >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux24" ) { return run_impl< T, Distribution, std::ranlux24 >( distribution, append, binary, count, range ); }
+    if( engine == "ranlux48" ) { return run_impl< T, Distribution, std::ranlux48 >( distribution, append, binary, count, range ); }
+    if( engine == "knuth_b" ) { return run_impl< T, Distribution, std::knuth_b >( distribution, append, binary, count, range ); }
+    if( engine == "default_random_engine" ) { return run_impl< T, Distribution, std::default_random_engine >( distribution, append, binary, count, range ); }
+    std::cerr << "csv-random make: expected engine; got: '" << engine << "'" << std::endl;
+    return 1;
+}
+
+static int run( const comma::command_line_options& options ) // quick and dirty
+{
+    auto params = comma::split( options.value< std::string >( "--distribution", "uniform" ), ',' );
+    const std::string& distribution = params[0];
+    const auto& format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
+    if ( format.collapsed_string().find( ',' ) != std::string::npos ) { std::cerr << "csv-random make: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl; return 1; }
+    if( distribution == "uniform" )
+    {
+        if( options.exists( "--range" ) ) // super-quick and dirty to preserve backward compatibility
+        {
+            if( params.size() > 1 ) { std::cerr << "csv-random make: uniform: either use --range or uniform[,<min>,<max>], not both" << std::endl; return 1; }
+            const auto& r = comma::split( options.value< std::string >( "--range" ), ',' );
+            params = { "uniform", r[0], r[1] };
+        }
+        if( params.size() != 1 && params.size() != 3 ) { std::cerr << "csv-random make: uniform: expected uniform[,<min>,<max>]; got: \"" << options.value< std::string >( "--distribution" ) << "\"" << std::endl; return 1; }
+        switch( format.offset( 0 ).type )
+        {
+            case csv::format::int8: return run_impl< char, std::uniform_int_distribution >( params, options );
+            case csv::format::uint8: return run_impl< unsigned char, std::uniform_int_distribution >( params, options );
+            case csv::format::int16: return run_impl< comma::int16, std::uniform_int_distribution >( params, options );
+            case csv::format::uint16: return run_impl< comma::uint16, std::uniform_int_distribution >( params, options );
+            case csv::format::int32: return run_impl< comma::int32, std::uniform_int_distribution >( params, options );
+            case csv::format::uint32: return run_impl< comma::uint32, std::uniform_int_distribution >( params, options );
+            case csv::format::int64: return run_impl< comma::int64, std::uniform_int_distribution >( params, options );
+            case csv::format::uint64: return run_impl< comma::uint64, std::uniform_int_distribution >( params, options );
+            case csv::format::float_t: return run_impl< float, std::uniform_real_distribution >( params, options );
+            case csv::format::double_t: return run_impl< double, std::uniform_real_distribution >( params, options );
+            default: std::cerr << "csv-random make: uniform distribution: expected type; got: '" << format.string() << "'" << std::endl; return 1;
+        }
+    }
+    if( distribution == "gaussian" || distribution == "normal" )
+    {
+        if( params.size() != 1 && params.size() != 3 ) { std::cerr << "csv-random make: gaussian: expected gaussian[,<mean>,<stddev>]; got: \"" << options.value< std::string >( "--distribution" ) << "\"" << std::endl; return 1; }
+        switch( format.offset( 0 ).type )
+        {
+            case csv::format::float_t: return run_impl< float, std::normal_distribution >( params, options );
+            case csv::format::double_t: return run_impl< double, std::normal_distribution >( params, options );
+            default: std::cerr << "csv-random make: normal distribution: expected floating point --type; got unsupported type: '" << format.string() << "'" << std::endl; return 1;
+        }
+    }
+    std::cerr << "csv-random make: expected distribution; got: '" << distribution << "'" << std::endl;
+    return 1;
+}
+
+} // namespace make {
+
+namespace shuffle {
+
+template < typename Engine > static int run_impl( const comma::command_line_options& options, bool sample = false )
+{
+    auto engine = ::seed ? Engine( *::seed ) : Engine();
+    std::deque< std::string > records;
+    std::vector< unsigned int > indices; // quick and dirty
+    unsigned int size = options.value( "--size", 1 ); // quick and dirty
+    auto ratio = options.optional< float >( "--ratio" ); // quick and dirty
+    auto sliding_window = options.optional< unsigned int >( "--sliding-window,--window" );
+    if( sliding_window ) { std::cerr << "csv-random shuffle: --sliding-window: todo" << std::endl; return 1; }
+    if( sliding_window ) { std::cerr << "csv-random shuffle: expected either block field or --sliding-window; got both" << std::endl; return 1; }
+    comma::csv::input_stream< input > is( std::cin, ::csv );
+    bool has_block = ::csv.has_field( "block" );
+    comma::uint32 block{0};
+    while( is.ready() || std::cin.good() )
+    {
+        const input* p = is.read();
+        if( !p || ( has_block && p->block != block ) )
+        {
+            if( !records.empty() )
+            {
+                //std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+                indices.resize( records.size() ); // quick and dirty
+                for( unsigned int i = 0; i < indices.size(); ++i ) { indices[i] = i; }
+                // deprecated: std::random_shuffle( indices.begin(), indices.end(), [&]( int ) -> int { return distribution( engine ); } ); // quick and dirty, watch performance
+                std::shuffle( indices.begin(), indices.end(), engine );
+                unsigned int s = sample ? ( ratio ? int( records.size() * *ratio ) : size ) : records.size();
+                if( sample ) { std::sort( indices.begin(), indices.begin() + s ); } // quick and dirty
+                for( unsigned int i = 0; i < s; ++i ) { std::cout.write( &records[indices[i]][0], records[indices[i]].size() ); }
+                records.clear();
+                if( ::csv.flush ) { std::cout.flush(); }
+            }
+            if( p ) { block = p->block; }
+        }
+        if( !p ) { break; }
+        if( ::csv.binary() )
+        {
+            records.emplace_back();
+            records.back().resize( ::csv.format().size() );
+            std::memcpy( &records.back()[0], is.binary().last(), ::csv.format().size() );
+        }
+        else
+        {
+            records.push_back( comma::join( is.ascii().last(), ::csv.delimiter ) + "\n" );
+        }
+    }
+    return 0;
+}
+
+static int run( const comma::command_line_options& options, bool sample = false )
+{
+    const auto& engine = options.value< std::string >( "--engine", "mt19937_64" );
+    if( engine == "minstd_rand0" ) { return run_impl< std::minstd_rand0 >( options, sample ); }
+    if( engine == "minstd_rand" ) { return run_impl< std::minstd_rand >( options, sample ); }
+    if( engine == "mt19937" ) { return run_impl< std::mt19937>( options, sample ); }
+    if( engine == "mt19937_64" ) { return run_impl< std::mt19937_64 >( options, sample ); }
+    if( engine == "ranlux24_base" ) { return run_impl< std::ranlux24_base >( options, sample ); }
+    if( engine == "ranlux48_base" ) { return run_impl< std::ranlux48_base >( options, sample ); }
+    if( engine == "ranlux24" ) { return run_impl< std::ranlux24 >( options, sample ); }
+    if( engine == "ranlux48" ) { return run_impl< std::ranlux48 >( options, sample ); }
+    if( engine == "knuth_b" ) { return run_impl< std::knuth_b >( options, sample ); }
+    if( engine == "default_random_engine" ) { return run_impl< std::default_random_engine >( options, sample ); }
+    std::cerr << "csv-random " << ( sample ? "sample" : "shuffle" ) << ": expected engine; got: '" << engine << "'" << std::endl;
+    return 1;
+}
+
+} // namespace shuffle {
+
+namespace sample {
+
+static int run( const comma::command_line_options& options ) { return shuffle::run( options, true ); } // quick and relatively dirty for now
+
+} // namespace sample {
+
+namespace true_random {
+
+template < typename T >
+static int run_impl( const comma::command_line_options& options, std::size_t count )
+{
+    std::random_device rd;
+    const bool binary = options.exists( "--output-binary" ) || ::csv.binary();
+    const bool flush = options.exists( "--flush" ) || ::csv.flush;
+    typedef std::pair< double, double > pair_t;
+    boost::optional< pair_t > range = comma::silent_none< pair_t >();
+    double factor{1};
+    if( options.exists( "--range" ) )
+    {
+        range = comma::csv::ascii< pair_t >().get( options.value< std::string >( "--range" ) );
+        factor = ( range->second - range->first ) / ( rd.max() - rd.min() );
+    }
+    auto output_line_to_stdout = [&]( std::string&& initial_delimiter )
+    {
+        for( std::size_t i = 0; i < count; ++i )
+        {
+            T r = rd();
+            if( range ) { r = range->first + ( r - rd.min() ) * factor; }
+            if( binary ) { std::cout.write( reinterpret_cast< const char* >( &r ), sizeof( T ) ); }
+            else { std::cout << initial_delimiter << type_traits< T >::cast( r ); initial_delimiter = ::csv.delimiter; }
+        }
+        if( !binary ) { std::cout << std::endl; }
+        if( flush ) { std::cout << std::flush; }
+    };
+    if( options.exists( "--append" ) )
+    {
+        while( std::cin.good() )
+        {
+            auto buf = ::csv.binary() ? std::string( ::csv.format().size(), {} ) : std::string{};
+            if( ::csv.binary() )
+            {
+                std::cin.read( &buf[0], buf.size() );
+                if( std::cin.gcount() == 0 ) { return 0; }
+                if( std::cin.gcount() != static_cast< int >( buf.size() ) ) { std::cerr << "csv-random true-random: expected " << buf.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+            }
+            else
+            {
+                std::getline( std::cin, buf );
+                if( buf.empty() ) { continue; }
+            }
+            std::cout.write( &buf[0], buf.size() );
+            output_line_to_stdout( { ::csv.delimiter } );
+        }
+    }
+    else
+    {
+        while( std::cout.good() )
+        {
+            output_line_to_stdout( {} );
+            if( options.exists( "--once" ) ) { break; }
+        }
+    }
+    return 0;
+}
+
+static int run( const comma::command_line_options& options )
+{
+    const auto format = comma::csv::format( options.value< std::string >( "--type", "ui" ) );
+    if( format.collapsed_string().find( ',' ) != std::string::npos ) { std::cerr << "csv-random true-random: --type must be homogeneous i.e. ui or 2ui or 3ui" << std::endl; return 1; }
+    switch( format.offset( 0 ).type ) {
+        case csv::format::int8: return run_impl< char >( options, format.count() );
+        case csv::format::uint8: return run_impl< unsigned char >( options, format.count() );
+        case csv::format::int16: return run_impl< comma::int16 >( options, format.count() );
+        case csv::format::uint16: return run_impl< comma::uint16 >( options, format.count() );
+        case csv::format::int32: return run_impl< comma::int32 >( options, format.count() );
+        case csv::format::uint32: return run_impl< comma::uint32 >( options, format.count() );
+        case csv::format::int64: return run_impl< comma::int64 >( options, format.count() );
+        case csv::format::uint64: return run_impl< comma::uint64 >( options, format.count() );
+        case csv::format::float_t: return run_impl< float >( options, format.count() );
+        case csv::format::double_t: return run_impl< double >( options, format.count() );
+        default: std::cerr << "csv-random true-random: expected type; got: '" << format.string() << "'" << std::endl;
+    }
+    return 1;
+}
+
+} // namespace true_random {
+
+} } } // namespace comma { namespace applications { namespace random {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        const auto& unnamed = options.unnamed( "--append,--flush,--verbose,-v", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-random: please specify operation" << std::endl; return 1; }
+        ::csv = comma::csv::options( options );
+        std::cout.precision( ::csv.precision );
+        ::seed = options.optional< comma::uint32 >( "--seed" );
+        ::verbose = options.exists( "--verbose,-v" );
+        std::string operation = unnamed[0];
+        if( operation == "make" || operation == "pseudo-random" ) { return comma::applications::random::make::run( options ); }
+        if( operation == "sample" ) { return comma::applications::random::sample::run( options ); }
+        if( operation == "shuffle" ) { return comma::applications::random::shuffle::run( options ); }
+        if( operation == "true-random" ) { return comma::applications::random::true_random::run( options ); }
+        std::cerr << "csv-random: expected operation; got: '" << operation << "'" << std::endl;
+        return 1;
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-random: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-random: unknown exception" << std::endl; }
+    return 1;
+}
diff --git a/csv/applications/csv-repeat.cpp b/csv/applications/csv-repeat.cpp
index a6fe24e6d..5401c1173 100644
--- a/csv/applications/csv-repeat.cpp
+++ b/csv/applications/csv-repeat.cpp
@@ -29,11 +29,11 @@
 
 /// @author dave jennings
 
+#include <functional>
 #include <iostream>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/thread/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../csv/options.h"
 #include "../../csv/stream.h"
@@ -73,6 +73,11 @@ void usage( bool verbose = false )
     std::cerr << "            warning: currently is very simplistic; see todo comments in the code to make it more robust" << std::endl;
     std::cerr << "    --period=[<seconds>]: period of repeated record" << std::endl;
     std::cerr << "    --timeout,-t=[<seconds>]: timeout before repeating the last record; if not specified, timeout is set to --period" << std::endl;
+    std::cerr << "    --timestamped: use input timestamp for repeating; currently, would do blocking read" << std::endl;
+    std::cerr << "                   convenient for filling holes in data in offline processing" << std::endl;
+    std::cerr << "      --timestamped options" << std::endl;
+    std::cerr << "          --at-least-from,--from=[<time>]; if first timestamp greater than <time>, fill the hole with the first record" << std::endl;
+    std::cerr << "          --at-least-to,--to=[<time>]; if last timestamp less than <time>, fill the hole with the last record" << std::endl;
     std::cerr << "    --verbose,-v: more output" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    if --period is not set, --timeout acts as a watchdog. If no input is seen" << std::endl;
@@ -81,6 +86,7 @@ void usage( bool verbose = false )
     std::cerr << "    --append fields are appended to output; supported fields are:" << std::endl;
     std::cerr << "        time: append timestamp" << std::endl;
     std::cerr << "        repeating: 1 if currently repeating" << std::endl;
+    std::cerr << "        count: counts up from zero for consecutive repeating records" << std::endl;
     std::cerr << std::endl;
     if( verbose )
     {
@@ -102,32 +108,45 @@ void usage( bool verbose = false )
     std::cerr << std::endl;
     std::cerr << "    { echo -e \"1\\n2\\n3\"; sleep 10; } | csv-repeat --timeout=3" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
 
+struct input_t
+{
+    boost::posix_time::ptime time;
+};
+
 struct output_t
 {
     boost::posix_time::ptime time;
     bool repeating;
-    output_t() : repeating( false ) {}
-    output_t( const boost::posix_time::ptime& time, bool repeating ) : time( time ), repeating( repeating ) {}
+    unsigned count;
+    output_t() : repeating( false ), count( 0 ) {}
+    output_t( const boost::posix_time::ptime& time, bool repeating, unsigned count=0 ) : time( time ), repeating( repeating ), count( count ) {}
 };
 
 namespace comma { namespace visiting {
 
+template <> struct traits< input_t >
+{
+    template < typename K, typename V > static void visit( const K&, input_t& p, V& v ) { v.apply( "t", p.time ); }
+    template < typename K, typename V > static void visit( const K&, const input_t& p, V& v ) { v.apply( "t", p.time ); }
+};
+
 template <> struct traits< output_t >
 {
     template < typename K, typename V > static void visit( const K&, const output_t& p, V& v )
     {
         v.apply( "time", p.time );
         v.apply( "repeating", p.repeating );
+        v.apply( "count", p.count );
     }
     template < typename K, typename V > static void visit( const K&, output_t& p, V& v )
     {
         v.apply( "time", p.time );
         v.apply( "repeating", p.repeating );
+        v.apply( "count", p.count );
     }
 };
     
@@ -140,20 +159,13 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
         bool ignore_eof = options.exists( "--ignore-eof,--ignoreeof,--yes" );
+        options.assert_mutually_exclusive( "--pace", "--ignore-eof,--ignoreeof,--yes" );
+        options.assert_mutually_exclusive( "--timestamped,pace" );
         if( ignore_eof && !options.exists( "--period" ) ) { std::cerr << "csv-repeat: got --ignore-oef, thus please specify --period" << std::endl; return 1; }
         comma::csv::options csv = comma::csv::options( options );
-        std::size_t record_size = csv.binary() ? csv.format().size() : 0;
-        std::vector< char > buffer( csv.binary() ? ( 65536ul / record_size + 1 ) * record_size : 0 );
-        char* buffer_begin = &buffer[0];
-        const char* buffer_end = &buffer[0] + buffer.size();
-        char* read_position = buffer_begin;
-        char* write_position = buffer_begin;
-        char* last_record = NULL;
-        comma::io::select select;
-        select.read().add( comma::io::stdin_fd );
-        comma::io::istream is( "-", comma::io::mode::binary );
         boost::scoped_ptr< comma::csv::output_stream< output_t > > ostream;
         comma::csv::options output_csv;
+        output_csv.full_xpath = false;
         if( options.exists( "--append-fields,--append,-a" ) )
         {
             output_csv.fields = options.value< std::string >( "--append-fields,--append,-a", "" );
@@ -172,6 +184,7 @@ int main( int ac, char** av )
                     {
                         if( v[i] == "repeating" ) { format += comma + 'b'; }
                         else if( v[i] == "time" ) { format += comma + 't'; }
+                        else if( v[i] == "count" ) { format += comma + "ui"; }
                         else { std::cerr << "csv-repeat: expected one of: " << comma::join( comma::csv::names< output_t >( false ), ',' ) << "; got: \"" << v[i] << "\"" << std::endl; return 1; }
                         comma = ",";
                     }
@@ -204,12 +217,116 @@ int main( int ac, char** av )
         boost::optional< double > timeout_seconds = options.optional< double >( "--timeout,-t" );
         if( !period && !timeout_seconds ) { std::cerr << "csv-repeat: please specify either --period, or --timeout, or both" << std::endl; return 1; }
         timeout = timeout_seconds ? boost::posix_time::microseconds( static_cast<unsigned int>(*timeout_seconds * 1000000 )) : *period;
+        std::cin.tie( NULL );
+        if( options.exists( "--timestamped" ) )
+        {
+            if( !period ) { std::cerr << "csv-repeat: for --timestamped, please specify --period" << std::endl; return 1; }
+            if( options.exists( "--timeout,-t" ) ) { std::cerr << "csv-repeat: for --timestamped: --timeout not supported" << std::endl; return 1; }
+            comma::csv::input_stream< input_t > istream( std::cin, csv );
+            boost::posix_time::ptime last;
+            if( options.exists( "--at-least-from,--from" ) ) { last = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-from,--from" ) ); }
+            boost::posix_time::ptime to;
+            if( options.exists( "--at-least-to,--to" ) ) { to = boost::posix_time::from_iso_string( options.value< std::string >( "--at-least-to,--to" ) ); }
+            std::string last_record;
+            if( csv.binary() ) { last_record = std::string( csv.format().size(), 0 ); }
+            auto pass = [&]( const output_t& )
+            {
+                static comma::csv::passed< input_t > passed( istream, std::cout, csv.flush );
+                passed.write();
+            };
+            auto append = [&]( const output_t& o )
+            {
+                static comma::csv::tied< input_t, output_t > tied( istream, *ostream );
+                tied.append( o );
+            };
+            std::function< void( const output_t& p ) > write;
+            if( ostream ) { write = append; } else { write = pass; }
+            auto write_last = [&]( boost::posix_time::ptime t )
+            {
+                std::cout.write( &last_record[0], last_record.size() );
+                if( !csv.binary() ) { std::cout << csv.delimiter; }
+                if( ostream ) { ostream->write( output_t( t, true ) ); }
+                else if( !csv.binary() ) { std::cout << std::endl; }
+            };
+            auto repeat = [&]( boost::posix_time::ptime now )
+            {
+                if( now.is_not_a_date_time() || last.is_not_a_date_time() ) { return; }
+                for( boost::posix_time::ptime t = last + *period; t <= now; )
+                {
+                    write_last( t );
+                    if( t == now ) { break; }
+                    t += *period;
+                    if( t > now ) { t = now; }
+                }
+            };
+            auto set_last_record = [&]()
+            {
+                if( csv.binary() ) { std::memcpy( &last_record[0], istream.binary().last(), last_record.size() ); } // todo! quick and dirty, watch performance! we don't need to copy each record, but that would make the code more complex
+                else { last_record = comma::join( istream.ascii().last(), csv.delimiter ); }
+            };
+            while( istream.ready() || std::cin.good() )
+            {
+                const input_t* p = istream.read();
+                if( !p ) { break; }
+                if( p->time.is_not_a_date_time() ) { std::cerr << "csv-repeat: expected timestamp, got not a date/time" << std::endl; return 1; }
+                if( last_record.empty() && !last.is_not_a_date_time() ) { set_last_record(); write_last( last ); } // quick and dirty
+                repeat( p->time );
+                write( output_t( p->time, false ) );
+                last = p->time;
+                set_last_record();
+            }
+            repeat( to );
+            return 0;
+        }
+        if( options.exists( "--pace" ) )
+        {
+            if( !period ) { std::cerr << "csv-repeat: for --pace, please specify --period" << std::endl; return 1; }
+            std::size_t record_size = csv.binary() ? csv.format().size() : 0;
+            if( record_size == 0 )
+            {
+                while( std::cin.good() && !std::cin.eof() )
+                {
+                    std::string line;
+                    std::getline( std::cin, line );
+                    if( line.empty() ) { break; }
+                    std::cout << line;
+                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), false ) ); }
+                    else { std::cout << std::endl; }
+                    boost::this_thread::sleep( *period );
+                }
+            }
+            else
+            {
+                std::vector< char > buf( record_size );
+                while( std::cin.good() && !std::cin.eof() ) // todo? quick and dirty; improve reading performance
+                {
+                    std::cin.read( &buf[0], record_size );
+                    if( std::cin.gcount() <= 0 ) { break; }
+                    if( std::cin.gcount() < int( record_size ) ) { std::cerr << "csv-repeat: expected " << record_size << " byte(s); got only: " << std::cin.gcount() << std::endl; return 1; }
+                    std::cout.write( &buf[0], record_size );
+                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), false ) ); }
+                    std::cout.flush();
+                    boost::this_thread::sleep( *period );
+                }
+            }
+            return 0;
+        }
+        std::size_t record_size = csv.binary() ? csv.format().size() : 0;
+        std::vector< char > buffer( csv.binary() ? ( 65536ul / record_size + 1 ) * record_size : 0 );
+        char* buffer_begin = &buffer[0];
+        const char* buffer_end = &buffer[0] + buffer.size();
+        char* read_position = buffer_begin;
+        char* write_position = buffer_begin;
+        char* last_record = NULL;
+        comma::io::select select;
+        select.read().add( comma::io::stdin_fd );
+        comma::io::istream is( "-", comma::io::mode::binary );
         bool end_of_stream = false;
         std::string line;
         std::string last_line;
         std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
-        std::cin.tie( NULL ); // std::cin is tied to std::cout by default
         bool repeating = false;
+        unsigned int count = 0;
         bool pace = options.exists( "--pace" );
         if( pace && !period ) { std::cerr << "csv-repeat: for --pace, please specify --period" << std::endl; return 1; }
         while( is->good() && !end_of_stream )
@@ -253,12 +370,14 @@ int main( int ac, char** av )
                     else { std::cout << std::endl; }
                 }
                 end_of_stream = repeating = false;
+                count = 0;
                 if( pace ) { boost::this_thread::sleep( *period ); } // todo: quick and dirty; fix it properly for --pace, to make sure sleep happens after each record only once
             }
             if( !is->good() || end_of_stream ) { break; }
             if( repeating )
             {
                 if( !period ) { std::cerr << "csv-repeat: input data timed out" << std::endl; return 1; }
+                count++;
                 if( csv.binary() )
                 {
                     if( last_record )
@@ -266,7 +385,7 @@ int main( int ac, char** av )
                         std::cout.write( last_record, record_size );
                         /// do not do it! see the note inside csv::stream.h, search for passed<> class template
                         /// ::write( 1, last_record, record_size );
-                        if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) ); }
+                        if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) ); }
                     }
                 }
                 else
@@ -277,7 +396,7 @@ int main( int ac, char** av )
                         if( ostream )
                         {
                             std::cout << csv.delimiter;
-                            ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) );
+                            ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) );
                         }
                         else { std::cout << std::endl; }
                     }
@@ -292,19 +411,20 @@ int main( int ac, char** av )
             {
                 boost::this_thread::sleep( *period ); // quick and dirty
                 if( is_shutdown ) { break; }
+                count++;
                 if( csv.binary() )
                 {
                     if( !last_record ) { break; }
                     std::cout.write( last_record, record_size );
                     /// do not do it! see the note inside csv::stream.h, search for passed<> class template
                     /// ::write( 1, last_record, record_size );
-                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) ); }
+                    if( ostream ) { ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) ); }
                 }
                 else
                 {
                     if( last_line.empty() ) { break; }
                     std::cout << last_line;
-                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true ) ); }
+                    if( ostream ) { std::cout << csv.delimiter; ostream->write( output_t( boost::posix_time::microsec_clock::universal_time(), true, count ) ); }
                     else { std::cout << std::endl; }
                 }
                 std::cout.flush();
diff --git a/csv/applications/csv-seek.cpp b/csv/applications/csv-seek.cpp
new file mode 100644
index 000000000..916770d35
--- /dev/null
+++ b/csv/applications/csv-seek.cpp
@@ -0,0 +1,176 @@
+// Copyright (c) 2024 Mission Systems
+
+/// @author Aspen Eyers
+
+#include <cstdint>
+#include <iostream>
+#include <fstream>
+#include "../../application/command_line_options.h"
+#include "../../csv/traits.h"
+#include "../../name_value/parser.h"
+#include "../../visiting/traits.h"
+#include "../../csv/stream.h"
+#include "../../csv/traits.h"
+
+
+static void usage( bool verbose = false )
+{
+    std::cerr << R"(
+seek through a stream to grab selected records
+usage: csv-seek <options> [<stream>]
+options
+    --permissive:          permissive mode: output empty record on error
+
+    --size,-s=<size>:      [todo] data is packets of fixed size, otherwise data is expected
+                           line-wise. Alternatively use --binary
+csv options
+)";
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << "examples" << std::endl;
+    if( verbose ) { std::cerr << R"(    examples setup
+        basics
+            make data file
+                csv-paste 'line-number;binary=ui' --head 100 > data.bin
+
+            sample the records at 50% and 10% through the data:
+                ( echo 0.5; echo 0.1 ) | csv-seek --fields=ratio "data.bin;binary=f" | csv-from-bin f
+
+            sample the 10th record
+                echo 10 | csv-seek "data.bin;binary=12f" | csv-from-bin f
+
+        colour hue (you would need snark installed with graphics and imaging enabled)
+            make data file
+                ( csv-paste value=255 value=0 line-number --head 256; \
+                  csv-paste 'line-number;begin=255;step=-1' line-number value=255 --head 256; \
+                  csv-paste value=0 value=255 'line-number;begin=255;step=-1' --head 256; \
+                  csv-paste line-number value=255 value=0 --head 256; \
+                  csv-paste value=255 'line-number;begin=255;step=-1' value=0 --head 256 ) \
+                      | csv-to-bin 3ub \
+                      > colour-wheel.bin
+            sample colour hue
+                csv-sliders 'hue;min=0;max=1;step=0.0001' \
+                            --frequency 10 \
+                            --window-geometry=0,0,400,60 \
+                            --title='examples: hue selection' \
+                    | csv-seek --permissive --fields ratio 'colour-wheel.bin;binary=3ub' --flush \
+                    | cv-cat --input 'rows=1;cols=1;no-header;type=3ub' \
+                             'resize=400;view=,examples: hue selection,,0,130;null'
+)";
+    }
+    else
+    {
+        std::cerr << "    see --help --verbose for more help" << std::endl;
+    }
+    exit( 0 );
+}
+
+namespace comma { namespace csv {
+struct config_t
+{
+    std::string filename;
+    std::string format;
+};
+
+struct input_t
+{
+    double ratio{0};
+    std::uint32_t index{0};
+    std::uint32_t block{0}; // todo in some vague future
+
+    std::uint64_t get_index( std::size_t filesize, std::size_t record_size, bool use_ratio ) const { return use_ratio ? static_cast<std::uint64_t>(filesize * ratio) : index*record_size; }
+};
+
+}} // namespace comma { namespace csv {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv::config_t >
+{
+    template < typename K, typename V > static void visit( const K&, comma::csv::config_t& p, V& v )
+    {
+        v.apply( "filename", p.filename );
+        v.apply( "format", p.format );
+    }
+
+    template < typename K, typename V > static void visit( const K&, const comma::csv::config_t& p, V& v )
+    {
+        v.apply( "filename", p.filename );
+        v.apply( "format", p.format );
+    }
+};
+
+template <> struct traits< comma::csv::input_t >
+{
+    template < typename K, typename V > static void visit( const K&, comma::csv::input_t& p, V& v )
+    {
+        v.apply( "ratio", p.ratio );
+        v.apply( "index", p.index );
+        v.apply( "block", p.block );
+    }
+
+    template < typename K, typename V > static void visit( const K&, const comma::csv::input_t& p, V& v )
+    {
+        v.apply( "ratio", p.ratio );
+        v.apply( "index", p.index );
+        v.apply( "block", p.block );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        std::vector< std::string > unnamed = options.unnamed( "--flush,-v,--verbose,--permissive,-p,--size", "-.*" );
+        comma::csv::options csv( options, "index" );
+        bool permissive = options.exists( "--permissive,-p" );
+        COMMA_ASSERT_BRIEF( csv.has_field( "ratio" ) != csv.has_field( "index" ), "please specify either 'ratio' or 'index' (but not both) in --fields" );
+
+        COMMA_ASSERT_BRIEF( unnamed.size() > 0, "expected file (or stream, todo)" );
+        COMMA_ASSERT_BRIEF( unnamed.size() < 2, "Does not work on multiple streams (yet (shouuld it?))" );
+
+        comma::name_value::parser csv_options_parser( "filename", ';', '=', false );
+        auto stream = csv_options_parser.get< comma::csv::config_t >( unnamed[0] );
+        auto stream_csv = csv_options_parser.get< comma::csv::options >( unnamed[0] );
+        std::string filename = stream.filename;
+        COMMA_ASSERT_BRIEF( filename!="-", "expected filename. file scrubbing does not work on streams." );
+        COMMA_ASSERT_BRIEF( stream_csv.binary(), "expected binary file" );
+
+        std::ifstream file(filename, std::ios::binary | std::ios::ate);
+        COMMA_ASSERT_BRIEF( file.is_open(), "unable to open file" );
+
+        std::streamsize file_size = file.tellg();
+        std::streampos record_size = stream_csv.format().size();
+
+        comma::csv::input_stream< comma::csv::input_t > istream( std::cin, csv );
+        while( std::cin.good() && !std::cin.eof() )
+        {
+            const comma::csv::input_t* p = istream.read();
+            if( !p ) { break; }
+
+            std::streampos index = p->get_index( file_size, record_size, csv.has_field( "ratio" ) );
+            std::streampos adjusted_offset = (index / record_size) * record_size;
+
+            if (adjusted_offset >= file_size) 
+            { 
+                comma::saymore() <<  "index out of bounds" << std::endl; 
+                if( permissive ) { continue; }
+                return 1;
+            }
+            std::vector<char> record_data;
+            file.seekg(adjusted_offset);
+            record_data.resize(record_size);
+            file.read(record_data.data(), record_size);
+            std::cout.write(record_data.data(), record_data.size());
+            if( csv.flush ) { std::cout.flush(); }
+        }
+
+        file.close();
+        return 0;
+    }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
+    return 1;
+}
diff --git a/csv/applications/csv-select.cpp b/csv/applications/csv-select.cpp
index 0ccadd3a9..dea184bac 100644
--- a/csv/applications/csv-select.cpp
+++ b/csv/applications/csv-select.cpp
@@ -1,45 +1,17 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
 #include <iostream>
-#include <sstream>
 #include <map>
+#include <sstream>
+#include <unordered_set>
 #include <vector>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include <boost/regex.hpp>
 #include <boost/scoped_ptr.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -48,7 +20,7 @@
 #include "../../string/string.h"
 #include "../../visiting/traits.h"
 
-void usage()
+void usage( bool verbose )
 {
     std::cerr << std::endl;
     std::cerr << "find in a file or stream by constraints on a given key" << std::endl;
@@ -82,7 +54,7 @@ void usage()
     std::cerr << "fields: any non-empty fields will be treated as keys" << std::endl;
     std::cerr << std::endl;
     std::cerr << "csv options" << std::endl;
-    std::cerr << comma::csv::options::usage() << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    cat a.csv | csv-select --fields=,,t --from=20120101T000000" << std::endl;
@@ -91,9 +63,7 @@ void usage()
     std::cerr << "    cat a.csv | csv-select --fields=t,scalar \"t;from=20120101T000000;sorted\" \"scalar;from=-10;to=20.5\"" << std::endl;
     std::cerr << "    echo hello,world | csv-select --fields=h,w \"h;regex=he.*\"" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 bool matches( const std::string& value, const boost::regex& r ) { return boost::regex_match( value, r ); }
@@ -138,19 +108,22 @@ struct constraints
 
     constraints( const std::string& options )
     {
-        comma::name_value::map m( options, ';', '=' ); // quick and dirty, since optional is not well-supported (euphymism for 'buggy') in comma::name_value::parser
-        if( m.exists( "equals" ) ) { equals = m.value< T >( "equals" ); }
-        if( m.exists( "not-equal" ) ) { not_equal = m.value< T >( "not-equal" ); }
-        if( m.exists( "less" ) ) { less = m.value< T >( "less" ); }
-        if( m.exists( "greater" ) ) { greater = m.value< T >( "greater" ); } // it was: { equal = m.value< T >( "greater" ); }
-        if( m.exists( "from" ) ) { from = m.value< T >( "from" ); }
-        if( m.exists( "greater-or-equal" ) ) { from = m.value< T >( "greater-or-equal" ); }
-        if( m.exists( "ge" ) ) { from = m.value< T >( "ge" ); }
-        if( m.exists( "to" ) ) { to = m.value< T >( "to" ); }
-        if( m.exists( "less-or-equal" ) ) { to = m.value< T >( "less-or-equal" ); }
-        if( m.exists( "le" ) ) { to = m.value< T >( "le" ); }
-        if( m.exists( "regex" ) ) { regex = boost::regex( m.value< std::string >( "regex" ) ); }
-        sorted = m.exists( "sorted" );
+        comma::name_value::map m( options.substr( options.find_first_of( ';' ) + 1 ), ';', '=', true, "equals,not-equal,less,greater,from,greater-or-equal,ge,to,less-or-equal,le,regex,sorted,fields,f,binary,b,delimiter,d,format" ); // quick and dirty, since optional is not well-supported (euphymism for 'buggy') in comma::name_value::parser
+        for( const auto& v: m.get() ) // super quick and dirty, suboptimal
+        {
+            if( v.first == "equals" ) { equals = m.value< T >( "equals" ); }
+            else if( v.first == "not-equal" ) { not_equal = m.value< T >( "not-equal" ); }
+            else if( v.first == "less" ) { less = m.value< T >( "less" ); }
+            else if( v.first == "greater" ) { greater = m.value< T >( "greater" ); } // it was: { equal = m.value< T >( "greater" ); }
+            else if( v.first == "from" ) { from = m.value< T >( "from" ); }
+            else if( v.first == "greater-or-equal" ) { from = m.value< T >( "greater-or-equal" ); }
+            else if( v.first == "ge" ) { from = m.value< T >( "ge" ); }
+            else if( v.first == "to" ) { to = m.value< T >( "to" ); }
+            else if( v.first == "less-or-equal" ) { to = m.value< T >( "less-or-equal" ); }
+            else if( v.first == "le" ) { to = m.value< T >( "le" ); }
+            else if( v.first == "regex" ) { regex = boost::regex( m.value< std::string >( "regex" ) ); }
+            else if( v.first == "sorted" ) { sorted = true; }
+        }
     }
 
     bool is_a_match( const T& t ) const // quick and dirty, implement a proper expression parser
@@ -219,15 +192,11 @@ struct input_t
 
     bool is_a_match( bool is_or ) const
     {
-//         std::cerr << "==> is_a_match: doubles: ";
-//         for( unsigned int i = 0; i < doubles.size(); ++i ) { std::cerr << doubles[i].value << " "; }
-//         std::cerr << std::endl;
         if( is_or )
         {
             for( unsigned int i = 0; i < time.size(); ++i ) { if( time[i].is_a_match( is_or ) ) { return true; } }
             for( unsigned int i = 0; i < doubles.size(); ++i ) { if( doubles[i].is_a_match( is_or ) ) { return true; } }
             for( unsigned int i = 0; i < strings.size(); ++i ) { if( strings[i].is_a_match( is_or ) ) { return true; } }
-    //        std::cerr << "==> is_a_match: done" << std::endl << std::endl;
             return false;
         }
         else
@@ -235,7 +204,6 @@ struct input_t
             for( unsigned int i = 0; i < time.size(); ++i ) { if( !time[i].is_a_match() ) { return false; } }
             for( unsigned int i = 0; i < doubles.size(); ++i ) { if( !doubles[i].is_a_match() ) { return false; } }
             for( unsigned int i = 0; i < strings.size(); ++i ) { if( !strings[i].is_a_match() ) { return false; } }
-    //        std::cerr << "==> is_a_match: done" << std::endl << std::endl;
             return true;
         }
     }
@@ -263,15 +231,8 @@ namespace comma { namespace visiting {
 
 template < typename T > struct traits< constrained< T > >
 {
-    template < typename K, typename V > static void visit( const K&, const constrained< T >& p, V& v )
-    {
-        v.apply( "value", p.value );
-    }
-
-    template < typename K, typename V > static void visit( const K&, constrained< T >& p, V& v )
-    {
-        v.apply( "value", p.value );
-    }
+    template < typename K, typename V > static void visit( const K&, const constrained< T >& p, V& v ) { v.apply( "value", p.value ); }
+    template < typename K, typename V > static void visit( const K&, constrained< T >& p, V& v ) { v.apply( "value", p.value ); }
 };
 
 template <> struct traits< input_t >
@@ -293,22 +254,17 @@ template <> struct traits< input_t >
 
 } } // namespace comma { namespace visiting {
 
-static bool verbose;
 static comma::csv::options csv;
 static input_t input;
 static std::vector< std::string > fields;
 typedef std::multimap< std::string, std::string > constraints_map_t;
 static constraints_map_t constraints_map;
 
-template < typename T >
-static constrained< T > make_value( unsigned int i, const comma::command_line_options& options )
+template < typename T > static constrained< T > make_value( unsigned int i, const comma::command_line_options& options )
 {
     constrained< T > v;
-    for( std::pair< constraints_map_t::const_iterator, constraints_map_t::const_iterator > r = constraints_map.equal_range( fields[i] ); r.first != r.second; ++r.first )
-    {
-        v.constraints.push_back( constraints< T >( r.first->second ) );
-    }
-    static constraints< T > common_constraints( options );
+    for( auto r = constraints_map.equal_range( fields[i] ); r.first != r.second; ++r.first ) { v.constraints.push_back( constraints< T >( r.first->second ) ); }
+    static constraints< T > common_constraints( options ); // quick and dirty
     if( !common_constraints.empty() ) { v.constraints.push_back( common_constraints ); }
     return v;
 }
@@ -338,21 +294,19 @@ static void init_input( const comma::csv::format& format, const comma::command_l
         }
     }
     csv.fields = comma::join( fields, ',' );
-    csv.full_xpath = true;
 }
 
 int main( int ac, char** av )
 {
-        comma::command_line_options options( ac, av );
     try
     {
-        if( options.exists( "--help,-h" ) ) { usage(); }
-        verbose = options.exists( "--verbose,-v" );
+        comma::command_line_options options( ac, av, usage );
         bool is_or = options.exists( "--or" );
         csv = comma::csv::options( options );
         fields = comma::split( csv.fields, ',' );
         if( fields.size() == 1 && fields[0].empty() ) { fields.clear(); }
-        std::vector< std::string > unnamed = options.unnamed( "--first-matching,--or,--sorted,--input-sorted,--not-matching,--output-all,--all,--strict,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--first-matching,--or,--sorted,--input-sorted,--not-matching,--output-all,--all,--strict,--verbose,-v,--flush"
+                                                            , "--equals,--not-equal,--less,--greater,--from,--greater-or-equal,--ge,--to,--less-or-equal,--le,--regex,--fields,-f,--binary,-b,--format,--delimiter,-d,--precision" );
         //for( unsigned int i = 0; i < unnamed.size(); constraints_map.insert( std::make_pair( comma::split( unnamed[i], ';' )[0], unnamed[i] ) ), ++i );
         bool strict = options.exists( "--strict" );
         bool first_matching = options.exists( "--first-matching" );
@@ -363,13 +317,9 @@ int main( int ac, char** av )
             std::string field = comma::split( unnamed[i], ';' )[0];
             bool found = false;
             for( unsigned int j = 0; j < fields.size() && !found; found = field == fields[j], ++j );
-            if( !found )
-            {
-                if( strict ) { std::cerr << "csv-select: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl; return 1; }
-                std::cerr << "csv-select: warning: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl;
-                continue;
-            }
-            constraints_map.insert( std::make_pair( field, unnamed[i] ) );
+            if( found ) { constraints_map.insert( std::make_pair( field, unnamed[i] ) ); continue; }
+            if( strict ) { std::cerr << "csv-select: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl; return 1; }
+            std::cerr << "csv-select: warning: on constraint: \"" << unnamed[i] << "\" field \"" << field << "\" not found in fields: " << csv.fields << std::endl;
         }
         if( csv.binary() )
         {
diff --git a/csv/applications/csv-shape.cpp b/csv/applications/csv-shape.cpp
index 024b6456e..46fc29289 100644
--- a/csv/applications/csv-shape.cpp
+++ b/csv/applications/csv-shape.cpp
@@ -1,37 +1,12 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2023-2024 Vsevolod Vlaskine
 
 /// @author dewey nguyen
 
+#include <cstdint>
+#include <deque>
 #include <iostream>
 #include <vector>
-#include <deque>
 #include "../../base/types.h"
 #include "../../application/command_line_options.h"
 #include "../options.h"
@@ -40,80 +15,100 @@
 
 using namespace comma;
 
+namespace comma { namespace csv { namespace applications { namespace shape { namespace operations { namespace sliding_window { static std::string usage( bool verbose ); } } } } } }
+
 static void usage( bool verbose=false )
 {
     std::cerr << "Perform reshaping operations on input data" << std::endl;
     std::cerr << std::endl;
     std::cerr << "operations" << std::endl;
-    std::cerr << "    concatenate: group input records for concatenation into output records." << std::endl;
-    std::cerr << "                 the user can choose non-overlapping or overlapping grouping (sliding window) mode." << std::endl;
-    std::cerr << "    loop:        same as concatenate, but with an additional last record:" << std::endl;
-    std::cerr << "                 last input record concatenated with the first record (hence, 'loop')" << std::endl;
-    std::cerr << "                 this mode always uses the sliding window for overlapping groups" << std::endl;
+    std::cerr << "    concatenate:    group input records for concatenation into output records." << std::endl;
+    std::cerr << "                    the user can choose non-overlapping or overlapping grouping (sliding window) mode." << std::endl;
+    std::cerr << "    loop:           same as concatenate, but with an additional last record:" << std::endl;
+    std::cerr << "                    last input record concatenated with the first record (hence, 'loop')" << std::endl;
+    std::cerr << "                    this mode always uses the sliding window for overlapping groups" << std::endl;
+    std::cerr << "    repeat:         repeat input given number of times, e.g. csv-shape repeat --size 5" << std::endl;
+    std::cerr << "    sliding-window: todo" << std::endl;
+    std::cerr << "    split:          csv-only: split line at n-th field, e.g. csv-shape split --size 4" << std::endl;
     std::cerr << std::endl;
     std::cerr << "Usage: cat data.csv | csv-shape <operation> [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
-    std::cerr << "    --binary,-b=[<format>]: in binary mode: format string of the input csv data types" << std::endl;
-    std::cerr << "    --delimiter,-d=[<char>]; default=','; in ascii mode, field separating character." << std::endl;
-    std::cerr << "    --help,-h;  see this usage message" << std::endl;
+    std::cerr << "    --expected-records; output the expected records for given --size and --step, and exit" << std::endl;
+    std::cerr << "    --size,-n=<num>; number of input records in each grouping, range: 2 and above" << std::endl;
+    std::cerr << "    --step=<num>; default=1; relative offset of the records to be concatenated" << std::endl;
     std::cerr << "    --verbose,-v: more output to stderr, shows examples with --help,-h" << std::endl;
     std::cerr << std::endl;
-    if( verbose ) { std::cerr << comma::csv::format::usage() << std::endl; }
     std::cerr << "operations options" << std::endl;
+    std::cerr << "    concatenate" << std::endl;
+    std::cerr << "       --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
+    std::cerr << "       --reverse; output records in reverse order (e.g. b,a)" << std::endl;
+    std::cerr << "       --sliding-window,-w; use a sliding window to group input records, see examples" << std::endl;
+    std::cerr << "    loop" << std::endl;
+    std::cerr << "       --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
+    std::cerr << "       --reverse; output records in reverse order (e.g. b,a)" << std::endl;
+    std::cerr << "    split" << std::endl;
+    std::cerr << "       --repeat; e.g: echo 0,1,2,3,4,5 | csv-shape split -n 2 will output: 0,1 and 2,3,4,5" << std::endl;
+    std::cerr << "                      echo 0,1,2,3,4,5 | csv-shape split -n 2 --repeat will output: 0,1, then 2,3, then 4,5" << std::endl;
+    std::cerr << "       --size,-n=<n>; e.g. echo 0,1,2,3,4,5| csv-shape split -n 3 will output" << std::endl;
+    std::cerr << "                      two lines: 0,1,2 and 3,4,5" << std::endl;
+    std::cerr << comma::csv::applications::shape::operations::sliding_window::usage( verbose ) << std::endl;
     std::cerr << std::endl;
-    std::cerr << "   common options" << std::endl;
-    std::cerr << "      --size,-n=<num>; number of input records in each grouping, range: 2 and above" << std::endl;
-    std::cerr << "      --step=<num>; default=1; relative offset of the records to be concatenated" << std::endl;
-    std::cerr << "      --expected-records; output the expected records for given --size and --step, and exit" << std::endl;
-    std::cerr << "   concatenate" << std::endl;
-    std::cerr << "      --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
-    std::cerr << "      --reverse; output records in reverse order (e.g. b,a)" << std::endl;
-    std::cerr << "      --sliding-window,-w; use a sliding window to group input records, see examples" << std::endl;
-    std::cerr << "   loop" << std::endl;
-    std::cerr << "      --bidirectional; output records in both directions (e.g. a,b; b,a)" << std::endl;
-    std::cerr << "      --reverse; output records in reverse order (e.g. b,a)" << std::endl;
-    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << "examples" << std::endl;
     if( verbose )
     {
-        std::cerr << "examples" << std::endl;   
-        std::cerr << "   concatenate" << std::endl;
-        std::cerr << "      non overlaping groups:" << std::endl;
-        std::cerr << "          concatenate each group of 5 input records into one output record." << std::endl;
-        std::cerr << "          input records 1 to 5 create the first output record, input records 6-10 create the second output record, and so forth." << std::endl;
-        std::cerr << "              seq 1 15 | csv-shape concatenate -n 5" << std::endl;
-        std::cerr << "      overlapping groups:" << std::endl;
-        std::cerr << "          move a sliding window of size 5 along the input records, every time the sliding window moves, make an output record from window" << std::endl;
-        std::cerr << "          input records 1 to 5 create the first output record, input records 2 to 6 create the second record, input records 3 to 7 create the third record, and so forth" << std::endl;
-        std::cerr << "              seq 1 10 | csv-shape concatenate -n 5 --sliding-window" << std::endl;
+        std::cerr << R"(examples
+    concatenate
+        non-overlapping groups
+            concatenate each group of 5 input records into one output record.
+            input records 1 to 5 create the first output record, input records 6-10 create the second output record, and so forth.
+                seq 1 15 | csv-shape concatenate -n 5
+        overlapping groups
+            move a sliding window of size 5 along the input records, every time the sliding window moves, make an output record from window
+            input records 1 to 5 create the first output record, input records 2 to 6 create the second record, input records 3 to 7 create the third record, and so forth
+                seq 1 10 | csv-shape concatenate -n 5 --sliding-window
+    sliding-window
+        basics
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4 --step 2
+        enumerate blocks of records
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4 --block
+            for x in a b c d e f g h; do echo $x; done | csv-shape sliding-window --size 4 --step 2 --block
+        incrementally output of the records 
+            for x in a b c d e f; do echo $x; done | csv-shape sliding-window --size 4 --incremental --block
+            for x in a b c d e f; do echo $x; done | csv-shape sliding-window --size 4 --incremental --block --step 2
+)";
     }
     else
     {
-        std::cerr << "examples: run csv-shape --help --verbose for more..." << std::endl;
+        std::cerr << "    run csv-shape --help --verbose for more..." << std::endl;
     }
+    std::cerr << std::endl;
     exit( 0 );
 }
 
 // There is nothing to do in this case - binary data
-static void simple_binary_pass_through(const comma::csv::format& f, bool flush=false)
+static void _binary_pass_through(const comma::csv::format& f, bool flush=false)
 {
     std::vector< char > buffer( f.size(), '\0' );
     while( std::cin.good() && !std::cin.eof() )
     {
-        if( std::cin.read( &buffer[0], buffer.size() ) ) {
+        if( std::cin.read( &buffer[0], buffer.size() ) )
+        {
             std::cout.write( &buffer[0], buffer.size() );
             if( flush ) { std::cout.flush(); }
         }
     }
 }
 
-bool is_binary;
+static bool is_binary;
 
-class concatenate_impl_
+class _concatenate
 {
 public:
-
-    concatenate_impl_() 
+    _concatenate()
         : use_sliding_window_(false)
         , bidirectional_(false)
         , reverse_(false)
@@ -133,13 +128,13 @@ class concatenate_impl_
         use_sliding_window_ = ( looping_ || options.exists("--sliding-window,-w") );
         reverse_ = options.exists("--reverse");
         bidirectional_ = options.exists("--bidirectional");
-        if( !use_sliding_window_ && is_binary ) { simple_binary_pass_through(csv.format(), csv.flush); return 0; };
+        if( !use_sliding_window_ && is_binary ) { _binary_pass_through( csv.format(), csv.flush ); return 0; };
         size_ = looping_ ? options.value("--size,-n", 2) : options.value< comma::uint32 >("--size,-n");
         step_ = options.value( "--step",1 );
         if( size_ < 2 ) { std::cerr <<  comma::verbose.app_name() << ": expected --size,-n= value to be greater than 1" << std::endl; return 1; }
         expected_records_ = step_ * ( size_ - 1 ) + 1;
         if( options.exists("--expected-records") ) { std::cout << expected_records_ << std::endl; return 0; };
-        comma::csv::input_stream< input_t > istream(std::cin, csv);
+        comma::csv::input_stream< input_t > istream( std::cin, csv );
         std::deque< std::string > deque;
         std::deque< std::string > first;
         bool has_block_ = csv.has_field( "block" );
@@ -152,7 +147,7 @@ class concatenate_impl_
                 if (!verify(deque)) { return 1; }
                 count_ = 0;
                 if ( looping_ ) { output_loop(deque, first, csv); }
-                deque.clear();  
+                deque.clear();
             }
             block_ = p->block;
             deque.push_back( istream.last() );
@@ -169,12 +164,9 @@ class concatenate_impl_
         return 0;
     }
 
-    struct input_t {
-        comma::uint32 block = 0;
-    };
+    struct input_t { comma::uint32 block = 0; };
 
 private:
-
     bool use_sliding_window_;
     bool bidirectional_;
     bool reverse_;
@@ -186,17 +178,17 @@ class concatenate_impl_
     comma::uint32 expected_records_;
 
     bool verify( const std::deque<std::string>& deque )
-    { 
+    {
         if( use_sliding_window_ && count_ < step_ * ( size_ - 1 ) + 1 )
-        { 
+        {
             std::cerr << comma::verbose.app_name() << ": --size,-n=" << size_ << ", --step=" << step_ << ", expected records count (" << step_ * ( size_ - 1 ) + 1
-                      << ") is bigger than total number of input records: " << count_ << std::endl; 
-            return false; 
+                      << ") is bigger than total number of input records: " << count_ << std::endl;
+            return false;
         }
-        if ( !use_sliding_window_ && !deque.empty() ) 
-        { 
-            std::cerr << comma::verbose.app_name() << ": error, leftover tail input record found: " << deque.size() << " lines." << std::endl; 
-            return false; 
+        if ( !use_sliding_window_ && !deque.empty() )
+        {
+            std::cerr << comma::verbose.app_name() << ": error, leftover tail input record found: " << deque.size() << " lines." << std::endl;
+            return false;
         }
         return true;
     }
@@ -211,7 +203,7 @@ class concatenate_impl_
             if(!is_binary){ std::cout << std::endl; }
             if (csv.flush) { std::cout.flush(); }
         }
-        if (bidirectional_ || reverse_ ) 
+        if (bidirectional_ || reverse_ )
         {
             std::cout.write( &( deque.back()[0] ), deque.back().size() );
             auto is = deque.crbegin(); while( ( is + 1 ) != deque.crend() ) { if(!is_binary){ std::cout << csv.delimiter; } is += step_; std::cout.write( &(*is)[0], is->size() ); }
@@ -234,31 +226,168 @@ class concatenate_impl_
 
 namespace comma { namespace visiting {
 
-template <> struct traits< concatenate_impl_::input_t >
+template <> struct traits< _concatenate::input_t >
 {
-    template < typename K, typename V > static void visit( const K&, const concatenate_impl_::input_t& p, V& v ) { v.apply("block", p.block); }
-    template < typename K, typename V > static void visit( const K&, concatenate_impl_::input_t& p, V& v ) { v.apply("block", p.block); }
+    template < typename K, typename V > static void visit( const K&, const _concatenate::input_t& p, V& v ) { v.apply("block", p.block); }
+    template < typename K, typename V > static void visit( const K&, _concatenate::input_t& p, V& v ) { v.apply("block", p.block); }
 };
 
 } } // namespace comma { namespace visiting {
 
+static int _repeat( const comma::command_line_options& options, const comma::csv::options& csv )
+{
+    unsigned int size = options.value< unsigned int >( "--size,-n" );
+    if( csv.binary() )
+    {
+        typedef _concatenate::input_t input_t; // quick and dirty
+        comma::csv::input_stream< input_t > is( std::cin, csv ); // quick and dirty, will be slow on ascii
+        while( is.ready() || ( std::cin.good() && !std::cin.eof() ) )
+        {
+            const input_t* p = is.read();
+            if( !p ) { break; }
+            for( unsigned int i = 0; i < size; ++i ) { std::cout.write( is.binary().last(), csv.format().size() ); }
+            if( csv.flush ) { std::cout.flush(); }
+        }
+    }
+    else
+    {
+        while( std::cin.good() && !std::cin.eof() )
+        {
+            std::string line;
+            std::getline( std::cin, line );
+            if( comma::strip( line ).empty() ) { continue; }
+            for( unsigned int i = 0; i < size; ++i ) { std::cout << line << std::endl; }
+        }
+    }
+    return 0;
+}
+
+static int _split( const comma::command_line_options& options, const comma::csv::options& csv )
+{
+    if( csv.binary() ) { _binary_pass_through( csv.format(), csv.flush ); return 0; };
+    unsigned int size = options.value< unsigned int >( "--size,-n" );
+    bool repeat = options.exists( "--repeat" );
+    while( std::cin.good() && !std::cin.eof() )
+    {
+        std::string line;
+        std::getline( std::cin, line );
+        const auto& s = comma::strip( line );
+        if( s.empty() ) { continue; }
+        unsigned int p{0};
+        for( unsigned int i{0}, c{0}; i < s.size(); ++i )
+        {
+            if( s[i] == csv.delimiter ) { ++c; }
+            if( c < size ) { continue; }
+            std::cout << s.substr( p, i - p ) << std::endl;
+            p = i + 1;
+            c = 0;
+            if( !repeat ) { break; }
+        }
+        if( p < s.size() ) { std::cout << s.substr( p ) << std::endl; }
+    }
+    return 0;
+}
+
+namespace comma { namespace csv { namespace applications { namespace shape { namespace operations {
+
+namespace sliding_window {
+
+std::string usage( bool )
+{
+    return R"(    sliding-window
+        --incremental; output first block incrementally: first record, then first and second, etc
+        --prepend-block,--block; prepend each record with block number, ui if binary output
+        --size=<n>; number of input records in each grouping
+        --step=<n>; default=1; sliding window step)";
+}
+
+static int run( const comma::command_line_options& options, comma::csv::options& csv )
+{
+    const unsigned int size = options.value< unsigned int >( "--size" );
+    const unsigned int stride = options.value< unsigned int >( "--step,--stride", 1 );
+    COMMA_ASSERT( stride <= size, "stride greater than size currently not supported, just ask; got: size: " << size << " stride: " << stride );
+    std::deque< std::string > deque;
+    std::string record = csv.binary() ? std::string( csv.format().size(), 0 ) : std::string();
+    bool incremental = options.exists( "--incremental" );
+    bool prepend_block = options.exists( "--prepend-block,--block" );
+    std::uint32_t block = 0;
+    auto output_record = [&]( const std::string& record )
+    {
+        if( prepend_block )
+        {
+            if( csv.binary() ) { std::cout.write( reinterpret_cast< const char* >( &block ), sizeof( std::uint32_t ) ); }
+            else { std::cout << block << csv.delimiter; }
+        }
+        std::cout.write( &record[0], record.size() );
+        if( !csv.binary() ) { std::cout << std::endl; }
+    };
+    auto output_all = [&]()
+    {
+        for( const auto& r: deque ) { output_record( r ); }
+        ++block;
+    };
+    while( std::cin.good() && !std::cin.eof() )
+    {
+        if( csv.binary() )
+        {
+            std::cin.read( &record[0], record.size() );
+            if( std::cin.gcount() == 0 ) { break; }
+            COMMA_ASSERT( std::cin.gcount() == int( record.size() ), "expected " << record.size() << " bytes; got only: " << std::cin.gcount() );
+        }
+        else
+        {
+            std::getline( std::cin, record );
+            if( comma::strip( record ).empty() ) { continue; }
+        }
+        deque.push_back( record );
+        // std::cerr << "============" << std::endl;
+        // for( const auto& d: deque ) { std::cerr << " " << d; }
+        // std::cerr << std::endl;
+        // std::cerr << "------------" << std::endl;
+        if( deque.size() < ( size + stride ) )
+        {
+            if( deque.size() > size ) { continue; }
+            if( incremental )
+            {
+                if( deque.size() % stride == 0 ) { output_all(); }
+            }
+            else
+            {
+                output_record( record );
+                if( deque.size() == size ) { ++block; } // quick and dirty
+            }
+        }
+        else
+        {
+            while( deque.size() > size ) { deque.pop_front(); } // quick and dirty
+            output_all();
+        }        
+        if( csv.flush ) { std::cout.flush(); }
+    }
+    return 0;
+}
+
+} // namespace sliding_window {
+
+} } } } } // namespace comma { namespace csv { namespace applications { namespace shape { namespace operations {
+
 int main( int ac, char** av )
 {
     try
     {
         comma::command_line_options options( ac, av, usage );
-        std::vector< std::string > unnamed = options.unnamed( "--size,-n,--sliding-window,-w,--step,--verbose,-v", "-.*" );
+        std::vector< std::string > unnamed = options.unnamed( "--prepend-block,--block,--expected-records,--incremental,--repeat,--sliding-window,-w,--verbose,-v", "-.*" );
         comma::csv::options csv( options );
-        if (csv.fields.empty()) { csv.fields="a"; }
+        csv.full_xpath = false;
+        if( csv.fields.empty() ) { csv.fields="a"; }
         is_binary = csv.binary();
         if( unnamed.empty() ) { std::cerr << comma::verbose.app_name() << ": please specify operations" << std::endl; exit( 1 ); }
         std::string operation = unnamed[0];
-        if( operation == "concatenate" || operation == "loop" )
-        {
-            return concatenate_impl_().run(options, csv);
-        }
-        std::cerr << comma::verbose.app_name() << ": operation not supported or unknown: '" << operation << '\'' << std::endl;
-        return 1;
+        if( operation == "concatenate" || operation == "loop" ) { return _concatenate().run( options, csv ); }
+        if( operation == "repeat" ) { return _repeat( options, csv ); }
+        if( operation == "sliding-window" ) { return comma::csv::applications::shape::operations::sliding_window::run( options, csv ); }
+        if( operation == "split" ) { return _split( options, csv ); }
+        comma::say() << ": expected operation; got: '" << operation << "'" << std::endl;
     }
     catch( std::exception& ex ) { std::cerr << "csv-shape: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-shape: unknown exception" << std::endl; }
diff --git a/csv/applications/csv-shuffle.cpp b/csv/applications/csv-shuffle.cpp
index 556514099..5589ab800 100644
--- a/csv/applications/csv-shuffle.cpp
+++ b/csv/applications/csv-shuffle.cpp
@@ -1,31 +1,7 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2020 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
 
 #ifdef WIN32
 #include <fcntl.h>
@@ -35,169 +11,108 @@
 #include <iostream>
 #include <vector>
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
 #include "../../csv/options.h"
 #include "../../string/string.h"
 
 static void usage( bool verbose )
 {
-    std::cerr << "perform operations on csv columns" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: cat data.csv | csv-shuffle <options> > shuffled.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
-    std::cerr << "    --fields,-f,--input-fields <fields>: input fields" << std::endl;
-    std::cerr << "    --output-fields,--output,-o <fields>: output fields" << std::endl;
-    std::cerr << "        semantics of outputting trailing fields:" << std::endl;
-    std::cerr << "            \"--output-fields=x,y\": do not output trailing fields" << std::endl;
-    std::cerr << "            \"--output-fields=x,y...\": output trailing fields" << std::endl;
-    std::cerr << "            see example below" << std::endl;
-    std::cerr << "    --verbose,-v: more output" << std::endl;
-    if( verbose ) { std::cerr << std::endl << comma::csv::options::usage() << std::endl; }
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    operations (for now): append, remove, swap" << std::endl;
-    std::cerr << "    semantics:" << std::endl;
-    std::cerr << "        remove:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=x,z" << std::endl;
-    std::cerr << "        append:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=x,y,z,x" << std::endl;
-    std::cerr << "        swap:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=y,z,x" << std::endl;
-    std::cerr << "        remove x, swap y,z, append z two times:" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y,z --output-fields=z,y,z,z" << std::endl;
-    std::cerr << "        do not output trailing fields: swap x and y, do not output z" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y --output-fields=y,x" << std::endl;
-    std::cerr << "        output trailing fields: swap x and y, output z" << std::endl;
-    std::cerr << "            cat xyz.csv | csv-shuffle --fields=x,y --output-fields=y,x,..." << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
-}
+    std::cerr << R"(
+swap, remove, or duplicate csv fields
 
-struct field
-{
-    std::string name;
-    unsigned int index;
-    unsigned int offset;
-    boost::optional< unsigned int > input_index;
-    unsigned int input_offset;
-    unsigned int size;
-    field( const std::string& name, unsigned int index ) : name( name ), index( index ) {}
-};
+usage: cat data.csv | csv-shuffle <options> > shuffled.csv
+
+options
+    --drop-empty,-e; e.g. two following commands are equivalent
+                     csv-shuffle --fields a,b,,,c --drop-empty
+                     csv-shuffle --fields a,b,,,c --output-fields a,b,c
+    --fields,-f,--input-fields=<fields>; input fields
+    --output-fields,--output,-o=<fields>; output fields, if not specified,
+                                          will be set to --input-fields,
+                                          which would chop off trailing
+                                          input fields see also --drop-empty
+    --verbose,-v: more verbose output
+)" << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+std::cerr << R"(examples
+    remove
+        echo 0,1,2 | csv-shuffle --fields=x,y,z
+    append
+        echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=x,y,z,x
+    swap
+        echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=y,z,x
+    remove x, swap y,z, append z two times
+        echo 0,1,2 | csv-shuffle --fields=x,y,z --output-fields=z,y,z,z
+)" << std::endl;
+    exit( 0 );
+}
 
 int main( int ac, char** av )
 {
     try
     {
-        comma::command_line_options options( ac, av );
-        bool verbose = options.exists( "--verbose,-v" );
-        if( options.exists( "--help,-h" ) ) { usage( verbose ); }
-        comma::csv::options csv( options );
-        std::string f = options.value< std::string >( "--input-fields", "" );
-        if( !f.empty() ) { csv.fields = f; }
-        std::vector< std::string > input_fields = comma::split( csv.fields, ',' );
-        std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o" ), ',' );
-        bool output_trailing_fields = output_fields.back() == "...";
-        if( output_fields.back() == "..." ) { output_fields.erase( output_fields.end() - 1 ); }
-        std::vector< field > fields;
-        for( unsigned int i = 0; i < output_fields.size(); ++i )
+        comma::command_line_options options( ac, av, usage );
+        comma::csv::options csv( options, options.value< std::string >( "--fields,-f,--input-fields" ) );
+        std::vector< std::string > input_fields = comma::split( csv.fields, ',', true );
+        std::vector< std::string > output_fields = comma::split( options.value< std::string >( "--output-fields,--output,-o", csv.fields ), ',', true );
+        if( options.exists( "--drop-empty,-e" ) )
         {
-            if( output_fields[i].empty() ) { continue; }
-            fields.push_back( field( output_fields[i], i ) );
+            std::vector< std::string > v;
+            for( auto s: output_fields ) { if( !s.empty() ) { v.push_back( s ); } }
+            output_fields = v;
         }
-        if( fields.empty() ) { std::cerr << "csv-shuffle: please define at least one output field" << std::endl; return 1; }
-        for( unsigned int i = 0; i < input_fields.size(); ++i )
+        COMMA_ASSERT_BRIEF( !output_fields.empty(), "please specify --output-fields or --drop-empty" );
+        COMMA_ASSERT_BRIEF( output_fields.back() != "...", "support for trailing fields has been removed for now; please specify input/output fields explicitly" );
+        auto find_ = [&]( const std::string& n )->unsigned int
         {
-            for( unsigned int j = 0; j < fields.size(); ++j )
-            {
-                if( fields[j].name != input_fields[i] ) { continue; }
-                fields[j].input_index = i;
-                if( csv.binary() )
-                {
-                    fields[j].input_offset = csv.format().offset( i ).offset;
-                    fields[j].size = csv.format().offset( i ).size;
-                }
-            }
-        }
-        for( unsigned int i = 0; i < fields.size(); ++i )
-        {
-            if( !fields[i].input_index ) { std::cerr << "csv-shuffle: \"" << fields[i].name << "\" not found in input fields " << csv.fields << std::endl; return 1; }
-        }
+            COMMA_ASSERT_BRIEF( !n.empty(), "got empty fields in output fields '" << comma::join( output_fields, ',' ) << "'; you may need to use --drop-empty" );
+            unsigned int j = 0;
+            for( ; j < input_fields.size(); ++j ) { if( input_fields[j] == n ) { return j; } }
+            COMMA_THROW( comma::exception, "output field '" << n << "' not found in input fields '" << csv.fields << "'" );
+        };
         if( csv.binary() )
         {
+            std::vector< std::pair< unsigned int, unsigned int > > offsets;
+            for( unsigned int i = 0; i < output_fields.size(); )
+            {
+                unsigned int j = find_( output_fields[i] );
+                offsets.push_back( std::make_pair( csv.format().offset( j ).offset, 0 ) );
+                for( ; i < output_fields.size() && j < input_fields.size() && input_fields[j] == output_fields[i]; ++i, ++j ) { offsets.back().second += csv.format().offset( j ).size; }
+            }
             #ifdef WIN32
             _setmode( _fileno( stdin ), _O_BINARY );
             _setmode( _fileno( stdout ), _O_BINARY );
             #endif
             std::vector< char > buf( csv.format().size() );
-            std::vector< comma::csv::format::element > elements;
-            elements.reserve( csv.format().count() ); // quick and dirty, can be really wasteful on large things like images
-            for( unsigned int i = 0; i < elements.capacity(); ++i ) { elements.push_back( csv.format().offset( i ) ); }
+            if( !csv.flush ) { std::cin.tie( NULL ); } // quick and dirty; std::cin is tied to std::cout by default, which is thread-unsafe now
             while( std::cin.good() && !std::cin.eof() )
             {
-                // todo: quick and dirty; if performance is an issue, you could read more than
-                // one record every time see comma::csv::binary_input_stream::read() for reference
                 std::cin.read( &buf[0], csv.format().size() );
                 if( std::cin.gcount() == 0 ) { continue; }
-                if( std::cin.gcount() < int( csv.format().size() ) ) { std::cerr << "csv-shuffle: expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() << std::endl; return 1; }
-                unsigned int previous_index = 0;
-                for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
-                {
-                    for( unsigned int k = previous_index; k < fields[i].index && k < elements.size(); ++k )
-                    {
-                        std::cout.write( &buf[ elements[k].offset ], elements[k].size );
-                    }
-                    std::cout.write( &buf[ fields[i].input_offset ], fields[i].size );
-                    previous_index = fields[i].index + 1;
-                }
-                //std::cerr << "--> previous_index: " << previous_index << " elements.size(): " << elements.size() << std::endl;
-                for( unsigned int k = previous_index; output_trailing_fields && k < elements.size(); ++k )
-                {
-                    std::cout.write( &buf[ elements[k].offset ], elements[k].size );
-                }
-                std::cout.flush(); // todo: flushing too often?
+                COMMA_ASSERT_BRIEF( std::cin.gcount() >= int( csv.format().size() ), "expected " << csv.format().size() << " bytes, got only " << std::cin.gcount() );
+                for( const auto& offset: offsets ) { std::cout.write( &buf[ offset.first ], offset.second ); }
+                if( csv.flush ) { std::cout.flush(); }
             }
+            return 0;
         }
-        else
+        std::vector< unsigned int > indices;
+        for( const auto& field: output_fields ) { indices.push_back( find_( field ) ); }
+        while( std::cin.good() && !std::cin.eof() )
         {
-            while( std::cin.good() && !std::cin.eof() )
-            {
-                std::string line;
-                std::getline( std::cin, line );
-                if( !line.empty() && *line.rbegin() == '\r' ) { line = line.substr( 0, line.length() - 1 ); } // windows... sigh...
-                if( line.empty() ) { continue; }
-                std::vector< std::string > v = comma::split( line, csv.delimiter );
-                std::string delimiter;
-                unsigned int previous_index = 0;
-                for( unsigned int i = 0; i < fields.size(); ++i ) // quick and dirty
-                {
-                    for( unsigned int k = previous_index; k < fields[i].index && k < v.size(); ++k )
-                    {
-                        std::cout << delimiter << v[k];
-                        delimiter = csv.delimiter;
-                    }
-                    previous_index = fields[i].index + 1;
-                    std::cout << delimiter;
-                    if ( *fields[i].input_index < v.size() ) { std::cout << v[ *fields[i].input_index ]; }
-                    delimiter = csv.delimiter;
-                }
-                for( unsigned int k = previous_index; output_trailing_fields && k < v.size(); ++k )
-                {
-                    std::cout << delimiter << v[k];
-                    delimiter = csv.delimiter;
-                }
-                std::cout << std::endl;
-            }
+            std::string line;
+            std::getline( std::cin, line );
+            if( !line.empty() && *line.rbegin() == '\r' ) { line = line.substr( 0, line.length() - 1 ); } // windows... sigh...
+            if( line.empty() ) { continue; }
+            const auto& v = comma::split( line, csv.delimiter );
+            COMMA_ASSERT_BRIEF( v.size() >= input_fields.size(), "expected at least " << input_fields.size() << " fields, got only " << v.size() << " in record \"" << line << "\"" );
+            std::string delimiter;
+            for( auto index: indices ) { std::cout << delimiter << v[index]; delimiter = csv.delimiter; }
+            std::cout << std::endl;
         }
         return 0;
     }
-    catch( std::exception& ex )
-    {
-        std::cerr << "csv-shuffle: " << ex.what() << std::endl;
-    }
-    catch( ... )
-    {
-        std::cerr << "csv-shuffle: unknown exception" << std::endl;
-    }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
diff --git a/csv/applications/csv-size.cpp b/csv/applications/csv-size.cpp
index 13ef66590..d37a6cb32 100644
--- a/csv/applications/csv-size.cpp
+++ b/csv/applications/csv-size.cpp
@@ -27,21 +27,21 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #include <iostream>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../csv/format.h"
 
 using namespace comma;
 
-static void usage()
+static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
     std::cerr << "a convenience utility: output to stdout size of given binary format" << std::endl;
     std::cerr << std::endl;
+    std::cerr << "DEPRECATED: use csv-format size" << std::endl;
+    std::cerr << std::endl;
     std::cerr << "Usage: csv-size <format> [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
@@ -52,22 +52,21 @@ static void usage()
     std::cerr << "      csv-size 2d will output 16" << std::endl;
     std::cerr << "      csv-size 2d --count will output 2" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( -1 );
+    exit( 0 );
 }
 
 int main( int ac, char** av )
 {
     try
     {
-        command_line_options options( ac, av );
-        if( ac < 2 || options.exists( "--help" ) || options.exists( "-h" ) ) { usage(); }
+        std::cerr << "csv-size: DEPRECATED, use echo <format> | csv-format size" << std::endl;
+        command_line_options options( ac, av, usage );
+        if( ac < 2 ) { usage(); }
         comma::csv::format format( options.unnamed( "--count,-c", "" )[0] );
         std::cout << ( options.exists( "--count,-c" ) ? format.count() : format.size() ) << std::endl;
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "csv-size: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-size: unknown exception" << std::endl; }
-    usage();
+    return 1;
 }
diff --git a/csv/applications/csv-sort.cpp b/csv/applications/csv-sort.cpp
index 18cfffbec..727f29de5 100644
--- a/csv/applications/csv-sort.cpp
+++ b/csv/applications/csv-sort.cpp
@@ -1,38 +1,14 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @authors matthew imhoff, dewey nguyen, vsevolod vlaskine
 
+#include <algorithm>
 #include <string.h>
 #include <deque>
 #include <iostream>
 #include <map>
+#include <memory>
+#include <random>
 #include <sstream>
 #include <string>
 #include <vector>
@@ -40,9 +16,9 @@
 #include <boost/unordered_set.hpp>
 #include <boost/lexical_cast.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
+#include "../../csv/block.h"
 #include "../../csv/stream.h"
 #include "../../csv/traits.h"
 #include "../../io/stream.h"
@@ -61,19 +37,23 @@ static void usage( bool more )
     std::cerr << std::endl;
     std::cerr << "Options:" << std::endl;
     std::cerr << "    --help,-h: help; --help --verbose: more help" << std::endl;
+    std::cerr << "    --block-size,--size=<n>; number of input records in the block assuming all blocks are of the same size" << std::endl;
     std::cerr << "    --discard-out-of-order,--discard-unsorted: instead of sorting, discard records out of order" << std::endl;
     std::cerr << "    --first: first line matching given keys; first line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
     std::cerr << "           fields" << std::endl;
     std::cerr << "               id: if present, multiple id fields accepted; output first record for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
     std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
-    std::cerr << "    --min: output only record(s) with minimum value for a given field." << std::endl;
+    std::cerr << "    --last: to be implemented: last line matching given keys; last line in the block, if block field present; no sorting will be done; if sorting required, use unique instead" << std::endl;
+    std::cerr << "    --min: output only record(s) with minimum value for a given field" << std::endl;
     std::cerr << "           fields" << std::endl;
     std::cerr << "               id: if present, multiple id fields accepted; output minimum for each set of ids in a given block; e.g. --fields=id,a,,id" << std::endl;
     std::cerr << "               block: if present; output minimum for each contiguous block" << std::endl;
     std::cerr << "    --max: output record(s) with maximum value, same semantics as --min" << std::endl;
     std::cerr << "           --min and --max may be used together." << std::endl;
     std::cerr << "    --numeric-keys-are-floats,--floats; in ascii, if --format not present, assume that numeric fields are floating point numbers" << std::endl;
-    std::cerr << "    --order <fields>: order in which to sort fields; default is input field order" << std::endl;
+    std::cerr << "    --order=<fields>: order in which to sort fields; default is input field order" << std::endl;
+    std::cerr << "    --random: output input records in pseudo-random order" << std::endl;
+    std::cerr << "    --random-seed,--seed=[<int>]; random seed for --random" << std::endl;
     std::cerr << "    --reverse,--descending,-r: sort in reverse order" << std::endl;
     std::cerr << "    --sliding-window,--window=<size>: sort last <size> entries" << std::endl;
     std::cerr << "    --string,-s: keys are strings; a quick and dirty option to support strings" << std::endl;
@@ -105,7 +85,6 @@ static void usage( bool more )
     std::cerr << "        using id" << std::endl;
     std::cerr << "            ( echo 1,a,2; echo 2,a,2; echo 3,b,3; echo 5,b,7; echo 3,b,9 ) | csv-sort --max --min --fields=,id,a" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     if( more )
     {
@@ -120,21 +99,17 @@ static bool verbose;
 static comma::csv::options csv;
 static bool is_min = false;
 static bool is_max = false;
+static comma::csv::block_counter block;
 
 struct ordering_t
 {
-    enum types {
-        str_type,
-        long_type,
-        double_type,
-        time_type
-    };
+    enum types { str_type, long_type, double_type, time_type };
     
-    types type;
-    int   index;
+    types type{double_type};
+    int index{0};
 };
 
-std::vector< ordering_t > ordering;
+static std::vector< ordering_t > ordering;
 
 struct input_t
 {
@@ -144,20 +119,12 @@ struct input_t
     {
         for( std::size_t i = 0; i < ordering.size(); ++i )
         { 
-            switch (ordering[i].type)
+            switch( ordering[i].type )
             {
-                case ordering_t::str_type:
-                    if (keys.strings[ordering[i].index] != rhs.keys.strings[ ordering[i].index ]) { return false; }
-                    break;
-                case ordering_t::long_type:
-                    if (keys.longs[ordering[i].index] != rhs.keys.longs[ ordering[i].index ]) { return false; }
-                    break;
-                case ordering_t::double_type:
-                    if (keys.doubles[ordering[i].index] != rhs.keys.doubles[ ordering[i].index ]) { return false; }
-                    break;
-                case ordering_t::time_type:
-                    if (keys.time[ordering[i].index] != rhs.keys.time[ ordering[i].index ]) { return false; }
-                    break;
+                case ordering_t::str_type: if (keys.strings[ordering[i].index] != rhs.keys.strings[ ordering[i].index ]) { return false; } break;
+                case ordering_t::long_type: if (keys.longs[ordering[i].index] != rhs.keys.longs[ ordering[i].index ]) { return false; } break;
+                case ordering_t::double_type: if (keys.doubles[ordering[i].index] != rhs.keys.doubles[ ordering[i].index ]) { return false; } break;
+                case ordering_t::time_type: if (keys.time[ordering[i].index] != rhs.keys.time[ ordering[i].index ]) { return false; } break;
             }
         }
         return true;
@@ -191,20 +158,17 @@ struct input_t
     }
     
     typedef std::map< input_t, std::vector< std::string > > map;
-    
 };
 
 struct input_with_block : public input_t
 {
-    comma::uint32 block;
-    input_with_block() : block( 0 ) {}
+    comma::uint32 block{0};
 };
 
 struct input_with_ids_t : public input_t
 {
     comma::csv::impl::unstructured ids;
-    comma::uint32 block;
-    input_with_ids_t() : block( 0 ) {}
+    comma::uint32 block{0};
 };
 
 namespace comma { namespace visiting {
@@ -278,8 +242,9 @@ static int handle_discard_out_of_order( comma::csv::input_stream< input_with_blo
     {
         const input_with_block* p = istream.read();
         if( !p ) { break; }
-        if( last && p->block == last->block && ( ( reverse && *last < *p ) || ( !reverse && *p < *last ) ) ) { continue; }
+        if( last && block == *p && ( reverse ? *last < *p : *p < *last ) ) { continue; }
         last = *p;
+        block.update( *p );
         output_last_( istream );
     }
     return 0;
@@ -290,11 +255,10 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
     typedef boost::unordered_set< comma::csv::impl::unstructured, comma::csv::impl::unstructured::hash > set_t;
     typedef boost::unordered_map< comma::csv::impl::unstructured, set_t, comma::csv::impl::unstructured::hash > map_t;
     map_t keys;
-    comma::uint32 block = 0;
     if( !first_line.empty() )
     { 
         input_with_ids_t input = comma::csv::ascii< input_with_ids_t >( csv, default_input ).get( first_line );
-        block = input.block;
+        block.update( input );
         keys[ input.ids ].insert( input.keys );
         std::cout << first_line << std::endl;
     }
@@ -302,23 +266,45 @@ static int handle_first( comma::csv::input_stream< input_with_ids_t >& istream,
     {
         const input_with_ids_t* p = istream.read();
         if( !p ) { break; }
-        if( p->block != block ) { block = p->block; keys.clear(); }
+        if( block.ready( *p ) ) { block.update( *p ); keys.clear(); }
         if( keys[ p->ids ].insert( p->keys ).second ) { output_last_( istream ); }
     }
     return 0;
 }
 
+// todo?
+// static int handle_last( comma::csv::input_stream< input_with_ids_t >& istream, const std::string& first_line, const input_with_ids_t& default_input )
+// {
+//     typedef boost::unordered_set< comma::csv::impl::unstructured, comma::csv::impl::unstructured::hash > set_t;
+//     typedef boost::unordered_map< comma::csv::impl::unstructured, set_t, comma::csv::impl::unstructured::hash > map_t;
+//     map_t keys;
+//     if( !first_line.empty() )
+//     { 
+//         input_with_ids_t input = comma::csv::ascii< input_with_ids_t >( csv, default_input ).get( first_line );
+//         block.update( input );
+//         keys[ input.ids ].insert( input.keys );
+//         //std::cout << first_line << std::endl;
+//     }
+//     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
+//     {
+//         const input_with_ids_t* p = istream.read();
+//         if( !p ) { break; }
+//         if( block != *p ) { block.update( *p ); keys.clear(); }
+//         if( keys[ p->ids ].insert( p->keys ).second ) { output_last_( istream ); }
+//     }
+//     return 0;
+// }
+
 static int handle_sliding_window( comma::csv::input_stream< input_with_block >& istream, const std::string& first_line, const input_with_block& default_input, bool reverse, unsigned int sliding_window )
 {
     if( sliding_window < 2 ) { std::cerr << "csv-sort: expected sliding window greater than 1, got: " << sliding_window << std::endl; return 1; }
-    comma::uint32 block = 0;
     unsigned int count = 0;
     typedef std::map< input_t, std::deque< std::string > > map_t;
     map_t map;
     if( !first_line.empty() )
     { 
         input_with_block input = comma::csv::ascii< input_with_block >( csv, default_input ).get( first_line );
-        block = input.block;
+        block.update( input );
         map_t::mapped_type& d = map[ input ];
         d.push_back( first_line );
         ++count;
@@ -326,14 +312,14 @@ static int handle_sliding_window( comma::csv::input_stream< input_with_block >&
     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) || !map.empty() )
     {
         const input_with_block* p = istream.read();
-        if( !p || p->block != block )
+        if( !p || block != *p )
         {
             if( reverse ) { output_( map.rbegin(), map.rend() ); } else { output_( map.begin(), map.end() ); }
             map.clear();
             count = 0;
         }
         if( !p ) { break; }
-        block = p->block;
+        block.update( *p );
         map_t::mapped_type& d = map[ *p ];
         if( istream.is_binary() )
         {
@@ -391,28 +377,20 @@ std::vector< comma::csv::impl::unstructured > input_order;
 
 void output_current_block( const limit_map_t& min, const limit_map_t& max )
 {
-    for( std::size_t i=0; i<input_order.size(); ++i )
+    for( std::size_t i = 0; i < input_order.size(); ++i )
     {
         const comma::csv::impl::unstructured& ids = input_order[i];
-        
         if( is_min )
         {
-            const limit_data_t& data = min.at(ids);
-            for ( std::size_t i=0; i<data.records.size(); ++i) {
-                std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() );
-            }
+            const limit_data_t& data = min.at( ids );
+            for( std::size_t i = 0; i < data.records.size(); ++i ) { std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() ); }
         }
-        
-        if( is_min && is_max && is_same_map[ ids ] ) { continue; }
-        
+        if( is_min && is_max && is_same_map[ids] ) { continue; }
         if( is_max )
         {
-            const limit_data_t& data = max.at(ids);
-            for ( std::size_t i=0; i<data.records.size(); ++i) {
-                std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() );
-            }
+            const limit_data_t& data = max.at( ids );
+            for( std::size_t i = 0; i < data.records.size(); ++i ) { std::cout.write( &( data.records[i][0] ), csv.binary() ? csv.format().size() : data.records[i].length() ); }
         }
-        
         if( csv.flush ) { std::cout.flush(); }
     }
 }
@@ -464,10 +442,8 @@ int handle_operations_with_ids( const comma::command_line_options& options )
     is_max = options.exists( "--max" );
     if( keys_size != 1 ) { std::cerr << "csv-sort: error, please specify exactly one field for --min/--max operation." << std::endl; return 1; }
     if ( verbose ) { std::cerr << "csv-sort: minimum mode: " << ( is_min ) << ", maximum mode: " << is_max  << std::endl; }
-    comma::uint32 block = 0;    // previous block number, use default of 0
     limit_map_t min_map;
     limit_map_t max_map;
-    
     bool first = true;
     if (!first_line.empty()) 
     { 
@@ -479,7 +455,7 @@ int handle_operations_with_ids( const comma::command_line_options& options )
         max_map[input.ids] = data;
         is_same_map[input.ids] = true;
         input_order.push_back( input.ids );
-        block = input.block;
+        block.update( input );
         first = false;
     }
     while( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) )
@@ -487,38 +463,32 @@ int handle_operations_with_ids( const comma::command_line_options& options )
         const input_with_ids_t* p = stdin_stream.read();
         if( !p ) { break; }
 //         std::cerr  << "p: " << comma::join( stdin_stream.ascii().last(), csv.delimiter ) << " - " << p->keys.longs[0] << std::endl;
-        
         if( first )
         {
             limit_data_t& data = min_map[p->ids];
             data.keys = *p;
             data.add_current_record( stdin_stream );
-            
             max_map[p->ids] = data;
             is_same_map[p->ids] = true;
             input_order.push_back( p->ids );
-            
-            block = p->block;
+            block.update( *p );
             first = false;
         }
-        else if( p->block != block )
+        else if( block != *p )
         {
             // Dump and clear previous
             output_current_block( min_map, max_map );
             min_map.clear();
             max_map.clear();
             input_order.clear();
-            
             // Set the same record for both min and max, it's a new block, new IDs
             limit_data_t& data = min_map[p->ids];
             data.keys = *p;
             data.add_current_record( stdin_stream );
-            
             max_map[p->ids] = data;
             is_same_map[p->ids] = true;
             input_order.push_back( p->ids );
-            
-            block = p->block;
+            block.update( *p );
         }
         else    /// The same block and not first record
         {
@@ -560,13 +530,11 @@ int handle_operations_with_ids( const comma::command_line_options& options )
                 }
                 else
                 {
-//                     std::cerr  << "found ids: " << p->ids.strings[0] << std::endl;
                     limit_data_t& data = iter->second;
                     if( *p < data.keys ) {}
                     else if( data.keys == *p ) { data.add_current_record( stdin_stream ); } //  std::cerr  << "equals " << std::endl; } // Else If equals then append
                     else
                     {
-//                         std::cerr  << "new max: " << p->ids.strings[0] << " " << p->keys.longs[0] << " " << data.keys.keys.longs[0] << std::endl;
                         data.keys = *p;
                         data.records.clear();
                         data.add_current_record( stdin_stream );
@@ -577,24 +545,94 @@ int handle_operations_with_ids( const comma::command_line_options& options )
         }
         
     }
-    
     output_current_block( min_map, max_map );
-    
+    return 0;
+}
+
+static int random( const comma::command_line_options& options )
+{
+    auto seed = options.optional< int >( "--random-seed,--seed" );
+    std::default_random_engine generator = seed ? std::default_random_engine( *seed ) : std::default_random_engine();
+    std::deque< std::string > records;
+    if( csv.has_field( "block" ) )
+    {
+        comma::csv::input_stream< input_with_block > is( std::cin, csv );
+        while( is.ready() || std::cin.good() )
+        {
+            const input_with_block* p = is.read();
+            if( !p || block != *p )
+            {
+                std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+                std::shuffle( records.begin(), records.end(), generator ); // std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+                for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+                if( csv.flush ) { std::cout.flush(); }
+                records.clear();
+                if( p ) { block.update( *p ); }
+            }
+            if( !p ) { break; }
+            if( csv.binary() )
+            {
+                records.push_back( std::string() );
+                records.back().resize( csv.format().size() );
+                std::memcpy( &records.back()[0], is.binary().last(), csv.format().size() );
+            }
+            else
+            {
+                records.push_back( comma::join( is.ascii().last(), csv.delimiter ) + "\n" );
+            }
+        }
+    }
+    else
+    {
+        // todo: quick and dirty, code duplication
+        // todo: implement --sliding-window
+        if( csv.binary() )
+        {
+            std::string s( csv.format().size(), 0 );
+            while( std::cin.good() )
+            {
+                std::cin.read( &s[0], s.size() );
+                if( std::cin.gcount() == 0 ) { break; }
+                if( std::cin.gcount() != int( s.size() ) ) { std::cerr << "csv-sort: --random: expected " << s.size() << " bytes; got " << std::cin.gcount() << std::endl; return 1; }
+                records.push_back( std::string() );
+                records.back().resize( csv.format().size() );
+                std::memcpy( &records.back()[0], &s[0], csv.format().size() );
+            }
+        }
+        else
+        {
+            while( std::cin.good() )
+            {
+                std::string s;
+                std::getline( std::cin, s );
+                if( !s.empty() ) { records.push_back( s + "\n" ); }
+            }
+        }
+        std::uniform_int_distribution< int > distribution( 0, records.size() - 1 ); // quick and dirty
+        std::shuffle( records.begin(), records.end(), generator ); // std::random_shuffle( records.begin(), records.end(), [&]( int ) -> int { return distribution( generator ); } ); // quick and dirty, watch performance
+        for( const auto& r: records ) { std::cout.write( &r[0], r.size() ); }
+    }
     return 0;
 }
 
 static int sort( const comma::command_line_options& options )
 {
     input_with_block default_input;
-    std::vector< std::string > v = comma::split( csv.fields, ',' );
-    std::vector< std::string > order = options.exists( "--order" ) ? comma::split( options.value< std::string >( "--order" ), ',' ) : v;
+    std::vector< std::string > v = comma::split( csv.fields, ',', true );
+    std::vector< std::string > order = options.exists( "--order" ) ? comma::split( options.value< std::string >( "--order" ), ',', true ) : v;
     std::vector< std::string > w( v.size() );
     bool unique = options.exists( "--unique,-u" );
     for( std::size_t k = 0; k < v.size(); ++k ) { if( v[k] == "block" ) { w[k] = "block"; } }
     std::string first_line;
     comma::csv::format f;
-    if( csv.binary() ) { f = csv.format(); }
-    else if( options.exists( "--format" ) ) { f = comma::csv::format( options.value< std::string >( "--format" ) ); }
+    if( csv.binary() )
+    {
+        f = csv.format();
+    }
+    else if( options.exists( "--format" ) )
+    {
+        f = comma::csv::format( options.value< std::string >( "--format" ) );
+    }
     else
     {
         while( std::cin.good() && first_line.empty() ) { std::getline( std::cin, first_line ); }
@@ -602,13 +640,19 @@ static int sort( const comma::command_line_options& options )
         f = comma::csv::impl::unstructured::guess_format( first_line, csv.delimiter, options.exists( "--numeric-keys-are-floats,--floats" ) );
         if( verbose ) { std::cerr << "csv-sort: guessed format: " << f.string() << std::endl; }
     }
+    if( order.empty() ) // quick and dirty for now (really should be a method in unstructured or alike)
+    {
+        order.resize( f.count() );
+        for( unsigned int i = 0; i < order.size(); ++i ) { order[i] = std::to_string( i ); }
+        if( v.empty() ) { v = order; w.resize( v.size() ); }
+    }
     for( std::size_t i = 0; i < order.size(); ++i ) // quick and dirty, wasteful, but who cares
     {
         if( order[i].empty() || order[i] == "block" ) { continue; }
         for( std::size_t k = 0; k < v.size(); ++k )
         {
-            if( v[k].empty() || v[k] != order[i] ) 
-            { 
+            if( v[k].empty() || v[k] != order[i] )
+            {
                 if( k + 1 == v.size() ) { std::cerr << "csv-sort: order field name \"" << order[i] << "\" not found in input fields \"" << csv.fields << "\"" << std::endl; return 1; }
                 continue; 
             }
@@ -634,25 +678,28 @@ static int sort( const comma::command_line_options& options )
     if( options.exists( "--discard-out-of-order,--discard-unsorted" ) ) { return handle_discard_out_of_order( istream, first_line, default_input, reverse ); }
     auto sliding_window = options.optional< unsigned int >( "--sliding-window,--window" );
     if( sliding_window ) { return handle_sliding_window( istream, first_line, default_input, reverse, *sliding_window ); }
-    comma::uint32 block = 0;
     input_t::map map;
     if( !first_line.empty() )
-    { 
+    {
         input_with_block input = comma::csv::ascii< input_with_block >( csv, default_input ).get( first_line );
-        block = input.block;
+        block.update( input );
         input_t::map::mapped_type& d = map[ input ];
         d.push_back( first_line );
     }
     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) || !map.empty() )
     {
         const input_with_block* p = istream.read();
-        if( !p || p->block != block )
+        //if( p ) { std::cerr << "==> a: block != *p: " << ( block != *p ) << " size: " << block.size() << " current_size: " << block.current_size() << " map.size(): " << map.size() << std::endl; }
+        if( !p || block != *p )
         {
+            //std::cerr << "==> b: block != *p: " << ( block != *p ) << " size: " << block.size() << " current_size: " << block.current_size() << std::endl;
             if( reverse ) { output_( map.rbegin(), map.rend() ); } else { output_( map.begin(), map.end() ); }
             map.clear();
         }
         if( !p ) { break; }
-        block = p->block;
+        //std::cerr << "==> c: block: " << block() << " current_size: " << block.current_size() << std::endl;
+        block.update( *p );
+        //std::cerr << "==> d: block: " << block() << " current_size: " << block.current_size() << std::endl;
         input_t::map::mapped_type& d = map[ *p ];
         if( unique && !d.empty() ) { continue; }
         if( istream.is_binary() )
@@ -674,12 +721,18 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--min,--sliding-window,--window,--unique" );
-        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--max,--sliding-window,--window,--unique" );
+        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--min,--sliding-window,--window,--unique,--random" );
+        options.assert_mutually_exclusive( "--discard-out-of-order,--discard-unsorted,--first,--max,--sliding-window,--window,--unique,--random" );
+        if( options.exists( "--last" ) ) { std::cerr << "csv-sort: --last: not implemented; todo" << std::endl; return 1; }
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
-        csv.full_xpath = true;
-        return options.exists( "--first,--min,--max" ) ? handle_operations_with_ids( options ) : sort( options );
+        block = comma::csv::block_counter( 0, options.value( "--block-size,--size", 0 ) );
+        if( csv.has_field( "block" ) && block.fixed() ) { comma::say() << "'block' field and --block-size are mutually exclusive; got csv fields: '" << csv.fields << "'" << std::endl; return 1; }
+        return   options.exists( "--first,--min,--max" )
+               ? handle_operations_with_ids( options )
+               : options.exists( "--random" )
+               ? random( options )
+               : sort( options );
     }
     catch( std::exception& ex ) { std::cerr << "csv-sort: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-sort: unknown exception" << std::endl; }
diff --git a/csv/applications/csv-split.cpp b/csv/applications/csv-split.cpp
index 6defbc18e..504f28ded 100644
--- a/csv/applications/csv-split.cpp
+++ b/csv/applications/csv-split.cpp
@@ -15,7 +15,7 @@
 //
 // NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
 // GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED
 // WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
 // MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifdef WIN32
@@ -38,22 +37,24 @@
 
 #include <boost/optional.hpp>
 #include <boost/program_options.hpp>
-#include "../../application/contact_info.h"
+#include "../../application/command_line_options.h"
 #include "../../csv/impl/program_options.h"
 #include "../../csv/traits.h"
 #include "split/split.h"
 
-comma::csv::options csv;
-std::vector< std::string > streams;
-boost::optional< boost::posix_time::time_duration > duration;
-std::string suffix;
-unsigned int size = 0;
-bool passthrough;
+static comma::csv::options csv;
+static std::vector< std::string > streams;
+static boost::optional< boost::posix_time::time_duration > duration;
+static std::string suffix;
+static unsigned int size = 0;
+static bool passthrough;
+static std::string files;
+static std::string default_filename;
+static std::string timestamps;
 
-template < typename T >
-void run()
+template < typename T > static int run()
 {
-    comma::csv::applications::split< T > split( duration, suffix, csv, streams, passthrough );
+    comma::csv::applications::split< T > split( duration, suffix, csv, streams, passthrough, files, default_filename, timestamps );
     if( size == 0 )
     {
         std::string line;
@@ -63,22 +64,36 @@ void run()
             if( line.empty() ) { break; }
             split.write( line );
         }
+        return 0;
     }
-    else
+    #ifdef WIN32
+        _setmode( _fileno( stdin ), _O_BINARY );
+    #endif
+    bool has_size = csv.has_field( "size" );
+    std::vector< char > buffer( std::max< unsigned int >( size, 32768 )); // quick and dirty
+    typedef comma::csv::applications::input< T > input_t;
+    comma::csv::binary< input_t > binary( csv );
+    input_t header;
+    while( std::cin.good() && !std::cin.eof() )
     {
-        #ifdef WIN32
-            _setmode( _fileno( stdin ), _O_BINARY );
-        #endif
-        std::vector< char > packet( size );
-        while( std::cin.good() && !std::cin.eof() )
+        std::cin.read( &buffer[0], size );
+        if( std::cin.gcount() == 0 ) { break; }
+        COMMA_ASSERT_BRIEF( std::cin.gcount() == int( size ), "expected " << size << " bytes; got: " << size );
+        unsigned int total_size = size;
+        if( has_size )
         {
-            std::cin.read( &packet[0], size );
-            if( std::cin.gcount() > 0 ) { split.write( &packet[0], size ); }
+            binary.get( header, &buffer[0] );
+            total_size += header.size;
+            if( buffer.size() < total_size ) { buffer.resize( total_size ); }
+            std::cin.read( &buffer[size], header.size );
+            COMMA_ASSERT_BRIEF( std::cin.gcount() == int( header.size ), "expected " << header.size << " bytes; got: " << size );
         }
+        split.write( &buffer[0], total_size );
     }
+    return 0;
 }
 
-int main( int argc, char** argv )
+int main( int ac, char** av )
 {
     try
     {
@@ -87,90 +102,130 @@ int main( int argc, char** argv )
         boost::program_options::options_description description( "options" );
         description.add_options()
             ( "help,h", "display help message" )
-            ( "size,c", boost::program_options::value< unsigned int >( &size ), "packet size, only full packets will be written" )
+            ( "default-file", boost::program_options::value< std::string >( &default_filename ), "todo: if --files present, unmatched ids will be put in the file with a given name; otherwise, unmatched values will be ignored" )
+            ( "files", boost::program_options::value< std::string >( &files ), "if 'block' or 'id' field present, list of output files (see examples below)" )
+            ( "passthrough,pass", "pass data through to stdout" )
             ( "period,t", boost::program_options::value< double >( &period ), "period in seconds after which a new file is created" )
-            ( "suffix,s", boost::program_options::value< std::string >( &extension ), "filename extension; default will be csv or bin, depending whether it is ascii or binary" )
+            ( "size,c", boost::program_options::value< unsigned int >( &size ), "packet size, only full packets will be written" )
             ( "string", "id is string; default: 32-bit integer" )
+            ( "suffix,s", boost::program_options::value< std::string >( &extension ), "filename extension; default will be csv or bin, depending whether it is ascii or binary" )
             ( "time", "id is time; default: 32-bit integer" )
-            ( "passthrough,pass", "pass data through to stdout" );
+            ( "timestamps", boost::program_options::value< std::string >( &timestamps ), "<filename>[;<csv options>]: split by timestamps (assuming both input and timestamps are in ascending order)" );
         description.add( comma::csv::program_options::description() );
         boost::program_options::variables_map vm;
-        boost::program_options::store( boost::program_options::parse_command_line( argc, argv, description), vm );
-        boost::program_options::parsed_options parsed = boost::program_options::command_line_parser(argc, argv).options( description ).allow_unregistered().run();
+        boost::program_options::store( boost::program_options::parse_command_line( ac, av, description ), vm );
+        boost::program_options::parsed_options parsed = boost::program_options::command_line_parser( ac, av ).options( description ).allow_unregistered().run();
         boost::program_options::notify( vm );
         if ( vm.count( "help" ) || vm.count( "long-help" ) )
         {
-            std::cerr << std::endl;
-            std::cerr << "read from stdin by packet or by line and split into files named by field value or time (if split by time)." << std::endl;
-            std::cerr << "if splitting by id, input can also be splitted into streams" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "usage: csv-split [options] [outputs]*" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "use cases" << std::endl;
-            std::cerr << "    split by id field, output to files" << std::endl;
-            std::cerr << "        if id field present in --fields:" << std::endl;
-            std::cerr << "        for each id value, output records with this id to a separate file, e.g. 0.csv, 1.csv, etc" << std::endl;
-            std::cerr << "        example: ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) | csv-split --fields id" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "    split by block field, output to files" << std::endl;
-            std::cerr << "        if block field present in --fields:" << std::endl;
-            std::cerr << "        output records with this block to a separate file, on change of block, open a new file, e.g. 0.csv, 1.csv, etc" << std::endl;
-            std::cerr << "        example: ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "    split by t field, output to files" << std::endl;
-            std::cerr << "        if t (timestamp) field present in --fields:" << std::endl;
-            std::cerr << "        separate records into different time periods, outputting in separate files" << std::endl;
-            std::cerr << "        example: ( echo 20170101T000001,a; echo 20170101T000003,b; echo 20170101T000007,c ) | csv-split --fields=t --period=4" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "    split by id field, output to streams" << std::endl;
-            std::cerr << "        if output streams (see example below) are present on the command line and id field present in --fields:" << std::endl;
-            std::cerr << "        output records with the given ids to the corresponding streams, while outputing the rest into files" << std::endl;
-            std::cerr << "        records with ids for which output stream is not specified will be discarded, unless ... stream is specified:" << std::endl;
-	    std::cerr << std::endl;
-	    std::cerr << "        outputs: <keys>;<stream>; to send records with a given set of ids to this stream" << std::endl;
-            std::cerr << "            keys:" << std::endl;
-            std::cerr << "                <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc" << std::endl;
-            std::cerr << "                ...: three dots mean: send to this stream all the records with ids for which no other stream is specified (see example below)" << std::endl;
-            std::cerr << "            stream:" << std::endl;
-	    std::cerr << "                tcp:<port>: e.g. tcp:1234" << std::endl;
-	    std::cerr << "                udp:<port>: e.g. udp:1234 (todo)" << std::endl;
-	    std::cerr << "                local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
-	    std::cerr << "                <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
-	    std::cerr << "                <filename>: a regular file" << std::endl;
-            std::cerr << "        example: ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) | csv-split --fields id \"0,1;tcp:5999\" \"...;local:/tmp/named_fifo\"" << std::endl;
-            std::cerr << std::endl;
-            std::cerr << description << std::endl;
-            std::cerr << std::endl;
-            std::cerr << "fields to split by listed in descending precedence" << std::endl;
-            std::cerr << "    block: split on the block number change" << std::endl;
-            std::cerr << "    id: split by id (same as block, except does not have to be contiguous by the price of worse performance)" << std::endl;
-            std::cerr << "    t: if present, use timestamp from the packet; if absent, use system time" << std::endl;
-	    std::cerr << std::endl;
-            std::cerr << comma::contact_info << std::endl;
-            std::cerr << std::endl;
-            return 1;
+            std::cerr << R"(
+read from stdin by packet or by line and split into files
+files are named by field value or time (if split by time)
+if splitting by id, input can also be split into streams
+
+usage: csv-split [options] [outputs]*
+)";
+            std::cerr << description;
+            std::cerr << R"(
+
+--fields=<fields>; <fields>: t,block,id,size
+    data is split by one of the following fields (listed in descending precedence)
+        block: split on the block number change
+        id   : split by id (same as block, except does not have to be contiguous
+                           with the price of worse performance)
+        t    : if present, use timestamp from the packet; if absent, use system time
+    size: if present, assume that fixed-width data is followed by <n> bytes
+          where <n> is the value of the size field; used only in binary mode
+          e.g: for the command: csv-split --fields t,,,size --binary=t,3ui,2f
+          the record has a fixed part (header) with format t,3ui,2f followed
+          by variable payload of size read from 'size' field (which can be 0 as well)
+
+examples:
+    --- split by block field, output to files ---
+    output records for each block to a separate file
+    on change of block, open a new file, e.g. 0.csv, 1.csv, etc
+
+    with default filenames:
+    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields block
+
+    with specified filenames:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields block --files <( echo a; echo b; echo c )
+csv-split
+    with filenames mapped to block ids:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields block \
+              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'
+
+    --- split by id field, output to files ---
+    for each id value, output records with this id to a separate file,
+    e.g. 0.csv, 1.csv, etc
+
+    with default filenames:
+    ( echo 0,a; echo 1,b; echo 1,c; echo 2,d ) | csv-split --fields id
+
+    with specified filenames:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields id --files <( echo a; echo b; echo c )
+
+    with filenames mapped to block ids:
+    ( echo 0; echo 1; echo 2 ) \
+        | csv-split --fields id \
+              --files <( echo 0,a; echo 1,b; echo 2,c )';fields=id,filename'
+
+    --- split by t field, output to files ---
+    separate records into different time periods, outputting in separate files
+    ( echo 20170101T000001,a; echo 20170101T000003,b; echo 20170101T000007,c ) \
+        | csv-split --fields=t --period=4
+
+    --- split by id field, output to streams ---
+    if output streams (see example below) are present on the command line and 
+    id field present in --fields output records with the given ids to the
+    corresponding streams, while outputing the rest into files
+
+    records with ids for which output stream is not specified will be discarded,
+    unless ... stream is specified:
+
+    outputs: <keys>;<stream>; send records with given set of i32768ds to this stream
+        keys:
+            <id>[,<id>]*: comma-separated list of ids, e.g: '5' or '2,5,7', etc
+            ... (three dots): send to this stream all the records with ids
+                for which no other stream is specified (see example below)
+        stream:
+            tcp:<port>: e.g. tcp:1234
+            udp:<port>: e.g. udp:1234 (todo)
+            local:<name>: linux/unix local server socket
+                          e.g. local:./tmp/my_socket
+            <named pipe name>: named pipe, re-opened if client reconnects
+            <filename>: a regular file
+
+        ( echo 0,a; echo 1,b; echo 0,c; echo 2,d ) \
+            | csv-split --fields id "0,1;tcp:5999" "...;local:/tmp/named_fifo"
+        ( echo 0,a; echo 1,b ) | csv-split --fields id --files \
+                  <( echo '1,one.csv'; echo '0,zero.csv' )';fields=id,filename'
+
+)";
+            return 0;
         }
-        csv = comma::csv::program_options::get( vm );
+        comma::command_line_options options( ac, av );
+        csv = comma::csv::options( options );
+        COMMA_ASSERT_BRIEF( !vm.count( "period" ) || !vm.count( "timestamps" ), "csv-split: --period and --timestamps are mutually exclusive (todo? combine them? just ask)" );
+        COMMA_ASSERT_BRIEF( default_filename.empty(), "csv-split: --default-filename: todo, just ask" )
         if( csv.binary() ) { size = csv.format().size(); }
         bool id_is_string = vm.count( "string" );
         bool id_is_time = vm.count( "time" );
         passthrough = vm.count("passthrough");
-        
-        if( id_is_string && id_is_time ) { std::cerr << "csv-split: either --string or --time" << std::endl; }
-        if( period > 0 ) { duration = boost::posix_time::microseconds( static_cast<unsigned int> (period * 1e6 )); }
+        COMMA_ASSERT_BRIEF( !id_is_string || !id_is_time, "csv-split: --string and --time are mutually exclusive" );
+        if( period > 0 ) { duration = boost::posix_time::microseconds( static_cast< unsigned int >( period * 1e6 )); }
         if( extension.empty() ) { suffix = csv.binary() || size > 0 ? ".bin" : ".csv"; }
         else { suffix += "."; suffix += extension; }
-
         streams = boost::program_options::collect_unrecognized( parsed.options, boost::program_options::include_positional );
-        if( !streams.empty() && ( csv.has_field( "block" ) || id_is_time ) ) { std::cerr << "publisher streams are not compatible with splitting by block or timestamp." << std::endl; return 1; }
-
-        if( id_is_string ) { run< std::string >(); }
-        else if( id_is_time ) { run< boost::posix_time::ptime >(); }
-        else { run< comma::uint32 >(); }
-        return 0;
+        COMMA_ASSERT_BRIEF( !( !streams.empty() && ( csv.has_field( "block" ) || id_is_time ) ), "publisher streams are not compatible with splitting by block or timestamp." );
+        if( id_is_string ) { return run< std::string >(); }
+        if( id_is_time ) { return run< boost::posix_time::ptime >(); }
+        return run< comma::uint32 >();
     }
-    catch( std::exception& ex ) { std::cerr << argv[0] << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << argv[0] << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
-
diff --git a/csv/applications/csv-strings.cpp b/csv/applications/csv-strings.cpp
new file mode 100644
index 000000000..be7510b40
--- /dev/null
+++ b/csv/applications/csv-strings.cpp
@@ -0,0 +1,383 @@
+// Copyright (c) 2018 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#include <deque>
+#include <functional>
+#include <iostream>
+
+#include <boost/lexical_cast.hpp>
+
+#include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../csv/stream.h"
+#include "../../csv/traits.h"
+#include "../../io/impl/filesystem.h"
+#include "../../string/string.h"
+
+static void usage( bool verbose )
+{
+    std::cerr << '\n';
+    std::cerr << "operations on strings\n";
+    std::cerr << '\n';
+    std::cerr << "    usage: cat input.csv | csv-strings <operation> [<options>] > output.csv\n";
+    std::cerr << '\n';
+    std::cerr << "operations\n";
+    std::cerr << "    add\n";
+    std::cerr << "    path-basename,basename\n";
+    std::cerr << "    path-common\n";
+    std::cerr << "    path-dirname,dirname\n";
+    std::cerr << "    path-real,path-canonical\n";
+    std::cerr << '\n';
+    std::cerr << "options\n";
+    std::cerr << "    --emplace; perform operation emplace\n";
+    std::cerr << "    --fields=[<fields>]; will perform operation on any non-empty fields\n";
+    std::cerr << "                         unless different semantics specified for operation\n";
+    std::cerr << "                         default: perform operation on the first field\n";
+    std::cerr << "    --strict; exit on strings on which operation does not make sense\n";
+    std::cerr << '\n';
+    std::cerr << "add\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --prefix=[<prefix>]; add prefix\n";
+    std::cerr << "        --suffix=[<suffix>]; add suffix\n";
+    std::cerr << '\n';
+    std::cerr << "path-basename,basename\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to remove\n";
+    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to keep\n";
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default: '/'\n";
+    std::cerr << '\n';
+    std::cerr << "path-common\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --once; output only the common path, do not append or emplace\n";
+    std::cerr << "        --dirname-on-single-record; if only one input record, output its 'dirname'; e.g: on a single\n";
+    std::cerr << "                                    input record 'a/b/c' output 'a/b'\n";
+    std::cerr << "        --dirname-on-full-match; if there is an input record that fully matches the common path\n";
+    std::cerr << "                                 output its 'dirname'; e.g: on 'a/b/c' and 'a/b/c/d' output 'a/b'\n";
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default: '/'\n";
+    std::cerr << '\n';
+    std::cerr << "path-dirname,dirname\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --head=<depth>; default=0; number of path elements at the beginning of the path to keep\n";
+    std::cerr << "        --tail=<depth>; default=1; number of path elements at the end of the path to remove\n";
+    std::cerr << "        --path-delimiter,-p=<delimiter>; default: '/'\n";
+    std::cerr << '\n';
+    std::cerr << "path-real,path-canonical\n";
+    std::cerr << "    options\n";
+    std::cerr << "        --base=[<path>]; base path, default: current directory\n";
+    std::cerr << '\n';
+    std::cerr << "csv options\n";
+    std::cerr << comma::csv::options::usage( "", verbose ) << '\n';
+    std::cerr << '\n';
+    exit( EXIT_SUCCESS );
+}
+
+static bool strict;
+static comma::csv::options csv;
+
+namespace comma { namespace applications { namespace strings {
+
+template < typename T >
+struct record
+{ 
+    std::vector< T > values;
+    record( unsigned int n = 0 ) : values( n ) {}
+};
+
+typedef record< std::string > input;
+
+} } } // namespace comma { namespace applications { namespace strings {
+
+namespace comma { namespace visiting {
+
+template < typename T > struct traits< comma::applications::strings::record< T > >
+{
+    template < typename K, typename V > static void visit( const K&, const comma::applications::strings::record< T >& p, V& v ) { v.apply( "values", p.values ); }
+    template < typename K, typename V > static void visit( const K&, comma::applications::strings::record< T >& p, V& v ) { v.apply( "values", p.values ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace applications { namespace strings {
+
+template < typename T >
+static int run( const comma::command_line_options& options )
+{
+    if( ::csv.binary() && !options.exists( "--emplace") ) { std::cerr << "csv-strings: path-" << T::name() << ": binary mode supported only for --emplace; todo, just ask\n"; exit( 1 ); }
+    auto v = comma::split( ::csv.fields, options.value( "--delimiter", ',' ) );
+    unsigned int n = 0;
+    for( unsigned int i = 0; i < v.size(); ++i )
+    {
+        if( v[i].empty() ) { continue; }
+        v[i] = "values[" + boost::lexical_cast< std::string >( n ) + "]";
+        ++n;
+    }
+    ::csv.fields = n == 0 ? std::string( "values[0]" ) : comma::join( v, ',' );
+    if( n == 0 ) { ++n; }
+    comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
+    std::function< void( const typename T::output_t& p ) > write;
+    auto run_ = [&]() -> int
+    {
+        T t( options );
+        while( istream.ready() || std::cin.good() )
+        {
+            const input* p = istream.read();
+            if( !p ) { break; }
+            typename T::output_t r( n );
+            for( unsigned int i = 0; i < p->values.size(); ++i ) { r.values[i] = t.convert( p->values[i] ); }
+            write( r );
+            if( ::csv.flush ) { std::cout.flush(); }
+        }
+        return 0;
+    };
+    if( options.exists( "--emplace" ) )
+    {
+        comma::csv::passed< input > passed( istream, std::cout, ::csv.flush );
+        write = [&]( const typename T::output_t& p ) { passed.write( p ); };
+        return run_();
+    }
+    comma::csv::options output_csv = ::csv;
+    output_csv.fields = "values";
+    comma::csv::output_stream< typename T::output_t > ostream( std::cout, output_csv, input( n ) );
+    comma::csv::tied< input, typename T::output_t > tied( istream, ostream );
+    write = [&]( const typename T::output_t& p ) { tied.append( p ); };
+    return run_();
+}
+
+namespace path {
+
+struct basename
+{
+    typedef input output_t;
+
+    unsigned int head;
+    unsigned int tail;
+    char delimiter;
+
+    static const char* name() { return "basename"; }
+
+    basename( const comma::command_line_options& options )
+        : head( options.value( "--head", 0 ) )
+        , tail( options.value( "--tail", 1 ) )
+        , delimiter( options.value( "--path-delimiter,-p", '/' ) )
+    {
+        options.assert_mutually_exclusive( "--head,--tail" );
+    }
+
+    std::string convert( const std::string& t ) const
+    {
+        bool is_absolute = !t.empty() && t[0] == delimiter;
+        const auto& s = comma::split( t, delimiter );
+        if( head > 0 )
+        {
+            if( s.size() >= head ) { return comma::join( s.begin() + head, s.end(), delimiter ); }
+            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+            return "";
+        }
+        if( s.size() >= tail )
+        {
+            auto o = comma::join( s.end() - tail, s.end(), delimiter );
+            if ( is_absolute && o.empty() ) { o = delimiter; }
+            return o;
+        }
+        if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+        return t;
+    }
+};
+
+struct dirname
+{
+    typedef input output_t;
+    unsigned int head;
+    unsigned int tail;
+    char delimiter;
+
+    static const char* name() { return "dirname"; }
+
+    dirname( const comma::command_line_options& options )
+        : head( options.value( "--head", 0 ) )
+        , tail( options.value( "--tail", 1 ) )
+        , delimiter( options.value( "--path-delimiter,-p", '/' ) )
+    {
+        options.assert_mutually_exclusive( "--head,--tail" );
+    }
+
+    std::string convert( const std::string& t ) const
+    {
+        bool is_absolute = !t.empty() && t[0] == delimiter;
+        const auto& s = comma::split( t, delimiter );
+        if( head > 0 )
+        {
+            if( s.size() >= head )
+            {
+                auto o = comma::join( s.begin(), s.begin() + head, delimiter );
+                if( is_absolute && o.empty() ) { o = delimiter; }
+                return o;
+            }
+            if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << head << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+            return t;
+        }
+        if( s.size() >= tail )
+        {
+            auto o = comma::join( s.begin(), s.end() - tail, delimiter );
+            if( is_absolute && o.empty() ) { o = delimiter; }
+            return o;
+        }
+        if( strict ) { COMMA_THROW( comma::exception, "expected path depth at least " << tail << "; got: '" << comma::join( s, delimiter ) << "'" ); }
+        return is_absolute ? std::string( 1, delimiter ) : "";
+    }
+};
+
+struct canonical
+{
+    typedef input output_t;
+    
+    comma::filesystem::path base;
+
+    static constexpr char const* name() { return "canonical"; }
+    
+    canonical( const comma::command_line_options& options )
+        : base( options.exists( "--base" )
+        ? comma::filesystem::path( options.value< std::string >( "--base" ) )
+        : comma::filesystem::current_path() )
+    {
+        if( ( options.value( "--path-delimiter,-p", '/' ) ) != '/' ) { COMMA_THROW( comma::exception, "path-canonical: expected path delimiter '/'; got: '" << options.value( "--path-delimiter,-p", '/' ) << "'" ); }
+    }
+
+    std::string convert( const std::string& s ) const
+    {
+        try { return comma::filesystem::canonical( base / comma::filesystem::path( s )).string(); } catch( ... ) { if( strict ) { throw; } }
+        return s;
+    }
+};
+
+namespace common {
+
+typedef input output_t;
+
+static int run( const comma::command_line_options& options )
+{
+    if( ::csv.binary() ) { std::cerr << "csv-strings: path-common: binary mode: todo, just ask" << std::endl; exit( 1 ); }
+    if( options.exists( "--emplace ") ) { std::cerr << "csv-strings: path-common: --emplace: todo, just ask" << std::endl; exit( 1 ); }
+    auto v = comma::split( ::csv.fields, options.value( "--delimiter", ',' ) );
+    unsigned int n = 0;
+    for( unsigned int i = 0; i < v.size(); ++i )
+    {
+        if( v[i].empty() ) { continue; }
+        v[i] = "values[" + boost::lexical_cast< std::string >( n ) + "]";
+        ++n;
+    }
+    ::csv.fields = n == 0 ? std::string( "values[0]" ) : comma::join( v, ',' );
+    if( n == 0 ) { ++n; }
+    comma::csv::input_stream< input > istream( std::cin, ::csv, input( n ) );
+    std::deque< std::string > inputs;
+    output_t output;
+    char delimiter = options.value( "--path-delimiter,-p", '/' );
+    bool once = options.exists( "--once" );
+    bool dirname_on_single_record = options.exists( "--dirname-on-single-record" );
+    bool dirname_on_full_match = options.exists( "--dirname-on-full-match" );
+    std::vector< char > full_match( n, true );
+    unsigned int count = 0;
+    while( istream.ready() || std::cin.good() )
+    {
+        auto p = istream.read();
+        if( !p ) { break; }
+        if( !once ) { inputs.emplace_back( istream.last() ); }
+        if( output.values.empty() ) { output.values = p->values; continue; }
+        for( std::size_t i = 0; i < p->values.size(); ++i )
+        {
+            const std::string& common = comma::common_front( output.values[i], p->values[i], delimiter );
+            if( dirname_on_full_match ) { full_match[i] = ( full_match[i] && output.values[i] == common ) || ( !full_match[i] && p->values[i] == common ); }
+            output.values[i] = common;
+        }
+        ++count;
+    }
+    if( dirname_on_full_match || ( dirname_on_single_record && count < 2 ) )
+    {
+        for( unsigned int i = 0; i < output.values.size(); ++i )
+        {
+            if( !full_match[i] ) { continue; }
+            bool is_absolute = output.values[i][0] == delimiter;
+            const auto& s = comma::split( output.values[i], delimiter );
+            output.values[i] = comma::join( s.begin(), s.end() - 1, delimiter );
+            if ( is_absolute && output.values[i].empty() ) { output.values[i] = std::string( 1, delimiter ); }
+        }
+    }
+    if( once )
+    {
+        if( ::csv.binary() ) { COMMA_THROW( comma::exception, "todo" ); }
+        else
+        {
+            std::string comma;
+            for( std::size_t i = 0; i < output.values.size(); ++i )
+            {
+                std::cout << comma << output.values[i];
+                comma = ::csv.delimiter;
+            }
+            std::cout << std::endl;
+        }
+    }
+    else
+    {
+        for( const auto& input : inputs )
+        {
+            std::cout.write( &input[0], input.size() );
+            for( std::size_t i = 0; i < output.values.size(); ++i ) { std::cout << ::csv.delimiter << output.values[i]; }
+            std::cout << std::endl;
+        }
+    }
+    return 0;
+}
+
+} } // namespace common { namespace path {
+
+struct add
+{
+    typedef input output_t;
+
+    std::string prefix;
+    std::string suffix;
+
+    static constexpr char const* name() { return "add"; }
+
+    explicit add( const comma::command_line_options& options )
+        : prefix( options.value( "--prefix", std::string() ) )
+        , suffix( options.value( "--suffix", std::string() ) ) {}
+
+    std::string convert( const std::string& t ) const { return prefix + t + suffix; }
+};
+    
+} } } // namespace comma { namespace applications { namespace strings {
+
+// todo
+// - basename
+//   - fix absolute path behaviour
+//   - fix --head; add tests
+//   - fix --tail; add tests
+// - dirname
+//   - fix absolute path behaviour
+//   - fix --head; add tests
+//   - fix --tail; add tests
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        const auto& unnamed = options.unnamed( "--flush,--verbose,-v,--emplace,--strict,--once,--dirname-on-single-record,--dirname-on-full-match", "-.*" );
+        if( unnamed.empty() ) { std::cerr << "csv-strings: please specify operation\n"; return 1; }
+        std::string operation = unnamed[0];
+        strict = options.exists( "--strict" );
+        csv = comma::csv::options( options );
+        if( operation == "add" ) { return comma::applications::strings::run< comma::applications::strings::add >( options ); }
+        if( operation == "path-basename" || operation == "basename" ) { return comma::applications::strings::run< comma::applications::strings::path::basename >( options ); }
+        if( operation == "path-dirname" || operation == "dirname" ) { return comma::applications::strings::run< comma::applications::strings::path::dirname >( options ); }
+        if( operation == "path-real" || operation == "path-canonical" ) { return comma::applications::strings::run< comma::applications::strings::path::canonical >( options ); }
+        if( operation == "path-common" ) { return comma::applications::strings::path::common::run( options ); }
+        std::cerr << "csv-strings: expection operation; got: '" << operation << "'\n";
+        return 1;
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-strings: " << ex.what() << '\n'; }
+    catch( ... ) { std::cerr << "csv-strings: unknown exception\n"; }
+    return 1;
+}
diff --git a/csv/applications/csv-thin.cpp b/csv/applications/csv-thin.cpp
index 3ee53466f..238a5c506 100644
--- a/csv/applications/csv-thin.cpp
+++ b/csv/applications/csv-thin.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -42,7 +15,6 @@
 #include <boost/random/uniform_real.hpp>
 #include <boost/random/variate_generator.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../io/file_descriptor.h"
@@ -53,50 +25,42 @@
 
 using namespace comma;
 
-static void usage(bool detail=false)
+static void usage( bool verbose = false )
 {
     std::cerr << std::endl;
-    std::cerr << "Read input data and thin them down by the given percentage;" << std::endl;
+    std::cerr << "read input data and thin them down by the given percentage;" << std::endl;
     std::cerr << "buffer handling optimized for a high-output producer" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "Usage: cat full.csv | csv-thin [<rate>] [<options>] > thinned.csv" << std::endl;
+    std::cerr << "usage: cat full.csv | csv-thin [<rate>] [<options>] > thinned.csv" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "options:" << std::endl;
-    std::cerr << "    --binary,-b=<format>: data is packets of fixed size given by <format>." << std::endl;
-    std::cerr << "                          Alternatively use --size" << std::endl;
-    std::cerr << "    --deterministic,-d: input is downsampled by a factor of int( 1 / <rate> )." << std::endl;
-    std::cerr << "                That is, if <rate> is 0.33, output every third packet." << std::endl;
-    std::cerr << "                Default is to output each packet with a probability of <rate>." << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --binary,-b=<format>: data is packets of fixed size given by <format>" << std::endl;
+    std::cerr << "                          alternatively use --size" << std::endl;
+    std::cerr << "    --deterministic,-d: input is downsampled by a factor of int( 1 / <rate> )" << std::endl;
+    std::cerr << "                        that is, if <rate> is 0.33, output every third packet" << std::endl;
+    std::cerr << "                        default is to output each packet with a probability of <rate>" << std::endl;
     std::cerr << "    --fields=<fields>: use timestamp in fields to determine time for --period" << std::endl;
-    std::cerr << "    --fps,--frames-per-second=<d>: deprecated and removed" << std::endl;
+    std::cerr << "    --invert,-i; invert selection logic; e.g. to split data" << std::endl;
     std::cerr << "    --period=<n>: output once every <n> seconds, ignores <rate>" << std::endl;
     std::cerr << "    --size,-s=<size>: data is packets of fixed size, otherwise data is expected" << std::endl;
     std::cerr << "                      line-wise. Alternatively use --binary" << std::endl;
+    std::cerr << "    --seed=[<value>]; random seed" << std::endl;
     std::cerr << std::endl;
-    if( detail )
-    {
-        std::cerr << "csv options:" << std::endl;
-        std::cerr<< comma::csv::options::usage() << std::endl;
-        std::cerr << std::endl;
-    }
-    else
-    {
-        std::cerr << "use -v or --verbose to see more detail" << std::endl;
-        std::cerr << std::endl;
-    }
-    std::cerr << "examples:" << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << "examples" << std::endl;
     std::cerr << "    output 70% of data:          cat full.csv | csv-thin 0.7" << std::endl;
     std::cerr << "    output once every 2 seconds: cat full.csv | csv-thin --period 2" << std::endl;
     std::cerr << "    using timestamp from input:  cat full.csv | csv-thin --period 2 --fields t" << std::endl;
     std::cerr << "    binary data:                 cat full.bin | csv-thin 0.1 --binary 3d" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 static double rate;
 static bool deterministic;
+static bool invert;
+static boost::optional< comma::uint32 > seed;
 static boost::optional< boost::posix_time::microseconds > period;
 
 struct timestamped
@@ -116,18 +80,15 @@ template <> struct traits< timestamped >
 
 } } // namespace comma { namespace visiting {
 
-static bool ignore()
+static bool skip()
 {
     if( period )
     {
         static boost::posix_time::ptime next_time = boost::posix_time::microsec_clock::universal_time();
         boost::posix_time::ptime now = boost::posix_time::microsec_clock::universal_time();
-        if( now > next_time )
-        {
-            next_time += *period;
-            return false;
-        }
-        return true;
+        if( now <= next_time ) { return true; }
+        next_time += *period;
+        return false;
     }
     if( deterministic )
     {
@@ -147,29 +108,24 @@ static bool ignore()
         ++count;
         if( count < ( step + 1 ) / rate ) { return true; }
         ++step;
-        if( step == size )
-        {
-            count = 0;
-            step = 0;
-        }
+        if( step == size ) { count = step = 0; }
         return false;
     }
-    static boost::mt19937 rng;
+    static boost::mt19937 rng = seed ? boost::mt19937( *seed ) : boost::mt19937();
     static boost::uniform_real<> dist( 0, 1 );
     static boost::variate_generator< boost::mt19937&, boost::uniform_real<> > random( rng, dist );
     static bool do_ignore = comma::math::less( rate, 1.0 );
     return do_ignore && random() > rate;
 }
 
-static bool ignore_with_timestamp( boost::posix_time::ptime timestamp )
+static bool keep() { return skip() == invert; }
+
+static bool skip_by_timestamp( boost::posix_time::ptime timestamp )
 {
     static boost::posix_time::ptime next_time = timestamp;
-    if( timestamp > next_time )
-    {
-        next_time += *period;
-        return false;
-    }
-    return true;
+    if( timestamp < next_time ) { return true; }
+    while( next_time <= timestamp ) { next_time += *period; }
+    return false;
 }
 
 int main( int ac, char** av )
@@ -178,41 +134,40 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         bool binary = options.exists( "--size,-s,--binary,-b" );
+        bool flush = options.exists( "--flush" );
         deterministic = options.exists( "--deterministic,-d" );
-        if( options.exists( "--period" )) { period = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--period" ) * 1000000 )); }
-        if(options.exists("--fps,--frames-per-second")) { COMMA_THROW( comma::exception, "ERROR: --fps option is deprecated and removed! Please talk to software team if you are using it"); }
+        invert = options.exists( "--invert,-i" );
+        seed = options.optional< comma::uint32 >( "--seed" );
+        if( options.exists( "--period" )) { period = boost::posix_time::microseconds( static_cast< unsigned int >( options.value< double >( "--period" ) * 1000000 ) ); }
         #ifdef WIN32
         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
-
         if( options.exists( "--fields" ))
         {
-            if( !period ) { COMMA_THROW( comma::exception, "--fields requires --period option" ); }
-            comma::csv::options csv( options );
-            comma::csv::input_stream< timestamped > istream( std::cin, csv );
+            if( !period ) { comma::say() << "--fields requires --period option" << std::endl; }
+            comma::csv::input_stream< timestamped > istream( std::cin, comma::csv::options( options ) );
             while( std::cin.good() && !std::cin.eof() )
             {
                 const timestamped* p = istream.read();
                 if( !p ) { break; }
-                if( !ignore_with_timestamp( p->timestamp ))
+                if( skip_by_timestamp( p->timestamp ) != invert ) { continue; }
+                if( istream.is_binary())
                 {
-                    if( istream.is_binary()) { std::cout.write( istream.binary().last(), istream.binary().size() ); }
-                    else { std::cout << comma::join( istream.ascii().last(), istream.ascii().ascii().delimiter() )<< std::endl; }
+                    std::cout.write( istream.binary().last(), istream.binary().size() );
+                    if( flush ) { std::cout.flush(); }
                 }
+                else { std::cout << comma::join( istream.ascii().last(), istream.ascii().ascii().delimiter() ) << std::endl; }
             }
             return 0;
         }
-        
         std::vector< std::string > v;
-
         if( !period )
         {
             v = options.unnamed( "--deterministic,-d", "-.*" );
-            if( v.empty() ) { std::cerr << "csv-thin: please specify rate" << std::endl; usage(); }
+            if( v.empty() ) { comma::say() << "please specify rate" << std::endl; return 1; }
             rate = boost::lexical_cast< double >( v[0] );
-            if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { std::cerr << "csv-thin: expected rate between 0 and 1, got " << rate << std::endl; usage(); }
+            if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { comma::say() << "expected rate between 0 and 1, got " << rate << std::endl; return 1; }
         }
-
         if( binary ) // quick and dirty, improve performance by reading larger buffer
         {
             std::size_t size = options.value( "--size,-s", 0u );
@@ -220,7 +175,7 @@ int main( int ac, char** av )
             boost::optional< comma::csv::format > f;
             if( !format_string.empty() ) { f.reset( comma::csv::format( format_string ) ); }
             if( !size ) { size = f->size(); }
-            if( f && f->size() != size ) { std::cerr << "csv-thin: expected consistent size, got --size " << size << " and --binary of size " << f->size() << std::endl; return 1; }
+            if( f && f->size() != size ) { comma::say() << "expected consistent size, got --size " << size << " and --binary of size " << f->size() << std::endl; return 1; }
             unsigned int factor = 65536 / size; // arbitrary
             if( factor == 0 ) { factor = 1; }
             std::vector< char > buf( size * factor );
@@ -234,8 +189,8 @@ int main( int ac, char** av )
                 //std::size_t e = available < int( size ) ? size : available - available % size;
                 std::cin.read( &buf[0], size ); // quick and dirty
                 if( std::cin.gcount() <= 0 ) { break; }
-                if( std::cin.gcount() < int( size ) ) { std::cerr << "csv-thin: expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; exit( 1 ); }
-                { if( !ignore() ) { std::cout.write( &buf[0], size ); std::cout.flush(); } }
+                if( std::cin.gcount() < int( size ) ) { comma::say() << "expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; return 1; }
+                if( keep() ) { std::cout.write( &buf[0], size ); std::cout.flush(); }
             }
             #else
             char* cur = &buf[0];
@@ -246,14 +201,14 @@ int main( int ac, char** av )
                 int count = ::read( comma::io::stdin_fd, cur + offset, capacity );
                 if( count <= 0 )
                 {
-                    if( offset != 0 ) { std::cerr << "csv-thin: expected at least " << size << " bytes, got only " << offset << std::endl; return 1; }
+                    if( offset != 0 ) { comma::say() << "expected at least " << size << " bytes, got only " << offset << std::endl; return 1; }
                     break;
                 }
                 offset += count;
                 capacity -= count;
                 for( ; offset >= size; cur += size, offset -= size )
                 {
-                    if( !ignore() ) { std::cout.write( cur, size ); }
+                    if( keep() ) { std::cout.write( cur, size ); }
                 }
                 if( capacity == 0 ) { cur = &buf[0]; offset = 0; capacity = buf.size(); }
                 std::cout.flush();
@@ -266,201 +221,12 @@ int main( int ac, char** av )
             while( std::cin.good() && !std::cin.eof() )
             {
                 std::getline( std::cin, line );
-                if( !line.empty() && !ignore() ) { std::cout << line << std::endl; }
+                if( !line.empty() && keep() ) { std::cout << line << std::endl; }
             }
         }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "csv-size: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-size: unknown exception" << std::endl; }
-    usage();
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
+    return 1;
 }
-
-// // This file is part of comma, a generic and flexible library
-// // Copyright (c) 2011 The University of Sydney
-// // All rights reserved.
-// //
-// // Redistribution and use in source and binary forms, with or without
-// // modification, are permitted provided that the following conditions are met:
-// // 1. Redistributions of source code must retain the above copyright
-// //    notice, this list of conditions and the following disclaimer.
-// // 2. Redistributions in binary form must reproduce the above copyright
-// //    notice, this list of conditions and the following disclaimer in the
-// //    documentation and/or other materials provided with the distribution.
-// // 3. All advertising materials mentioning features or use of this software
-// //    must display the following acknowledgement:
-// //    This product includes software developed by the University of Sydney.
-// // 4. Neither the name of the University of Sydney nor the
-// //    names of its contributors may be used to endorse or promote products
-// //    derived from this software without specific prior written permission.
-// //
-// // NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// // GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// // HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// // WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// // MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// // DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// // BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-//
-// /// @author vsevolod vlaskine
-//
-// #ifdef WIN32
-// #include <stdio.h>
-// #include <fcntl.h>
-// #include <io.h>
-// #endif
-//
-// #include <iostream>
-// #include <boost/random/mersenne_twister.hpp>
-// #include <boost/random/uniform_real.hpp>
-// #include <boost/random/variate_generator.hpp>
-// #include <comma/application/command_line_options.h>
-// #include <comma/application/contact_info.h>
-// #include <comma/base/exception.h>
-// #include <comma/base/types.h>
-// #include <comma/io/file_descriptor.h>
-// #include <comma/math/compare.h>
-//
-// using namespace comma;
-//
-// static void usage()
-// {
-//     std::cerr << std::endl;
-//     std::cerr << "Read input data and thin them down by the given percentage;" << std::endl;
-//     std::cerr << "buffer handling optimized for a high-output producer" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "Usage: cat full.csv | csv-thin <rate> [<options>] > thinned.csv" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "e.g. output 70% of data:  cat full.csv | csv-thin 0.7 > thinned.csv" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "<options>" << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << "    --size,-s <size>: if given, data is packets of fixed size" << std::endl;
-//     std::cerr << "                      otherwise data is line-based" << std::endl;
-//     std::cerr << "    --deterministic,-d: if given, input is downsampled by a factor of int(1 / <rate>)." << std::endl;
-//     std::cerr << "                     That is, if <rate> is 0.33, output every third packet." << std::endl;
-//     std::cerr << "                     Default is to output each packet with a probability of <rate>." << std::endl;
-//     std::cerr << std::endl;
-//     std::cerr << comma::contact_info << std::endl;
-//     std::cerr << std::endl;
-//     exit( 1 );
-// }
-//
-// static double rate;
-// static bool deterministic;
-// static unsigned long long count_size;
-//
-// static bool ignore()
-// {
-//     if( deterministic )
-//     {
-//         static unsigned long long count = count_size - 1;
-//         if( ++count == count_size ) { count = 0; }
-//         if(rate<0.5)
-//         {
-//             return count != 0;
-//         }
-//         else
-//         {
-//             return count == 0;
-//         }
-//     }
-//     static boost::mt19937 rng;
-//     static boost::uniform_real<> dist( 0, 1 );
-//     static boost::variate_generator< boost::mt19937&, boost::uniform_real<> > random( rng, dist );
-//     static bool do_ignore = comma::math::less( rate, 1.0 );
-//     return do_ignore && random() > rate;
-//
-// }
-//
-// int main( int ac, char** av )
-// {
-//     try
-//     {
-//         comma::command_line_options options( ac, av );
-//         if( options.exists( "--help,-h" ) || ac == 1 ) { usage(); }
-//         bool binary = options.exists( "--size,-s" );
-//         deterministic = options.exists( "--deterministic,-d" );
-//         std::size_t size = options.value( "--size,-s", 0u );
-//         #ifdef WIN32
-//         if( binary ) { _setmode( _fileno( stdin ), _O_BINARY ); _setmode( _fileno( stdout ), _O_BINARY ); }
-//         #endif
-//         std::vector< std::string > v = options.unnamed( "--deterministic,-d", "-.*" );
-//         if( v.empty() ) { std::cerr << "csv-thin: please specify rate" << std::endl; usage(); }
-//         rate = boost::lexical_cast< double >( v[0] );
-//         if( comma::math::less( rate, 0 ) || comma::math::less( 1, rate ) ) { std::cerr << "csv-thin: expected rate between 0 and 1, got " << rate << std::endl; usage(); }
-//
-//         if( deterministic )
-//         {
-//             if(rate<0.5)
-//             {
-//                 count_size = static_cast< unsigned long long >( 1.0 / rate );
-//             }
-//             else
-//             {
-//                 count_size = static_cast< unsigned long long >( 1.0 / (1-rate) );
-//             }
-//         }
-//
-//         if( binary ) // quick and dirty, improve performance by reading larger buffer
-//         {
-//             unsigned int factor = 65536 / size; // arbitrary
-//             if( factor == 0 ) { factor = 1; }
-//             std::vector< char > buf( size * factor );
-//             #ifdef WIN32
-//             while( std::cin.good() && !std::cin.eof() )
-//             {
-//                 // it all does not seem to work: in_avail() always returns 0
-//                 //std::streamsize available = std::cin.rdbuf()->in_avail();
-//                 //if( available < 0 ) { continue; }
-//                 //if( available > 0 ) { std::cerr << "available = " << available << std::endl; }
-//                 //std::size_t e = available < int( size ) ? size : available - available % size;
-//                 std::cin.read( &buf[0], size ); // quick and dirty
-//                 if( std::cin.gcount() <= 0 ) { break; }
-//                 if( std::cin.gcount() < int( size ) ) { std::cerr << "csv-thin: expected " << size << " bytes; got only " << std::cin.gcount() << std::endl; exit( 1 ); }
-//                 { if( !ignore() ) { std::cout.write( &buf[0], size ); std::cout.flush(); } }
-//             }
-//             #else
-//             char* cur = &buf[0];
-//             unsigned int offset = 0;
-//             unsigned int capacity = buf.size();
-//             while( std::cin.good() && !std::cin.eof() )
-//             {
-//                 int count = ::read( comma::io::stdin_fd, cur + offset, capacity );
-//                 if( count <= 0 )
-//                 {
-//                     if( offset != 0 ) { std::cerr << "csv-thin: expected at least " << size << " bytes, got only " << offset << std::endl; return 1; }
-//                     break;
-//                 }
-//                 offset += count;
-//                 capacity -= count;
-//                 for( ; offset >= size; cur += size, offset -= size )
-//                 {
-//                     if( !ignore() ) { std::cout.write( cur, size ); }
-//                 }
-//                 if( capacity == 0 ) { cur = &buf[0]; offset = 0; capacity = buf.size(); }
-//                 std::cout.flush();
-//             }
-//             #endif
-//         }
-//         else
-//         {
-//             std::string line;
-//             while( std::cin.good() && !std::cin.eof() )
-//             {
-//                 std::getline( std::cin, line );
-//                 if( !line.empty() && !ignore() ) { std::cout << line << std::endl; }
-//             }
-//         }
-//         return 0;
-//     }
-//     catch( std::exception& ex ) { std::cerr << "csv-size: " << ex.what() << std::endl; }
-//     catch( ... ) { std::cerr << "csv-size: unknown exception" << std::endl; }
-//     usage();
-// }
diff --git a/csv/applications/csv-time-delay.cpp b/csv/applications/csv-time-delay.cpp
index 187838166..2b715a8ae 100644
--- a/csv/applications/csv-time-delay.cpp
+++ b/csv/applications/csv-time-delay.cpp
@@ -33,7 +33,6 @@
 #include <iostream>
 #include <string>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../name_value/parser.h"
@@ -50,7 +49,6 @@ static void usage()
     std::cerr << "<options>" << std::endl;
     std::cerr << comma::csv::options::usage( "t" ) << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( -1 );
 }
@@ -78,7 +76,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av );
         if( options.exists( "--help" ) || options.exists( "-h" ) || ac == 1 ) { usage(); }
-        const std::vector< std::string >& v = options.unnamed( "--flush", "--binary,-b,--delimiter,-d,--fields,-f,--full-xpath,--precision,--quote" );
+        const std::vector< std::string >& v = options.unnamed( "--flush", "--binary,-b,--delimiter,-d,--fields,-f,--precision,--quote" );
         if( v.empty() ) { std::cerr << "csv-time-delay: expected time delay, got none" << std::endl; return 1; }
         double d = boost::lexical_cast< double >( v[0] );
         int sign = d < 0 ? -1 : 1;
@@ -90,6 +88,7 @@ int main( int ac, char** av )
         microseconds *= sign;
         boost::posix_time::time_duration delay = boost::posix_time::minutes( minutes ) + boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds );
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         comma::csv::input_stream< Point > istream( std::cin, csv );
         comma::csv::output_stream< Point > ostream( std::cout, csv );
         while( std::cin.good() && !std::cin.eof() )
diff --git a/csv/applications/csv-time-join.cpp b/csv/applications/csv-time-join.cpp
index 80e3ef85b..227f8fea0 100644
--- a/csv/applications/csv-time-join.cpp
+++ b/csv/applications/csv-time-join.cpp
@@ -1,476 +1,433 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-/// @author vsevolod vlaskine
-
-#include <deque>
-#include <iostream>
-#include <string>
-#include <boost/date_time/posix_time/posix_time.hpp>
-#include <boost/optional.hpp>
-#include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
-#include "../../application/signal_flag.h"
-#include "../../base/types.h"
-#include "../../csv/stream.h"
-#include "../../io/stream.h"
-#include "../../csv/traits.h"
-#include "../../io/select.h"
-#include "../../name_value/parser.h"
-#include "../../string/string.h"
-#include "../../visiting/traits.h"
-
-static void bash_completion( unsigned const ac, char const * const * av )
-{
-    static const char* completion_options =
-        " --help --verbose"
-        " --by-lower --by-upper --nearest --realtime"
-        " --binary --delimiter --fields"
-        " --bound --do-not-append --select --timestamp-only"
-        " --buffer --discard-bounding"
-        ;
-    std::cout << completion_options << std::endl;
-    exit( 0 );
-}
-
-static void usage( bool verbose )
-{
-    std::cerr << std::endl;
-    std::cerr << "join timestamped data from stdin with corresponding timestamped data from the" << std::endl;
-    std::cerr << "second input" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "timestamps are expected to be fully ordered" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "note: on windows only files are supported as bounding data" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: cat a.csv | csv-time-join <how> [<options>] bounding.csv [-] > joined.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<how>" << std::endl;
-    std::cerr << "    --by-lower: join by lower timestamp (default)" << std::endl;
-    std::cerr << "    --by-upper: join by upper timestamp" << std::endl;
-    std::cerr << "    --nearest:  join by nearest timestamp" << std::endl;
-    std::cerr << "                if 'block' given in --fields, output the whole block" << std::endl;
-    std::cerr << "    --realtime: (streams only) output input immediately joined with current" << std::endl;
-    std::cerr << "                latest bounding timestamp. The joined bounding timestamp may" << std::endl;
-    std::cerr << "                be less than or greater than the timestamp from stdin." << std::endl;
-    std::cerr << "                No timestamp comparisons are made before outputting a record." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<input/output options>" << std::endl;
-    std::cerr << "    -: if csv-time-join - b.csv, concatenate output as: <stdin><b.csv>" << std::endl;
-    std::cerr << "       if csv-time-join b.csv -, concatenate output as: <b.csv><stdin>" << std::endl;
-    std::cerr << "       default: csv-time-join - b.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    --help,-h:                  this help" << std::endl;
-    std::cerr << "    --verbose,-v:               more output" << std::endl;
-    std::cerr << "    --binary,-b <format>:       binary format" << std::endl;
-    std::cerr << "    --delimiter,-d <delimiter>: ascii only; default ','" << std::endl;
-    std::cerr << "    --fields,-f <fields>:       input fields; default: t" << std::endl;
-    std::cerr << "    --bound=<seconds>:          output only points within given bound" << std::endl;
-    std::cerr << "    --do-not-append,--select:   do not append any field from the second input" << std::endl;
-    std::cerr << "    --timestamp-only:           append only timestamp from the second input" << std::endl;
-    std::cerr << "    --buffer:                   bounding data buffer size; default: infinite" << std::endl;
-    std::cerr << "    --discard-bounding:         discard bounding data if buffer size reached;" << std::endl;
-    std::cerr << "                                default is to block until stdin catches up" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    first field on stdin is timestamp, the first field of filter is timestamp" << std::endl;
-    std::cerr << "        - default:" << std::endl;
-    std::cerr << "            cat a.csv | csv-time-join b.csv" << std::endl;
-    std::cerr << "        - explicit:" << std::endl;
-    std::cerr << "            cat a.csv | csv-time-join --fields=t \"b.csv;fields=t\"" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    3rd field on stdin is timestamp, the 2nd field of filter is timestamp" << std::endl;
-    std::cerr << "        cat a.csv | csv-time-join --fields=,,t \"b.csv;fields=,t\"" << std::endl;
-    std::cerr << std::endl;
-    if( verbose )
-    {
-        std::cerr << "    echo \"20170101T115955,a\" >  a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120001,b\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120002,c\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120007,d\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120012,e\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120015,f\" >> a.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120000,y\" >  b.csv" << std::endl;
-        std::cerr << "    echo \"20170101T120010,z\" >> b.csv" << std::endl;
-        std::cerr << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --by-upper" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --select" << std::endl;
-        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --timestamp-only" << std::endl;
-        std::cerr << std::endl;
-        std::cerr << "    ( sleep 1; cat a.csv ) | csv-play |" << std::endl;
-        std::cerr << "        csv-time-join --realtime <( cat b.csv | csv-play )" << std::endl;
-}
-    else
-    {
-        std::cerr << "    try --help --verbose for more examples" << std::endl;
-    }
-    std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 0 );
-}
-
-struct Point
-{
-    boost::optional<boost::posix_time::ptime> timestamp;
-    Point() {}
-    Point( const boost::posix_time::ptime& timestamp ) : timestamp( timestamp ) {}
-};
-
-namespace comma { namespace visiting {
-
-template <> struct traits< Point >
-{
-    template < typename K, typename V > static void visit( const K&, const Point& p, V& v )
-    { 
-        v.apply( "t", p.timestamp );
-    }
-    
-    template < typename K, typename V > static void visit( const K&, Point& p, V& v )
-    {
-        v.apply( "t", p.timestamp );
-    }
-};
-    
-} } // namespace comma { namespace visiting {
-
-enum class how { by_lower, by_upper, nearest, realtime };
-how method = how::by_lower;
-bool timestamp_only;
-bool select_only;
-
-comma::csv::options stdin_csv;
-comma::csv::options bounding_csv;
-boost::optional< boost::posix_time::time_duration > bound;
-
-typedef std::pair< boost::posix_time::ptime, std::string > timestring_t;
-
-boost::posix_time::ptime get_time( const Point& p )
-{
-    return p.timestamp ? *p.timestamp : boost::posix_time::microsec_clock::universal_time();
-}
-
-static void output_bounding( std::ostream& os, const timestring_t& bounding, bool stdin_first )
-{
-    if( !select_only )
-    {
-        if( stdin_csv.binary() )
-        {
-            if( timestamp_only )
-            {
-                static const unsigned int time_size = comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::size;
-                static char timestamp[ time_size ];
-                comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( bounding.first, timestamp );
-                os.write( (char*)&timestamp, time_size );
-            }
-            else
-            {
-                os.write( &bounding.second[0], bounding.second.size() );
-            }
-        }
-        else
-        {
-            if( stdin_first ) { os << stdin_csv.delimiter; }
-            os << ( timestamp_only ? boost::posix_time::to_iso_string( bounding.first ) : bounding.second );
-            if( !stdin_first ) { os << stdin_csv.delimiter; }
-        }
-    }
-}
-
-static void output_input( std::ostream& os, const timestring_t& input )
-{
-    if( stdin_csv.binary() ) { os.write( &input.second[0], stdin_csv.format().size() ); }
-    else { os << input.second; }
-}
-
-static void output( const timestring_t& input, const timestring_t& bounding, bool stdin_first )
-{
-    if( bounding.first.is_infinity() ) { return; }
-
-    if( bound && ( input.first - bounding.first > bound || bounding.first - input.first > bound )) { return; }
-
-    if( stdin_first )
-    {
-        output_input( std::cout, input );
-        output_bounding( std::cout, bounding, stdin_first );
-    }
-    else
-    {
-        output_bounding( std::cout, bounding, stdin_first );
-        output_input( std::cout, input );
-    }
-
-    if( !stdin_csv.binary() ) { std::cout << '\n'; }
-    std::cout.flush();
-}
-
-int main( int ac, char** av )
-{
-    try
-    {
-        comma::signal_flag is_shutdown(comma::signal_flag::hard);
-        comma::command_line_options options( ac, av, usage );
-
-        if( options.exists( "--bash-completion" )) bash_completion( ac, av );
-        options.assert_mutually_exclusive( "--by-lower,--by-upper,--nearest,--realtime" );
-        if( options.exists( "--by-upper" )) { method = how::by_upper; }
-        if( options.exists( "--nearest" )) { method = how::nearest; }
-        if( options.exists( "--realtime" )) { method = how::realtime; }
-        timestamp_only = options.exists( "--timestamp-only,--time-only" );
-        select_only = options.exists( "--do-not-append,--select" );
-        if( select_only && timestamp_only ) { std::cerr << "csv-time-join: --timestamp-only specified with --select, ignoring --timestamp-only" << std::endl; }
-        bool discard_bounding = options.exists( "--discard-bounding" );
-        boost::optional< unsigned int > buffer_size = options.optional< unsigned int >( "--buffer" );
-        if( options.exists( "--bound" ) ) { bound = boost::posix_time::microseconds( static_cast<unsigned int>(options.value< double >( "--bound" ) * 1000000 )); }
-        stdin_csv = comma::csv::options( options, "t" );
-
-        std::vector< std::string > unnamed = options.unnamed(
-            "--by-lower,--by-upper,--nearest,--realtime,--select,--do-not-append,--timestamp-only,--time-only,--discard-bounding",
-            "--binary,-b,--delimiter,-d,--fields,-f,--bound,--buffer,--verbose,-v" );
-        std::string properties;
-        bool stdin_first = true;
-        switch( unnamed.size() )
-        {
-            case 0:
-                std::cerr << "csv-time-join: please specify bounding source" << std::endl;
-                return 1;
-            case 1:
-                properties = unnamed[0];
-                break;
-            case 2:
-                if( unnamed[0] == "-" ) { properties = unnamed[1]; }
-                else if( unnamed[1] == "-" ) { properties = unnamed[0]; stdin_first = false; }
-                else { std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
-                break;
-            default:
-                std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl;
-                return 1;
-        }
-        comma::name_value::parser parser( "filename" );
-        bounding_csv = parser.get< comma::csv::options >( properties );
-        if( bounding_csv.fields.empty() ) { bounding_csv.fields = "t"; }
-
-        comma::csv::input_stream< Point > stdin_stream( std::cin, stdin_csv );
-        #ifdef WIN32
-        if( stdin_csv.binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
-        #endif // #ifdef WIN32
-
-        comma::io::istream bounding_istream( comma::split( properties, ';' )[0]
-                                           , bounding_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii );
-        comma::csv::input_stream< Point > bounding_stream( *bounding_istream, bounding_csv );
-
-        #ifndef WIN32
-        comma::io::select select;
-        comma::io::select bounding_stream_select;
-        select.read().add( 0 );
-        select.read().add( bounding_istream.fd() );
-        bounding_stream_select.read().add( bounding_istream.fd() );
-        #endif // #ifndef WIN32
-
-        const Point* p = NULL;
-
-        if( method == how::realtime )
-        {
-            #ifndef WIN32
-            bool end_of_input = false;
-            bool end_of_bounds = false;
-            
-            boost::optional<timestring_t> joined_line;
-            
-            while (!is_shutdown && !end_of_input)
-            {
-                if ( !bounding_stream.ready() && !stdin_stream.ready() )
-                {
-                    select.wait(boost::posix_time::milliseconds(1));
-                }
-                
-                if ( !is_shutdown && !end_of_input && ( stdin_stream.ready() || ( select.check() && select.read().ready( comma::io::stdin_fd ) ) ) )
-                {
-                    p = stdin_stream.read();
-                    if( p )
-                    {
-                        timestring_t input_line = std::make_pair( get_time( *p ), stdin_stream.last() );
-                        if( joined_line ) { output( input_line, *joined_line, stdin_first ); }
-                    }
-                    else
-                    {
-                        comma::verbose << "end of input stream" << std::endl;
-                        end_of_input = true;
-                    }
-                }
-                
-                if ( !is_shutdown && !end_of_bounds &&
-                   ( bounding_stream.ready() || ( select.check() && select.read().ready( bounding_istream.fd() ))))
-                {
-                    p = bounding_stream.read();
-                    if( p )
-                    {
-                        joined_line = std::make_pair( get_time( *p ), bounding_stream.last() );
-                    }
-                    else
-                    {
-                        comma::verbose << "end of bounding stream" << std::endl;
-                        end_of_bounds = true;
-                    }
-                }
-            }
-            if (is_shutdown) { comma::verbose << "got a signal" << std::endl; return 0; }
-            #else
-            COMMA_THROW(comma::exception, "--realtime mode not supported in WIN32");
-            #endif
-        }
-        else
-        {
-            std::deque<timestring_t> bounding_queue;
-            bool next = true;
-            bool bounding_data_available;
-            bool upper_bound_added = false;
-
-            // add a fake entry for an lower bound to allow stdin before first bound to match
-            bounding_queue.push_back( std::make_pair( boost::posix_time::neg_infin, "" ));
-
-            while( ( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) ) )
-            {
-                if( !std::cin.good() ) { select.read().remove( 0 ); }
-                if( !bounding_istream->good() ) { select.read().remove( bounding_istream.fd() ); }
-                bounding_data_available = bounding_stream.ready() || ( bounding_istream->good() && !bounding_istream->eof() );
-                #ifdef WIN32
-                bool bounding_stream_ready = true;
-                bool stdin_stream_ready = true;
-                #else // #ifdef WIN32
-                //check so we do not block
-                bool bounding_stream_ready = bounding_stream.ready();
-                bool stdin_stream_ready = stdin_stream.ready();
-
-                if( next )
-                {
-                    if( !bounding_stream_ready || !stdin_stream_ready )
-                    {
-                        if( !bounding_stream_ready && !stdin_stream_ready )
-                        {
-                            select.wait( boost::posix_time::milliseconds(10) );
-                        }
-                        else
-                        {
-                            select.check();
-                        }
-                        if( select.read().ready( bounding_istream.fd() )) { bounding_stream_ready = true; }
-                        if( select.read().ready(0) ) { stdin_stream_ready=true; }
-                    }
-                }
-                else
-                {
-                    if( !bounding_stream_ready )
-                    {
-                        bounding_stream_select.wait( boost::posix_time::milliseconds(10) );
-                        if( bounding_stream_select.read().ready( bounding_istream.fd() )) { bounding_stream_ready=true; }
-                    }
-                }
-                #endif //#ifdef WIN32
-
-                //keep storing available bounding data
-                if( bounding_stream_ready )
-                {
-                    if( !buffer_size || bounding_queue.size() < *buffer_size || discard_bounding )
-                    {
-                        const Point* q = bounding_stream.read();
-                        if( q )
-                        {
-                            bounding_queue.push_back( std::make_pair( get_time( *q ), bounding_stream.last() ));
-                        }
-                        else
-                        {
-                            bounding_data_available=false;
-                        }
-                    }
-                    if( buffer_size && bounding_queue.size() > *buffer_size && discard_bounding )
-                    {
-                        bounding_queue.pop_front();
-                    }
-                }
-                if( !upper_bound_added && bounding_istream->eof() )
-                {
-                    // add a fake entry for an upper bound to allow stdin data above last bound to match
-                    bounding_queue.push_back( std::make_pair( boost::posix_time::pos_infin, "" ));
-                    upper_bound_added = true;
-                }
-
-                //if we are done with the last bounded point get next
-                if( next )
-                {
-                    if(!stdin_stream_ready) { continue; }
-                    p = stdin_stream.read();
-                    if( !p ) { break; }
-                }
-
-                boost::posix_time::ptime t = get_time(*p);
-              
-                //get bound
-                while(bounding_queue.size()>=2)
-                {
-                    if( t < bounding_queue[1].first ) { break; }
-                    bounding_queue.pop_front();
-                }
-
-                if(bounding_queue.size()<2)
-                {
-                    //bound not found
-                    //do we have more data?
-                    if(!bounding_data_available) { break; }
-                    next=false;
-                    continue;
-                }
-
-                //bound available
-
-                if( method == how::by_lower && t < bounding_queue.front().first )
-                {
-                    next = true;
-                    continue;
-                }
-
-                bool is_first = ( method == how::by_lower )
-                    || ( method == how::nearest && ( t - bounding_queue[0].first ) < ( bounding_queue[1].first - t ));
-
-                const timestring_t& chosen_bound = is_first ? bounding_queue[0] : bounding_queue[1];;
-                timestring_t input_line = std::make_pair( t, stdin_stream.last() );
-
-                output( input_line, chosen_bound, stdin_first );
-                next=true;
-            }
-        }
-        return 0;     
-    }
-    catch( std::exception& ex ) { std::cerr << "csv-time-join: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "csv-time-join: unknown exception" << std::endl; }
-}
+// This file is part of comma, a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+
+/// @author vsevolod vlaskine
+
+#include <cmath>
+#include <deque>
+#include <iostream>
+#include <string>
+#include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/optional.hpp>
+#include "../../application/command_line_options.h"
+#include "../../application/signal_flag.h"
+#include "../../base/types.h"
+#include "../../csv/stream.h"
+#include "../../io/stream.h"
+#include "../../csv/traits.h"
+#include "../../io/select.h"
+#include "../../name_value/parser.h"
+#include "../../string/string.h"
+#include "../../visiting/traits.h"
+
+static void bash_completion( unsigned const ac, char const * const * av )
+{
+    static const char* completion_options =
+        " --help --verbose"
+        " --by-lower --by-upper --nearest --realtime"
+        " --binary --delimiter --fields"
+        " --bound --do-not-append --select --timestamp-only"
+        " --buffer --discard-bounding"
+        ;
+    std::cout << completion_options << std::endl;
+    exit( 0 );
+}
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "join timestamped data from stdin with corresponding timestamped data from the" << std::endl;
+    std::cerr << "second input" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "timestamps are expected to be fully ordered" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "note: on windows only files are supported as bounding data" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat a.csv | csv-time-join <how> [<options>] bounding.csv [-] > joined.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "<how>" << std::endl;
+    std::cerr << "    --by-lower: join by lower timestamp (default)" << std::endl;
+    std::cerr << "    --by-upper: join by upper timestamp" << std::endl;
+    std::cerr << "    --nearest:  join by nearest timestamp" << std::endl;
+    std::cerr << "                if 'block' given in --fields, output the whole block" << std::endl;
+    std::cerr << "    --realtime: (streams only) output input immediately joined with current" << std::endl;
+    std::cerr << "                latest bounding timestamp. The joined bounding timestamp may" << std::endl;
+    std::cerr << "                be less than or greater than the timestamp from stdin." << std::endl;
+    std::cerr << "                No timestamp comparisons are made before outputting a record." << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "<input/output options>" << std::endl;
+    std::cerr << "    -: if csv-time-join - b.csv, concatenate output as: <stdin><b.csv>" << std::endl;
+    std::cerr << "       if csv-time-join b.csv -, concatenate output as: <b.csv><stdin>" << std::endl;
+    std::cerr << "       default: csv-time-join - b.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    --help,-h:                    this help" << std::endl;
+    std::cerr << "    --verbose,-v:                 more output" << std::endl;
+    std::cerr << "    --binary,-b <format>:         binary format" << std::endl;
+    std::cerr << "    --delimiter,-d <delimiter>:   ascii only; default ','" << std::endl;
+    std::cerr << "    --fields,-f <fields>:         input fields; default: t" << std::endl;
+    std::cerr << "    --bound=[<seconds>]:          output only points within given bound" << std::endl;
+    std::cerr << "    --buffer=[<records>]:         bounding data buffer size; default: infinite" << std::endl;
+    std::cerr << "    --discard-bounding:           discard bounding data if buffer size reached;" << std::endl;
+    std::cerr << "                                  default is to block until stdin catches up" << std::endl;
+    std::cerr << "    --do-not-append,--select:     do not append any field from the second input" << std::endl;
+    std::cerr << "    --output-diff-abs,--abs-diff: append abs difference between first and second input" << std::endl;
+    std::cerr << "                                  input timestamps as seconds (double)" << std::endl;
+    std::cerr << "    --output-diff,--diff:         append difference between first and second input" << std::endl;
+    std::cerr << "                                  input timestamps as seconds (double)" << std::endl;
+    std::cerr << "    --timestamp-only:             append only timestamp from the second input" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "    first field on stdin is timestamp, the first field of filter is timestamp" << std::endl;
+    std::cerr << "        - default:" << std::endl;
+    std::cerr << "            cat a.csv | csv-time-join b.csv" << std::endl;
+    std::cerr << "        - explicit:" << std::endl;
+    std::cerr << "            cat a.csv | csv-time-join --fields=t \"b.csv;fields=t\"" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    3rd field on stdin is timestamp, the 2nd field of filter is timestamp" << std::endl;
+    std::cerr << "        cat a.csv | csv-time-join --fields=,,t \"b.csv;fields=,t\"" << std::endl;
+    std::cerr << std::endl;
+    if( verbose )
+    {
+        std::cerr << "    echo \"20170101T115955,a\" >  a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120001,b\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120002,c\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120007,d\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120012,e\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120015,f\" >> a.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120000,y\" >  b.csv" << std::endl;
+        std::cerr << "    echo \"20170101T120010,z\" >> b.csv" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --by-upper" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --select" << std::endl;
+        std::cerr << "    cat a.csv | csv-time-join b.csv --nearest --bound=2 --timestamp-only" << std::endl;
+        std::cerr << std::endl;
+        std::cerr << "    ( sleep 1; cat a.csv ) | csv-play |" << std::endl;
+        std::cerr << "        csv-time-join --realtime <( cat b.csv | csv-play )" << std::endl;
+}
+    else
+    {
+        std::cerr << "    try --help --verbose for more examples" << std::endl;
+    }
+    std::cerr << std::endl;
+    std::cerr << std::endl;
+    exit( 0 );
+}
+
+struct Point
+{
+    boost::optional<boost::posix_time::ptime> timestamp;
+    Point() {}
+    Point( const boost::posix_time::ptime& timestamp ) : timestamp( timestamp ) {}
+};
+
+namespace comma { namespace visiting {
+
+template <> struct traits< Point >
+{
+    template < typename K, typename V > static void visit( const K&, const Point& p, V& v ) { v.apply( "t", p.timestamp ); }
+    template < typename K, typename V > static void visit( const K&, Point& p, V& v ) { v.apply( "t", p.timestamp ); }
+};
+    
+} } // namespace comma { namespace visiting {
+
+enum class how { by_lower, by_upper, nearest, realtime };
+how method = how::by_lower;
+static bool timestamp_only;
+static bool output_diff_abs;
+static bool output_diff;
+static bool select_only;
+static comma::csv::options stdin_csv;
+static comma::csv::options bounding_csv;
+static boost::optional< boost::posix_time::time_duration > bound;
+typedef std::pair< boost::posix_time::ptime, std::string > timestring_t;
+
+static boost::posix_time::ptime get_time( const Point& p ) { return p.timestamp ? *p.timestamp : boost::posix_time::microsec_clock::universal_time(); }
+
+static void output_bounding( std::ostream& os, const timestring_t& bounding, bool stdin_first )
+{
+    if( !select_only )
+    {
+        if( stdin_csv.binary() )
+        {
+            if( timestamp_only )
+            {
+                static const unsigned int time_size = comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::size;
+                static char timestamp[ time_size ];
+                comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( bounding.first, timestamp );
+                os.write( ( const char* )( &timestamp ), time_size );
+            }
+            else
+            {
+                os.write( &bounding.second[0], bounding.second.size() );
+            }
+        }
+        else
+        {
+            if( stdin_first ) { os << stdin_csv.delimiter; }
+            os << ( timestamp_only ? boost::posix_time::to_iso_string( bounding.first ) : bounding.second );
+            if( !stdin_first ) { os << stdin_csv.delimiter; }
+        }
+    }
+}
+
+static void _output_diff( std::ostream& os, boost::posix_time::ptime bounded, boost::posix_time::ptime bounding )
+{
+    if( !output_diff && !output_diff_abs ) { return; }
+    double diff = double( ( bounded - bounding ).total_microseconds() ) * 1e-6;
+    if( output_diff_abs ) { diff = std::abs( diff ); }
+    if( stdin_csv.binary() ) { os.write( reinterpret_cast< const char* >( &diff ), sizeof( double ) ); } else { os << stdin_csv.delimiter << diff; }    
+}
+
+static void output_input( std::ostream& os, const timestring_t& input )
+{
+    if( stdin_csv.binary() ) { os.write( &input.second[0], stdin_csv.format().size() ); } else { os << input.second; }
+}
+
+static void output( const timestring_t& input, const timestring_t& bounding, bool stdin_first )
+{
+    if( bounding.first.is_infinity() ) { return; }
+    if( bound && ( input.first - bounding.first > bound || bounding.first - input.first > bound )) { return; }
+    if( stdin_first )
+    {
+        output_input( std::cout, input );
+        output_bounding( std::cout, bounding, stdin_first );
+    }
+    else
+    {
+        output_bounding( std::cout, bounding, stdin_first );
+        output_input( std::cout, input );
+    }
+    _output_diff( std::cout, input.first, bounding.first );
+    if( !stdin_csv.binary() ) { std::cout << '\n'; }
+    std::cout.flush();
+}
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::signal_flag is_shutdown(comma::signal_flag::hard);
+        comma::command_line_options options( ac, av, usage );
+        if( options.exists( "--bash-completion" )) bash_completion( ac, av );
+        options.assert_mutually_exclusive( "--by-lower,--by-upper,--nearest,--realtime" );
+        options.assert_mutually_exclusive( "--output-diff,--diff", "--output-diff-abs,--abs-diff" );
+        if( options.exists( "--by-upper" )) { method = how::by_upper; }
+        if( options.exists( "--nearest" )) { method = how::nearest; }
+        if( options.exists( "--realtime" )) { method = how::realtime; }
+        timestamp_only = options.exists( "--timestamp-only,--time-only" );
+        output_diff = options.exists( "--output-diff,--diff" );
+        output_diff_abs = options.exists( "--output-diff-abs,--abs-diff" );
+        select_only = options.exists( "--do-not-append,--select" );
+        if( select_only && timestamp_only ) { std::cerr << "csv-time-join: --timestamp-only specified with --select, ignoring --timestamp-only" << std::endl; }
+        bool discard_bounding = options.exists( "--discard-bounding" );
+        boost::optional< unsigned int > buffer_size = options.optional< unsigned int >( "--buffer" );
+        if( options.exists( "--bound" ) ) { bound = boost::posix_time::microseconds( static_cast<unsigned int>(options.value< double >( "--bound" ) * 1000000 )); }
+        stdin_csv = comma::csv::options( options, "t" );
+        std::vector< std::string > unnamed = options.unnamed(
+            "--by-lower,--by-upper,--nearest,--realtime,--select,--do-not-append,--timestamp-only,--time-only,--discard-bounding",
+            "--binary,-b,--delimiter,-d,--fields,-f,--bound,--buffer,--verbose,-v,--output-diff-abs,--abs-diff,--diff-abs,--diff" );
+        std::string properties;
+        bool stdin_first = true;
+        switch( unnamed.size() )
+        {
+            case 0:
+                std::cerr << "csv-time-join: please specify bounding source" << std::endl;
+                return 1;
+            case 1:
+                properties = unnamed[0];
+                break;
+            case 2:
+                if( unnamed[0] == "-" ) { properties = unnamed[1]; }
+                else if( unnamed[1] == "-" ) { properties = unnamed[0]; stdin_first = false; }
+                else { std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
+                break;
+            default:
+                std::cerr << "csv-time-join: expected either '- <bounding>' or '<bounding> -'; got : " << comma::join( unnamed, ' ' ) << std::endl;
+                return 1;
+        }
+        comma::name_value::parser parser( "filename" );
+        bounding_csv = parser.get< comma::csv::options >( properties );
+        if( bounding_csv.fields.empty() ) { bounding_csv.fields = "t"; }
+
+        comma::csv::input_stream< Point > stdin_stream( std::cin, stdin_csv );
+        #ifdef WIN32
+        if( stdin_csv.binary() ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        #endif // #ifdef WIN32
+
+        comma::io::istream bounding_istream( comma::split( properties, ';' )[0], bounding_csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii );
+        comma::csv::input_stream< Point > bounding_stream( *bounding_istream, bounding_csv );
+
+        #ifndef WIN32
+        comma::io::select select;
+        comma::io::select bounding_stream_select;
+        select.read().add( 0 );
+        select.read().add( bounding_istream.fd() );
+        bounding_stream_select.read().add( bounding_istream.fd() );
+        #endif // #ifndef WIN32
+
+        const Point* p = NULL;
+        if( method == how::realtime )
+        {
+            #ifdef WIN32
+            COMMA_THROW( comma::exception, "--realtime mode not supported in WIN32" );
+            #else
+            bool end_of_input = false;
+            bool end_of_bounds = false;
+            boost::optional< timestring_t > joined_line;
+            while( !is_shutdown && !end_of_input )
+            {
+                if( !bounding_stream.ready() && !stdin_stream.ready() ) { select.wait(boost::posix_time::milliseconds(1)); }
+                if( !is_shutdown && !end_of_input && ( stdin_stream.ready() || ( select.check() && select.read().ready( comma::io::stdin_fd ) ) ) )
+                {
+                    p = stdin_stream.read();
+                    if( p )
+                    {
+                        timestring_t input_line = std::make_pair( get_time( *p ), stdin_stream.last() );
+                        if( joined_line ) { output( input_line, *joined_line, stdin_first ); }
+                    }
+                    else
+                    {
+                        comma::verbose << "end of input stream" << std::endl;
+                        end_of_input = true;
+                    }
+                }
+                if( !is_shutdown && !end_of_bounds && ( bounding_stream.ready() || ( select.check() && select.read().ready( bounding_istream.fd() ) ) ) )
+                {
+                    p = bounding_stream.read();
+                    if( p )
+                    {
+                        joined_line = std::make_pair( get_time( *p ), bounding_stream.last() );
+                    }
+                    else
+                    {
+                        comma::verbose << "end of bounding stream" << std::endl;
+                        end_of_bounds = true;
+                    }
+                }
+            }
+            if( is_shutdown ) { comma::verbose << "got a signal" << std::endl; return 0; }
+            #endif // #ifdef WIN32
+        }
+        else
+        {
+            std::deque< timestring_t > bounding_queue;
+            bool next = true;
+            bool bounding_data_available;
+            bool upper_bound_added = false;
+            bounding_queue.push_back( std::make_pair( boost::posix_time::neg_infin, "" ) ); // add a fake entry for an lower bound to allow stdin before first bound to match
+            while( stdin_stream.ready() || ( std::cin.good() && !std::cin.eof() ) )
+            {
+                if( !std::cin.good() ) { select.read().remove( 0 ); }
+                if( !bounding_istream->good() ) { select.read().remove( bounding_istream.fd() ); }
+                bounding_data_available = bounding_stream.ready() || ( bounding_istream->good() && !bounding_istream->eof() );
+                #ifdef WIN32
+                bool bounding_stream_ready = true;
+                bool stdin_stream_ready = true;
+                #else // #ifdef WIN32
+                //check so we do not block
+                bool bounding_stream_ready = bounding_stream.ready();
+                bool stdin_stream_ready = stdin_stream.ready();
+                if( next )
+                {
+                    if( !bounding_stream_ready || !stdin_stream_ready )
+                    {
+                        if( !bounding_stream_ready && !stdin_stream_ready ) { select.wait( boost::posix_time::milliseconds( 10 ) ); }
+                        else { select.check(); }
+                        if( select.read().ready( bounding_istream.fd() )) { bounding_stream_ready = true; }
+                        if( select.read().ready(0) ) { stdin_stream_ready = true; }
+                    }
+                }
+                else
+                {
+                    if( !bounding_stream_ready )
+                    {
+                        bounding_stream_select.wait( boost::posix_time::milliseconds( 10 ) );
+                        if( bounding_stream_select.read().ready( bounding_istream.fd() )) { bounding_stream_ready=true; }
+                    }
+                }
+                #endif //#ifdef WIN32
+                //keep storing available bounding data
+                if( bounding_stream_ready )
+                {
+                    if( !buffer_size || bounding_queue.size() < *buffer_size || discard_bounding )
+                    {
+                        const Point* q = bounding_stream.read();
+                        if( q ) { bounding_queue.push_back( std::make_pair( get_time( *q ), bounding_stream.last() )); }
+                        else { bounding_data_available = false; }
+                    }
+                    if( buffer_size && bounding_queue.size() > *buffer_size && discard_bounding ) { bounding_queue.pop_front(); }
+                }
+                if( !upper_bound_added && bounding_istream->eof() )
+                {
+                    // add a fake entry for an upper bound to allow stdin data above last bound to match
+                    bounding_queue.push_back( std::make_pair( boost::posix_time::pos_infin, "" ));
+                    upper_bound_added = true;
+                }
+                //if we are done with the last bounded point get next
+                if( next )
+                {
+                    if( !stdin_stream_ready ) { continue; }
+                    p = stdin_stream.read();
+                    if( !p ) { break; }
+                }
+                boost::posix_time::ptime t = get_time( *p );
+                //get bound
+                for( ; bounding_queue.size() >= 2 && t >= bounding_queue[1].first; bounding_queue.pop_front() );
+                if( bounding_queue.size() < 2 )
+                {
+                    //bound not found
+                    //do we have more data?
+                    if( !bounding_data_available ) { break; }
+                    next = false;
+                    continue;
+                }
+                //bound available
+                if( method == how::by_lower && t < bounding_queue.front().first )
+                {
+                    next = true;
+                    continue;
+                }
+                bool is_first = ( method == how::by_lower )
+                    || ( method == how::nearest && ( t - bounding_queue[0].first ) < ( bounding_queue[1].first - t ));
+                const timestring_t& chosen_bound = is_first ? bounding_queue[0] : bounding_queue[1];;
+                timestring_t input_line = std::make_pair( t, stdin_stream.last() );
+                output( input_line, chosen_bound, stdin_first );
+                next = true;
+            }
+        }
+        return 0;     
+    }
+    catch( std::exception& ex ) { std::cerr << "csv-time-join: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "csv-time-join: unknown exception" << std::endl; }
+    return 1;
+}
diff --git a/csv/applications/csv-time-stamp.cpp b/csv/applications/csv-time-stamp.cpp
index b77dece7e..e989c1a1f 100644
--- a/csv/applications/csv-time-stamp.cpp
+++ b/csv/applications/csv-time-stamp.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author cedric wohlleber
 
@@ -40,11 +12,10 @@
 #include <string>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
 
-static void usage()
+static void usage( bool verbose )
 {
     std::cerr << std::endl;
     std::cerr << "prepend input with timestamp" << std::endl;
@@ -55,6 +26,7 @@ static void usage()
     std::cerr << "    --binary,-b=<format>: binary format" << std::endl;
     std::cerr << "    --size=<size>: binary input of size" << std::endl;
     std::cerr << "    --delimiter,-d <delimiter>: ascii only; default ','" << std::endl;
+    std::cerr << "    --flush; flush stdout after each record" << std::endl;
     std::cerr << "    --local: if present, local time; default: utc" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples:" << std::endl;
@@ -62,30 +34,22 @@ static void usage()
     std::cerr << "    cat input.bin | csv-time-stamp --binary=3ui" << std::endl;
     std::cerr << "    cat input.bin | csv-time-stamp --size=12" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( -1 );
+    exit( 1 );
 }
 
 int main( int ac, char** av )
 {
     try
     {
-        comma::command_line_options options( ac, av );
-        if( options.exists( "--help" ) || options.exists( "-h" ) ) { usage(); }
-
+        comma::command_line_options options( ac, av, usage );
         bool local = options.exists( "--local" );
         char delimiter = options.value( "--delimiter,-d", ',' );
-
         boost::optional< comma::csv::format > format;
-        if( options.exists( "--binary,-b" ))
-        {
-            format = comma::csv::format( options.value< std::string >( "--binary,-b" ));
-        }
+        if( options.exists( "--binary,-b" )) { format = comma::csv::format( options.value< std::string >( "--binary,-b" )); }
         bool binary = options.exists( "--binary,-b,--size" );
         std::size_t size = options.value( "--size", 0 );
+        bool flush = options.exists( "--flush" );
         if( binary && size == 0 ) { size = format->size(); }
-
         #ifdef WIN32
         if( binary )
         {
@@ -93,7 +57,6 @@ int main( int ac, char** av )
             _setmode( _fileno( stdout ), _O_BINARY );
         }
         #endif
-
         if( binary )
         {
             boost::array< char, 65536 > buf;
@@ -114,7 +77,7 @@ int main( int ac, char** av )
                         std::cout.write( ( char* )( &timestamp ), time_size );
                         std::cout.write( cur, size );
                     }
-                    std::cout.flush();
+                    if( flush ) { std::cout.flush(); }
                     if( cur == end ) { cur = begin; }
                 }
                 int r = ::read( 0, cur + offset, end - cur - offset );
@@ -137,5 +100,5 @@ int main( int ac, char** av )
     }
     catch( std::exception& ex ) { std::cerr << "csv-time-stamp: " << ex.what() << std::endl; }
     catch( ... ) { std::cerr << "csv-time-stamp: unknown exception" << std::endl; }
-    usage();
+    return 1;
 }
diff --git a/csv/applications/csv-time.cpp b/csv/applications/csv-time.cpp
index 78308a2ba..273cc24e6 100644
--- a/csv/applications/csv-time.cpp
+++ b/csv/applications/csv-time.cpp
@@ -27,9 +27,7 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
-/// @author vsevolod vlaskine
-/// @author mathew hounsell
+/// @authors vsevolod vlaskine, mathew hounsell
 
 #include <string.h>
 #include <time.h>
@@ -43,72 +41,72 @@
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/date_time/local_time/local_time.hpp>
 #include <boost/date_time/c_local_time_adjustor.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/epoch.h"
 #include "../../string/string.h"
+#include "../../timing/tai.h"
 #include "../../visiting/traits.h"
 
 static void usage( bool )
 {
-    static char const * const msg_general =
-        "\n"
-        "\nConvert between a couple of common time representation"
-        "\n"
-        "\nUsage:"
-        "\n    cat log.csv | csv-time <options> > converted.csv"
-        "\n"
-        "\nOptions"
-        "\n    --from <what>: input format: any, iso, seconds, sql, xsd, local; default iso"
-        "\n    --to <what>: output format: iso, seconds, sql, xsd, local; default iso"
-        "\n    --delimiter,-d <delimiter> : default: ','"
-        "\n    --fields <fields> : time field names or field numbers as in \"cut\""
-        "\n                        e.g. \"1,5,7\" or \"a,b,,d\""
-        "\n                        defaults to \"a\" (first field only is datetime)"
-        "\n    --empty-as-not-a-date-time,--accept-empty,-e: if time field is empty, consider it as not-a-date-time"
-        "\n"
-        "\nNote: no --binary option, do not use this utility on binary; instead read as unsigned long-long (time in microseconds)"
-        "\n"
-        "\nTime formats"
-        "\n    - any, guess"
-        "\n            a special input format - try to convert from all those supported,"
-        "\n            default input format, will be slower"
-        "\n    - format"
-        "\n            user given time format, for e.g 'format;%Y%m%dT%H%M%S' will also convert to/from iso format"
-        "\n            see man date for details about time format specifications"
-        "\n    - iso, iso-8601-basic"
-        "\n            YYYYMMDDTHHMMSS.FFFFFF, e.g. 20140101T001122.333000"
-        "\n    - iso-always-with-fractions"
-        "\n            YYYYMMDDTHHMMSS.FFFFFF"
-        "\n            output 20140101T000000.000000, not 20140101T000000"
-        "\n    - local"
-        "\n            same as iso but converts from/to local time adjusted using current machine settings"
-        "\n    - microseconds, us"
-        "\n            microseconds since UNIX epoch as integer"
-        "\n    - seconds"
-        "\n            seconds since UNIX epoch as double"
-        "\n    - sql, posix, ieee-std-1003.1"
-        "\n            e.g. 2014-01-01 00:11:22"
-        "\n    - xsd, iso-8601-extended"
-        "\n            used in xsd:dateTime, xs:dateTime, gml and derivatives"
-        "\n            e.g. 2014-12-25T00:00:00.000Z"
-        "\n                 2014-12-25T00:00:00.000+11:00"
-        "\n                 2014-12-25T00:00:00.000+1100"
-        "\n                 2014-12-25T00:00:00.000+11"
-        "\n"
-        "\nDeprecated options:"
-        "\n    --to-seconds,--sec,-s: iso input expected; use --from, --to"
-        "\n    --to-iso-string,--iso,-i: input as seconds expected; use --from, --to"
-        "\n"
-        "\n";
-    std::cerr << msg_general << comma::contact_info << std::endl << std::endl;
+    std::cerr << "\n"
+                 "\nConvert between a couple of common time representation"
+                 "\n"
+                 "\nUsage:"
+                 "\n    cat log.csv | csv-time <options> > converted.csv"
+                 "\n"
+                 "\nOptions"
+                 "\n    --from <what>: input format: any, iso, seconds, sql, xsd, local, tai; default iso"
+                 "\n    --to <what>: output format: iso, seconds, sql, xsd, local, tai; default iso"
+                 "\n    --delimiter,-d <delimiter> : default: ','"
+                 "\n    --fields <fields> : time field names or field numbers as in \"cut\""
+                 "\n                        e.g. \"1,5,7\" or \"a,b,,d\""
+                 "\n                        defaults to \"a\" (first field only is datetime)"
+                 "\n    --empty-as-not-a-date-time,--accept-empty,-e: if time field is empty, consider it as not-a-date-time"
+                 "\n"
+                 "\nNote: no --binary option, do not use this utility on binary; instead read as unsigned long-long (time in microseconds)"
+                 "\n"
+                 "\nTime formats"
+                 "\n    - any, guess"
+                 "\n            a special input format - try to convert from all those supported,"
+                 "\n            default input format, will be slower"
+                 "\n    - format"
+                 "\n            user given time format, for e.g 'format;%Y%m%dT%H%M%S' will also convert to/from iso format"
+                 "\n            see man date for details about time format specifications"
+                 "\n    - iso, iso-8601-basic"
+                 "\n            YYYYMMDDTHHMMSS.FFFFFF, e.g. 20140101T001122.333000"
+                 "\n    - iso-always-with-fractions"
+                 "\n            YYYYMMDDTHHMMSS.FFFFFF"
+                 "\n            output 20140101T000000.000000, not 20140101T000000"
+                 "\n    - local"
+                 "\n            same as iso but converts from/to local time adjusted using current machine settings"
+                 "\n    - microseconds, us"
+                 "\n            microseconds since UNIX epoch as integer"
+                 "\n    - seconds"
+                 "\n            seconds since UNIX epoch as double"
+                 "\n    - sql, posix, ieee-std-1003.1"
+                 "\n            e.g. 2014-01-01 00:11:22"
+                 "\n    - tai"
+                 "\n            same as iso but converts from/to the TAI time standard"
+                 "\n    - xsd, iso-8601-extended"
+                 "\n            used in xsd:dateTime, xs:dateTime, gml and derivatives"
+                 "\n            e.g. 2014-12-25T00:00:00.000Z"
+                 "\n                 2014-12-25T00:00:00.000+11:00"
+                 "\n                 2014-12-25T00:00:00.000+1100"
+                 "\n                 2014-12-25T00:00:00.000+11"
+                 "\n"
+                 "\nDeprecated options:"
+                 "\n    --to-seconds,--sec,-s: iso input expected; use --from, --to"
+                 "\n    --to-iso-string,--iso,-i: input as seconds expected; use --from, --to"
+                 "\n"
+                 "\n";
     exit( 0 );
 }
 
-enum what_t { guess, iso, seconds, microseconds, sql, xsd, local, format, iso_always_with_fractions };
+enum what_t { guess, iso, seconds, microseconds, sql, xsd, local, format, iso_always_with_fractions, tai };
 static what_t from = guess;
 static what_t to = iso;
 static std::string from_format;
@@ -179,19 +177,20 @@ static what_t what( const std::string& option, const comma::command_line_options
         {
             return local;
         }
+        else if( s == "tai" )
+        {
+            return tai;
+        }
     }
-    std::cerr << "csv-time: expected seconds, sql, or iso; got: \"" << s << "\"" << std::endl;
+    std::cerr << "csv-time: expected seconds, sql, tai, or iso; got: \"" << s << "\"" << std::endl;
     exit( 1 );
 }
 
 static boost::posix_time::ptime from_string_xsd( const std::string& s )
 {
     std::string t = s;
-
-    // Set the delimiter between date and time to be what time_from_string expects
-    const size_t idx_t = t.find( 'T' );
+    const size_t idx_t = t.find( 'T' ); // Set the delimiter between date and time to be what time_from_string expects
     if ( std::string::npos != idx_t ) t[idx_t] = ' ';
-
     // Determine the timezone offset. Could be any of Z,+-hh:mm,+-hhmm,+-hh
     signed hrs = 0;
     signed mins = 0;
@@ -220,7 +219,7 @@ static boost::posix_time::ptime from_string_xsd( const std::string& s )
     }
     // Construct the time from the string and apply the offset
     boost::posix_time::ptime result = boost::posix_time::time_from_string( t );
-    result += boost::posix_time::hours(hrs) + boost::posix_time::minutes(mins);
+    result += boost::posix_time::hours( hrs ) + boost::posix_time::minutes( mins );
     return result;
 }
 
@@ -265,6 +264,9 @@ static boost::posix_time::ptime from_string( const std::string& s, const what_t
         case sql:
             return s == "NULL" || s == "null" ? boost::posix_time::not_a_date_time : boost::posix_time::time_from_string( s );
 
+        case tai:
+            return comma::timing::tai::to_utc( boost::posix_time::from_iso_string( s ));
+
         case xsd: // 2014-03-05T23:00:00.000Z
             return from_string_xsd( s );
 
@@ -364,6 +366,9 @@ std::string to_string( const boost::posix_time::ptime& t, what_t w )
         case sql:
             return t.is_not_a_date_time() ? std::string( "NULL" ) : comma::split( boost::replace_all_copy( boost::posix_time::to_iso_extended_string( t ), "T", " " ), '.' )[0];
 
+        case tai:
+            return boost::posix_time::to_iso_string( comma::timing::tai::from_utc( t ));
+
         case xsd: // 2014-03-05T23:00:00.000Z
             return boost::posix_time::to_iso_extended_string( t );
 
@@ -388,7 +393,6 @@ namespace comma { namespace visiting {
 template <> struct traits< input_t >
 {
     template < typename K, typename V > static void visit( const K&, const input_t& p, V& v ) { v.apply( "values", p.values ); }
-
     template < typename K, typename V > static void visit( const K&, input_t& p, V& v ) { v.apply( "values", p.values ); }
 };
 
@@ -434,8 +438,7 @@ static void init_input()
         {
             fields += comma;
             comma = ",";
-            if( keep[i] )
-                fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]";
+            if( keep[i] ) { fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]"; }
         }
     }
     else
@@ -444,14 +447,11 @@ static void init_input()
         {
             fields += comma;
             comma = ",";
-
-            if( ! names[i].empty() )
-                fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]";
+            if( ! names[i].empty() ) { fields += "values[" + boost::lexical_cast< std::string >( size++ ) + "]"; }
         }
     }
 
     csv.fields = fields;
-    csv.full_xpath = true;
     input.values.resize( size );
 }
 
@@ -477,6 +477,7 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         accept_empty = options.exists( "--empty-as-not-a-date-time,--accept-empty,-e" );
         csv = comma::csv::options( options );
+        csv.full_xpath = false;
         csv.precision = 16;
         if( csv.fields.empty() ) { csv.fields="a"; }
         init_input();
diff --git a/csv/applications/csv-to-bin.cpp b/csv/applications/csv-to-bin.cpp
index d3b029ca6..22c8d024a 100644
--- a/csv/applications/csv-to-bin.cpp
+++ b/csv/applications/csv-to-bin.cpp
@@ -38,7 +38,6 @@
 
 #include <stdlib.h>
 #include <iostream>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../csv/format.h"
 #include "../../string/string.h"
@@ -58,7 +57,6 @@ static void usage( bool )
     std::cerr << std::endl;
     std::cerr << csv::format::usage() << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
@@ -76,7 +74,8 @@ int main( int ac, char** av )
         char delimiter = options.value( "--delimiter", ',' );
         bool flush = options.exists( "--flush" );
         comma::csv::format format( av[1] );
-        //{ ProfilerStart( "csv-to-bin.prof" );
+        if( !flush ) { std::cin.tie( NULL ); }
+        //{ ProfilerStart( "csvg-to-bin.prof" );
         while( std::cin.good() && !std::cin.eof() )
         {
             std::getline( std::cin, line );
diff --git a/csv/applications/csv-to-sql.cpp b/csv/applications/csv-to-sql.cpp
index d7e8f8b59..4dc5df12b 100644
--- a/csv/applications/csv-to-sql.cpp
+++ b/csv/applications/csv-to-sql.cpp
@@ -148,6 +148,7 @@ int main( int ac, char** av )
         if( options.exists( "--help,-h" ) ) { usage( true ); }
 
         comma::csv::options csv( options );
+        csv.full_xpath = false;
         if ( csv.binary() ) { std::cerr << app_name << ": binary not handled" << std::endl; return 1; }
 
         std::string null_value = default_null_value;
diff --git a/csv/applications/csv-units.cpp b/csv/applications/csv-units.cpp
index 8a74d546a..fa7addbe8 100644
--- a/csv/applications/csv-units.cpp
+++ b/csv/applications/csv-units.cpp
@@ -1,39 +1,13 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 /// @author kai huang
 
+#include <functional>
 #include <iostream>
 #include <boost/array.hpp>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
+#include <boost/optional.hpp>
 #include <boost/unordered/unordered_map.hpp>
 
 #include <boost/units/systems/si.hpp>
@@ -53,7 +27,6 @@
 #include <boost/units/base_units/angle/degree.hpp>
 
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../csv/stream.h"
 #include "../../visiting/traits.h"
@@ -114,7 +87,6 @@ static void usage(char const * const txt = "")
     std::cerr << msg_general << std::endl; // endl to make this function easier to debug by flushing
     std::cerr << "\ncsv options\n" << comma::csv::options::usage() << std::endl;
     std::cerr << msg_examples << std::endl;
-    std::cerr << '\n' << comma::contact_info << '\n' << std::endl;
     exit( 1 );
 }
 
@@ -133,7 +105,7 @@ typedef boost::units::absolute< boost::units::si::temperature > kelvin_t;
 typedef boost::units::absolute< boost::units::celsius::temperature > celsius_t;
 typedef boost::units::absolute< boost::units::fahrenheit::temperature > fahrenheit_t;
 
-/// Converts the given value between the two template measurement units 
+/// Converts the given value between the two template measurement units
 template < typename From, typename To >
 double cast( double input )
 {
@@ -201,7 +173,7 @@ namespace units {
               count,
               invalid
     };
-    
+
     static boost::array< et, count > metric = {{ kelvin
                                                , radians
                                                , kelvin
@@ -254,7 +226,7 @@ namespace units {
     /// returns a name even if the value is invalid
     std::string debug_name( const et val ) { return val < 0 || val > invalid ? "ERROR:" + boost::lexical_cast<std::string>(val) : name( val ); }
 
-    /// Given a canonical name or an alias of a measurement unit 
+    /// Given a canonical name or an alias of a measurement unit
     /// retrieve the canonical enumeration.
     et value( std::string const & str )
     {
@@ -298,18 +270,18 @@ namespace units {
         if( map.cend() != citr ) { return citr->second; }
         COMMA_THROW( comma::exception, "expected unit name, got \"" << str << "\"" );
     }
-    
+
     /// A type to allow a lookup table for converting units
     //typedef double (* cast_function)( double );
-    typedef boost::function< double( double ) > cast_function;
-    
+    typedef std::function< double( double ) > cast_function;
+
     /// Retrieve a function that will convert between the two given
     /// measurement units.
     /// @returns NULL if the conversion is not supported.
     cast_function cast_lookup( const et from, const et to ) // quick and dirty
     {
         if ( from < 0 || from >= count ) { COMMA_THROW( comma::exception, "can not cast lookup for invalid unit (from) " << from ); }
-        if ( to < 0 || to >= count ) { COMMA_THROW( comma::exception, "can not cast lookup for invalid unit (to) " << to ); }        
+        if ( to < 0 || to >= count ) { COMMA_THROW( comma::exception, "can not cast lookup for invalid unit (to) " << to ); }
         static cast_function map[count][count] = { { NULL, }, };
         static bool initialised = false;
         if (! initialised )
@@ -340,18 +312,18 @@ namespace units {
             map[metres][feet] = cast< length_t, imperial_us_length_t >;
             map[metres][nautical_miles] = cast< length_t, nautical_mile_t >;
             map[metres][statute_miles] = cast< length_t, statute_mile_t >;
-            map[hours][minutes] = boost::bind( &scale, _1, 60.0 );
-            map[hours][seconds] = boost::bind( &scale, _1, 3600.0 );
-            map[minutes][seconds] = boost::bind( &scale, _1, 60.0 );
-            map[minutes][hours] = boost::bind( &scale, _1, 1.0 / 60.0 );
-            map[seconds][hours] = boost::bind( &scale, _1, 1.0 / 3600.0 );
-            map[seconds][minutes] = boost::bind( &scale, _1, 1.0 / 60.0 );
-            map[percent][fraction] = boost::bind( &scale, _1, 0.01 );
-            map[fraction][percent] = boost::bind( &scale, _1, 100.0 );
+            map[hours][minutes] = std::bind( &scale, std::placeholders::_1, 60.0 );
+            map[hours][seconds] = std::bind( &scale, std::placeholders::_1, 3600.0 );
+            map[minutes][seconds] = std::bind( &scale, std::placeholders::_1, 60.0 );
+            map[minutes][hours] = std::bind( &scale, std::placeholders::_1, 1.0 / 60.0 );
+            map[seconds][hours] = std::bind( &scale, std::placeholders::_1, 1.0 / 3600.0 );
+            map[seconds][minutes] = std::bind( &scale, std::placeholders::_1, 1.0 / 60.0 );
+            map[percent][fraction] = std::bind( &scale, std::placeholders::_1, 0.01 );
+            map[fraction][percent] = std::bind( &scale, std::placeholders::_1, 100.0 );
         }
         return map[from][to];
     }
-    
+
     /// Test if the conversion between two measurement units is supported.
     bool can_convert( const et from, const et to ) { return NULL != cast_lookup(from, to); }
 }
@@ -379,7 +351,7 @@ struct item_t
 
 struct input_t
 {
-    std::vector< item_t > values;    
+    std::vector< item_t > values;
 };
 
 namespace comma { namespace visiting {
@@ -423,7 +395,7 @@ static std::string init_input_field( const std::string& v )
 {
     const std::string stripped( comma::strip( v, ' ' ) );
     if( stripped.empty() ) { return std::string(); }
-    
+
     const size_t pos = stripped.rfind( '/' );
     std::string head, tail;
     if ( std::string::npos == pos ) // just a
@@ -441,11 +413,11 @@ static std::string init_input_field( const std::string& v )
             tail = "value";
         }
     }
-    
+
     unsigned idx = input_fields.size();
     if ( input_fields.cend() == input_fields.find( head ) ) { input_fields[head] = idx; }
     else { idx = input_fields.at( head ); }
-    
+
     return "values[" + boost::lexical_cast< std::string >( idx ) + "]/" + tail;
 }
 
@@ -461,7 +433,6 @@ static void init_input()
         fields += init_input_field( v[i] );
     }
     csv.fields = fields;
-    csv.full_xpath = true;
     input.values.resize( input_fields.size() ); //input.values.resize( size );
 }
 
@@ -487,7 +458,7 @@ static int run( const units::et from, const units::et to )
 
     units::cast_function const default_cast_function = units::cast_lookup( from, to );
     if (NULL == default_cast_function) { COMMA_THROW( comma::exception, "unsupported default conversion from " << debug_name(from) << " to " << debug_name(to) ); }
-    
+
     unsigned line = 0;
     while( istream.ready() || ( std::cin.good() && !std::cin.eof() ) )
     {
@@ -518,7 +489,7 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
-        
+
         if( options.exists( "--help,-h" ) ) usage();
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
diff --git a/csv/applications/csv-update.cpp b/csv/applications/csv-update.cpp
index 98f0ff463..32b09b537 100644
--- a/csv/applications/csv-update.cpp
+++ b/csv/applications/csv-update.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
@@ -41,7 +14,6 @@
 #include <boost/unordered_map.hpp>
 #include <boost/graph/graph_concepts.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/types.h"
 #include "../../csv/stream.h"
 #include "../../csv/impl/unstructured.h"
@@ -59,25 +31,11 @@ static void usage( bool more )
     std::cerr << std::endl;
     std::cerr << "       if update input specified (update.csv above), update" << std::endl;
     std::cerr << "       records from stdin by the ones in the update file" << std::endl;
-    if( more )
-    {
-        std::cerr << "       todo" << std::endl;
-    }
-    else
-    {
-        std::cerr << "       ... use --help --verbose for more" << std::endl;
-    }
+    if( more ) { std::cerr << "       todo" << std::endl; } else { std::cerr << "       ... use --help --verbose for more" << std::endl; }
     std::cerr << std::endl;
     std::cerr << "       if update input not specified, apply updates received" << std::endl;
     std::cerr << "       on stdin itself" << std::endl;
-    if( more )
-    {
-        std::cerr << "       todo" << std::endl;
-    }
-    else
-    {
-        std::cerr << "       ... use --help --verbose for more" << std::endl;
-    }
+    if( more ) { std::cerr << "       todo" << std::endl; } else { std::cerr << "       ... use --help --verbose for more" << std::endl; }
     std::cerr << std::endl;
     std::cerr << "    fields:" << std::endl;
     std::cerr << "        block: block number" << std::endl;
@@ -109,7 +67,7 @@ static void usage( bool more )
     std::cerr << "    --update-non-empty-fields,--update-non-empty,-u:" << std::endl;
     std::cerr << "        if update has empty fields, use the field value from stdin (for binary, empty fields must be defined with --empty)" << std::endl;
     std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
-    if( more ) { std::cerr << std::endl << "csv options:" << std::endl << comma::csv::options::usage() << std::endl; }
+    if( more ) { std::cerr << std::endl << "csv options:" << std::endl << comma::csv::options::usage() << std::endl; } else { std::cerr << std::endl << "csv options ... use --help --verbose for more" << std::endl; }
     std::cerr << std::endl;
     if( more )
     {
@@ -154,8 +112,6 @@ static void usage( bool more )
         std::cerr << "examples ... use --help --verbose" << std::endl;
     }
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
     exit( 0 );
 }
 
@@ -163,7 +119,7 @@ struct input_t
 {
     comma::csv::impl::unstructured key;
     comma::csv::impl::unstructured value;
-    comma::uint32 block;
+    comma::uint32 block{0};
 
     input_t() : block( 0 ) {}
     input_t( comma::csv::impl::unstructured key, comma::csv::impl::unstructured value, comma::uint32 block ): key( key ), value( value ), block( block ) {}
@@ -175,8 +131,8 @@ struct map_t
 {
     struct value_type
     {
-        unsigned int index;
-        input_t value;
+        unsigned int index{0};
+        input_t value{};
         std::string string;
 
         value_type() {}
@@ -215,7 +171,7 @@ static bool last_block = false;
 static bool last_only = false;
 static bool matched_only = false;
 static bool update_non_empty = false;
-static input_t default_input;
+static input_t default_input{};
 static comma::csv::impl::unstructured empty;
 static boost::optional< comma::csv::impl::unstructured > erase;
 static map_t::type filter_map;
@@ -244,8 +200,7 @@ static void output_and_clear( map_t::type& map, bool do_output, comma::csv::outp
         }
         for( output_map_t::const_iterator it = m.begin(); it != m.end(); ++it )
         {   
-            if( ostream ) { ostream->write( it->second->value, it->second->string ); }
-            else { std::cout << it->second->string; }
+            if( ostream ) { ostream->write( it->second->value, it->second->string ); } else { std::cout << it->second->string; }
         }
     }
     map.clear();
@@ -256,7 +211,6 @@ static input_t::input_stream_t* make_filter_stream()
     if( filter_transport ) { return new input_t::input_stream_t( **filter_transport, csv, default_input ); }
     if( filter_line.empty() ) { return NULL; }
     comma::csv::options c;
-    c.full_xpath = true;
     c.fields = csv.fields;
     static std::istringstream iss( filter_line );
     return new input_t::input_stream_t( iss, c, default_input );
@@ -390,7 +344,6 @@ int main( int ac, char** av )
         comma::command_line_options options( ac, av, usage );
         verbose = options.exists( "--verbose,-v" );
         csv = comma::csv::options( options );
-        csv.full_xpath = true;
         csv.quote.reset();
         last_only = options.exists( "--last-only,--last" );
         last_block = options.exists( "--last-block" );
@@ -448,7 +401,6 @@ int main( int ac, char** av )
             std::string s = options.value< std::string >( "--empty" ) + std::string( f.count(), ',' );
             std::istringstream iss( s );
             comma::csv::options c;
-            c.full_xpath = true;
             c.fields = csv.fields;
             comma::csv::input_stream< input_t > isstream( iss, c, default_input );
             empty = ( isstream.read() )->value;
@@ -460,7 +412,6 @@ int main( int ac, char** av )
             std::string s = options.value< std::string >( "--remove,--reset,--unset,--erase" ) + std::string( f.count(), ',' );
             std::istringstream iss( s );
             comma::csv::options c;
-            c.full_xpath = true;
             c.fields = csv.fields;
             comma::csv::input_stream< input_t > isstream( iss, c, default_input );
             erase = ( isstream.read() )->value;
diff --git a/csv/applications/play/multiplay.cpp b/csv/applications/play/multiplay.cpp
index ac590b0ee..bdb81e305 100644
--- a/csv/applications/play/multiplay.cpp
+++ b/csv/applications/play/multiplay.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
 #include <sstream>
@@ -35,13 +34,8 @@
 #include "../../../string/string.h"
 #include "multiplay.h"
 
-namespace comma {
-
+namespace comma { namespace csv { namespace applications { namespace play {
 
-/*!
-    @brief Constructor
-    @param configs csv options
-*/
 Multiplay::Multiplay( const std::vector< SourceConfig >& configs
                     , double speed
                     , bool quiet
@@ -51,8 +45,8 @@ Multiplay::Multiplay( const std::vector< SourceConfig >& configs
                     , bool flush )
     : m_configs( configs )
     , istreams_( configs.size() )
-    , m_inputStreams( configs.size() )
-    , m_publishers( configs.size() )
+    , _input_streams( configs.size() )
+    , _publishers( configs.size() )
     , m_play( speed, quiet, resolution )
     , m_timestamps( configs.size() )
     , m_started( false )
@@ -66,18 +60,26 @@ Multiplay::Multiplay( const std::vector< SourceConfig >& configs
         // todo: quick and dirty for now: blocking streams for named pipes
         istreams_[i].reset( new io::istream( configs[i].options.filename, m_configs[i].options.binary() ? io::mode::binary : io::mode::ascii, io::mode::blocking ) );
         if( !( *istreams_[i] )() ) { COMMA_THROW( comma::exception, "named pipe " << configs[i].options.filename << " is closed (todo: support closed named pipes)" ); }
-        m_inputStreams[i].reset( new csv::input_stream< time >( *( *istreams_[i] )(), m_configs[i].options ) );
+        _input_streams[i].reset( new csv::input_stream< time >( *( *istreams_[i] )(), m_configs[i].options ) );
         unsigned int j;
         for( j = 0; j < i && configs[j].outputFileName != configs[i].outputFileName; ++j ); // quick and dirty: unique publishers
-        if( j == i ) { m_publishers[i].reset( new io::publisher( configs[i].outputFileName, m_configs[i].options.binary() ? io::mode::binary : io::mode::ascii, true, flush ) ); }
-        else { m_publishers[i] = m_publishers[j]; }
+        if( j == i )
+        {
+            const auto& s = comma::split( configs[i].outputFileName, ':' ); // todo: quick and dirty for now; add usage semantics for local sockets
+            if( s.size() > 2 && s[0] == "tcp" ) { _publishers[i].reset( new comma::csv::applications::play::client_publisher( configs[i].outputFileName, m_configs[i].options.binary(), flush ) ); }
+            else { _publishers[i].reset( new comma::csv::applications::play::server_publisher( configs[i].outputFileName, m_configs[i].options.binary(), flush ) ); }
+        }
+        else
+        {
+            _publishers[i] = _publishers[j];
+        }
         boost::posix_time::time_duration d;
         if( configs[i].offset.total_microseconds() != 0 )
         {
             if( m_configs[i].options.binary() )
             {
                 binary_[i].reset( new csv::binary< time >( m_configs[i].options.fields ) );
-                buf_fer.resize( m_configs[i].options.format().size() );
+                _buffer.resize( m_configs[i].options.format().size() );
             }
             else
             {
@@ -92,7 +94,7 @@ void Multiplay::close()
     for( unsigned int i = 0U; i < m_configs.size(); i++ )
     {
         istreams_[i]->close();
-        m_publishers[i]->close();
+        _publishers[i]->close();
     }
 }
 
@@ -112,21 +114,14 @@ bool Multiplay::ready() // quick and dirty; should not it be in io::Publisher?
     if( m_started ) { return true; }
     for( unsigned int i = 0; i < m_configs.size(); ++i )
     {
-        m_publishers[i]->accept();
-        if( m_publishers[i]->size() < m_configs[i].minNumberOfClients )
-        {
-            boost::this_thread::sleep( boost::posix_time::millisec( 200 ) );
-            return false;
-        }
+        _publishers[i]->accept();
+        if( _publishers[i]->size() < m_configs[i].minNumberOfClients ) { boost::this_thread::sleep( boost::posix_time::millisec( 200 ) ); return false; }
     }
     m_started = true;
     return true;
 }
     
-/*!
-    @brief try to read from all files and write the oldest
-    @return true if at least one file could be read
-*/
+/// @brief try to read from all files and write the oldest; return true if at least one file could be read
 bool Multiplay::read()
 {
     if( !ready() ) { return true; }
@@ -134,19 +129,12 @@ bool Multiplay::read()
     for( unsigned int i = 0U; i < m_configs.size(); ++i )
     {
         if( !m_timestamps[i].is_not_a_date_time() ) { end = false; continue; }
-        const time* time = m_inputStreams[i]->read();
+        const time* time = _input_streams[i]->read();
         if( time == NULL ) { continue; }
         boost::posix_time::ptime t = time->timestamp;
-        if( m_configs[i].offset.total_microseconds() != 0 )
-        {
-            t += m_configs[i].offset;
-        }
+        if( m_configs[i].offset.total_microseconds() != 0 ) { t += m_configs[i].offset; }
         end = false;
-        if( ( ( !m_from.is_not_a_date_time() ) && ( t < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( t > m_to ) ) )
-        {            
-            i--;
-            continue;
-        }
+        if( ( ( !m_from.is_not_a_date_time() ) && ( t < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( t > m_to ) ) ) { i--; continue; }
         m_timestamps[i] = t;
     }
     if( end ) { return false; }
@@ -158,23 +146,20 @@ bool Multiplay::read()
         oldest = m_timestamps[i];
         index = i;
     }
-    if( ( ( !m_from.is_not_a_date_time() ) && ( oldest < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( oldest > m_to ) ) )
-    {
-        return true;
-    }
+    if( ( ( !m_from.is_not_a_date_time() ) && ( oldest < m_from ) ) || ( ( !m_to.is_not_a_date_time() ) && ( oldest > m_to ) ) ) { return true; }
     now_ = oldest;
     m_play.wait( oldest );
     if( m_configs[index].options.binary() )
     {
         if( binary_[index] )
         {
-            ::memcpy( &buf_fer[0], m_inputStreams[index]->binary().last(), buf_fer.size() );
-            binary_[index]->put( time( oldest ), &buf_fer[0] );
-            m_publishers[index]->write( &buf_fer[0], buf_fer.size() );
+            ::memcpy( &_buffer[0], _input_streams[index]->binary().last(), _buffer.size() );
+            binary_[index]->put( time( oldest ), &_buffer[0] );
+            _publishers[index]->write( &_buffer[0], _buffer.size() );
         }
         else
         {
-            m_publishers[index]->write( m_inputStreams[index]->binary().last(), m_configs[index].options.format().size() );
+            _publishers[index]->write( _input_streams[index]->binary().last(), m_configs[index].options.format().size() );
         }
     }
     else
@@ -182,18 +167,17 @@ bool Multiplay::read()
         static std::string endl = impl::endl(); // quick and dirty, since publisher is not std::stream
         if( ascii_[index] )
         {
-            std::vector< std::string > last = m_inputStreams[index]->ascii().last();
+            std::vector< std::string > last = _input_streams[index]->ascii().last();
             ascii_[index]->put( time( oldest ), last );
-            ( *m_publishers[index] ) << comma::join( last, m_configs[index].options.delimiter ) << endl;
+            _publishers[index]->write_line( comma::join( last, m_configs[index].options.delimiter ) );
         }
         else
         {
-            ( *m_publishers[index] ) << comma::join( m_inputStreams[index]->ascii().last(), m_configs[index].options.delimiter ) << endl;
+            _publishers[index]->write_line( comma::join( _input_streams[index]->ascii().last(), m_configs[index].options.delimiter ) );
         }
     }
     m_timestamps[index] = boost::posix_time::not_a_date_time;
     return true;
 }
 
-} // namespace comma {
-
+} } } } // namespace comma { namespace csv { namespace applications { namespace play {
diff --git a/csv/applications/play/multiplay.h b/csv/applications/play/multiplay.h
index 6486854f1..5e1e32304 100644
--- a/csv/applications/play/multiplay.h
+++ b/csv/applications/play/multiplay.h
@@ -30,17 +30,54 @@
 
 /// @author cedric wohlleber
 
-#ifndef COMMA_CSV_MULTIPLAY_H
-#define COMMA_CSV_MULTIPLAY_H
+#pragma once
 
 #include <vector>
 #include <boost/thread/thread_time.hpp>
 #include "../../../csv/options.h"
 #include "../../../csv/stream.h"
 #include "../../../io/publisher.h"
+#include "../../../io/stream.h"
 #include "play.h"
 
-namespace comma {
+namespace comma { namespace csv { namespace applications { namespace play {
+
+struct publisher // todo? quick and dirty; improve and put someplace generic
+{
+    virtual ~publisher() = default;
+    virtual unsigned int size() const = 0;
+    virtual void close() = 0;
+    virtual void accept() {}
+    virtual void write( const char* buf, unsigned int size ) = 0;
+    virtual void write_line( const std::string& ) = 0;
+};
+
+class server_publisher: public publisher
+{
+    public:
+        server_publisher( const std::string& name, bool binary, bool flush ): _oserver( name, binary ? io::mode::binary : io::mode::ascii, true, flush || !binary ) {}
+        unsigned int size() const { return _oserver.size(); }
+        void close() { _oserver.close(); }
+        void accept() { _oserver.accept(); }
+        void write( const char* buf, unsigned int size ) { _oserver.write( buf, size ); }
+        void write_line( const std::string& s ) { _oserver.write( &s[0], s.size() ); _oserver.write( "\n", 1 ); }
+    private:
+        io::oserver _oserver;
+};
+
+class client_publisher: public publisher
+{
+    public:
+        client_publisher( const std::string& name, bool binary, bool flush ): _ostream( name, binary ? io::mode::binary : io::mode::ascii, io::mode::non_blocking ), _flush( flush ) {}
+        unsigned int size() const { return 1; }
+        void close() { _ostream.close(); }
+        void accept() {}
+        void write( const char* buf, unsigned int size ) { _ostream->write( buf, size ); if( _flush ) { _ostream->flush(); } }
+        void write_line( const std::string& s ) { _ostream->write( &s[0], s.size() ); if( _flush ) { _ostream->flush(); } ( *_ostream ) << std::endl; }
+    private:
+        io::ostream _ostream;
+        bool _flush{false};
+};
 
 /// gets data from multiple input files, and output in a real time manner to output files,  using timestamps
 class Multiplay
@@ -59,21 +96,18 @@ class Multiplay
             std::size_t minNumberOfClients;
             csv::options options;
             boost::posix_time::time_duration offset;
-            SourceConfig( const std::string& output, const csv::options& csv ) :
-                outputFileName( output ), minNumberOfClients( 0 ), options( csv ) {}
-            SourceConfig( const std::string& output, std::size_t n, const csv::options& csv ) :
-                outputFileName( output ), minNumberOfClients( n ), options( csv ) {}
-            SourceConfig() {};
+            SourceConfig( const std::string& output, const csv::options& csv ): outputFileName( output ), minNumberOfClients( 0 ), options( csv ) {}
+            SourceConfig( const std::string& output, std::size_t n, const csv::options& csv ): outputFileName( output ), minNumberOfClients( n ), options( csv ) {}
+            SourceConfig() { options.full_xpath = false; };
         };
 
         Multiplay( const std::vector< SourceConfig >& configs
-                , double speed = 1.0
-                , bool quiet = false
-                , const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds( 1 )
-                , boost::posix_time::ptime from = boost::posix_time::not_a_date_time
-                , boost::posix_time::ptime to = boost::posix_time::not_a_date_time
-                , bool flush = true
-                 );
+                 , double speed = 1.0
+                 , bool quiet = false
+                 , const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds( 1 )
+                 , boost::posix_time::ptime from = boost::posix_time::not_a_date_time
+                 , boost::posix_time::ptime to = boost::posix_time::not_a_date_time
+                 , bool flush = true );
 
         void close();
 
@@ -81,11 +115,13 @@ class Multiplay
         
         boost::posix_time::ptime now() const { return now_; }
 
+        void paused_for( const boost::posix_time::time_duration& pause_duration ) { m_play.paused_for( pause_duration ); }
+
     private:
         std::vector<SourceConfig> m_configs;
         std::vector< boost::shared_ptr< comma::io::istream > > istreams_;
-        std::vector< boost::shared_ptr< csv::input_stream< time > > > m_inputStreams;
-        std::vector< boost::shared_ptr< comma::io::publisher > > m_publishers;
+        std::vector< boost::shared_ptr< csv::input_stream< time > > > _input_streams;
+        std::vector< boost::shared_ptr< comma::csv::applications::play::publisher > > _publishers;
         csv::impl::play m_play;
         std::vector< boost::posix_time::ptime > m_timestamps;
         boost::posix_time::ptime now_;
@@ -94,33 +130,25 @@ class Multiplay
         boost::posix_time::ptime m_to;
         std::vector< boost::shared_ptr< csv::ascii< time > > > ascii_;
         std::vector< boost::shared_ptr< csv::binary< time > > > binary_;
-        std::vector< char > buf_fer;
+        std::vector< char > _buffer;
         bool ready();
 };
 
-} // namespace comma {
+} } } } // namespace comma { namespace csv { namespace applications { namespace play {
 
 namespace comma { namespace visiting {
 
-template <> struct traits< comma::Multiplay::time >
+template <> struct traits< comma::csv::applications::play::Multiplay::time >
 {
-    template < typename Key, class Visitor >
-    static void visit( Key, comma::Multiplay::time& t, Visitor& v )
-    {
-        v.apply( "t", t.timestamp );
-    }
-
-    template < typename Key, class Visitor >
-    static void visit( Key, const comma::Multiplay::time& t, Visitor& v )
-    {
-        v.apply( "t", t.timestamp );
-    }
+    typedef comma::csv::applications::play::Multiplay::time type_t;
+    template < typename Key, class Visitor > static void visit( Key, type_t& t, Visitor& v ) { v.apply( "t", t.timestamp ); }
+    template < typename Key, class Visitor > static void visit( Key, const type_t& t, Visitor& v ) { v.apply( "t", t.timestamp ); }
 };
 
-template <> struct traits< comma::Multiplay::SourceConfig >
+template <> struct traits< comma::csv::applications::play::Multiplay::SourceConfig >
 {
-    template < typename Key, class Visitor >
-    static void visit( Key, comma::Multiplay::SourceConfig& c, Visitor& v )
+    typedef comma::csv::applications::play::Multiplay::SourceConfig type_t;
+    template < typename Key, class Visitor > static void visit( Key, type_t& c, Visitor& v )
     {
         v.apply( "options", c.options );
         v.apply( "output", c.outputFileName );
@@ -130,8 +158,7 @@ template <> struct traits< comma::Multiplay::SourceConfig >
 		c.offset = boost::posix_time::microseconds( static_cast< boost::int64_t >( duration * 1e6 ) );
     }
 
-    template < typename Key, class Visitor >
-    static void visit( Key, const comma::Multiplay::SourceConfig& c, Visitor& v )
+    template < typename Key, class Visitor > static void visit( Key, const type_t& c, Visitor& v )
     {
         v.apply( "options", c.options );
         v.apply( "output", c.outputFileName );
@@ -143,5 +170,3 @@ template <> struct traits< comma::Multiplay::SourceConfig >
 };
 
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_CSV_MULTIPLAY_H
diff --git a/csv/applications/play/play.cpp b/csv/applications/play/play.cpp
index 69566cd90..f138045e8 100644
--- a/csv/applications/play/play.cpp
+++ b/csv/applications/play/play.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
 #include <boost/thread/thread.hpp>
@@ -37,57 +36,39 @@
 namespace comma { namespace csv { namespace impl {
     
 /// constructor    
-play::play( double speed, bool quiet, const boost::posix_time::time_duration& resolution ):
-    m_speed( speed ),
-    m_resolution( resolution ),
-    m_lag( false ),
-    m_lagCounter( 0U ),
-    m_quiet( quiet )
-{
-}
-
-/// constructor
-/// @param first first timestamp
-/// @param speed slow-down factor: 1.0 = real time, 2.0 = twice as slow etc...
+/// @param speed speed-up factor: 1.0 = real time, 0.5 = half speed etc
 /// @param quiet if true, do not output warnings if we can not keep up with the desired playback speed
 /// @param resolution expected resolution from the sleep function
-play::play( const boost::posix_time::ptime& first, double speed, bool quiet, const boost::posix_time::time_duration& resolution ):
-
-    m_systemFirst( boost::get_system_time() ),
-    m_offset( m_systemFirst - first ),
-    m_first( first ),
-    m_last( first ),
-    m_speed( speed ),
-    m_resolution( resolution ),
-    m_lag( false ),
-    m_lagCounter( 0U ),
-    m_quiet( quiet )
+play::play( double speed, bool quiet, const boost::posix_time::time_duration& resolution )
+    : m_times_initialized( false )
+    , m_speed( speed )
+    , m_resolution( resolution )
+    , m_lag( false )
+    , m_lagCounter( 0U )
+    , m_quiet( quiet )
 {
-    
 }
 
-
 /// wait until a timestamp
 /// @param time timestamp as ptime
 void play::wait( const boost::posix_time::ptime& time )
 {
-
-    if ( !m_offset )
+    if ( !m_times_initialized )
     {
         boost::posix_time::ptime systemTime = boost::get_system_time();
-        m_offset = systemTime - time;
         m_systemFirst = systemTime;
         m_first = time;
         m_last = time;
+        m_times_initialized = true;
     }
     else
     {        
         if ( time > m_last )
         {
             boost::posix_time::ptime systemTime = boost::get_system_time();
-            const boost::posix_time::ptime target = m_systemFirst + boost::posix_time::milliseconds( static_cast<long>(( time - m_first ).total_milliseconds() * m_speed ) );
+            const boost::posix_time::ptime target = m_systemFirst + boost::posix_time::milliseconds( static_cast<long>(( time - m_first ).total_milliseconds() / m_speed ) );
             const boost::posix_time::time_duration lag = systemTime - target;
-            if ( !m_quiet && ( lag > m_resolution ) ) // no need to be alarmed for a lag less than the expected accuracy
+            if ( !m_quiet && lag > m_resolution ) // no need to be alarmed for a lag less than the expected accuracy
             {
                 if( !m_lag )
                 {
@@ -100,14 +81,11 @@ void play::wait( const boost::posix_time::ptime& time )
             {
                 if( !m_quiet && m_lag )
                 {
-                    m_lag = false;
                     std::cerr << "csv-play: recovered after " << m_lagCounter << " packets " << std::endl;
+                    m_lag = false;
                     m_lagCounter = 0U;
                 }
-                if ( lag < -m_resolution ) // no need to sleep less than the expected accuracy
-                {
-                    boost::this_thread::sleep( target );
-                }
+                if( lag < -m_resolution ) { boost::this_thread::sleep( target ); } // no need to sleep less than the expected accuracy
             }
             m_last = time;
         }
@@ -120,10 +98,10 @@ void play::wait( const boost::posix_time::ptime& time )
 
 /// wait until a timestamp
 /// @param isoTime timestamp in iso format
-void play::wait( const std::string& isoTime )
-{
-    wait( boost::posix_time::from_iso_string( isoTime ) );
-}
+void play::wait( const std::string& isoTime ) { wait( boost::posix_time::from_iso_string( isoTime ) ); }
+
+/// allow for a pause in playback
+/// @param pause_duration duration of pause
+void play::paused_for( const boost::posix_time::time_duration& pause_duration ) { if( m_times_initialized ) { m_systemFirst += pause_duration; } }
 
 } } } // namespace comma { namespace csv { namespace impl {
-    
\ No newline at end of file
diff --git a/csv/applications/play/play.h b/csv/applications/play/play.h
index 9ae95c6eb..e4b0815ff 100644
--- a/csv/applications/play/play.h
+++ b/csv/applications/play/play.h
@@ -27,11 +27,9 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
-#ifndef COMMA_CSV_APPLICATIONS_PLAY_H
-#define COMMA_CSV_APPLICATIONS_PLAY_H
+#pragma once
 
 #include <boost/optional.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
@@ -43,15 +41,16 @@ class play
 {
 public:
     play( double speed = 1.0, bool quiet = false, const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds(1) );
-    play( const boost::posix_time::ptime& first, double speed = 1.0, bool quiet = false, const boost::posix_time::time_duration& resolution = boost::posix_time::milliseconds(1) );
 
     void wait( const boost::posix_time::ptime& time );
 
     void wait( const std::string& isoTime );
 
+    void paused_for( const boost::posix_time::time_duration& pause_duration );
+
 private:
+    bool m_times_initialized;
     boost::posix_time::ptime m_systemFirst; /// system time at first timestamp
-    boost::optional< boost::posix_time::time_duration > m_offset; /// offset between timestamps and system time
     boost::posix_time::ptime m_first; /// first timestamp
     boost::posix_time::ptime m_last; /// last timestamp received
     const double m_speed;
@@ -62,5 +61,3 @@ class play
 };
 
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // COMMA_CSV_APPLICATIONS_PLAY_H
diff --git a/csv/applications/split/split.cpp b/csv/applications/split/split.cpp
index 71f7f8a62..e38aba81e 100644
--- a/csv/applications/split/split.cpp
+++ b/csv/applications/split/split.cpp
@@ -27,7 +27,6 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifdef WIN32
@@ -39,100 +38,196 @@
 #include <sys/resource.h>
 #endif
 
+#include <unordered_map>
 #include <boost/lexical_cast.hpp>
-#include "../../../io/file_descriptor.h"
 #include "../../../base/exception.h"
+#include "../../../csv/stream.h"
+#include "../../../csv/traits.h"
+#include "../../../io/file_descriptor.h"
+#include "../../../io/impl/filesystem.h"
+#include "../../../name_value/parser.h"
+#include "../../../visiting/traits.h"
 #include "split.h"
 
 namespace comma { namespace csv { namespace applications {
 
+template < typename T > struct filename_record
+{
+    T id;
+    std::string filename;
+    filename_record( const T& id = 0, const std::string& filename = "" ): id( id ), filename( filename ) {}
+};
+
+} } } // namespace comma { namespace csv { namespace applications {
+
+namespace comma { namespace visiting {
+
+template < typename T > struct traits< comma::csv::applications::filename_record< T > >
+{
+    template< typename K, typename V > static void visit( const K& k, comma::csv::applications::filename_record< T >& t, V& v )
+    {
+        v.apply( "id", t.id );
+        v.apply( "filename", t.filename );
+    }
+
+    template< typename K, typename V > static void visit( const K& k, const comma::csv::applications::filename_record< T >& t, V& v )
+    {
+        v.apply( "id", t.id );
+        v.apply( "filename", t.filename );
+    }
+};
+
+template <> struct traits< comma::csv::applications::timestamp >
+{
+    template< typename K, typename V > static void visit( const K&, comma::csv::applications::timestamp& t, V& v ) { v.apply( "t", t.t ); }
+    template< typename K, typename V > static void visit( const K&, const comma::csv::applications::timestamp& t, V& v ) { v.apply( "t", t.t ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace csv { namespace applications {
+
+std::pair< std::unordered_map< comma::uint32, std::string >, bool > static filenames( const std::string& filename )
+{
+    std::pair< std::unordered_map< comma::uint32, std::string >, bool > r;
+    r.second = false;
+    if( filename.empty() ) { return r; }
+    auto csv = comma::name_value::parser( "filename" ).get< comma::csv::options >( filename );
+    if( csv.fields.empty() ) { csv.fields = "filename"; }
+    std::ifstream ifs( csv.filename );
+    if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "could not open --files='" << csv.filename << "'" ); }
+    comma::csv::input_stream< filename_record< comma::uint32 > > is( ifs, csv ); // quick and dirty; todo: support templated map
+    comma::uint32 id = 0;
+    r.second = csv.has_field( "id" );
+    while( is.ready() || ifs.good() )
+    {
+        auto p = is.read();
+        if( p == nullptr ) { break; }
+        r.first[ r.second ? p->id : id++ ] = p->filename; // quick and dirty
+    }
+    if( r.first.empty() ) { COMMA_THROW( comma::exception, "got no filenames from '" << csv.filename << "'" ); }
+    return r;
+}
+
 template < typename T >
-split< T >::split( boost::optional< boost::posix_time::time_duration > period
-            , const std::string& suffix
-            , const comma::csv::options& csv
-            , bool pass )
+void split< T >::timestamps_stream_make_( const std::string& timestamps )
+{
+    if( timestamps.empty() ) { return; }
+    auto csv = comma::name_value::parser( "filename", ';', '=', false ).get< comma::csv::options >( timestamps );
+    timestamps_ifstream_.reset( new std::ifstream( csv.filename ) );
+    if( !timestamps_ifstream_->is_open() ) { COMMA_THROW( comma::exception, "could not open --timestamps='" << csv.filename << "'" ); }
+    timestamps_.reset( new comma::csv::input_stream< csv::applications::timestamp >( *timestamps_ifstream_, csv ) );
+    auto p = timestamps_->read();
+    if( !p ) { COMMA_THROW( comma::exception, "could not read from --timestamps='" << csv.filename << "'" ); } // quick and dirty
+    timestamps_last_.second = p->t;
+    //std::cerr << "--> a: interval: " << boost::posix_time::to_iso_string( timestamps_last_.first ) << " - " << boost::posix_time::to_iso_string( timestamps_last_.second ) << std::endl;
+}
+
+template < typename T > bool split< T >::timestamps_stream_seek_( boost::posix_time::ptime t )
+{
+    bool changed = false;
+    while( t >= timestamps_last_.second && !timestamps_last_.second.is_pos_infinity() )
+    {
+        auto p = timestamps_->read();
+        timestamps_last_.first = timestamps_last_.second;
+        timestamps_last_.second = p ? p->t : boost::posix_time::pos_infin;
+        changed = true;
+    }
+    return changed;
+}
+
+template < typename T >
+split< T >::split( const boost::optional< boost::posix_time::time_duration >& period
+                 , const std::string& suffix
+                 , const comma::csv::options& csv
+                 , bool pass
+                 , const std::string& filenames
+                 , const std::string& default_filename
+                 , const std::string& timestamps )
     : ofstream_( std::bind( &split< T >::ofstream_by_time_, this ) )
     , period_( period )
     , suffix_( suffix )
+    , timestamps_last_( boost::posix_time::neg_infin, boost::posix_time::not_a_date_time )
     , pass_ ( pass )
     , flush_( csv.flush )
     , is_shutdown_( false )
 {
-    if( ( csv.has_field( "t" ) || csv.fields.empty() ) && !period ) { COMMA_THROW( comma::exception, "please specify --period" ); }
     if( csv.fields.empty() ) { return; }
-    if( csv.binary() ) { binary_.reset( new comma::csv::binary< input >( csv ) ); }
-    else { ascii_.reset( new comma::csv::ascii< input >( csv ) ); }
-    if( csv.has_field( "block" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_block_, this ); }
-    else if( csv.has_field( "id" ) ) { ofstream_ = std::bind( &split< T >::ofstream_by_id_, this ); }
+    if( csv.binary() ) { binary_.reset( new comma::csv::binary< input >( csv ) ); } else { ascii_.reset( new comma::csv::ascii< input >( csv ) ); }
+    boost::tie( filenames_, filenames_have_id_ ) = applications::filenames( filenames );
+    if( csv.has_field( "block" ) )
+    {
+        ofstream_ = std::bind( &split< T >::ofstream_by_block_, this );
+    }
+    else if( csv.has_field( "id" ) )
+    {
+        ofstream_ = std::bind( &split< T >::ofstream_by_id_, this );
+    }
+    else   // splitting by time
+    {
+        if( !filenames_.empty() ) { COMMA_THROW( comma::exception, "--files given, but no block field specified in --fields" ); }
+        if( !period && timestamps.empty() ) { COMMA_THROW( comma::exception, "splitting by time; please specify either --period or --timestamps" ); }
+    }
+    timestamps_stream_make_( timestamps );
 }
 
-//to-do
 template < typename T >
-split< T >::split( boost::optional< boost::posix_time::time_duration > period
+split< T >::split( const boost::optional< boost::posix_time::time_duration >& period
                  , const std::string& suffix
                  , const comma::csv::options& csv
                  , const std::vector< std::string >& streams //to-do
-                 , bool pass )
-    : split( period, suffix, csv, pass )
+                 , bool pass
+                 , const std::string& filenames
+                 , const std::string& default_filename
+                 , const std::string& timestamps )
+    : split( period, suffix, csv, pass, filenames, default_filename, timestamps )
 {
-    if( 0 < streams.size() )
+    if( streams.empty() ) { return; }
+    auto const io_mode = csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii;
+    for( auto const& si : streams )
     {
-        auto const io_mode = csv.binary() ? comma::io::mode::binary : comma::io::mode::ascii;
-
-        for( auto const& si : streams )
+        auto const stream_values = comma::split( si, ';' );
+        if( 2 > stream_values.size() || stream_values[ 0 ].empty() || stream_values[ 1 ].empty() ) { COMMA_THROW( comma::exception, "please specify <id> and output <stream> in format <id>;<stream>, got: " << si ); }
+        transaction t( publishers_ );
+        std::unique_ptr< comma::io::publisher > publisher( new comma::io::publisher( stream_values[1], io_mode, false, csv.flush ) );
+        if( "..." == stream_values[0] )
         {
-            auto const stream_values = comma::split( si, ';' );
-            if( 2 > stream_values.size() || stream_values[ 0 ].empty() || stream_values[ 1 ].empty() )
-            {
-                COMMA_THROW( comma::exception, "please specify <id> and output <stream> in format <id>;<stream>, got: " << si );
-            }
-
-            transaction t( publishers_ );
-            std::unique_ptr< comma::io::publisher > publisher( new comma::io::publisher( stream_values[1], io_mode, false, csv.flush ) );
-
-            if( "..." == stream_values[0] )
+            if( default_publisher_ ) { COMMA_THROW( comma::exception, "multiple output streams have the id: ..." ); }
+            default_publisher_ = std::move( publisher );
+        }
+        else
+        {
+            auto publisher_pos = t->insert( std::move( publisher ) );
+            auto const keys = comma::split( stream_values[0], ',' );
+            for( auto const& ki : keys )
             {
-                if( default_publisher_ ) { COMMA_THROW( comma::exception, "multiple output streams have the id: ..." ); }
-                default_publisher_ = std::move( publisher );
-            }
-            else
-            {
-                auto publisher_pos = t->insert( std::move( publisher ) );
-                auto const keys = comma::split( stream_values[0], ',' );
-
-                for( auto const& ki : keys )
-                {
-                    auto const kii = boost::lexical_cast< T >( ki );
-                    if( seen_ids_.end() !=  seen_ids_.find( kii ) ) { COMMA_THROW( comma::exception, "multiple output streams have the id: " << ki ); }
-                    seen_ids_.insert( kii );
-
-                    mapped_publishers_.insert( std::make_pair( kii, publisher_pos.first->get() ) );
-                }
+                auto const kii = boost::lexical_cast< T >( ki );
+                if( seen_ids_.end() !=  seen_ids_.find( kii ) ) { COMMA_THROW( comma::exception, "multiple output streams have the id: " << ki ); }
+                seen_ids_.insert( kii );
+                mapped_publishers_.insert( std::make_pair( kii, publisher_pos.first->get() ) );
             }
         }
-        acceptor_thread_ = std::thread( std::bind( &split< T >::accept_, std::ref( *this )));
     }
+    acceptor_thread_ = std::thread( std::bind( &split< T >::accept_, std::ref( *this )));
 }
 
-template < typename T >
-split< T >::~split()
+template < typename T > split< T >::~split()
 {
     is_shutdown_ = true;
     if( acceptor_thread_.joinable() )
     {
         acceptor_thread_.join();
         transaction t( publishers_ );
-        for( auto& ii : *t ) { ii->close(); } 
+        for( auto& ii : *t ) { ii->close(); }
     }
 }
 
-template < typename T >
-void split< T >::accept_()
+template < typename T > void split< T >::accept_()
 {
     comma::io::select select;
     {
         transaction t( publishers_ );
-        for( auto& ii : *t ) { if( ii->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ii->acceptor_file_descriptor() ); } } 
+        for( auto& ii : *t ) { if( ii->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ii->acceptor_file_descriptor() ); } }
         if( default_publisher_ ) { if( default_publisher_->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( default_publisher_->acceptor_file_descriptor() ); } }
     }
     while( !is_shutdown_ )
@@ -144,9 +239,7 @@ void split< T >::accept_()
     }
 }
 
-
-template < typename T >
-bool split< T >::published_on_stream( const char* data, unsigned int size )
+template < typename T > bool split< T >::published_on_stream( const char* data, unsigned int size )
 {
     transaction t( publishers_ );
     if( t->empty() && !default_publisher_ ) { return false; }
@@ -157,22 +250,24 @@ bool split< T >::published_on_stream( const char* data, unsigned int size )
     return true;
 }
 
-template < typename T >
-void split< T >::write( const char* data, unsigned int size )
+template < typename T > void split< T >::write( const char* data, unsigned int size )
 {
     mode_ = std::ofstream::out | std::ofstream::binary;
     if( binary_ ) { binary_->get( current_, data ); }
     else { current_.timestamp = boost::get_system_time(); }
     if( !published_on_stream( data, size ) ) // todo? or bind write function on initialisation and call it here?
     {
-        ofstream_().write( data, size );
-        if( flush_ ) { ofstream_().flush(); }
+        auto ofs = ofstream_();
+        if( ofs )
+        {
+            ofs->write( data, size );
+            if( flush_ ) { ofs->flush(); }
+        }
     }
-    if ( pass_ ) { std::cout.write( data, size ); std::cout.flush(); }
+    if( pass_ ) { std::cout.write( data, size ); std::cout.flush(); }
 }
 
-template < typename T >
-void split< T >::write ( std::string line )
+template < typename T > void split< T >::write( std::string line )
 {
     mode_ = std::ofstream::out; // quick and dirty
     if( ascii_ ) { ascii_->get( current_, line ); }
@@ -180,54 +275,70 @@ void split< T >::write ( std::string line )
     line += '\n';
     if( !published_on_stream( &line[0], line.size()) ) // todo? or bind write function on initialisation and call it here?
     {
-        std::ofstream& ofs = ofstream_();
-        ofs.write( &line[0], line.size() );
-        //ofs.put( '\n' );
-        if( flush_ ) { ofs.flush(); }
+        auto ofs = ofstream_();
+        if( ofs )
+        {
+            ofs->write( &line[0], line.size() );
+            //ofs.put( '\n' );
+            if( flush_ ) { ofs->flush(); }
+        }
     }
-    if ( pass_ ) { std::cout.write( &line[0], line.size() ); /*std::cout.put('\n');*/ std::cout.flush(); }
+    if( pass_ ) { std::cout.write( &line[0], line.size() ); /*std::cout.put('\n');*/ std::cout.flush(); }
 }
 
-template < typename T >
-std::ofstream& split< T >::ofstream_by_time_()
+template < typename T > std::ofstream* split< T >::ofstream_by_time_()
 {
-    if( !last_ || current_.timestamp > ( last_->timestamp + *period_ ) )
+    bool changed = period_ ? !last_ || current_.timestamp > last_->timestamp + *period_ : timestamps_stream_seek_( current_.timestamp );
+    if( !last_ || changed )
     {
         file_.close();
-        std::string time = boost::posix_time::to_iso_string( current_.timestamp );
+        std::string time = boost::posix_time::to_iso_string( period_ || timestamps_last_.first.is_neg_infinity() ? current_.timestamp : timestamps_last_.first );
         if( time.find_first_of( '.' ) == std::string::npos ) { time += ".000000"; }
         file_.open( ( time + suffix_ ).c_str(), mode_ );
         last_ = current_;
     }
-    return file_;
+    return &file_;
 }
 
-template < typename T >
-std::ofstream& split< T >::ofstream_by_block_()
+template < typename T > std::ofstream* split< T >::ofstream_by_block_()
 {
+    static comma::uint32 id = 0;
     if( !last_ || last_->block != current_.block )
     {
         file_.close();
-        std::string name = boost::lexical_cast< std::string >( current_.block ) + suffix_;
-        file_.open( name.c_str(), mode_ );
+        std::string filename;
+        if( !filenames_.empty() )
+        {
+            auto it = filenames_.find( filenames_have_id_ ? current_.block : id );
+            if( it == filenames_.end() ) { return nullptr; }
+            filename = it->second;
+            const auto& dirname = comma::filesystem::path( filename ).parent_path();
+            COMMA_ASSERT( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ), "failed to create directory '" << dirname << "' for file: '" << filename << "'" )
+        }
+        if( filename.empty() ) { filename = boost::lexical_cast< std::string >( current_.block ) + suffix_; }
+        file_.open( &filename[0], mode_ );
+        COMMA_ASSERT( file_.is_open(), "failed to open '" << filename << "'" );
         last_ = current_;
+        ++id;
     }
-    return file_;
+    return &file_;
 }
 
-template < typename T >
-static std::string make_filename_from_id(const T& id, std::string suffix )
-{
-    return boost::lexical_cast< std::string >( id ) + suffix;
-}
+template < typename T > static std::string to_string( const T& v ) { return boost::lexical_cast< std::string >( v ); }
 
-static std::string make_filename_from_id(const boost::posix_time::ptime& id, std::string suffix )
+template <> std::string to_string< boost::posix_time::ptime >( const boost::posix_time::ptime& v ) { return boost::posix_time::to_iso_string( v ); }
+
+template < typename T, typename M > static std::string find_( const M& m, const T& id ) { COMMA_THROW( comma::exception, "id-to-filename map not implemented for this type" ); }
+
+template <> std::string find_< comma::uint32, std::unordered_map< comma::uint32, std::string > >( const std::unordered_map< comma::uint32, std::string >& m, const comma::uint32& id )
 {
-    return boost::posix_time::to_iso_string( id ) + suffix;
+    auto it = m.find( id );
+    return it == m.end() ? std::string() : it->second;
 }
 
-template < typename T >
-std::ofstream& split< T >::ofstream_by_id_()
+template < typename T > std::string split< T >::filename_from_id_( const T& id ) { return filenames_.empty() ? to_string( id ) + suffix_ : find_( filenames_, id ); }
+
+template < typename T > std::ofstream* split< T >::ofstream_by_id_()
 {
     typename Files::iterator it = files_.find( current_.id );
     if( it == files_.end() )
@@ -237,18 +348,21 @@ std::ofstream& split< T >::ofstream_by_id_()
         #else
         static struct rlimit r;
         static int q = getrlimit( RLIMIT_NOFILE, &r );
-        if( q != 0 ) { COMMA_THROW( comma::exception, "getrlimit() failed" ); }
+        if( q != 0 ) { COMMA_THROW( comma::exception, "getting resource limit (getrlimit()) for number of open files failed" ); }
         static unsigned int max_number_of_open_files = static_cast< unsigned int >( r.rlim_cur );
         #endif
         if( files_.size() + 10 > max_number_of_open_files ) { files_.clear(); } // quick and dirty, may be too drastic...
         std::ios_base::openmode mode = mode_;
         if( seen_ids_.find( current_.id ) == seen_ids_.end() ) { seen_ids_.insert( current_.id ); }
         else { mode |= std::ofstream::app; }
-        std::string name = make_filename_from_id( current_.id, suffix_);
-        std::shared_ptr< std::ofstream > stmp( new std::ofstream( name.c_str(), mode ) );
+        std::string name = filename_from_id_( current_.id );
+        if( name.empty() ) { return nullptr; }
+        const auto& dirname = comma::filesystem::path( name ).parent_path();
+        COMMA_ASSERT( dirname.empty() || comma::filesystem::is_directory( dirname ) || comma::filesystem::create_directories( dirname ), "failed to create directory '" << dirname << "' for file: '" << name << "'" );
+        std::shared_ptr< std::ofstream > stmp( new std::ofstream( &name[0], mode ) );
         it = files_.insert( std::make_pair( current_.id, stmp ) ).first;
     }
-    return *it->second;
+    return it->second.get();
 }
 
 template class split< comma::uint32 >;
diff --git a/csv/applications/split/split.h b/csv/applications/split/split.h
index 053097a31..5e1d4bfa4 100644
--- a/csv/applications/split/split.h
+++ b/csv/applications/split/split.h
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2022 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -30,22 +31,22 @@
 /// @author vsevolod vlaskine
 /// @author cedric wohlleber
 
-#ifndef COMMA_CSV_SPLIT_H
-#define COMMA_CSV_SPLIT_H
+#pragma once
 
 #include <fstream>
 #include <fstream>
 #include <functional>
 #include <memory>
+#include <type_traits>
 #include <unordered_map>
 #include <unordered_set>
 #include <thread>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/optional.hpp>
-#include <boost/static_assert.hpp>
 #include "../../../base/types.h"
 #include "../../../csv/ascii.h"
 #include "../../../csv/binary.h"
+#include "../../../csv/stream.h"
 #include "../../../visiting/traits.h"
 #include "../../../io/publisher.h"
 #include "../../../sync/synchronized.h"
@@ -55,10 +56,13 @@ namespace comma { namespace csv { namespace applications {
 template < typename T > struct input // quick and dirty
 {
     boost::posix_time::ptime timestamp;
-    comma::uint32 block;
+    comma::uint32 block{0};
+    comma::uint32 size{0};
     T id;
 };
 
+struct timestamp { boost::posix_time::ptime t; };
+
 } } } // namespace comma { namespace csv { namespace applications {
 
 namespace comma { namespace visiting {
@@ -69,6 +73,7 @@ template < typename T > struct traits< comma::csv::applications::input< T > >
     {
         v.apply( "t", p.timestamp );
         v.apply( "block", p.block );
+        v.apply( "size", p.size );
         v.apply( "id", p.id );
     }
 
@@ -76,6 +81,7 @@ template < typename T > struct traits< comma::csv::applications::input< T > >
     {
         v.apply( "t", p.timestamp );
         v.apply( "block", p.block );
+        v.apply( "size", p.size );
         v.apply( "id", p.id );
     }
 };
@@ -100,7 +106,7 @@ template <> struct traits< boost::posix_time::ptime >
     {
         std::size_t operator()( const boost::posix_time::ptime& t ) const
         {
-            BOOST_STATIC_ASSERT( sizeof( t ) == sizeof( comma::uint64 ) );
+            static_assert( sizeof( t ) == sizeof( comma::uint64 ), "expected time of size 8" );
             std::size_t seed = 0;
             boost::hash_combine( seed, reinterpret_cast< const comma::uint64& >( t ) ); // quick and dirty
             return seed;
@@ -119,32 +125,36 @@ class split
 {
     public:
         typedef applications::input< T > input;
-
-        split( boost::optional< boost::posix_time::time_duration > period
+        split( const boost::optional< boost::posix_time::time_duration >& period
              , const std::string& suffix
              , const comma::csv::options& csv
-             , bool passthrough );
-
-        void write( const char* data, unsigned int size );
-        void write( std::string line );
-
-        //to-do
-        split( boost::optional< boost::posix_time::time_duration > period
+             , bool passthrough
+             , const std::string& filenames
+             , const std::string& default_filename = ""
+             , const std::string& timestamps = "" );
+        split( const boost::optional< boost::posix_time::time_duration >& period
              , const std::string& suffix
              , const comma::csv::options& csv
              , const std::vector< std::string >& streams
-             , bool passthrough );
+             , bool passthrough
+             , const std::string& filenames
+             , const std::string& default_filename = ""
+             , const std::string& timestamps = "" );
         ~split();
-
+        void write( const char* data, unsigned int size );
+        void write( std::string line );
     private:
-        std::ofstream& ofstream_by_time_();
-        std::ofstream& ofstream_by_block_();
-        std::ofstream& ofstream_by_id_();
+        std::ofstream* ofstream_by_time_();
+        std::ofstream* ofstream_by_block_();
+        std::ofstream* ofstream_by_id_();
+        std::string filename_from_id_( const T& id );
         void update_( const char* data, unsigned int size );
         void update_( const std::string& line );
         void accept_();
+        void timestamps_stream_make_( const std::string& timestamps );
+        bool timestamps_stream_seek_( boost::posix_time::ptime t );
 
-        std::function< std::ofstream&() > ofstream_;
+        std::function< std::ofstream*() > ofstream_;
         std::unique_ptr< comma::csv::ascii< input > > ascii_;
         std::unique_ptr< comma::csv::binary< input > > binary_;
         boost::optional< boost::posix_time::time_duration > period_;
@@ -153,6 +163,9 @@ class split
         boost::optional< input > last_;
         std::ios_base::openmode mode_;
         std::ofstream file_;
+        std::unique_ptr< std::ifstream > timestamps_ifstream_;
+        std::unique_ptr< comma::csv::input_stream< applications::timestamp > > timestamps_;
+        std::pair< boost::posix_time::ptime, boost::posix_time::ptime > timestamps_last_;
 
         using Files = typename traits< T >::map;
         using ids_type_ = typename traits< T >::set;
@@ -162,6 +175,9 @@ class split
         ids_type_ seen_ids_;
         bool pass_;
         bool flush_;
+        std::unordered_map< comma::uint32, std::string > filenames_;
+        // todo? std::unique_ptr< comma::io::publisher > default_file_;
+        bool filenames_have_id_;
 
         //to-do
         bool published_on_stream( const char* data, unsigned int size );
@@ -174,5 +190,3 @@ class split
 };
 
 } } } // namespace comma { namespace csv { namespace applications {
-
-#endif // COMMA_CSV_SPLIT_H
diff --git a/csv/ascii.h b/csv/ascii.h
index 0e1fdf3ed..cb653b627 100644
--- a/csv/ascii.h
+++ b/csv/ascii.h
@@ -87,6 +87,9 @@ class ascii
         
         /// return quote sign
         boost::optional< char > quote() const { return quote_; }
+        
+        /// return default value
+        const S& sample() const { return sample_; }
 
     private:
         char delimiter_;
diff --git a/csv/block.h b/csv/block.h
new file mode 100644
index 000000000..62cfe1617
--- /dev/null
+++ b/csv/block.h
@@ -0,0 +1,36 @@
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+namespace comma { namespace csv {
+
+class block_counter
+{
+    public:
+        block_counter( comma::uint32 b = 0, comma::uint32 s = 0 ): _block( b ), _size( s ) {}
+        comma::uint32 operator()() const { return _block; }
+        comma::uint32 size() const { return _size; }
+        comma::uint32 current_size() const { return _current_size; }
+        bool fixed() const { return _size > 0; }
+        template < typename T > bool operator==( const T& t ) const { return _size > 0 ? _current_size < _size : t.block == _block; } // dodgy?
+        template < typename T > bool operator!=( const T& t ) const { return !operator==( t ); }
+        template < typename T > void update( const T& t );
+        template < typename T > bool ready( const T& t ) const { return _size > 0 ? _current_size == _size : t.block != _block; }
+    private:
+        comma::uint32 _block{0};
+        comma::uint32 _size{0};
+        comma::uint32 _current_size{0}; 
+};
+
+template < typename T > inline void block_counter::update( const T& t )
+{ 
+    if( _size == 0 ) { _block = t.block; return; }
+    ++_current_size;
+    if( _current_size <= _size ) { return; }
+    _current_size = 1;
+    ++_block;
+}
+
+} } // namespace comma { namespace csv {
diff --git a/csv/examples/applications/CMakeLists.txt b/csv/examples/applications/CMakeLists.txt
new file mode 100644
index 000000000..1445ca4c6
--- /dev/null
+++ b/csv/examples/applications/CMakeLists.txt
@@ -0,0 +1,9 @@
+project( comma-csv-sample-application )
+cmake_minimum_required( VERSION 3.1 )
+add_compile_options( -std=c++14 )
+find_package( Boost REQUIRED COMPONENTS thread filesystem system date_time iostreams program_options regex )
+find_package( comma REQUIRED PATHS "/usr/local/CMakeFiles" )
+add_executable( comma-csv-sample-application-append comma-csv-sample-application-append.cpp )
+target_link_libraries( comma-csv-sample-application-append ${comma_ALL_LIBRARIES} )
+add_executable( comma-csv-sample-application-emplace comma-csv-sample-application-emplace.cpp )
+target_link_libraries( comma-csv-sample-application-emplace ${comma_ALL_LIBRARIES} )
diff --git a/csv/examples/applications/comma-csv-sample-application-append.cpp b/csv/examples/applications/comma-csv-sample-application-append.cpp
new file mode 100644
index 000000000..f56e7f75e
--- /dev/null
+++ b/csv/examples/applications/comma-csv-sample-application-append.cpp
@@ -0,0 +1,139 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+#include <cmath>
+#include <exception>
+#include <iostream>
+#include <comma/application/command_line_options.h>
+#include <comma/csv/stream.h>
+#include <comma/string/string.h>
+#include <comma/visiting/traits.h>
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "example: read csv/binary fixed-width data on stdin (angle and factor)" << std::endl;
+    std::cerr << "         count input records, calculate sin and cos of angle, and sign of factor" << std::endl;
+    std::cerr << "         append to input, output to stdout" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat values.csv | ./comma-csv-sample-application-append [<options>] > result.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --input-fields; print input fields to stdout and exit" << std::endl;
+    std::cerr << "    --output-fields; print output fields to stdout and exit" << std::endl;
+    std::cerr << "    --output-format; print output format to stdout and exit" << std::endl;
+    std::cerr << "    --no-append; do not output stdin records to stdout, output only result" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "    ascii" << std::endl;
+    std::cerr << "        ( echo 45,20; echo 30,-10 ) | ./comma-csv-sample-application-append" << std::endl;
+    std::cerr << "    binary" << std::endl;
+    std::cerr << "        ( echo 45,20; echo 30,-10 ) \\" << std::endl;
+    std::cerr << "            | csv-to-bin 2d \\" << std::endl;
+    std::cerr << "            | ./comma-csv-sample-application-append --binary 2d \\" << std::endl;
+    std::cerr << "            | csv-from-bin 2d,ui,3d" << std::endl;
+    std::cerr << std::endl;
+}
+
+namespace comma { namespace csv { namespace examples { namespace application {
+
+struct input
+{
+    double angle{0};
+    double factor{0};
+};
+
+struct output
+{
+    struct trigonometric_t
+    {
+        double sin;
+        double cos;
+    };
+    unsigned int count{0};
+    trigonometric_t trigonometric;
+    double factor_sign{0};
+};
+
+} } } } // namespace comma { namespace csv { namespace examples { namespace application {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv::examples::application::input >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "angle", p.angle );
+        v.apply( "factor", p.factor );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "angle", p.angle );
+        v.apply( "factor", p.factor );
+    }
+};
+
+template <> struct traits< comma::csv::examples::application::output::trigonometric_t >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::output::trigonometric_t& p, Visitor& v )
+    {
+        v.apply( "sin", p.sin );
+        v.apply( "cos", p.cos );
+    }
+};
+
+template <> struct traits< comma::csv::examples::application::output >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::output& p, Visitor& v )
+    {
+        v.apply( "count", p.count );
+        v.apply( "trigonometric", p.trigonometric );
+        v.apply( "factor_sign", p.factor_sign );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+static comma::csv::examples::application::output& populate_output( const comma::csv::examples::application::input& input
+                                                                 , comma::csv::examples::application::output& output )
+{
+    ++output.count;
+    output.trigonometric.sin = std::sin( input.angle * M_PI / 180 );
+    output.trigonometric.cos = std::cos( input.angle * M_PI / 180 );
+    output.factor_sign = input.factor > 0 ? 1 : input.factor < 0 ? -1 : 0;
+    return output;
+}
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        comma::csv::options csv( options );
+        typedef comma::csv::examples::application::input input_t;
+        typedef comma::csv::examples::application::output output_t;
+        if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< input_t >(), ',' ) << std::endl; return 0; }
+        if( options.exists( "--output-fields" ) ) { std::cout << comma::join( comma::csv::names< output_t >(), ',' ) << std::endl; return 0; }
+        if( options.exists( "--output-format" ) ) { std::cout << comma::csv::format::value< output_t >() << std::endl; return 0; }
+        comma::csv::input_stream< input_t > is( std::cin, csv );
+        comma::csv::output_stream< output_t > os( std::cout, csv.binary() );
+        auto tied = comma::csv::make_tied( is, os );
+        bool append = !options.exists( "--no-append" );
+        output_t output;
+        while( is.ready() || std::cin.good() )
+        {
+            auto p = is.read();
+            if( !p ) { break; }
+            if( append ) { tied.append( populate_output( *p, output ) ); }
+            else { os.write( populate_output( *p, output ) ); }
+        }
+        return 0;
+    }
+    catch( const std::exception& e ) { std::cerr << av[0] << ": " << e.what() << std::endl; }
+    catch( ... ) { std::cerr << av[0] << ": unknown exception" << std::endl; }
+    return 1;
+}
\ No newline at end of file
diff --git a/csv/examples/applications/comma-csv-sample-application-emplace.cpp b/csv/examples/applications/comma-csv-sample-application-emplace.cpp
new file mode 100644
index 000000000..63a2e7ff6
--- /dev/null
+++ b/csv/examples/applications/comma-csv-sample-application-emplace.cpp
@@ -0,0 +1,107 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+#include <exception>
+#include <iostream>
+#include <comma/application/command_line_options.h>
+#include <comma/csv/stream.h>
+#include <comma/string/string.h>
+#include <comma/visiting/traits.h>
+
+static void usage( bool verbose )
+{
+    std::cerr << std::endl;
+    std::cerr << "example: read csv/binary fixed-width data on stdin, calculate some result" << std::endl;
+    std::cerr << "         update input values emplace, output to stdout" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "usage: cat values.csv | ./comma-csv-sample-application-emplace [<options>] > result.csv" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "options" << std::endl;
+    std::cerr << "    --input-fields; print input fields to stdout and exit" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "csv options" << std::endl;
+    std::cerr << comma::csv::options::usage( verbose ) << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "examples" << std::endl;
+    std::cerr << "    ascii" << std::endl;
+    std::cerr << "        ( echo 1,2; echo 3,4 ) | ./comma-csv-sample-application-emplace" << std::endl;
+    std::cerr << "    binary" << std::endl;
+    std::cerr << "        ( echo 1,2; echo 3,4 ) \\" << std::endl;
+    std::cerr << "            | csv-to-bin 2ui \\" << std::endl;
+    std::cerr << "            | ./comma-csv-sample-application-emplace --binary 2ui \\" << std::endl;
+    std::cerr << "            | csv-from-bin 2ui" << std::endl;
+    std::cerr << std::endl;
+}
+
+namespace comma { namespace csv { namespace examples { namespace application {
+
+struct input
+{
+    struct nested { double c{0}; };
+    double a{0};
+    nested b;
+};
+
+} } } } // namespace comma { namespace csv { namespace examples { namespace application {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::csv::examples::application::input::nested >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input::nested& p, Visitor& v )
+    {
+        v.apply( "c", p.c );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input::nested& p, Visitor& v )
+    {
+        v.apply( "c", p.c );
+    }
+};
+
+template <> struct traits< comma::csv::examples::application::input >
+{
+    template < typename Key, class Visitor > static void visit( const Key&, const comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key&, comma::csv::examples::application::input& p, Visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+static comma::csv::examples::application::input updated( const comma::csv::examples::application::input& input )
+{
+    auto r = input;
+    r.a = input.a + input.b.c;
+    return r;
+}
+
+int main( int ac, char** av )
+{
+    try
+    {
+        comma::command_line_options options( ac, av, usage );
+        comma::csv::options csv( options );
+        typedef comma::csv::examples::application::input input_t;
+        if( options.exists( "--input-fields" ) ) { std::cout << comma::join( comma::csv::names< input_t >(), ',' ) << std::endl; return 0; }
+        comma::csv::input_stream< comma::csv::examples::application::input > is( std::cin, csv );
+        auto passed = comma::csv::make_passed( is, std::cout, csv.flush );
+        while( is.ready() || std::cin.good() )
+        {
+            auto p = is.read();
+            if( !p ) { break; }
+            passed.write( updated( *p ) );
+        }
+        return 0;
+    }
+    catch( const std::exception& e ) { std::cerr << av[0] << ": " << e.what() << std::endl; }
+    catch( ... ) { std::cerr << av[0] << ": unknown exception" << std::endl; }
+    return 1;
+}
\ No newline at end of file
diff --git a/csv/examples/bash/irregular-stream-to-csv b/csv/examples/bash/irregular-stream-to-csv
new file mode 100755
index 000000000..55bfb2ce9
--- /dev/null
+++ b/csv/examples/bash/irregular-stream-to-csv
@@ -0,0 +1,40 @@
+#!/bin/bash
+
+# suppose we have an ascii stream (e.g. produced by a sensor) that mixes severals
+# values appearing in the stream at various times and we can distinguish different
+# input record types by some keywords
+#
+# we want to convert it into a csv stream with each record containing
+# the latest values
+#
+# notes
+# - the same is possible with a bit more effort with binary data
+# - --unbuffered in sed is required, if your stream has to be realtime
+
+function test-input()
+{
+    cat <<eof
+greeting: hello
+which: holy
+who: cow
+greeting: bye
+which: wicked
+greeting: hi
+which: lazy
+who: fox
+greeting: jump
+which: brown
+eof
+}
+
+test-input \
+    | sed -e 's#\(greeting: .*\)#\1,,#' \
+          -e 's#\(which: .*\)#,\1,#' \
+          -e 's#\(who: .*\)#,,\1#' \
+          --unbuffered \
+    | csv-update --update-non-empty \
+    | sed -e 's#greeting: ##' \
+          -e 's#which: ##' \
+          -e 's#who: ##' \
+          --unbuffered \
+    | tr ',' ' '
\ No newline at end of file
diff --git a/csv/examples/bin_load.m b/csv/examples/matlab/load-binary-file.m
similarity index 100%
rename from csv/examples/bin_load.m
rename to csv/examples/matlab/load-binary-file.m
diff --git a/csv/examples/bin_save.m b/csv/examples/matlab/save-binary-file.m
similarity index 100%
rename from csv/examples/bin_save.m
rename to csv/examples/matlab/save-binary-file.m
diff --git a/csv/examples/iso2seconds.m b/csv/examples/matlab/time-iso-to-seconds.m
similarity index 100%
rename from csv/examples/iso2seconds.m
rename to csv/examples/matlab/time-iso-to-seconds.m
diff --git a/csv/examples/seconds2iso.m b/csv/examples/matlab/time-seconds-to-iso.m
similarity index 100%
rename from csv/examples/seconds2iso.m
rename to csv/examples/matlab/time-seconds-to-iso.m
diff --git a/csv/format.cpp b/csv/format.cpp
index 048535ed6..c2415b636 100644
--- a/csv/format.cpp
+++ b/csv/format.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -41,7 +13,6 @@
 #include "../base/types.h"
 #include "../string/string.h"
 #include "../csv/format.h"
-#include "impl/epoch.h"
 
 namespace comma { namespace csv {
 
@@ -132,7 +103,7 @@ static boost::array< unsigned int, 14 > Sizesimpl()
 {
     boost::array< unsigned int, 14 > sizes;
     sizes[ format::char_t ] = sizeof( char );
-    sizes[ format::int8 ] = sizeof( char );
+    sizes[ format::int8 ] = sizeof( signed char );
     sizes[ format::uint8 ] = sizeof( unsigned char );
     sizes[ format::int16 ] = sizeof( int16 );
     sizes[ format::uint16 ] = sizeof( uint16 );
@@ -226,8 +197,8 @@ static boost::posix_time::ptime time_from_iso_string( const std::string& s )
     if ( s.empty() || s == "not-a-date-time" ) { return boost::posix_time::not_a_date_time; }
     else if ( s == "+infinity" || s == "+inf" || s == "inf" ) { return boost::posix_time::pos_infin; }
     else if ( s == "-infinity" || s == "-inf" ) { return boost::posix_time::neg_infin; }
-    else 
-    { 
+    else
+    {
         try { return boost::posix_time::from_iso_string( s ); }
         catch ( ... ) { return boost::posix_time::not_a_date_time; }
     }
@@ -243,9 +214,9 @@ static std::size_t csv_to_bin( char* buf, const std::string& s, format::types_en
             case format::int8:
             {
                 int i = boost::lexical_cast< int >( s );
-                if( i < -127 || i > 128 ) { COMMA_THROW( comma::exception, "expected byte, got " << i ); }
-                *buf = static_cast< char >( i );
-                return sizeof( char );
+                if( i < -128 || i > 127 ) { COMMA_THROW( comma::exception, "expected byte, got " << i ); }
+                *buf = static_cast< signed char >( i );
+                return sizeof( signed char );
             }
             case format::uint8:
             {
@@ -287,14 +258,8 @@ static std::size_t csv_to_bin( char* buf, const std::string& s, format::types_en
             default: COMMA_THROW( comma::exception, "todo: not implemented" );
         }
     }
-    catch( std::exception& ex )
-    {
-        COMMA_THROW( comma::exception, "failed to convert \"" << s << "\" to type \"" << format::to_format(type) << "\": "  << ex.what() );
-    }
-    catch( ... )
-    {
-        throw;
-    }
+    catch( std::exception& ex ) { COMMA_THROW( comma::exception, "failed to convert \"" << s << "\" to type \"" << format::to_format(type) << "\": "  << ex.what() ); }
+    catch( ... ) { throw; }
 }
 
 static std::size_t bin_to_csv( std::ostringstream& oss, const char* buf, format::types_enum type, std::size_t size, const boost::optional< unsigned int >& precision )
@@ -302,7 +267,7 @@ static std::size_t bin_to_csv( std::ostringstream& oss, const char* buf, format:
     switch( type ) // todo: tear down bin_to_csv, use format::traits
     {
         case format::int8:
-            oss << static_cast< int >( *buf );
+            oss << static_cast< int >( static_cast< signed char >( *buf ));
             return sizeof( char );
         case format::uint8:
             oss << static_cast< unsigned int >( static_cast< unsigned char >( *buf ) );
@@ -377,7 +342,7 @@ std::string format::csv_to_bin( const std::vector< std::string >& csv ) const
 std::string format::bin_to_csv( const std::string& bin, char delimiter, const boost::optional< unsigned int >& precision ) const
 {
     if( bin.length() != size_ ) { COMMA_THROW( comma::exception, "expected binary string of size " << size_ << ", got " << bin.length() << " bytes" ); }
-    return bin_to_csv( bin.c_str(), delimiter, precision );
+    return bin_to_csv( &bin[0], delimiter, precision );
 }
 
 std::string format::bin_to_csv( const char* buf, char delimiter, const boost::optional< unsigned int >& precision ) const
@@ -459,7 +424,7 @@ std::string format::collapsed_string() const
 
 // formats for not-a-date-time, +infinity, -infinity
 // note: these are not boost representations. in boost, +infinity = int64::max() - 1, -infinity = int64::min(), not-a-date-time = int64::max()
-// not-a-date-time is chosen to matche python numpy.datetime64('NaT') = int64::min()
+// not-a-date-time is chosen to match python numpy.datetime64('NaT') = int64::min()
 static const comma::int64 bin_not_a_date_time = std::numeric_limits< comma::int64 >::min();
 static const comma::int64 bin_time_pos_infin = std::numeric_limits< comma::int64 >::max();
 static const comma::int64 bin_time_neg_infin = std::numeric_limits< comma::int64 >::min() + 1;
@@ -501,27 +466,13 @@ boost::posix_time::ptime format::traits< boost::posix_time::ptime, format::time
     //::memcpy( &microseconds, buf, sizeof( comma::int64 ) );
 	(void)size;
     comma::int64 microseconds = *reinterpret_cast< const comma::int64* >( buf );
-    if( microseconds == bin_not_a_date_time ) { return boost::posix_time::not_a_date_time; }
-    if( microseconds == bin_time_pos_infin ) { return boost::posix_time::pos_infin; }
-    if( microseconds == bin_time_neg_infin ) { return boost::posix_time::neg_infin; }
-    long seconds = static_cast< long >( microseconds / 1000000 ); // todo: due to bug in boost, will be casted down to int32, but for the dates we use seconds will never overflow, thus, leave it like this now
-    microseconds -= static_cast< comma::int64 >( seconds ) * 1000000;
-    return boost::posix_time::ptime( csv::impl::epoch, boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( static_cast< long >( microseconds ) ) );
+    return comma::csv::time::from_microseconds( microseconds );
 }
 
 void format::traits< boost::posix_time::ptime, format::time >::to_bin( const boost::posix_time::ptime& t, char* buf, std::size_t size )
 {
-    if( t.is_not_a_date_time() ) { *reinterpret_cast< comma::int64* >( buf ) = bin_not_a_date_time; return; }
-    if( t.is_pos_infinity() ) { *reinterpret_cast< comma::int64* >( buf ) = bin_time_pos_infin; return; }
-    if( t.is_neg_infinity() ) { *reinterpret_cast< comma::int64* >( buf ) = bin_time_neg_infin; return; }
 	(void)size;
-    static const boost::posix_time::ptime base( csv::impl::epoch );
-    const boost::posix_time::time_duration duration = t - base;
-    long seconds = duration.total_seconds(); // boost uses long, which is a bug for 32-bit
-    comma::int64 microseconds = static_cast< comma::int64 >( seconds ) * 1000000l;
-    microseconds += ( duration - boost::posix_time::seconds( seconds ) ).total_microseconds();
-    *reinterpret_cast< comma::int64* >( buf ) = microseconds; // ::memcpy( buf, &microseconds, sizeof( comma::int64 ) );
-
+    *reinterpret_cast< comma::int64* >( buf ) = comma::csv::time::to_microseconds(t);
 }
 
 std::string format::traits< std::string, format::fixed_string >::from_bin( const char* buf, std::size_t size )
@@ -536,4 +487,31 @@ void format::traits< std::string, format::fixed_string >::to_bin( const std::str
     if( t.length() < size ) { ::memset( buf + t.length(), 0, size - t.length() ); }
 }
 
+namespace time {
+
+boost::posix_time::ptime from_microseconds(comma::int64 microseconds, boost::gregorian::date epoch)
+{
+    if( microseconds == bin_not_a_date_time ) { return boost::posix_time::not_a_date_time; }
+    if( microseconds == bin_time_pos_infin ) { return boost::posix_time::pos_infin; }
+    if( microseconds == bin_time_neg_infin ) { return boost::posix_time::neg_infin; }
+    long seconds = static_cast< long >( microseconds / 1000000 ); // todo: due to bug in boost, will be casted down to int32, but for the dates we use seconds will never overflow, thus, leave it like this now
+    microseconds -= static_cast< comma::int64 >( seconds ) * 1000000;
+    return boost::posix_time::ptime( epoch, boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( static_cast< long >( microseconds ) ) );
+}
+
+comma::int64 to_microseconds(const boost::posix_time::ptime& t, boost::gregorian::date epoch)
+{
+    if( t.is_not_a_date_time() ) { return bin_not_a_date_time; }
+    if( t.is_pos_infinity() ) { return bin_time_pos_infin; }
+    if( t.is_neg_infinity() ) { return bin_time_neg_infin; }
+    static const boost::posix_time::ptime base( epoch );
+    const boost::posix_time::time_duration duration = t - base;
+    long seconds = duration.total_seconds(); // boost uses long, which is a bug for 32-bit
+    comma::int64 microseconds = static_cast< comma::int64 >( seconds ) * 1000000l;
+    microseconds += ( duration - boost::posix_time::seconds( seconds ) ).total_microseconds();
+    return microseconds;
+}
+
+} // namespace time {
+
 } } // namespace comma { namespace csv {
diff --git a/csv/format.h b/csv/format.h
index c167ecc49..7bd874db4 100644
--- a/csv/format.h
+++ b/csv/format.h
@@ -1,37 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_APPLICATIONS_FORMAT_HEADER_GUARD_
-#define COMMA_CSV_APPLICATIONS_FORMAT_HEADER_GUARD_
+#pragma once
 
 #include <stdlib.h>
 #include <iostream>
@@ -48,12 +20,21 @@
 #include "../visiting/visit.h"
 #include "../visiting/while.h"
 #include "../xpath/xpath.h"
+#include "impl/epoch.h" 
 
 namespace comma { namespace csv {
 
 /// forward declaration
 namespace impl { class to_format; }
 
+namespace time {
+
+boost::posix_time::ptime from_microseconds(comma::int64 microseconds, boost::gregorian::date epoch=csv::impl::epoch);
+
+comma::int64 to_microseconds(const boost::posix_time::ptime& t, boost::gregorian::date epoch=csv::impl::epoch);
+
+} // namespace time {
+
 /// csv to/from bin format
 /// @todo the interface has got real messy; fully refactor!
 class format
@@ -77,6 +58,7 @@ class format
             //static void to_bin( const T& t, char* buf, std::size_t size = sizeof( T ) ) { ::memcpy( buf, &t, sizeof( T ) ); }
             static T from_bin( const char* buf, std::size_t size = sizeof( T ) ) { (void)size; return *reinterpret_cast< const T* >( buf ); }
             static void to_bin( const T& t, char* buf, std::size_t size = sizeof( T ) ) { (void)size; *reinterpret_cast< T* >( buf ) = t; }
+            static T zero() { return 0; }
         };
 
         /// struct containing offsets
@@ -166,7 +148,6 @@ class format
         template < typename T > static std::string value_impl( const T& t );
 };
 
-
 namespace impl {
 
 class to_format
@@ -257,6 +238,7 @@ inline std::string format::value( const std::string& fields, bool full_xpath, co
 
 template <> inline std::string format::value_impl< bool >( const bool& ) { return "b"; }
 template <> inline std::string format::value_impl< char >( const char& ) { return "b"; }
+template <> inline std::string format::value_impl< signed char >( const signed char& ) { return "b"; }
 template <> inline std::string format::value_impl< unsigned char >( const unsigned char& ) { return "ub"; }
 template <> inline std::string format::value_impl< int16 >( const comma::int16& ) { return "w"; }
 template <> inline std::string format::value_impl< comma::uint16 >( const comma::uint16& ) { return "uw"; }
@@ -282,7 +264,13 @@ template <> struct format::type_to_enum< bool >
     static const char* as_string() { return "b"; }
 };
 
-template <> struct format::type_to_enum< char >
+template <> struct format::type_to_enum< char > // ATTENTION: char is unsigned on arm
+{
+    static const format::types_enum value = format::int8;
+    static const char* as_string() { return "b"; }
+};
+
+template <> struct format::type_to_enum< signed char >
 {
     static const format::types_enum value = format::int8;
     static const char* as_string() { return "b"; }
@@ -367,6 +355,7 @@ template <> struct format::traits< boost::posix_time::ptime, format::long_time >
     static const char* as_string() { return "lt"; }
     static boost::posix_time::ptime from_bin( const char* buf, std::size_t size = 12 );
     static void to_bin( const boost::posix_time::ptime& t, char* buf, std::size_t size = 12 );
+    static boost::posix_time::ptime zero() { return boost::posix_time::ptime(); }
 };
 
 template <> struct format::traits< boost::posix_time::ptime, format::time >
@@ -376,6 +365,7 @@ template <> struct format::traits< boost::posix_time::ptime, format::time >
     static const char* as_string() { return "t"; }
     static boost::posix_time::ptime from_bin( const char* buf, std::size_t size = 8 );
     static void to_bin( const boost::posix_time::ptime& t, char* buf, std::size_t size = 8 );
+    static boost::posix_time::ptime zero() { return boost::posix_time::ptime(); }
 };
 
 template <> struct format::traits< std::string, format::fixed_string >
@@ -384,8 +374,7 @@ template <> struct format::traits< std::string, format::fixed_string >
     static const char* as_string() { return type_to_enum< std::string >::as_string(); }
     static std::string from_bin( const char* buf, std::size_t size );
     static void to_bin( const std::string& t, char* buf, std::size_t size );
+    static std::string zero() { return std::string(); }
 };
 
 } } // namespace comma { namespace csv {
-
-#endif // #ifndef COMMA_CSV_APPLICATIONS_FORMAT_HEADER_GUARD_
diff --git a/csv/impl/epoch.h b/csv/impl/epoch.h
index a428e3bb1..6b5dff0f4 100644
--- a/csv/impl/epoch.h
+++ b/csv/impl/epoch.h
@@ -1,44 +1,14 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_IMPL_EPOCH_H_
-#define COMMA_CSV_IMPL_EPOCH_H_
+#pragma once
 
-#include <boost/date_time/posix_time/posix_time.hpp>
+#include "../../timing/epoch.h"
 
 namespace comma { namespace csv { namespace impl {
 
-static const boost::gregorian::date epoch( 1970, 1, 1 );
+static const boost::gregorian::date epoch = comma::timing::epoch;
 
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // #ifndef COMMA_CSV_IMPL_EPOCH_H_
diff --git a/csv/impl/fieldwise.cpp b/csv/impl/fieldwise.cpp
index 53f16dde9..724efa32a 100644
--- a/csv/impl/fieldwise.cpp
+++ b/csv/impl/fieldwise.cpp
@@ -42,6 +42,7 @@ fieldwise::fieldwise( const std::string& fields, char delimiter )
     , binary_( this )
 {
     csv::options o;
+    o.full_xpath = false;
     o.fields = fields;
     o.delimiter = delimiter;
     init_( o, split( fields, ',' ) );
diff --git a/csv/impl/from_ascii.h b/csv/impl/from_ascii.h
index 94dd64296..1b69ebe7c 100644
--- a/csv/impl/from_ascii.h
+++ b/csv/impl/from_ascii.h
@@ -55,8 +55,8 @@ class from_ascii_
     public:
         /// constructor
         from_ascii_( const std::vector< boost::optional< std::size_t > >& indices
-                  , const std::deque< bool >& optional
-                  , const std::vector< std::string >& line );
+                   , const std::deque< bool >& optional
+                   , const std::vector< std::string >& line );
 
         /// apply
         template < typename K, typename T > void apply( const K& name, boost::optional< T >& value );
@@ -83,6 +83,7 @@ class from_ascii_
         std::size_t index_;
         std::size_t optional_index;
         static void lexical_cast_( char& v, const std::string& s ) { v = s.at( 0 ) == '\'' && s.at( 2 ) == '\'' && s.length() == 3 ? s.at( 1 ) : static_cast< char >( boost::lexical_cast< int >( s ) ); }
+        static void lexical_cast_( signed char& v, const std::string& s ) { v = s.at( 0 ) == '\'' && s.at( 2 ) == '\'' && s.length() == 3 ? s.at( 1 ) : static_cast< signed char >( boost::lexical_cast< int >( s ) ); }
         static void lexical_cast_( unsigned char& v, const std::string& s ) { v = s.at( 0 ) == '\'' && s.at( 2 ) == '\'' && s.length() == 3 ? s.at( 1 ) : static_cast< unsigned char >( boost::lexical_cast< unsigned int >( s ) ); }
         static void lexical_cast_( boost::posix_time::ptime& v, const std::string& s )
         { 
diff --git a/csv/impl/program_options.h b/csv/impl/program_options.h
index 7dd400ae4..9aa7bc424 100644
--- a/csv/impl/program_options.h
+++ b/csv/impl/program_options.h
@@ -55,7 +55,6 @@ inline boost::program_options::options_description program_options::description(
         ( "fields", boost::program_options::value< std::string >()->default_value( default_fields ), "csv fields" )
         ( "binary,b", boost::program_options::value< std::string >(), "csv binary format" )
         ( "delimiter,d", boost::program_options::value< char >()->default_value( ',' ), "csv delimiter" )
-        ( "full-xpath", "expect full xpaths as field names" )
         ( "precision", boost::program_options::value< unsigned int >()->default_value( 12 ), "floating point precision" )
         ( "quote", boost::program_options::value< std::string >()->default_value( "\"" ), "quote sign to quote strings (ascii only)" )
         ( "flush", "flush output stream after each record" );
@@ -69,7 +68,6 @@ inline csv::options program_options::get( const boost::program_options::variable
     if( vm.count( "delimiter ") ) { csv.delimiter = vm[ "delimiter" ].as< char >(); }
     if( vm.count( "precision" ) ) { csv.precision = vm[ "precision" ].as< unsigned int >(); }
     if( vm.count( "binary" ) ) { csv.format( vm[ "binary" ].as< std::string >() ); }
-    csv.full_xpath = vm.count( "full-xpath" ) > 0;
     csv.flush = vm.count( "flush" ) > 0;
     if( vm.count( "quote" ) )
     {
diff --git a/csv/impl/to_ascii.h b/csv/impl/to_ascii.h
index 79b7ce91c..37f44cee3 100644
--- a/csv/impl/to_ascii.h
+++ b/csv/impl/to_ascii.h
@@ -29,8 +29,7 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_IMPL_TOASCII_HEADER_GUARD_
-#define COMMA_CSV_IMPL_TOASCII_HEADER_GUARD_
+#pragma once
 
 #include <vector>
 #include <boost/date_time/posix_time/posix_time.hpp>
@@ -40,6 +39,7 @@
 #include <boost/shared_ptr.hpp>
 #include <boost/type_traits.hpp>
 #include "../../base/exception.h"
+#include "../../base/none.h"
 #include "../../string/string.h"
 #include "../../visiting/visit.h"
 #include "../../visiting/while.h"
@@ -84,13 +84,14 @@ class to_ascii
         const std::vector< boost::optional< std::size_t > >& indices_;
         std::vector< std::string >& row_;
         std::size_t index_;
-        boost::optional< unsigned int > precision_;
-        boost::optional< char > quote_;
+        boost::optional< unsigned int > precision_{ comma::silent_none< unsigned int >() };
+        boost::optional< char > quote_{ comma::silent_none< char >() };
 
         std::string as_string_( const boost::posix_time::ptime& v ) { return to_iso_string( v ); }
         std::string as_string_( const std::string& v ) { return quote_ ? *quote_ + v + *quote_ : v; } // todo: escape/unescape
         // todo: better output semantics for char/unsigned char
         std::string as_string_( const char& v ) { std::ostringstream oss; oss << static_cast< int >( v ); return oss.str(); }
+        std::string as_string_( const signed char& v ) { std::ostringstream oss; oss << static_cast< int >( v ); return oss.str(); }
         std::string as_string_( const unsigned char& v ) { std::ostringstream oss; oss << static_cast< unsigned int >( v ); return oss.str(); }
         void set_precision_( std::ostringstream& oss ) const;
 
@@ -156,5 +157,3 @@ inline void to_ascii::apply_final( const K&, const T& value )
 }
 
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // #ifndef COMMA_CSV_IMPL_TOASCII_HEADER_GUARD_
diff --git a/csv/impl/to_names.h b/csv/impl/to_names.h
index 6be9c5f12..fe877901e 100644
--- a/csv/impl/to_names.h
+++ b/csv/impl/to_names.h
@@ -30,9 +30,12 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_IMPL_TONAMES_H_
-#define COMMA_CSV_IMPL_TONAMES_H_
+#pragma once
 
+#include <memory>
+#if __cplusplus >= 201703L
+#include <optional>
+#endif // #if __cplusplus >= 201703L
 #include <sstream>
 #include <boost/optional.hpp>
 #include <boost/scoped_ptr.hpp>
@@ -51,74 +54,60 @@ namespace comma { namespace csv { namespace impl {
 class to_names
 {
     public:
-        /// constructor
-        to_names( bool full_path_as_name = true );
+        to_names( bool full_path_as_name = true ): _full_path_as_name( full_path_as_name ) {}
         
-        /// constructor
-        to_names( const xpath& root, bool full_path_as_name );
+        to_names( const xpath& root, bool full_path_as_name ): _full_path_as_name( full_path_as_name ), _root( root ) {}
         
-        /// traverse
         template < typename K, typename T >
-        void apply( const K& name, const boost::optional< T >& value );
+        void apply( const K& name, const boost::optional< T >& value ) { apply( name, value ? *value : T() ); }
+
+        #if __cplusplus >= 201703L
+        template < typename K, typename T >
+        void apply( const K& name, const std::optional< T >& value ) { apply( name, value ? *value : T() ); }
+        #endif // #if __cplusplus >= 201703L
         
-        /// traverse
         template < typename K, typename T >
         void apply( const K& name, const boost::scoped_ptr< T >& value );
         
-        /// traverse
         template < typename K, typename T >
         void apply( const K& name, const boost::shared_ptr< T >& value );
+
+        template < typename K, typename T >
+        void apply( const K& name, const std::unique_ptr< T >& value );
         
-        /// traverse
         template < typename K, typename T >
         void apply( const K& name, const T& value );
         
-        /// traverse
         template < typename K, typename T >
         void apply_next( const K& name, const T& value );
         
-        /// output a non-string type
         template < typename K, typename T >
         void apply_final( const K& name, const T& value );
         
-        /// return string
-        const std::vector< std::string >& operator()() const;
+        const std::vector< std::string >& operator()() const { return _names; }
         
     private:
-        bool full_path_as_name_;
-        xpath xpath_;
-        xpath root_;
-        boost::optional< std::size_t > index_;
-        std::vector< std::string > names_;
-        const xpath& append( std::size_t index ) { xpath_.elements.back().index = index; return xpath_; }
-        const xpath& append( const char* name ) { xpath_ /= xpath::element( name ); return xpath_; }
-        const xpath& append( const std::string& name ) { xpath_ /= xpath::element( name ); return xpath_; }
-        const xpath& trim( std::size_t ) { xpath_.elements.back().index = boost::optional< std::size_t >(); return xpath_; }
-        const xpath& trim( const char* ) { xpath_ = xpath_.head(); return xpath_; }
-        const xpath& trim( const std::string& ) { xpath_ = xpath_.head(); return xpath_; }
+        bool _full_path_as_name;
+        xpath _xpath;
+        xpath _root;
+        boost::optional< std::size_t > _index;
+        std::vector< std::string > _names;
+        const xpath& _append( std::size_t index ) { _xpath.elements.back().index = index; return _xpath; }
+        const xpath& _append( const char* name ) { _xpath /= xpath::element( name ); return _xpath; }
+        const xpath& _append( const std::string& name ) { _xpath /= xpath::element( name ); return _xpath; }
+        const xpath& _trim( std::size_t ) { _xpath.elements.back().index = boost::optional< std::size_t >(); return _xpath; }
+        const xpath& _trim( const char* ) { _xpath = _xpath.head(); return _xpath; }
+        const xpath& _trim( const std::string& ) { _xpath = _xpath.head(); return _xpath; }
 };
 
-inline to_names::to_names( bool full_path_as_name ) : full_path_as_name_( full_path_as_name ) {}
-
-inline to_names::to_names( const xpath& root, bool full_path_as_name ) : full_path_as_name_( full_path_as_name ), root_( root ) {}
-
 template < typename K, typename T >
-inline void to_names::apply( const K& name, const boost::optional< T >& value )
-{
-    apply( name, value ? *value : T() );
-}
+inline void to_names::apply( const K& name, const boost::scoped_ptr< T >& value ) { if( value ) { apply( name, *value ); } else { T v; apply( name, v ); } }
 
 template < typename K, typename T >
-inline void to_names::apply( const K& name, const boost::scoped_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); } else { T v; apply( name, v ); }
-}
+inline void to_names::apply( const K& name, const boost::shared_ptr< T >& value ) { if( value ) { apply( name, *value ); } else { T v; apply( name, v ); } }
 
 template < typename K, typename T >
-inline void to_names::apply( const K& name, const boost::shared_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); } else { T v; apply( name, v ); }
-}
+inline void to_names::apply( const K& name, const std::unique_ptr< T >& value ) { if( value ) { apply( name, *value ); } else { T v; apply( name, v ); } }
 
 template < typename K, typename T >
 inline void to_names::apply( const K& name, const T& value )
@@ -131,21 +120,17 @@ inline void to_names::apply( const K& name, const T& value )
 template < typename K, typename T >
 inline void to_names::apply_next( const K& name, const T& value )
 {
-    append( name );
+    _append( name );
     comma::visiting::visit( name, value, *this );
-    trim( name );
+    _trim( name );
 }
 
 template < typename K, typename T >
 inline void to_names::apply_final( const K& name, const T& )
 {
-    append( name );
-    if( xpath_ <= root_ ) { names_.push_back( full_path_as_name_ ? xpath_.to_string() : xpath_.elements.back().to_string() ); }
-    trim( name );
+    _append( name );
+    if( _xpath <= _root ) { _names.push_back( _full_path_as_name ? _xpath.to_string() : _xpath.elements.back().to_string() ); }
+    _trim( name );
 }
 
-inline const std::vector< std::string >& to_names::operator()() const { return names_; }
-
 } } } // namespace comma { namespace csv { namespace impl {
-
-#endif // COMMA_CSV_IMPL_TONAMES_H_
diff --git a/csv/impl/unstructured.h b/csv/impl/unstructured.h
index 21d0426d8..617f77b19 100644
--- a/csv/impl/unstructured.h
+++ b/csv/impl/unstructured.h
@@ -27,14 +27,13 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #pragma once
 
 #include <string>
+#include <type_traits>
 #include <vector>
-#include <boost/static_assert.hpp>
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/functional/hash.hpp>
 #include <boost/lexical_cast.hpp>
@@ -67,9 +66,9 @@ struct unstructured
                 return true;
             }
             
-            struct hash : public std::unary_function< values, std::size_t >
+            struct hash //: public std::function< std::size_t ( const& values ) >
             {
-                std::size_t operator()( values const& p ) const
+                std::size_t operator()( const values& p ) const
                 {
                     std::size_t seed = 0;
                     for( std::size_t i = 0; i < p.size(); ++i ) { hash_combine_impl_( seed, p[i] ); }
@@ -80,7 +79,7 @@ struct unstructured
         private:
             static void hash_combine_impl_( std::size_t& s, const boost::posix_time::ptime& t ) // quick and dirty
             {
-                BOOST_STATIC_ASSERT( sizeof( boost::posix_time::ptime ) == 8 ); // quick and dirty
+                static_assert( sizeof( boost::posix_time::ptime ) == 8, "expected time of size 8" ); // quick and dirty
                 boost::hash_combine( s, reinterpret_cast< const comma::uint64& >( t ) );
             }
             
@@ -198,21 +197,15 @@ struct unstructured
         return f;
     }
     
-    bool operator==( const unstructured& rhs ) const
-    {
-        return longs == rhs.longs && doubles == rhs.doubles && time == rhs.time && strings == rhs.strings;        
-    }
+    bool operator==( const unstructured& rhs ) const { return longs == rhs.longs && doubles == rhs.doubles && time == rhs.time && strings == rhs.strings; }
     
-    bool operator<( const unstructured& rhs ) const
-    {
-        return doubles < rhs.doubles && time < rhs.time && strings < rhs.strings;        
-    }
+    bool operator<( const unstructured& rhs ) const { return doubles < rhs.doubles && time < rhs.time && strings < rhs.strings; }
     
     template < typename T > values< T >& get();
     
     template < typename T > const values< T >& get() const;
         
-    struct hash : public std::unary_function< unstructured, std::size_t >
+    struct hash //: public std::unary_function< unstructured, std::size_t >
     {
         std::size_t operator()( unstructured const& p ) const
         {
diff --git a/csv/names.cpp b/csv/names.cpp
index 76666407c..1a29c5f71 100644
--- a/csv/names.cpp
+++ b/csv/names.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
@@ -36,10 +8,11 @@
 
 namespace comma { namespace csv {
 
-bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset )
+bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset, bool allow_empty )
 {
     for( unsigned int i = 0; i < subset.size(); ++i )
     {
+        if( allow_empty && subset[i].empty() ) { continue; }
         bool found = false;
         for( unsigned int j = 0; !found && j < fields.size(); found = fields[j] == subset[i], ++j );
         if( !found ) { return false; }
@@ -47,9 +20,6 @@ bool fields_exist( const std::vector< std::string >& fields, const std::vector<
     return true;
 }
 
-bool fields_exist( const std::string& fields, const std::string& subset, char delimiter )
-{
-    return fields_exist( comma::split( fields, delimiter ), comma::split( subset, delimiter ) );
-}
+bool fields_exist( const std::string& fields, const std::string& subset, char delimiter, bool allow_empty ) { return fields_exist( comma::split( fields, delimiter, true ), comma::split( subset, delimiter, true ), allow_empty ); }
 
 } } // namespace comma { namespace csv {
diff --git a/csv/names.h b/csv/names.h
index 37a4d2ede..1fe53f86d 100644
--- a/csv/names.h
+++ b/csv/names.h
@@ -1,38 +1,12 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_NAMES_H_
-#define COMMA_CSV_NAMES_H_
+#pragma once
 
+#include <algorithm>
+#include <vector>
+#include <unordered_map>
 #include "../csv/impl/to_names.h"
 #include "../string/string.h"
 #include "../visiting/apply.h"
@@ -42,28 +16,33 @@ namespace comma { namespace csv {
 
 /// the most generic way: return default column names for
 /// a given sample and given subtree in comma-separated xpaths
-template < typename S >
-std::vector< std::string > names( const std::string& paths, bool useFullxpath = true, const S& sample = S() );
+template < typename S > std::vector< std::string > names( const std::string& paths, bool use_full_xpath = true, const S& sample = S() );
 
 /// return default column names for a given sample and given subtree in comma-separated xpaths
-template < typename S >
-std::vector< std::string > names( const char* paths, bool useFullxpath = true, const S& sample = S() ) { return names( std::string( paths ), useFullxpath, sample ); }
+template < typename S > std::vector< std::string > names( const char* paths, bool use_full_xpath = true, const S& sample = S() ) { return names( std::string( paths ), use_full_xpath, sample ); }
 
 /// return default column names for a given sample
-template < typename S >
-std::vector< std::string > names( bool useFullxpath, const S& sample = S() ) { return names( "", useFullxpath, sample ); }
+template < typename S > std::vector< std::string > names( bool use_full_xpath, const S& sample = S() ) { return names( "", use_full_xpath, sample ); }
+
+/// return default column names for a given sample replacing full field names with give aliases
+/// also see csv::options constructor with aliases
+/// attention! aliases: name-value pairs as passed to csv::options: key: alias; value: name
+template < typename S > std::vector< std::string > names( const std::unordered_map< std::string, std::string >& aliases, bool use_full_xpath = true, const S& sample = S() );
 
 /// return default column names for a given sample, use full xpath
-template < typename S >
-std::vector< std::string > names( const S& sample = S() ) { return names( true, sample ); }
+template < typename S > std::vector< std::string > names( const S& sample = S() ) { return names( true, sample ); }
+
+template < typename S > std::unordered_map< std::string, std::string > leaves( const std::string& paths, const S& sample = S() );
+template < typename S > std::unordered_map< std::string, std::string > leaves( const char* paths, const S& sample = S() ) { return leaves( std::string( paths ), sample ); }
+template < typename S > std::unordered_map< std::string, std::string > leaves( const S& sample = S() ) { return leaves( "", sample ); }
 
 /// return true, if all the fields from subset present in fields
 /// @todo make a generic subset application
-bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset );
-bool fields_exist( const std::string& fields, const std::string& subset, char delimiter = ',' );
+bool fields_exist( const std::vector< std::string >& fields, const std::vector< std::string >& subset, bool allow_empty = false );
+bool fields_exist( const std::string& fields, const std::string& subset, char delimiter = ',', bool allow_empty = false );
 
 template < typename S >
-inline std::vector< std::string > names( const std::string& paths, bool useFullxpath, const S& sample )
+inline std::vector< std::string > names( const std::string& paths, bool use_full_xpath, const S& sample )
 {
     std::vector< std::string > p = split( paths, ',' );
     std::vector< std::string > r;
@@ -75,7 +54,7 @@ inline std::vector< std::string > names( const std::string& paths, bool useFullx
         }
         else
         {
-            impl::to_names v( p[i], useFullxpath );
+            impl::to_names v( p[i], use_full_xpath );
             visiting::apply( v, sample );
             if( v().empty() ) { r.push_back( p[i] ); } // unknown name, don't replace
             else { r.insert( r.end(), v().begin(), v().end() ); }
@@ -84,6 +63,22 @@ inline std::vector< std::string > names( const std::string& paths, bool useFullx
     return r;
 }
 
-} } // namespace comma { namespace csv {
+template < typename S >
+inline std::unordered_map< std::string, std::string > leaves( const std::string& paths, const S& sample )
+{
+    const auto& flat = names< S >( paths, false, sample );
+    const auto& full = names< S >( paths, true, sample );
+    std::unordered_map< std::string, std::string > m;
+    std::transform( flat.begin(), flat.end(), full.begin(), std::inserter( m, m.end() ), []( const std::string& k, const std::string& v ) { return std::make_pair( k, v ); } );
+    return m;
+}
+
+template < typename S >
+inline std::vector< std::string > names( const std::unordered_map< std::string, std::string >& aliases, bool use_full_xpath, const S& sample )
+{
+    auto n = names( use_full_xpath, sample );
+    for( auto& m: n ) { for( auto i: aliases ) { if( i.second == m ) { m = i.first; break; } } } // quick and dirty
+    return n;
+}
 
-#endif // COMMA_CSV_NAMES_H_
+} } // namespace comma { namespace csv {
diff --git a/csv/options.cpp b/csv/options.cpp
index ce369090e..8fd16e0db 100644
--- a/csv/options.cpp
+++ b/csv/options.cpp
@@ -27,11 +27,11 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #include <boost/regex.hpp>
 #include "../base/exception.h"
+#include "../base/none.h"
 #include "../csv/options.h"
 #include "../string/split.h"
 #include "../string/string.h"
@@ -50,17 +50,18 @@ bool options::binary() const { return static_cast< bool >( format_ ); }
 
 namespace impl {
 
-inline static void init( comma::csv::options& csv_options, const comma::command_line_options& options, const std::string& defaultFields )
+static void init( comma::csv::options& csv_options
+                , const comma::command_line_options& options
+                , const std::string& default_fields
+                , bool full_xpath
+                , const std::unordered_map< std::string, std::string >& field_aliases )
 {
-    csv_options.full_xpath = options.exists( "--full-xpath" );
-    csv_options.fields = options.value( "--fields,-f", defaultFields );
+    csv_options.full_xpath = full_xpath;
+    csv_options.fields = comma::replace( options.value( "--fields,-f", default_fields ), field_aliases );
     if( options.exists( "--binary,-b" ) )
     {
         boost::optional< std::string > format = options.optional< std::string >( "--binary,-b" );
-        if( format )
-        {
-            csv_options.format( options.value< std::string >( "--binary,-b" ) );
-        }
+        if( format ) { csv_options.format( options.value< std::string >( "--binary,-b" ) ); }
     }
     csv_options.precision = options.value< unsigned int >( "--precision", 12 );
     csv_options.delimiter = options.exists( "--delimiter" ) ? options.value( "--delimiter", ',' ) : options.value( "-d", ',' );
@@ -69,9 +70,9 @@ inline static void init( comma::csv::options& csv_options, const comma::command_
     {
         switch( quote_character->size() )
         {
-            case 0: csv_options.quote.reset(); break;
+            case 0: csv_options.quote = silent_none< char >(); break;
             case 1: csv_options.quote = ( *quote_character )[0]; break;
-            case 2: COMMA_THROW( comma::exception, "expected a quote character, got \"" << *quote_character << "\"" );
+            default: COMMA_THROW( comma::exception, "expected a quote character, got \"" << *quote_character << "\"" );
         }
     }
     csv_options.flush = options.exists( "--flush" );
@@ -79,18 +80,13 @@ inline static void init( comma::csv::options& csv_options, const comma::command_
 
 } // namespace impl {
 
-options::options() : full_xpath( false ), delimiter( ',' ), precision( 12 ), quote( '"' ), flush( false ) {}
+options::options(): full_xpath( true ), delimiter( ',' ), precision( 12 ), quote( '"' ), flush( false ) {}
 
-options::options( int argc, char** argv, const std::string& defaultFields )
-{
-    impl::init( *this, comma::command_line_options( argc, argv ), defaultFields );
-}
+options::options( int argc, char** argv, const std::string& default_fields, bool full_xpath ): options( comma::command_line_options( argc, argv ), default_fields, full_xpath ) {}
 
-options::options( const comma::command_line_options& options, const std::string& defaultFields, bool set_full_xpath )
-{
-    impl::init( *this, options, defaultFields );
-    if(set_full_xpath) { full_xpath = true; }
-}
+options::options( const comma::command_line_options& options, const std::string& default_fields, bool full_xpath ) { impl::init( *this, options, default_fields, full_xpath, {} ); }
+
+options::options( const comma::command_line_options& options, const std::unordered_map< std::string, std::string >& field_aliases, const std::string& default_fields ) { impl::init( *this, options, default_fields, true, field_aliases ); }
 
 std::string options::usage( const std::string& default_fields, bool verbose )
 {
@@ -101,9 +97,6 @@ std::string options::usage( const std::string& default_fields, bool verbose )
         oss << "    --fields,-f <names>: comma-separated field names";
         if( !default_fields.empty() ) { oss << "; default: " << default_fields; }
         oss << std::endl;
-        oss << "    --full-xpath: expect full xpaths as field names; default: false" << std::endl;
-        oss << "                  default false was a wrong choice, but changing it" << std::endl;
-        oss << "                  to true now may break too many things" << std::endl;
         oss << "    --precision <precision>: floating point precision; default: 12" << std::endl;
         oss << "    --quote=[<quote_character>]: quote sign to quote strings (ascii only); default: '\"'" << std::endl;
         oss << "    --flush: if present, flush output stream after each record" << std::endl;
@@ -129,12 +122,20 @@ std::string options::usage( const std::string& default_fields, bool verbose )
 bool options::has_field( const std::string& field ) const
 {
     if( field.empty() ) { return false; }
-    const std::vector< std::string >& v = split( fields, ',' );
-    const std::vector< std::string >& f = split( field, ',' );
+    const auto& v = split( fields, ',' );
+    const auto& f = split( field, ',' );
     for( unsigned int i = 0; i < f.size(); ++i ) { if( std::find( v.begin(), v.end(), f[i] ) == v.end() ) { return false; } }
     return true;
 }
 
+std::map< std::string, unsigned int > options::indices() const
+{
+    std::map< std::string, unsigned int > m;
+    const auto& v = split( fields, ',' );
+    for( unsigned int i = 0; i < v.size(); ++i ) { if( !v[i].empty() ) { m[v[i]] = i; } }
+    return m;
+}
+
 bool options::has_some_of_fields( const std::string& field ) const
 {
     if( field.empty() ) { return false; }
@@ -174,6 +175,6 @@ bool options::has_some_of_paths( const std::string& paths ) const
     return false;
 }
 
-std::string options::valueless_options() { return "--full-xpath,--flush"; }
+std::string options::valueless_options() { return "--flush"; }
 
 } } // namespace comma { namespace csv {
diff --git a/csv/options.h b/csv/options.h
index 01c561a2a..a3489e9c0 100644
--- a/csv/options.h
+++ b/csv/options.h
@@ -1,36 +1,11 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
 #pragma once
 
+#include <map>
+#include <unordered_map>
 #include <boost/optional.hpp>
 #include "../application/command_line_options.h"
 #include "format.h"
@@ -45,14 +20,22 @@ class options
         options();
 
         /// constructor
-        options( int argc, char** argv, const std::string& defaultFields = "" );
+        options( int argc, char** argv, const std::string& default_fields = "", bool full_xpath = true );
 
         /// constructor
-        options( const comma::command_line_options& options, const std::string& defaultFields = "", bool set_full_xpath = false );
+        options( const comma::command_line_options& options, const std::string& default_fields = "", bool full_xpath = true );
+
+        /// constructor
+        options( const comma::command_line_options& options, const std::unordered_map< std::string, std::string >& field_aliases, const std::string& default_fields = "" );
+
+        /// make options from input options (propagate binary setting, flush, delimiter, etc)
+        /// typical use: make output stream options compatible with the input stream options
+        template < typename T >
+        static options make_same_kind( const options& rhs );
 
         /// return usage to incorporate into application usage
         static std::string usage( const std::string& default_fields = "", bool verbose = true );
-        
+
         /// return usage to incorporate into application usage
         static std::string usage( bool verbose ) { return usage( "", verbose ); }
 
@@ -71,10 +54,10 @@ class options
 
         /// precision
         unsigned int precision;
-        
+
         /// quote sign for strings
         boost::optional< char > quote;
-        
+
         /// if true, flush output stream after each record
         bool flush;
 
@@ -96,21 +79,24 @@ class options
         /// return true, if fields have all given fields (convenience function, slow)
         /// @param field comma-separated fields, e.g. "x,y,z"
         bool has_field( const std::string& fields_to_check ) const;
-        
+
         /// return true, if fields have some given fields (convenience function, slow)
         /// @param field comma-separated fields, e.g. "x,y,z"
         bool has_some_of_fields( const std::string& fields_to_check ) const;
-        
+
         /// return true, if fields have all given paths (convenience function, slow)
         /// @param field comma-separated fields, e.g. fields "centre/position/x,centre/position/y,centre/position/z,..."
         ///              have paths 'centre/position', 'centre', 'centre/position/x', etc
         bool has_paths( const std::string& paths ) const;
-        
+
         /// return true, if fields have some given paths (convenience function, slow)
         /// @param field comma-separated fields, e.g. fields "centre/position/x,centre/position/y,centre/position/z,..."
         ///              have paths 'centre/position', 'centre', 'centre/position/x', etc
         bool has_some_of_paths( const std::string& paths ) const;
 
+        /// return field indices
+        std::map< std::string, unsigned int > indices() const;
+
         /// returns comma separated list of valueless csv options that can be passed to command_line_options.unnamed
         static std::string valueless_options();
 
@@ -118,4 +104,17 @@ class options
         boost::optional< csv::format > format_;
 };
 
+template < typename T >
+inline options options::make_same_kind( const options& rhs )
+{
+    options o;
+    o.flush = rhs.flush;
+    o.delimiter = rhs.delimiter;
+    o.full_xpath = rhs.full_xpath;
+    o.precision = rhs.precision;
+    o.quote = rhs.quote;
+    if( rhs.binary() ) { o.format( format::value< T >() ); }
+    return o;
+}
+
 } } // namespace comma { namespace csv {
diff --git a/csv/split.cpp b/csv/split.cpp
new file mode 100644
index 000000000..bd63fb87f
--- /dev/null
+++ b/csv/split.cpp
@@ -0,0 +1,47 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#include <sstream>
+#include "../timing/conversions.h"
+#include "split.h"
+
+namespace comma { namespace csv { namespace splitting {
+
+std::string usage( unsigned int size, bool verbose )
+{
+    std::string indent( size, ' ' );
+    std::ostringstream oss;
+    oss << indent << "split:<options>      : todo" << std::endl;
+    oss << indent << "log:<dir>;<options>  : log in timestamped files" << std::endl;
+    if( verbose )
+    {
+        oss << indent << "    <options>: <how>[;<parameters>]" << std::endl;
+        oss << indent << "        by-time;period=<seconds>[;align]" << std::endl;
+        oss << indent << "            period=<seconds>: create a new file if next" << std::endl;
+        oss << indent << "                              timestamp passes <seconds> deadline" << std::endl;
+        oss << indent << "            align : align deadline timestamp and respective filename" << std::endl;
+        oss << indent << "                    exactly with the period (todo, just ask)" << std::endl;
+        oss << indent << "        by-size;size=<bytes>" << std::endl;
+        oss << indent << "            size=<bytes>: create files not larger than <bytes>" << std::endl;
+        oss << indent << "                          may not be exact on ascii output" << std::endl;
+        oss << indent << "        by-block" << std::endl;
+    }
+    else
+    {
+        oss << indent << "    run --help --verbose for details..." << std::endl;
+    }
+    return oss.str();
+}
+
+std::ofstream* ofstream::update( boost::posix_time::ptime t )
+{
+    if( _ofs ) { _ofs.reset(); }
+    _time = t;
+    _filename = _dir + "/" + timing::to_iso_string( t ) + "." + _suffix;
+    _ofs = std::make_unique< std::ofstream >( _filename );
+    COMMA_ASSERT( _ofs->is_open(), "failed to open '" << _filename << "'" );
+    return _ofs.get();
+}
+
+} } } // namespace comma { namespace csv { namespace splitting {
diff --git a/csv/split.h b/csv/split.h
new file mode 100644
index 000000000..cdb346ab0
--- /dev/null
+++ b/csv/split.h
@@ -0,0 +1,288 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <fstream>
+#include "../base/exception.h"
+#include "../base/none.h"
+#include "../io/stream.h"
+#include "../string/string.h"
+#include "../timing/duration.h"
+#include "options.h"
+#include "stream.h"
+
+namespace comma { namespace csv {
+
+namespace splitting {
+
+std::string usage( unsigned int indent = 0, bool verbose = false );
+
+template < typename T >
+struct type_traits
+{
+    static boost::posix_time::ptime time( const T& t ) { return t.t; }
+    static unsigned int block( const T& t ) { return t.block; }
+    static unsigned int id( const T& t ) { return t.id; }
+};
+
+class ofstream
+{
+    public:
+        ofstream( const std::string& dir, const std::string& suffix ): _dir( dir ), _suffix( suffix ) {}
+        ofstream( const std::string& dir, const options& csv ): _dir( dir ), _suffix( csv.binary() ? "bin" : "csv" ) {}
+        std::ofstream* update( boost::posix_time::ptime t );
+        template < typename T > std::ofstream* update( const T& t ) { return update( splitting::type_traits< T >::time( t ) ); }
+        std::ofstream* operator()() { return _ofs.get(); }
+        boost::posix_time::ptime time() const { return _time; }
+        const std::string& dir() const { return _dir; }
+        const std::string& filename() const { return _filename; }
+    
+    protected:
+        std::string _dir;
+        std::string _suffix;
+        std::string _filename;
+        boost::posix_time::ptime _time;
+        std::unique_ptr< std::ofstream > _ofs;
+};
+
+template < typename T >
+struct method
+{
+    virtual ~method() {}
+    virtual void wrote( unsigned int size ) {}
+    virtual std::ostream* stream( const T& t, unsigned int size = 0 ) = 0;
+    virtual boost::posix_time::ptime time() const { return boost::posix_time::ptime(); } // quick and dirty for now
+    virtual const std::string& address() const;
+};
+
+template < typename T >
+class to_timestamped_files: public method< T >
+{
+    public:
+        to_timestamped_files( const std::string& dir, const options& csv ): _ofs( dir, csv ) {}
+        boost::posix_time::ptime time() const { return _ofs.time(); }
+        const splitting::ofstream& ofs() const { return _ofs; }
+        const std::string& address() const { return _ofs.dir(); }
+
+    protected:
+        splitting::ofstream _ofs;
+};
+
+template < typename T >
+class none: public method< T >
+{
+    public:
+        none( const std::string& address ): _ostream( address ), _address( address ) {}
+        std::ostream* stream( const T&, unsigned int ) { return _ostream(); }
+        const std::string& address() const { return _address; }
+    
+    private:
+        std::string _address;
+        io::ostream _ostream;
+};
+
+template < typename T >
+class by_time: public to_timestamped_files< T >
+{
+    public:
+        by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align = false );
+        by_time( double max_duration, const std::string& dir, const options& csv, bool align ): by_time( timing::duration::from_seconds( max_duration ), dir, csv, align ) {}
+        std::ostream* stream( const T& t, unsigned int ) { auto d = splitting::type_traits< T >::time( t ); return _is_due( d ) ? this->_ofs.update( d ) : this->_ofs(); }
+    
+    private:
+        boost::posix_time::time_duration _max_duration;
+        bool _align{false};
+        boost::posix_time::ptime _deadline;
+
+        bool _is_due( boost::posix_time::ptime t );
+};
+
+template < typename T >
+class by_size: public to_timestamped_files< T >
+{
+    public:
+        by_size( std::size_t size, const std::string& dir, const options& csv );
+        std::ostream* stream( const T& t, unsigned int size = 0 ) { return _is_due( size ) ? this->_ofs.update( t ) : this->_ofs(); }
+        void wrote( unsigned int size );
+
+    private:
+        std::size_t _size{0};
+        std::size_t _record_size{0};
+        double _average_record_size{0};
+        std::size_t _count{0};
+        std::size_t _remaining{0};
+
+        bool _is_due( unsigned int extra_size );
+};
+
+template < typename T >
+class by_block: public to_timestamped_files< T >
+{
+    public:
+        by_block( const std::string& dir, const options& csv ): to_timestamped_files< T >( dir, csv ), _block( silent_none< unsigned int >() ) {}
+        std::ostream* stream( const T& t, unsigned int ) { return _is_due( splitting::type_traits< T >::block( t ) ) ? this->_ofs.update( t ) : this->_ofs(); }
+
+    private:
+        boost::optional< unsigned int > _block;
+
+        bool _is_due( unsigned int block );
+};
+
+template < typename T >
+class by_id; // todo
+
+} // namespace splitting {
+
+template < typename T >
+class split
+{
+    public:
+        split( splitting::method< T >* how, const options& csv, const T& sample = T() ): _how( how ), _options( csv ), _sample( sample ) {}
+        split& write( const T& t, const char* buf, unsigned int size, bool flush = false );
+        void flush() { if( _os ) { _os->flush(); } }
+        split& operator<<( const T& t ) { return write( t, nullptr, 0 ); }
+        bool eof() const { return _eof || ( _os && _os->eof() ); }
+        static split< T >* make( const std::string& options, const csv::options& csv, bool permissive = false, const T& sample = T() );
+        const splitting::method< T >& how() { return *_how; }
+
+    protected:
+        std::unique_ptr< splitting::method< T > > _how;
+        options _options;
+        T _sample;
+        bool _eof{false};
+        std::ostream* _os{nullptr};
+        std::unique_ptr< output_stream< T > > _ostream;
+        void _init();
+};
+
+template < typename T > inline split< T >& split< T >::write( const T& t, const char* buf, unsigned int size, bool flush )
+{
+    COMMA_ASSERT( !_eof, "end of stream" );
+    std::ostream* os = _how->stream( t );
+    if( !os || os->eof() )
+    {
+        _eof = true;
+        _os = nullptr;
+        return *this;
+    }
+    if( _os != os )
+    {
+        _ostream.reset();
+        _os = os;
+        _ostream = std::make_unique< output_stream< T > >( *_os, _options, _sample );
+    }
+    _ostream->write( t );
+    if( buf ) { _os->write( buf, size ); }
+    if( flush ) { _os->flush(); }
+    _how->wrote( _ostream->last_size() + size );
+    return *this;
+}
+
+template < typename T > inline split< T >* split< T >::make( const std::string& options, const csv::options& csv, bool permissive, const T& sample )
+{
+    const auto& v = comma::split_head( options, 2, ':' );
+    if( v[0] == "split" ) { COMMA_THROW( comma::exception, "on '" << options << "': 'split': todo, just ask" ); }
+    if( v[0] == "log" ) // todo: reimplement using comma::variant
+    {
+        const auto& w = comma::split( v[1], ';' );
+        COMMA_ASSERT( w.size() >= 2, "expected log:<dir>;<method>[;<options>]; got: '" << options << "'" );
+        std::string dir = w[0];
+        std::string method = w[1];
+        if( method == "by-time" )
+        {
+            boost::optional< double > period = silent_none< double >();
+            bool align{false};
+            for( unsigned int i = 2; i < w.size(); ++i )
+            {
+                const auto& s = comma::split( w[i], '=' );
+                if( s[0] == "period" && s.size() == 2 ) { period = boost::lexical_cast< double >( s[1] ); }
+                else if( ( s[0] == "align" && s.size() == 1 ) || w[i] == "align=true" || w[i] == "align=1" ) { align = true; }
+            }
+            if( period ) { return new split< T >( new splitting::by_time< T >( *period, dir, csv, align ), csv, sample ); }
+            if( permissive ) { return nullptr; }
+            COMMA_THROW( comma::exception, "expected 'log:<dir>;by-time;period=<seconds>[;align]'; got: '" << options << "'" );
+        }
+        if( method == "by-size" )
+        {
+            for( unsigned int i = 2; i < w.size(); ++i )
+            {
+                const auto& s = comma::split( w[i], '=' );
+                if( s[0] == "size" && s.size() == 2 )
+                { 
+                    if( permissive ) { return nullptr; }
+                    return new split< T >( new splitting::by_size< T >( boost::lexical_cast< unsigned int >( s[1] ), dir, csv ), csv, sample );
+                }
+            }
+            if( permissive ) { return nullptr; }
+            COMMA_THROW( comma::exception, "expected 'log:<dir>;by-size;size=<bytes>'; got: '" << options << "'" );
+        }
+        if( method == "by-block" )
+        {
+            return new split< T >( new splitting::by_block< T >( dir, csv ), csv, sample );
+        }
+        if( permissive ) { return nullptr; }
+        COMMA_THROW( comma::exception, "expected 'by-time', 'by-size' or 'by-block', got: '" << v[0] << " in '" << options << "'" );
+    }
+    if( permissive ) { return nullptr; }
+    COMMA_THROW( comma::exception, "expected 'split' or 'log', got: '" << v[0] << " in '" << options << "'" );
+}
+
+namespace splitting {
+
+template < typename T >
+inline by_time< T >::by_time( boost::posix_time::time_duration max_duration, const std::string& dir, const options& csv, bool align )
+    : to_timestamped_files< T >( dir, csv )
+    , _max_duration( max_duration )
+    , _align( align )
+{
+    COMMA_THROW_IF( align, "align: todo, just ask" );
+}
+
+template < typename T >
+inline bool by_time< T >::_is_due( boost::posix_time::ptime t )
+{
+    if( !_deadline.is_not_a_date_time() && t < _deadline ) { return false; }
+    _deadline = t + _max_duration;
+    return true;
+}
+
+template < typename T >
+inline by_size< T >::by_size( std::size_t size, const std::string& dir, const options& csv )
+    : to_timestamped_files< T >( dir, csv )
+    , _size( size )
+    , _record_size( csv.binary() ? csv.format().size() : 0 )
+{
+}
+
+template < typename T >
+inline bool by_size< T >::_is_due( unsigned int extra_size )
+{
+    if( ( _record_size ? _record_size + extra_size : ( unsigned int )( _average_record_size ) ) <= _remaining ) { return false; }
+    _remaining = _size + extra_size;
+    return true;
+}
+
+template < typename T >
+inline void by_size< T >::wrote( unsigned int size )
+{
+    _remaining = _remaining >= size ? _remaining - size : 0;
+    if( _record_size ) { return; }
+    ++_count;
+    if( _count == 1 ) { _average_record_size = size; return; }
+    double r = 1. / _count;
+    _average_record_size = ( 1 - r ) * _average_record_size + r * size; // quick and dirty
+}
+
+template < typename T >
+inline bool by_block< T >::_is_due( unsigned int block )
+{
+    if( _block && *_block == block ) { return false; }
+    _block = block;
+    return true;
+}
+
+} // namespace splitting {
+
+} } // namespace comma { namespace csv {
diff --git a/csv/stream.h b/csv/stream.h
index 815878ad1..93a829353 100644
--- a/csv/stream.h
+++ b/csv/stream.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_STREAM_H_
-#define COMMA_CSV_STREAM_H_
+#pragma once
 
 #ifdef WIN32
 #include <stdio.h>
@@ -39,6 +10,7 @@
 #include <io.h>
 #endif
 
+#include <fstream>
 #include <iostream>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/noncopyable.hpp>
@@ -53,10 +25,28 @@ namespace comma { namespace csv {
 /// @todo document
 namespace detail { void unsynchronize_with_stdio(); }
 
-template < typename S > class output_stream;
+/// generic input stream
 template < typename S > class input_stream;
+
+/// generic output stream
+template < typename S > class output_stream;
+
+/// tied input and output streams
 template < typename S, typename T > class tied;
 
+/// input stream passed through
+template < typename S > class passed;
+
+/// convenience functions: read input stream into a container that has push_back() method
+template < typename V > V read_as( const options& o, const typename V::value_type& default_value = typename V::value_type(), std::size_t size = 0 );
+template < typename V > V read_as( std::istream& is, const options& o = options(), std::size_t size = 0 );
+template < typename V > V read_as( const std::string& filename, const options& o = options(), std::size_t size = 0 );
+template < typename V > V read_as( std::istream& is, const options& o, const typename V::value_type& default_value, std::size_t size = 0 );
+template < typename V > V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value, std::size_t size = 0 );
+
+/// convenience functions: write to output stream from a non-mapped container
+template < typename V > void write( const V& v, std::ostream& os, const options& o, const typename V::value_type& default_value );
+template < typename V > void write( const V& v, std::ostream& os, const options& o = options() );
 
 /// ascii csv input stream
 template < typename S >
@@ -64,7 +54,7 @@ class ascii_input_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        ascii_input_stream( std::istream& is, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = false, const S& sample = S() );
+        ascii_input_stream( std::istream& is, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = true, const S& sample = S() );
 
         /// constructor from csv options
         ascii_input_stream( std::istream& is, const options& o, const S& sample = S() );
@@ -115,7 +105,7 @@ class ascii_output_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        ascii_output_stream( std::ostream& os, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = false, const S& sample = S() );
+        ascii_output_stream( std::ostream& os, const std::string& column_names = "", char delimiter = ',', bool full_path_as_name = true, const S& sample = S() );
 
         /// constructor from csv options
         ascii_output_stream( std::ostream& os, const options& o, const S& sample = S() );
@@ -148,8 +138,11 @@ class ascii_output_stream : public boost::noncopyable
         /// return fields
         const std::vector< std::string >& fields() const { return fields_; }
 
+        /// return size of last output record in bytes
+        unsigned int last_size() const { return _last_size; }
+
     private:
-        friend class output_stream<S>;
+        friend class output_stream< S >;
         template < typename W, typename T>
         friend class tied;
         template < typename V, typename T, typename Data >
@@ -158,6 +151,7 @@ class ascii_output_stream : public boost::noncopyable
         std::ostream& os_;
         csv::ascii< S > ascii_;
         std::vector< std::string > fields_;
+        unsigned int _last_size{0};
 };
 
 /// binary csv input stream
@@ -166,7 +160,7 @@ class binary_input_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        binary_input_stream( std::istream& is, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = false, const S& sample = S() );
+        binary_input_stream( std::istream& is, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = true, const S& sample = S() );
 
         /// constructor from options
         binary_input_stream( std::istream& is, const options& o, const S& sample = S() );
@@ -215,7 +209,7 @@ class binary_output_stream : public boost::noncopyable
 {
     public:
         /// constructor
-        binary_output_stream( std::ostream& os, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = false, bool flush = false, const S& sample = S() );
+        binary_output_stream( std::ostream& os, const std::string& format = "", const std::string& column_names = "", bool full_path_as_name = true, bool flush = false, const S& sample = S() );
 
         /// constructor from options
         binary_output_stream( std::ostream& os, const options& o, const S& sample = S() );
@@ -238,6 +232,9 @@ class binary_output_stream : public boost::noncopyable
         /// return fields
         const std::vector< std::string >& fields() const { return fields_; }
 
+        /// record size
+        unsigned int size() const { return _size; }
+
     private:
         template < typename W, typename T>
         friend class tied;
@@ -254,6 +251,7 @@ class binary_output_stream : public boost::noncopyable
         //char* cur_;
         std::vector< std::string > fields_;
         bool flush_;
+        unsigned int _size{};
         /// bool is_stdout;
 };
 
@@ -320,7 +318,7 @@ class output_stream : public boost::noncopyable
         /// construct from csv options
         output_stream( std::ostream& os, const csv::options& o, const S& sample = S() );
 
-        output_stream( std::ostream& os, bool binary, bool full_xpath = false, bool flush = false, const S& sample = S() );
+        output_stream( std::ostream& os, bool binary, bool full_xpath = true, bool flush = false, const S& sample = S() );
 
         /// write
         void write( const S& s ) { if( ascii_ ) { ascii_->write( s ); } else { binary_->write( s ); } }
@@ -359,6 +357,9 @@ class output_stream : public boost::noncopyable
 
         std::ostream& os() { return binary_ ? binary_->os_ : ascii_->os_; }
 
+        /// return size of last output record in bytes
+        unsigned int last_size() const { return binary_ ? binary_->size() : ascii_->last_size(); }
+
     private:
         boost::scoped_ptr< ascii_output_stream< S > > ascii_;
         boost::scoped_ptr< binary_output_stream< S > > binary_;
@@ -436,11 +437,29 @@ template < typename S >
 class passed
 {
     public:
-        passed( const input_stream< S >& is, std::ostream& os, bool flush=false ) : is_( is ), os_( os ), flush(flush)
-        {
-            #ifdef WIN32
-            if( is_.is_binary() && os == std::cout ) { _setmode( _fileno( stdout ), _O_BINARY ); }
-            #endif // #ifdef WIN32
+        passed( const input_stream< S >& is, std::ostream& os, bool flush = false );
+
+        void write();
+        
+        void write( const S& s );
+
+    private:
+        const input_stream< S >& is_;
+        std::ostream& os_;
+        std::string buffer_;
+        bool flush;
+        bool is_stdout_;
+};
+
+template < typename S >
+inline passed< S > make_passed( const input_stream< S >& is, std::ostream& os, bool flush = false ) { return passed< S >( is, os, flush ); }
+ 
+template < typename S >
+inline passed< S >::passed( const input_stream< S >& is, std::ostream& os, bool flush ) : is_( is ), os_( os ), flush( flush )
+{
+    #ifdef WIN32
+    if( is_.is_binary() && os == std::cout ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+    #endif // #ifdef WIN32
 // In using view-points in 'pass' mode there were issues with the write method.
 // How to reproduce: take some nav data in t,6d format. Store as in.bin and other.bin.
 //
@@ -485,29 +504,59 @@ class passed
 //  - according to git grep, only view-points was using this class template at the moment; therefore,
 //    the change is very localized and we preserve it in this class
 //  - however, all the other similar modifications have been commented out using /// symbol
-            is_stdout_ = os.rdbuf() == std::cout.rdbuf();
-        }
+    is_stdout_ = os.rdbuf() == std::cout.rdbuf();
+}
 
-        void write()
+template < typename S >
+inline void passed< S >::write()
+{
+    if( is_.is_binary() )
+    {
+        if( is_stdout_ )
         {
-            if( is_.is_binary() ) {
-                if ( is_stdout_ ) {
-                    ::write( 1, is_.binary().last(), is_.binary().size() );
-                    if(flush) { ::fflush( stdout ); }
-                } else {
-                    os_.write( is_.binary().last(), is_.binary().size() );
-                    if(flush) { os_.flush(); }
-                }
-            }
-            else os_ << comma::join( is_.ascii().last(), is_.ascii().ascii().delimiter() ) << std::endl;
+            auto r = ::write( 1, is_.binary().last(), is_.binary().size() );
+            ( void ) r;
+            if( flush ) { ::fflush( stdout ); }
         }
+        else
+        {
+            os_.write( is_.binary().last(), is_.binary().size() );
+            if( flush ) { os_.flush(); }
+        }
+    }
+    else
+    {
+        os_ << comma::join( is_.ascii().last(), is_.ascii().ascii().delimiter() ) << std::endl;
+    }
+}
 
-    private:
-        const input_stream< S >& is_;
-        std::ostream& os_;
-        bool flush;
-        bool is_stdout_;
-};
+template < typename S >
+inline void passed< S >::write( const S& s )
+{
+    if( is_.is_binary() )
+    {
+        buffer_.resize( is_.binary().size() );
+        ::memcpy( &buffer_[0], is_.binary().last(), is_.binary().size() ); // quick and dirty
+        is_.binary().binary().put( s, &buffer_[0] );
+        if( is_stdout_ )
+        {
+            auto r = ::write( 1, &buffer_[0], is_.binary().size() );
+            ( void ) r;
+            if( flush ) { ::fflush( stdout ); }
+        }
+        else
+        {
+            os_.write( &buffer_[0], is_.binary().size() );
+            if( flush ) { os_.flush(); }
+        }
+    }
+    else
+    {
+        std::vector< std::string > v = is_.ascii().last();
+        is_.ascii().ascii().put( s, v );
+        os_ << comma::join( v, is_.ascii().ascii().delimiter() ) << std::endl;
+    }
+}
 
 template < typename S >
 inline ascii_input_stream< S >::ascii_input_stream( std::istream& is, const std::string& column_names, char delimiter, bool full_path_as_name, const S& sample )
@@ -600,8 +649,7 @@ inline void ascii_output_stream< S >::write( const S& s )
 template < typename S >
 inline void ascii_output_stream< S >::write( const S& s, const std::string& line )
 {
-    write( s, split
-( line, ascii_.delimiter() ) );
+    write( s, split( line, ascii_.delimiter() ) );
 }
 
 template < typename S >
@@ -617,7 +665,8 @@ inline void ascii_output_stream< S >::write( const S& s, std::vector< std::strin
     ascii_.put( s, v );
     if( v.empty() ) { return; } // never here, though
     os_ << v[0];
-    for( std::size_t i = 1; i < v.size(); ++i ) { os_ << ascii_.delimiter() << v[i]; }
+    _last_size = 0;
+    for( std::size_t i = 1; i < v.size(); ++i ) { os_ << ascii_.delimiter() << v[i]; _last_size += v[i].size() + 1; }
     os_ << std::endl;
 }
 
@@ -681,6 +730,7 @@ inline binary_output_stream< S >::binary_output_stream( std::ostream& os, const
     //, cur_( begin_ )
     , fields_( split( column_names, ',' ) )
     , flush_( flush )
+    , _size( binary_.format().size() )
     /// , is_stdout( os_.rdbuf() == std::cout.rdbuf() )
 {
     #ifdef WIN32
@@ -701,6 +751,7 @@ inline binary_output_stream< S >::binary_output_stream( std::ostream& os, const
     , fields_( split( o.fields, ',' ) )
     , flush_( o.flush )
     /// , is_stdout( os_.rdbuf() == std::cout.rdbuf() )
+    , _size( binary_.format().size() )
 {
     #ifdef WIN32
     if( &os == &std::cout ) { _setmode( _fileno( stdout ), _O_BINARY ); }
@@ -804,6 +855,45 @@ inline void output_stream< S >::append_output( input_stream< T >& is, const S& s
     }
 }*/
 
-} } // namespace comma { namespace csv {
+template < typename V > inline void write( const V& v, std::ostream& os, const options& o ) { if( !v.empty() ) { write( v, os, o, typename V::value_type() ); } }
+
+template < typename V > inline void write( const V& v, std::ostream& os, const options& o, const typename V::value_type& default_value )
+{
+    if( v.empty() ) { return; }
+    output_stream< typename V::value_type > ostream( os, o, default_value );
+    for( const auto& e: v )
+    {
+        COMMA_ASSERT( os.good(), "output stream not good" );
+        ostream.write( e );
+    }
+    if( o.flush ) { os.flush(); }
+}
 
-#endif /*COMMA_CSV_STREAM_H_*/
+template < typename V > inline V read_as( std::istream& is, const options& o, const typename V::value_type& default_value, std::size_t size )
+{
+    input_stream< typename V::value_type > istream( is, o, default_value );
+    V v;
+    for( std::size_t count{0}; ( size == 0 || count < size ) && ( istream.ready() || is.good() ); ++count )
+    {
+        auto p = istream.read();
+        if( !p ) { break; }
+        v.push_back( *p );
+    }
+    return v;
+}
+
+template < typename V > inline V read_as( const std::string& filename, const options& o, const typename V::value_type& default_value, std::size_t size )
+{
+    std::ifstream ifs;
+    ifs.open( &filename[0], o.binary() ? std::ios_base::in | std::ios_base::binary : std::ios_base::in );
+    if( ifs.is_open() ) { return read_as< V >( ifs, o, default_value, size ); }
+    COMMA_THROW( comma::exception, "failed to open '" << filename << "'" );
+}
+
+template < typename V > inline V read_as( const std::string& filename, const options& o, std::size_t size ) { return read_as< V >( filename, o, typename V::value_type(), size ); }
+
+template < typename V > inline V read_as( std::istream& is, const options& o, std::size_t size ) { return read_as< V >( is, o, typename V::value_type(), size ); }
+
+template < typename V > inline V read_as( const options& o, const typename V::value_type& default_value, std::size_t size ) { return read_as< V >( o.filename, o, default_value, size ); }
+
+} } // namespace comma { namespace csv {
diff --git a/csv/test/CMakeLists.txt b/csv/test/CMakeLists.txt
index 6e6184332..4bbc487c2 100644
--- a/csv/test/CMakeLists.txt
+++ b/csv/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT csv )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_xpath comma_string comma_csv ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT csv )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/csv/test/ascii_test.cpp b/csv/test/ascii_test.cpp
index a6f61643c..3a2e3e521 100644
--- a/csv/test/ascii_test.cpp
+++ b/csv/test/ascii_test.cpp
@@ -30,6 +30,9 @@
 
 #include <gtest/gtest.h>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#if ( BOOST_VERSION >= 107400 ) // quick and dirty; fixing trivial compilation error
+#include <boost/optional/optional_io.hpp>
+#endif
 #include "../../csv/ascii.h"
 #include "../../string/string.h"
 
@@ -37,25 +40,23 @@ namespace comma { namespace csv { namespace ascii_test {
 
 struct nested
 {
-    int x;
-    int y;
-    nested() : x( 0 ), y( 0 ) {}
+    int x{0};
+    int y{0};
 };
 
 struct simple_struct
 {
-    int a;
-    double b;
-    char c;
+    int a{0};
+    double b{0};
+    char c{0};
     std::string s;
     boost::posix_time::ptime t;
     ascii_test::nested nested;
-    simple_struct() : a( 0 ), b( 0 ), c( 0 ) {}
 };
 
 struct test_struct
 {
-    int a;
+    int a{0};
     boost::optional< int > z;
     boost::optional< ascii_test::nested > nested;
 };
@@ -209,6 +210,26 @@ TEST( csv, ascii_get )
 
 TEST( csv, ascii_put )
 {
+}
+
+TEST( csv, ascii_put_string )
+{
+    typedef comma::csv::ascii_test::simple_struct value_t;
+    typedef comma::csv::ascii< value_t > ascii_t;
+    EXPECT_EQ( ascii_t().put( value_t{} ), "0,0,0,\"\",not-a-date-time,0,0" );
+    EXPECT_EQ( ascii_t().put( value_t{1,2,3,"XXX"} ), "1,2,3,\"XXX\",not-a-date-time,0,0" );
+    {
+        comma::csv::options csv;
+        csv.quote.reset();
+        EXPECT_EQ( ascii_t( csv ).put( value_t{} ), "0,0,0,,not-a-date-time,0,0" );
+        EXPECT_EQ( ascii_t( csv ).put( value_t{1,2,3,"XXX"} ), "1,2,3,XXX,not-a-date-time,0,0" );
+    }
+    {
+        comma::csv::options csv;
+        csv.quote = '#';
+        EXPECT_EQ( ascii_t( csv ).put( value_t{} ), "0,0,0,##,not-a-date-time,0,0" );
+        EXPECT_EQ( ascii_t( csv ).put( value_t{1,2,3,"XXX"} ), "1,2,3,#XXX#,not-a-date-time,0,0" );
+    }
     // todo
 }
 
diff --git a/csv/test/binary_test.cpp b/csv/test/binary_test.cpp
index f61d4b50d..87cd46bb4 100644
--- a/csv/test/binary_test.cpp
+++ b/csv/test/binary_test.cpp
@@ -1,34 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 #include <gtest/gtest.h>
+#include <array>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include "../../csv/binary.h"
 #include "../../csv/format.h"
@@ -309,11 +283,11 @@ static void test_binary_cast( const char* format, T t, S expected )
 {
     comma::csv::binary< test_cast< T > > bt( format );
     comma::csv::binary< test_cast< S > > bs( format );
-    char buf[16] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 }; // just to trash it
+    std::string buf = "abcdefghijklmnop"; // just to trash it
     test_cast< T > vt( t );
     test_cast< S > vs;
-    bt.put( vt, buf );
-    bs.get( vs, buf );
+    bt.put( vt, &buf[0] );
+    bs.get( vs, &buf[0] );
     test_traits< T >::expect_equal( vs.value, expected );
 }
 
diff --git a/csv/test/csv-blocks/group/expected b/csv/test/csv-blocks/group/expected
new file mode 100644
index 000000000..52255b96a
--- /dev/null
+++ b/csv/test/csv-blocks/group/expected
@@ -0,0 +1,112 @@
+group/scalar/gap[0]/output/line[0]="1.1,0"
+group/scalar/gap[0]/output/line[1]="2,1"
+group/scalar/gap[0]/output/line[2]="5,2"
+group/scalar/gap[0]/output/line[3]="5.9,3"
+group/scalar/gap[0]/status=0
+group/scalar/gap[1]/output/line[0]="1.1,0"
+group/scalar/gap[1]/output/line[1]="2,0"
+group/scalar/gap[1]/output/line[2]="5,1"
+group/scalar/gap[1]/output/line[3]="5.9,1"
+group/scalar/gap[1]/status=0
+group/scalar/gap[2]/output/line[0]="1.1,0"
+group/scalar/gap[2]/output/line[1]="2,0"
+group/scalar/gap[2]/output/line[2]="5,0"
+group/scalar/gap[2]/output/line[3]="5.9,0"
+group/scalar/gap[2]/status=0
+group/scalar/gap[3]/output/line[0]="19700101T000001.100000,0"
+group/scalar/gap[3]/output/line[1]="19700101T000002,1"
+group/scalar/gap[3]/output/line[2]="19700101T000005,2"
+group/scalar/gap[3]/output/line[3]="19700101T000005.900000,3"
+group/scalar/gap[3]/status=0
+group/scalar/gap[4]/output/line[0]="19700101T000001.100000,0"
+group/scalar/gap[4]/output/line[1]="19700101T000002,0"
+group/scalar/gap[4]/output/line[2]="19700101T000005,1"
+group/scalar/gap[4]/output/line[3]="19700101T000005.900000,1"
+group/scalar/gap[4]/status=0
+group/scalar/gap[5]/output/line[0]="19700101T000001.100000,0"
+group/scalar/gap[5]/output/line[1]="19700101T000002,0"
+group/scalar/gap[5]/output/line[2]="19700101T000005,0"
+group/scalar/gap[5]/output/line[3]="19700101T000005.900000,0"
+group/scalar/gap[5]/status=0
+
+group/scalar/span[0]/output/line[0]="1.1,0"
+group/scalar/span[0]/output/line[1]="2,1"
+group/scalar/span[0]/output/line[2]="5,2"
+group/scalar/span[0]/output/line[3]="5.9,3"
+group/scalar/span[0]/status=0
+group/scalar/span[1]/output/line[0]="1.1,0"
+group/scalar/span[1]/output/line[1]="2,0"
+group/scalar/span[1]/output/line[2]="5,1"
+group/scalar/span[1]/output/line[3]="5.9,1"
+group/scalar/span[1]/status=0
+group/scalar/span[2]/output/line[0]="1.1,0"
+group/scalar/span[2]/output/line[1]="2,0"
+group/scalar/span[2]/output/line[2]="5,0"
+group/scalar/span[2]/output/line[3]="5.9,1"
+group/scalar/span[2]/status=0
+group/scalar/span[3]/output/line[0]="19700101T000001.100000,0"
+group/scalar/span[3]/output/line[1]="19700101T000002,1"
+group/scalar/span[3]/output/line[2]="19700101T000005,2"
+group/scalar/span[3]/output/line[3]="19700101T000005.900000,3"
+group/scalar/span[3]/status=0
+group/scalar/span[4]/output/line[0]="19700101T000001.100000,0"
+group/scalar/span[4]/output/line[1]="19700101T000002,0"
+group/scalar/span[4]/output/line[2]="19700101T000005,1"
+group/scalar/span[4]/output/line[3]="19700101T000005.900000,1"
+group/scalar/span[4]/status=0
+group/scalar/span[5]/output/line[0]="19700101T000001.100000,0"
+group/scalar/span[5]/output/line[1]="19700101T000002,0"
+group/scalar/span[5]/output/line[2]="19700101T000005,0"
+group/scalar/span[5]/output/line[3]="19700101T000005.900000,0"
+group/scalar/span[5]/status=0
+
+group/scalar/gap_and_span[0]/output/line[0]="1,0"
+group/scalar/gap_and_span[0]/output/line[1]="2,0"
+group/scalar/gap_and_span[0]/output/line[2]="5,1"
+group/scalar/gap_and_span[0]/output/line[3]="6,1"
+group/scalar/gap_and_span[0]/output/line[4]="7,1"
+group/scalar/gap_and_span[0]/output/line[5]="8,1"
+group/scalar/gap_and_span[0]/output/line[6]="9,2"
+group/scalar/gap_and_span[0]/status=0
+
+group/scalar/range[0]/output/line[0]="1,0"
+group/scalar/range[0]/output/line[1]="2,1"
+group/scalar/range[0]/output/line[2]="3,1"
+group/scalar/range[0]/output/line[3]="1,2"
+group/scalar/range[0]/output/line[4]="2,3"
+group/scalar/range[0]/output/line[5]="3,3"
+group/scalar/range[0]/status=0
+group/scalar/range[1]/output/line[0]="2,0"
+group/scalar/range[1]/output/line[1]="3,0"
+group/scalar/range[1]/output/line[2]="2,1"
+group/scalar/range[1]/output/line[3]="3,1"
+group/scalar/range[1]/status=0
+group/scalar/range[2]/output/line[0]="1,0"
+group/scalar/range[2]/output/line[1]="2,1"
+group/scalar/range[2]/output/line[2]="3,1"
+group/scalar/range[2]/output/line[3]="1,2"
+group/scalar/range[2]/output/line[4]="2,3"
+group/scalar/range[2]/output/line[5]="3,3"
+group/scalar/range[2]/status=0
+group/scalar/range[3]/output/line[0]="1,0"
+group/scalar/range[3]/output/line[1]="1,1"
+group/scalar/range[3]/status=0
+group/scalar/range[4]/output/line[0]="1,0"
+group/scalar/range[4]/output/line[1]="2,1"
+group/scalar/range[4]/output/line[2]="3,2"
+group/scalar/range[4]/output/line[3]="1,2"
+group/scalar/range[4]/output/line[4]="2,3"
+group/scalar/range[4]/output/line[5]="3,4"
+group/scalar/range[4]/status=0
+group/scalar/range[5]/output/line[0]="2,0"
+group/scalar/range[5]/output/line[1]="2,1"
+group/scalar/range[5]/status=0
+group/scalar/range[6]/output/line[0]="1,0"
+group/scalar/range[6]/output/line[1]="2,0"
+group/scalar/range[6]/output/line[2]="3,0"
+group/scalar/range[6]/output/line[3]="1,0"
+group/scalar/range[6]/output/line[4]="2,0"
+group/scalar/range[6]/output/line[5]="3,0"
+group/scalar/range[6]/status=0
+group/scalar/range[7]/output=""
+group/scalar/range[7]/status=0
diff --git a/csv/test/csv-blocks/group/input b/csv/test/csv-blocks/group/input
new file mode 100644
index 000000000..627a1e016
--- /dev/null
+++ b/csv/test/csv-blocks/group/input
@@ -0,0 +1,24 @@
+group/scalar/gap[0]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --gap 0.5"
+group/scalar/gap[1]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --gap 1"
+group/scalar/gap[2]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --gap 5"
+group/scalar/gap[3]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --gap 0.5"
+group/scalar/gap[4]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --gap 1"
+group/scalar/gap[5]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --gap 5"
+
+group/scalar/span[0]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --span 0.5"
+group/scalar/span[1]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --span 1"
+group/scalar/span[2]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-blocks group --fields scalar --span 4"
+group/scalar/span[3]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --span 0.5"
+group/scalar/span[4]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --span 1"
+group/scalar/span[5]="( echo 1.1; echo 2; echo 5; echo 5.9 ) | csv-time --from seconds | csv-blocks group --fields scalar --span 5"
+
+group/scalar/gap_and_span[0]="( echo 1; echo 2; echo 5; echo 6; echo 7; echo 8; echo 9 ) | csv-blocks group --fields scalar --gap 2 --span 4"
+
+group/scalar/range[0]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5"
+group/scalar/range[1]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --discard-out-of-range"
+group/scalar/range[2]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5"
+group/scalar/range[3]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 1.5 --discard-out-of-range"
+group/scalar/range[4]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5"
+group/scalar/range[5]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --min 1.5 --max 2.5 --discard-out-of-range"
+group/scalar/range[6]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0"
+group/scalar/range[7]="( seq 3; seq 3 ) | csv-blocks group --fields scalar --max 0 --discard-out-of-range"
diff --git a/csv/test/csv-crc/check/ascii-bad/expected b/csv/test/csv-crc/check/ascii-bad/expected
new file mode 100644
index 000000000..efcad8ed9
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-bad/expected
@@ -0,0 +1,2 @@
+output[0]/line="0,0,0,54755"
+count=1
diff --git a/csv/test/csv-crc/check/ascii-bad/input b/csv/test/csv-crc/check/ascii-bad/input
new file mode 100644
index 000000000..272285034
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-bad/input
@@ -0,0 +1,5 @@
+operation=check
+0,0,0,54755
+1,1,1,0
+2,2,2,57154
+3,3,3,20994
diff --git a/csv/test/csv-crc/check/ascii-good/expected b/csv/test/csv-crc/check/ascii-good/expected
new file mode 100644
index 000000000..36a88a0d7
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-good/expected
@@ -0,0 +1,5 @@
+output[0]/line="0,0,0,54755"
+output[1]/line="1,1,1,22691"
+output[2]/line="2,2,2,57154"
+output[3]/line="3,3,3,20994"
+count=4
diff --git a/csv/test/csv-crc/check/ascii-good/input b/csv/test/csv-crc/check/ascii-good/input
new file mode 100644
index 000000000..f64d1713f
--- /dev/null
+++ b/csv/test/csv-crc/check/ascii-good/input
@@ -0,0 +1,5 @@
+operation=check
+0,0,0,54755
+1,1,1,22691
+2,2,2,57154
+3,3,3,20994
diff --git a/csv/test/csv-crc/check/big-endian/expected b/csv/test/csv-crc/check/big-endian/expected
new file mode 100644
index 000000000..016496f83
--- /dev/null
+++ b/csv/test/csv-crc/check/big-endian/expected
@@ -0,0 +1,5 @@
+output[0]/line="0,0,0,63876"
+output[1]/line="1,1,1,60342"
+output[2]/line="2,2,2,56800"
+output[3]/line="3,3,3,53202"
+count=4
diff --git a/csv/test/csv-crc/check/big-endian/input b/csv/test/csv-crc/check/big-endian/input
new file mode 100644
index 000000000..e9f01c460
--- /dev/null
+++ b/csv/test/csv-crc/check/big-endian/input
@@ -0,0 +1,7 @@
+operation=check
+binary=3ui,uw
+args="--big-endian"
+0,0,0,63876
+1,1,1,60342
+2,2,2,56800
+3,3,3,53202
diff --git a/csv/test/csv-crc/check/binary-bad/expected b/csv/test/csv-crc/check/binary-bad/expected
new file mode 100644
index 000000000..98ac01605
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-bad/expected
@@ -0,0 +1,2 @@
+output[0]/line="0,0,0,34041"
+count=1
diff --git a/csv/test/csv-crc/check/binary-bad/input b/csv/test/csv-crc/check/binary-bad/input
new file mode 100644
index 000000000..0873c8bc1
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-bad/input
@@ -0,0 +1,6 @@
+operation=check
+binary=3ui,uw
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/check/binary-good/expected b/csv/test/csv-crc/check/binary-good/expected
new file mode 100644
index 000000000..d5a50a50a
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-good/expected
@@ -0,0 +1,5 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+count=4
diff --git a/csv/test/csv-crc/check/binary-good/input b/csv/test/csv-crc/check/binary-good/input
new file mode 100644
index 000000000..362856496
--- /dev/null
+++ b/csv/test/csv-crc/check/binary-good/input
@@ -0,0 +1,6 @@
+operation=check
+binary=3ui,uw
+0,0,0,34041
+1,1,1,46827
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/binary-bad-1/expected b/csv/test/csv-crc/recover/binary-bad-1/expected
new file mode 100644
index 000000000..87d9b518d
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-1/expected
@@ -0,0 +1,10 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="2,2,2,57565"
+output[2]/line="3,3,3,53967"
+output[3]/line="4,4,4,19633"
+output[4]/line="5,5,5,32419"
+output[5]/line="6,6,6,10389"
+output[6]/line="7,7,7,6791"
+output[7]/line="8,8,8,1096"
+output[8]/line="9,9,9,13914"
+count=9
diff --git a/csv/test/csv-crc/recover/binary-bad-1/input b/csv/test/csv-crc/recover/binary-bad-1/input
new file mode 100644
index 000000000..e07603006
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-1/input
@@ -0,0 +1,12 @@
+operation=recover
+binary=3ui,uw
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/binary-bad-2/expected b/csv/test/csv-crc/recover/binary-bad-2/expected
new file mode 100644
index 000000000..da2800f25
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-2/expected
@@ -0,0 +1,9 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="3,3,3,53967"
+output[2]/line="4,4,4,19633"
+output[3]/line="5,5,5,32419"
+output[4]/line="6,6,6,10389"
+output[5]/line="7,7,7,6791"
+output[6]/line="8,8,8,1096"
+output[7]/line="9,9,9,13914"
+count=8
diff --git a/csv/test/csv-crc/recover/binary-bad-2/input b/csv/test/csv-crc/recover/binary-bad-2/input
new file mode 100644
index 000000000..98a092270
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-2/input
@@ -0,0 +1,12 @@
+operation=recover
+binary=3ui,uw
+0,0,0,34041
+1,1,1,0
+2,2,2,0
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/binary-bad-3/expected b/csv/test/csv-crc/recover/binary-bad-3/expected
new file mode 100644
index 000000000..f03fe1cbc
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-3/expected
@@ -0,0 +1,8 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="4,4,4,19633"
+output[2]/line="5,5,5,32419"
+output[3]/line="6,6,6,10389"
+output[4]/line="7,7,7,6791"
+output[5]/line="8,8,8,1096"
+output[6]/line="9,9,9,13914"
+count=7
diff --git a/csv/test/csv-crc/recover/binary-bad-3/input b/csv/test/csv-crc/recover/binary-bad-3/input
new file mode 100644
index 000000000..ed36c0e4a
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-bad-3/input
@@ -0,0 +1,12 @@
+operation=recover
+binary=3ui,uw
+0,0,0,34041
+1,1,1,0
+2,2,2,0
+3,3,3,0
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/binary-good/expected b/csv/test/csv-crc/recover/binary-good/expected
new file mode 100644
index 000000000..d5a50a50a
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-good/expected
@@ -0,0 +1,5 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+count=4
diff --git a/csv/test/csv-crc/recover/binary-good/input b/csv/test/csv-crc/recover/binary-good/input
new file mode 100644
index 000000000..28a29aa1e
--- /dev/null
+++ b/csv/test/csv-crc/recover/binary-good/input
@@ -0,0 +1,6 @@
+operation=recover
+binary=3ui,uw
+0,0,0,34041
+1,1,1,46827
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/discard-after-1/expected b/csv/test/csv-crc/recover/discard-after-1/expected
new file mode 100644
index 000000000..da2800f25
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-1/expected
@@ -0,0 +1,9 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="3,3,3,53967"
+output[2]/line="4,4,4,19633"
+output[3]/line="5,5,5,32419"
+output[4]/line="6,6,6,10389"
+output[5]/line="7,7,7,6791"
+output[6]/line="8,8,8,1096"
+output[7]/line="9,9,9,13914"
+count=8
diff --git a/csv/test/csv-crc/recover/discard-after-1/input b/csv/test/csv-crc/recover/discard-after-1/input
new file mode 100644
index 000000000..05462938c
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-1/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 1 --discard"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/discard-after-2/expected b/csv/test/csv-crc/recover/discard-after-2/expected
new file mode 100644
index 000000000..d89a4f109
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-2/expected
@@ -0,0 +1,6 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="6,6,6,10389"
+output[2]/line="7,7,7,6791"
+output[3]/line="8,8,8,1096"
+output[4]/line="9,9,9,13914"
+count=5
diff --git a/csv/test/csv-crc/recover/discard-after-2/input b/csv/test/csv-crc/recover/discard-after-2/input
new file mode 100644
index 000000000..3e55f6cc8
--- /dev/null
+++ b/csv/test/csv-crc/recover/discard-after-2/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 2 --discard"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,0
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/give-up-after-0/expected b/csv/test/csv-crc/recover/give-up-after-0/expected
new file mode 100644
index 000000000..98ac01605
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-0/expected
@@ -0,0 +1,2 @@
+output[0]/line="0,0,0,34041"
+count=1
diff --git a/csv/test/csv-crc/recover/give-up-after-0/input b/csv/test/csv-crc/recover/give-up-after-0/input
new file mode 100644
index 000000000..981369062
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-0/input
@@ -0,0 +1,7 @@
+operation=recover
+binary=3ui,uw
+args="--give-up-after 0"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/give-up-after-21/expected b/csv/test/csv-crc/recover/give-up-after-21/expected
new file mode 100644
index 000000000..3b497e5a4
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-21/expected
@@ -0,0 +1,4 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="2,2,2,57565"
+output[2]/line="3,3,3,53967"
+count=3
diff --git a/csv/test/csv-crc/recover/give-up-after-21/input b/csv/test/csv-crc/recover/give-up-after-21/input
new file mode 100644
index 000000000..0d8b71097
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-21/input
@@ -0,0 +1,7 @@
+operation=recover
+binary=3ui,uw
+args="--give-up-after 21"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/give-up-after-7/expected b/csv/test/csv-crc/recover/give-up-after-7/expected
new file mode 100644
index 000000000..98ac01605
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-7/expected
@@ -0,0 +1,2 @@
+output[0]/line="0,0,0,34041"
+count=1
diff --git a/csv/test/csv-crc/recover/give-up-after-7/input b/csv/test/csv-crc/recover/give-up-after-7/input
new file mode 100644
index 000000000..798df435b
--- /dev/null
+++ b/csv/test/csv-crc/recover/give-up-after-7/input
@@ -0,0 +1,7 @@
+operation=recover
+binary=3ui,uw
+args="--give-up-after 7"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
diff --git a/csv/test/csv-crc/recover/recover-after-1/expected b/csv/test/csv-crc/recover/recover-after-1/expected
new file mode 100644
index 000000000..87d9b518d
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-1/expected
@@ -0,0 +1,10 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="2,2,2,57565"
+output[2]/line="3,3,3,53967"
+output[3]/line="4,4,4,19633"
+output[4]/line="5,5,5,32419"
+output[5]/line="6,6,6,10389"
+output[6]/line="7,7,7,6791"
+output[7]/line="8,8,8,1096"
+output[8]/line="9,9,9,13914"
+count=9
diff --git a/csv/test/csv-crc/recover/recover-after-1/input b/csv/test/csv-crc/recover/recover-after-1/input
new file mode 100644
index 000000000..988d63176
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-1/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 1"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,53967
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/recover-after-10/expected b/csv/test/csv-crc/recover/recover-after-10/expected
new file mode 100644
index 000000000..d5a50a50a
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-10/expected
@@ -0,0 +1,5 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+count=4
diff --git a/csv/test/csv-crc/recover/recover-after-10/input b/csv/test/csv-crc/recover/recover-after-10/input
new file mode 100644
index 000000000..9cd49614b
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-10/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 10"
+0,0,0,34041
+1,1,1,46827
+2,2,2,57565
+3,3,3,53967
+4,4,4,0
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/recover/recover-after-2/expected b/csv/test/csv-crc/recover/recover-after-2/expected
new file mode 100644
index 000000000..f03fe1cbc
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-2/expected
@@ -0,0 +1,8 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="4,4,4,19633"
+output[2]/line="5,5,5,32419"
+output[3]/line="6,6,6,10389"
+output[4]/line="7,7,7,6791"
+output[5]/line="8,8,8,1096"
+output[6]/line="9,9,9,13914"
+count=7
diff --git a/csv/test/csv-crc/recover/recover-after-2/input b/csv/test/csv-crc/recover/recover-after-2/input
new file mode 100644
index 000000000..687ae2121
--- /dev/null
+++ b/csv/test/csv-crc/recover/recover-after-2/input
@@ -0,0 +1,13 @@
+operation=recover
+binary=3ui,uw
+args="--recover-after 2"
+0,0,0,34041
+1,1,1,0
+2,2,2,57565
+3,3,3,0
+4,4,4,19633
+5,5,5,32419
+6,6,6,10389
+7,7,7,6791
+8,8,8,1096
+9,9,9,13914
diff --git a/csv/test/csv-crc/test b/csv/test/csv-crc/test
new file mode 100755
index 000000000..a36f24dfd
--- /dev/null
+++ b/csv/test/csv-crc/test
@@ -0,0 +1,25 @@
+#!/bin/bash
+
+# read individual test parameters and data
+input=$( cat )
+eval "$( grep = <<< "$input" )"
+data=$( grep -v = <<< "$input" )
+
+[[ $operation ]] || exit 1
+[[ $data ]] || exit 1
+
+function run_test()
+{
+    if [[ $binary ]]; then
+        size=$( echo $binary | csv-format size )
+        output_format=$binary
+        [[ $operation == wrap ]] && output_format=$output_format,uw
+        echo "$data" | csv-to-bin $binary | csv-crc $operation --size $size $args | csv-from-bin $output_format
+    else
+        echo "$data" | csv-crc $operation $args
+    fi
+}
+
+output=$( run_test )
+echo "$output" | name-value-from-csv -f line -d : --line-number -p output
+echo count=$( wc -l <<< "$output" )
\ No newline at end of file
diff --git a/csv/test/csv-crc/wrap/ascii/expected b/csv/test/csv-crc/wrap/ascii/expected
new file mode 100644
index 000000000..320309a98
--- /dev/null
+++ b/csv/test/csv-crc/wrap/ascii/expected
@@ -0,0 +1,11 @@
+output[0]/line="0,0,0,54755"
+output[1]/line="1,1,1,22691"
+output[2]/line="2,2,2,57154"
+output[3]/line="3,3,3,20994"
+output[4]/line="4,4,4,49313"
+output[5]/line="5,5,5,19937"
+output[6]/line="6,6,6,51712"
+output[7]/line="7,7,7,18240"
+output[8]/line="8,8,8,65383"
+output[9]/line="9,9,9,29223"
+count=10
diff --git a/csv/test/csv-crc/wrap/ascii/input b/csv/test/csv-crc/wrap/ascii/input
new file mode 100644
index 000000000..82e0e414b
--- /dev/null
+++ b/csv/test/csv-crc/wrap/ascii/input
@@ -0,0 +1,11 @@
+operation=wrap
+0,0,0
+1,1,1
+2,2,2
+3,3,3
+4,4,4
+5,5,5
+6,6,6
+7,7,7
+8,8,8
+9,9,9
diff --git a/csv/test/csv-crc/wrap/big-endian/expected b/csv/test/csv-crc/wrap/big-endian/expected
new file mode 100644
index 000000000..e0e2c23f7
--- /dev/null
+++ b/csv/test/csv-crc/wrap/big-endian/expected
@@ -0,0 +1,11 @@
+output[0]/line="0,0,0,63876"
+output[1]/line="1,1,1,60342"
+output[2]/line="2,2,2,56800"
+output[3]/line="3,3,3,53202"
+output[4]/line="4,4,4,45388"
+output[5]/line="5,5,5,41854"
+output[6]/line="6,6,6,38184"
+output[7]/line="7,7,7,34586"
+output[8]/line="8,8,8,18436"
+output[9]/line="9,9,9,23094"
+count=10
diff --git a/csv/test/csv-crc/wrap/big-endian/input b/csv/test/csv-crc/wrap/big-endian/input
new file mode 100644
index 000000000..3d773dbe0
--- /dev/null
+++ b/csv/test/csv-crc/wrap/big-endian/input
@@ -0,0 +1,13 @@
+operation=wrap
+binary=3ui
+args="--big-endian"
+0,0,0
+1,1,1
+2,2,2
+3,3,3
+4,4,4
+5,5,5
+6,6,6
+7,7,7
+8,8,8
+9,9,9
diff --git a/csv/test/csv-crc/wrap/binary/expected b/csv/test/csv-crc/wrap/binary/expected
new file mode 100644
index 000000000..a21ec8d4f
--- /dev/null
+++ b/csv/test/csv-crc/wrap/binary/expected
@@ -0,0 +1,11 @@
+output[0]/line="0,0,0,34041"
+output[1]/line="1,1,1,46827"
+output[2]/line="2,2,2,57565"
+output[3]/line="3,3,3,53967"
+output[4]/line="4,4,4,19633"
+output[5]/line="5,5,5,32419"
+output[6]/line="6,6,6,10389"
+output[7]/line="7,7,7,6791"
+output[8]/line="8,8,8,1096"
+output[9]/line="9,9,9,13914"
+count=10
diff --git a/csv/test/csv-crc/wrap/binary/input b/csv/test/csv-crc/wrap/binary/input
new file mode 100644
index 000000000..00e305daa
--- /dev/null
+++ b/csv/test/csv-crc/wrap/binary/input
@@ -0,0 +1,12 @@
+operation=wrap
+binary=3ui
+0,0,0
+1,1,1
+2,2,2
+3,3,3
+4,4,4
+5,5,5
+6,6,6
+7,7,7
+8,8,8
+9,9,9
diff --git a/csv/test/csv-enumerate/expected b/csv/test/csv-enumerate/expected
new file mode 100644
index 000000000..5ef5ab006
--- /dev/null
+++ b/csv/test/csv-enumerate/expected
@@ -0,0 +1,22 @@
+ascii[0]/output=""
+ascii[0]/status=1
+ascii[1]/output/line[0]="0,x,a,0"
+ascii[1]/output/line[1]="1,y,b,1"
+ascii[1]/output/line[2]="0,x,c,0"
+ascii[1]/status=0
+ascii[2]/output/line[0]="0,1,a,0"
+ascii[2]/output/line[1]="1,y,b,1"
+ascii[2]/output/line[2]="0,1,c,0"
+ascii[2]/status=0
+
+binary[0]/output/line[0]="0,1,a,0"
+binary[0]/output/line[1]="1,y,b,1"
+binary[0]/output/line[2]="0,1,c,0"
+binary[0]/status=0
+
+map[0]/output/line[0]="1,y,1,1"
+map[0]/output/line[1]="0,x,0,2"
+map[0]/status=0
+map[1]/output/line[0]="1,y,1,1"
+map[1]/output/line[1]="0,x,0,2"
+map[1]/status=0
diff --git a/csv/test/csv-enumerate/input b/csv/test/csv-enumerate/input
new file mode 100644
index 000000000..bf136d6bd
--- /dev/null
+++ b/csv/test/csv-enumerate/input
@@ -0,0 +1,10 @@
+ascii[0]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-enumerate"
+ascii[1]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-enumerate --fields a,b"
+ascii[2]="( echo 0,1,a ; echo 1,y,b; echo 0,1,c ) | csv-enumerate --fields a,b --format ui,s[16],s[16]"
+
+binary[0]="( echo 0,1,a ; echo 1,y,b; echo 0,1,c ) | csv-to-bin ui,s[16],s[16] | csv-enumerate --fields a,b --binary ui,s[16],s[16] | csv-from-bin ui,s[16],s[16],ui"
+
+map[0]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-enumerate --fields a,b --map | sed 's#\"##g' "
+map[1]="( echo 0,x,a ; echo 1,y,b; echo 0,x,c ) | csv-to-bin ui,s[16],s[16] | csv-enumerate --fields a,b --map --binary ui,s[16],s[16] | csv-from-bin ui,s[16],2ui | sed 's#\"##g' "
+
+
diff --git a/csv/test/csv-fields/expected b/csv/test/csv-fields/expected
index 43a1a5ac8..443885c0a 100644
--- a/csv/test/csv-fields/expected
+++ b/csv/test/csv-fields/expected
@@ -18,6 +18,18 @@ numbers/fill[2]/output="f1,f2,f3,f4"
 numbers/fill[2]/status=0
 numbers/fill[3]/output="f1,f2,f3,f4"
 numbers/fill[3]/status=0
+numbers/fields[0]/output=""
+numbers/fields[0]/status=0
+numbers/fields[1]/output="1"
+numbers/fields[1]/status=0
+numbers/fields[2]/output="2"
+numbers/fields[2]/status=0
+numbers/fields[3]/output="2"
+numbers/fields[3]/status=0
+numbers/fields[4]/output="2,3"
+numbers/fields[4]/status=0
+numbers/fields[5]/output="2,3,4"
+numbers/fields[5]/status=0
 
 clear/keep[0]/output=",,,"
 clear/keep[0]/status=0
@@ -193,3 +205,15 @@ make_fixed[2]/output="a,b,c"
 make_fixed[2]/status=0
 make_fixed[3]/output="a:b:c:d::"
 make_fixed[3]/status=0
+make_fixed[4]/output="a,b,c,4,5,6"
+make_fixed[4]/status=0
+make_fixed[5]/output="a,b,c,4,5,"
+make_fixed[5]/status=0
+make_fixed[6]/output="a,b,c,,,"
+make_fixed[6]/status=0
+make_fixed[7]/output="a,b,c,,,"
+make_fixed[7]/status=0
+make_fixed[8]/output="a,b,,4,5,6"
+make_fixed[8]/status=0
+make_fixed[9]/output="a,b,c,4,5,6"
+make_fixed[9]/status=0
diff --git a/csv/test/csv-fields/input b/csv/test/csv-fields/input
index c4a92cbd8..7a8a3db2c 100644
--- a/csv/test/csv-fields/input
+++ b/csv/test/csv-fields/input
@@ -8,6 +8,12 @@ numbers/fill[0]="echo ,,, | csv-fields numbers --fill"
 numbers/fill[1]="echo a,,,b | csv-fields numbers --fill"
 numbers/fill[2]="echo ,,, | csv-fields numbers --fill --prefix f"
 numbers/fill[3]="echo a,,,b | csv-fields numbers --fill --prefix f"
+numbers/fields[0]="echo ,,, | csv-fields numbers --fields=a"
+numbers/fields[1]="echo a,,, | csv-fields numbers --fields=a"
+numbers/fields[2]="echo ,a,, | csv-fields numbers --fields=a"
+numbers/fields[3]="echo ,a,b, | csv-fields numbers --fields=a"
+numbers/fields[4]="echo ,a,b, | csv-fields numbers --fields=a,b"
+numbers/fields[5]="echo ,a,a,a | csv-fields numbers --fields=a"
 
 clear/keep[0]="echo a,b,c,d | csv-fields clear --keep ,,,"
 clear/keep[1]="echo a,b,c,d | csv-fields clear --keep a"
@@ -103,5 +109,9 @@ make_fixed[0]="echo a,b,c,d | csv-fields make-fixed --count=6"
 make_fixed[1]="echo a,b,c,d | csv-fields make-fixed --count=3"
 make_fixed[2]="echo a,b,c,d | csv-fields make-fixed --count=3 --force"
 make_fixed[3]="echo a:b:c:d | csv-fields make-fixed --count=6 --delimiter=:"
-
-
+make_fixed[4]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3,4,5,6"
+make_fixed[5]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3,4,5"
+make_fixed[6]="echo a,b,c | csv-fields make-fixed --count=6 --values 1,2,3"
+make_fixed[7]="echo a,b,c | csv-fields make-fixed --count=6 --values 1"
+make_fixed[8]="echo a,b, | csv-fields make-fixed --count=6 --values 1,2,3,4,5,6"
+make_fixed[9]="echo a,b,c | csv-fields make-fixed --values 1,2,3,4,5,6"
diff --git a/csv/test/csv-interval/ascii/test b/csv/test/csv-interval/ascii/test
deleted file mode 100755
index 074ec4ca8..000000000
--- a/csv/test/csv-interval/ascii/test
+++ /dev/null
@@ -1,3 +0,0 @@
-#!/bin/bash
-
-csv-interval $( cat options ) | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
diff --git a/csv/test/csv-interval/overlap-count/input b/csv/test/csv-interval/overlap-count/input
deleted file mode 100644
index f4e21571d..000000000
--- a/csv/test/csv-interval/overlap-count/input
+++ /dev/null
@@ -1,16 +0,0 @@
-min[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 0"
-min[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 1"
-min[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 2"
-min[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 3"
-
-max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 0"
-max[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 1"
-max[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 2"
-max[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-max 3"
-
-min_max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count-min 1 --overlap-count-max 2"
-
-equal[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 0"
-equal[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 1"
-equal[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 2"
-equal[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --overlap-count 3"
diff --git a/csv/test/csv-interval/append/expected b/csv/test/csv-intervals/append/expected
similarity index 100%
rename from csv/test/csv-interval/append/expected
rename to csv/test/csv-intervals/append/expected
diff --git a/csv/test/csv-interval/append/input b/csv/test/csv-intervals/append/input
similarity index 79%
rename from csv/test/csv-interval/append/input
rename to csv/test/csv-intervals/append/input
index 2f584bfa3..bf97c221d 100644
--- a/csv/test/csv-interval/append/input
+++ b/csv/test/csv-intervals/append/input
@@ -1,3 +1,3 @@
-append[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-interval --append"
+append[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --append"
 
 
diff --git a/csv/test/csv-intervals/ascii/test b/csv/test/csv-intervals/ascii/test
new file mode 100755
index 000000000..940042294
--- /dev/null
+++ b/csv/test/csv-intervals/ascii/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+
+csv-intervals make $( cat options ) | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
diff --git a/csv/test/csv-interval/ascii/test.01/expected b/csv/test/csv-intervals/ascii/test.01/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.01/expected
rename to csv/test/csv-intervals/ascii/test.01/expected
diff --git a/csv/test/csv-interval/ascii/test.01/input b/csv/test/csv-intervals/ascii/test.01/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.01/input
rename to csv/test/csv-intervals/ascii/test.01/input
diff --git a/csv/test/csv-interval/ascii/test.01/options b/csv/test/csv-intervals/ascii/test.01/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.01/options
rename to csv/test/csv-intervals/ascii/test.01/options
diff --git a/csv/test/csv-interval/ascii/test.02/expected b/csv/test/csv-intervals/ascii/test.02/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.02/expected
rename to csv/test/csv-intervals/ascii/test.02/expected
diff --git a/csv/test/csv-interval/ascii/test.02/input b/csv/test/csv-intervals/ascii/test.02/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.02/input
rename to csv/test/csv-intervals/ascii/test.02/input
diff --git a/csv/test/csv-interval/ascii/test.02/options b/csv/test/csv-intervals/ascii/test.02/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.02/options
rename to csv/test/csv-intervals/ascii/test.02/options
diff --git a/csv/test/csv-interval/ascii/test.03/expected b/csv/test/csv-intervals/ascii/test.03/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.03/expected
rename to csv/test/csv-intervals/ascii/test.03/expected
diff --git a/csv/test/csv-interval/ascii/test.03/input b/csv/test/csv-intervals/ascii/test.03/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.03/input
rename to csv/test/csv-intervals/ascii/test.03/input
diff --git a/csv/test/csv-interval/ascii/test.03/options b/csv/test/csv-intervals/ascii/test.03/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.03/options
rename to csv/test/csv-intervals/ascii/test.03/options
diff --git a/csv/test/csv-interval/ascii/test.04/disabled b/csv/test/csv-intervals/ascii/test.04/disabled
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/disabled
rename to csv/test/csv-intervals/ascii/test.04/disabled
diff --git a/csv/test/csv-interval/ascii/test.04/expected b/csv/test/csv-intervals/ascii/test.04/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/expected
rename to csv/test/csv-intervals/ascii/test.04/expected
diff --git a/csv/test/csv-interval/ascii/test.04/input b/csv/test/csv-intervals/ascii/test.04/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/input
rename to csv/test/csv-intervals/ascii/test.04/input
diff --git a/csv/test/csv-interval/ascii/test.04/options b/csv/test/csv-intervals/ascii/test.04/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.04/options
rename to csv/test/csv-intervals/ascii/test.04/options
diff --git a/csv/test/csv-interval/ascii/test.05/expected b/csv/test/csv-intervals/ascii/test.05/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.05/expected
rename to csv/test/csv-intervals/ascii/test.05/expected
diff --git a/csv/test/csv-interval/ascii/test.05/input b/csv/test/csv-intervals/ascii/test.05/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.05/input
rename to csv/test/csv-intervals/ascii/test.05/input
diff --git a/csv/test/csv-interval/ascii/test.05/options b/csv/test/csv-intervals/ascii/test.05/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.05/options
rename to csv/test/csv-intervals/ascii/test.05/options
diff --git a/csv/test/csv-interval/ascii/test.06/expected b/csv/test/csv-intervals/ascii/test.06/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.06/expected
rename to csv/test/csv-intervals/ascii/test.06/expected
diff --git a/csv/test/csv-interval/ascii/test.06/input b/csv/test/csv-intervals/ascii/test.06/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.06/input
rename to csv/test/csv-intervals/ascii/test.06/input
diff --git a/csv/test/csv-interval/ascii/test.06/options b/csv/test/csv-intervals/ascii/test.06/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.06/options
rename to csv/test/csv-intervals/ascii/test.06/options
diff --git a/csv/test/csv-interval/ascii/test.07/expected b/csv/test/csv-intervals/ascii/test.07/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.07/expected
rename to csv/test/csv-intervals/ascii/test.07/expected
diff --git a/csv/test/csv-interval/ascii/test.07/input b/csv/test/csv-intervals/ascii/test.07/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.07/input
rename to csv/test/csv-intervals/ascii/test.07/input
diff --git a/csv/test/csv-interval/ascii/test.07/options b/csv/test/csv-intervals/ascii/test.07/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.07/options
rename to csv/test/csv-intervals/ascii/test.07/options
diff --git a/csv/test/csv-interval/ascii/test.08/expected b/csv/test/csv-intervals/ascii/test.08/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.08/expected
rename to csv/test/csv-intervals/ascii/test.08/expected
diff --git a/csv/test/csv-interval/ascii/test.08/input b/csv/test/csv-intervals/ascii/test.08/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.08/input
rename to csv/test/csv-intervals/ascii/test.08/input
diff --git a/csv/test/csv-interval/ascii/test.08/options b/csv/test/csv-intervals/ascii/test.08/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.08/options
rename to csv/test/csv-intervals/ascii/test.08/options
diff --git a/csv/test/csv-interval/ascii/test.09/expected b/csv/test/csv-intervals/ascii/test.09/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.09/expected
rename to csv/test/csv-intervals/ascii/test.09/expected
diff --git a/csv/test/csv-interval/ascii/test.09/input b/csv/test/csv-intervals/ascii/test.09/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.09/input
rename to csv/test/csv-intervals/ascii/test.09/input
diff --git a/csv/test/csv-interval/ascii/test.09/options b/csv/test/csv-intervals/ascii/test.09/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.09/options
rename to csv/test/csv-intervals/ascii/test.09/options
diff --git a/csv/test/csv-interval/ascii/test.10/expected b/csv/test/csv-intervals/ascii/test.10/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.10/expected
rename to csv/test/csv-intervals/ascii/test.10/expected
diff --git a/csv/test/csv-interval/ascii/test.10/input b/csv/test/csv-intervals/ascii/test.10/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.10/input
rename to csv/test/csv-intervals/ascii/test.10/input
diff --git a/csv/test/csv-interval/ascii/test.10/options b/csv/test/csv-intervals/ascii/test.10/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.10/options
rename to csv/test/csv-intervals/ascii/test.10/options
diff --git a/csv/test/csv-interval/ascii/test.11/expected b/csv/test/csv-intervals/ascii/test.11/expected
similarity index 100%
rename from csv/test/csv-interval/ascii/test.11/expected
rename to csv/test/csv-intervals/ascii/test.11/expected
diff --git a/csv/test/csv-interval/ascii/test.11/input b/csv/test/csv-intervals/ascii/test.11/input
similarity index 100%
rename from csv/test/csv-interval/ascii/test.11/input
rename to csv/test/csv-intervals/ascii/test.11/input
diff --git a/csv/test/csv-interval/ascii/test.11/options b/csv/test/csv-intervals/ascii/test.11/options
similarity index 100%
rename from csv/test/csv-interval/ascii/test.11/options
rename to csv/test/csv-intervals/ascii/test.11/options
diff --git a/csv/test/csv-interval/binary/test b/csv/test/csv-intervals/binary/test
similarity index 65%
rename from csv/test/csv-interval/binary/test
rename to csv/test/csv-intervals/binary/test
index 4f41eb06b..93e137d9e 100755
--- a/csv/test/csv-interval/binary/test
+++ b/csv/test/csv-intervals/binary/test
@@ -7,4 +7,4 @@ format_index=$( echo $options | fmt -1 | grep -n -- '--binary' | cut -d: -f1 )
 input_format="${args[$format_index]}"
 [[ -z "$output_format" ]] && output_format=$input_format
 
-csv-to-bin $input_format | csv-interval $options | csv-from-bin $output_format | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
+csv-to-bin $input_format | csv-intervals make $options | csv-from-bin $output_format | gawk '{ printf( "interval[%d]=%s\n", NR, $0 ); }'
diff --git a/csv/test/csv-interval/binary/test.01/expected b/csv/test/csv-intervals/binary/test.01/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.01/expected
rename to csv/test/csv-intervals/binary/test.01/expected
diff --git a/csv/test/csv-interval/binary/test.01/input b/csv/test/csv-intervals/binary/test.01/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.01/input
rename to csv/test/csv-intervals/binary/test.01/input
diff --git a/csv/test/csv-interval/binary/test.01/options b/csv/test/csv-intervals/binary/test.01/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.01/options
rename to csv/test/csv-intervals/binary/test.01/options
diff --git a/csv/test/csv-interval/binary/test.02/expected b/csv/test/csv-intervals/binary/test.02/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.02/expected
rename to csv/test/csv-intervals/binary/test.02/expected
diff --git a/csv/test/csv-interval/binary/test.02/input b/csv/test/csv-intervals/binary/test.02/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.02/input
rename to csv/test/csv-intervals/binary/test.02/input
diff --git a/csv/test/csv-interval/binary/test.02/options b/csv/test/csv-intervals/binary/test.02/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.02/options
rename to csv/test/csv-intervals/binary/test.02/options
diff --git a/csv/test/csv-interval/binary/test.03/disabled b/csv/test/csv-intervals/binary/test.03/disabled
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/disabled
rename to csv/test/csv-intervals/binary/test.03/disabled
diff --git a/csv/test/csv-interval/binary/test.03/expected b/csv/test/csv-intervals/binary/test.03/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/expected
rename to csv/test/csv-intervals/binary/test.03/expected
diff --git a/csv/test/csv-interval/binary/test.03/input b/csv/test/csv-intervals/binary/test.03/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/input
rename to csv/test/csv-intervals/binary/test.03/input
diff --git a/csv/test/csv-interval/binary/test.03/options b/csv/test/csv-intervals/binary/test.03/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.03/options
rename to csv/test/csv-intervals/binary/test.03/options
diff --git a/csv/test/csv-interval/binary/test.04/disabled b/csv/test/csv-intervals/binary/test.04/disabled
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/disabled
rename to csv/test/csv-intervals/binary/test.04/disabled
diff --git a/csv/test/csv-interval/binary/test.04/expected b/csv/test/csv-intervals/binary/test.04/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/expected
rename to csv/test/csv-intervals/binary/test.04/expected
diff --git a/csv/test/csv-interval/binary/test.04/input b/csv/test/csv-intervals/binary/test.04/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/input
rename to csv/test/csv-intervals/binary/test.04/input
diff --git a/csv/test/csv-interval/binary/test.04/options b/csv/test/csv-intervals/binary/test.04/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.04/options
rename to csv/test/csv-intervals/binary/test.04/options
diff --git a/csv/test/csv-interval/binary/test.05/expected b/csv/test/csv-intervals/binary/test.05/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.05/expected
rename to csv/test/csv-intervals/binary/test.05/expected
diff --git a/csv/test/csv-interval/binary/test.05/input b/csv/test/csv-intervals/binary/test.05/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.05/input
rename to csv/test/csv-intervals/binary/test.05/input
diff --git a/csv/test/csv-interval/binary/test.05/options b/csv/test/csv-intervals/binary/test.05/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.05/options
rename to csv/test/csv-intervals/binary/test.05/options
diff --git a/csv/test/csv-interval/binary/test.06/expected b/csv/test/csv-intervals/binary/test.06/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.06/expected
rename to csv/test/csv-intervals/binary/test.06/expected
diff --git a/csv/test/csv-interval/binary/test.06/input b/csv/test/csv-intervals/binary/test.06/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.06/input
rename to csv/test/csv-intervals/binary/test.06/input
diff --git a/csv/test/csv-interval/binary/test.06/options b/csv/test/csv-intervals/binary/test.06/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.06/options
rename to csv/test/csv-intervals/binary/test.06/options
diff --git a/csv/test/csv-interval/binary/test.07/expected b/csv/test/csv-intervals/binary/test.07/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.07/expected
rename to csv/test/csv-intervals/binary/test.07/expected
diff --git a/csv/test/csv-interval/binary/test.07/input b/csv/test/csv-intervals/binary/test.07/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.07/input
rename to csv/test/csv-intervals/binary/test.07/input
diff --git a/csv/test/csv-interval/binary/test.07/options b/csv/test/csv-intervals/binary/test.07/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.07/options
rename to csv/test/csv-intervals/binary/test.07/options
diff --git a/csv/test/csv-interval/binary/test.08/expected b/csv/test/csv-intervals/binary/test.08/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.08/expected
rename to csv/test/csv-intervals/binary/test.08/expected
diff --git a/csv/test/csv-interval/binary/test.08/input b/csv/test/csv-intervals/binary/test.08/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.08/input
rename to csv/test/csv-intervals/binary/test.08/input
diff --git a/csv/test/csv-interval/binary/test.08/options b/csv/test/csv-intervals/binary/test.08/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.08/options
rename to csv/test/csv-intervals/binary/test.08/options
diff --git a/csv/test/csv-interval/binary/test.09/expected b/csv/test/csv-intervals/binary/test.09/expected
similarity index 100%
rename from csv/test/csv-interval/binary/test.09/expected
rename to csv/test/csv-intervals/binary/test.09/expected
diff --git a/csv/test/csv-interval/binary/test.09/input b/csv/test/csv-intervals/binary/test.09/input
similarity index 100%
rename from csv/test/csv-interval/binary/test.09/input
rename to csv/test/csv-intervals/binary/test.09/input
diff --git a/csv/test/csv-interval/binary/test.09/options b/csv/test/csv-intervals/binary/test.09/options
similarity index 100%
rename from csv/test/csv-interval/binary/test.09/options
rename to csv/test/csv-intervals/binary/test.09/options
diff --git a/csv/test/csv-intervals/contain/expected b/csv/test/csv-intervals/contain/expected
new file mode 100644
index 000000000..b307e5a5c
--- /dev/null
+++ b/csv/test/csv-intervals/contain/expected
@@ -0,0 +1,23 @@
+contain/ascii[0]/output/line[0]="1,1"
+contain/ascii[0]/output/line[1]="5,0"
+contain/ascii[0]/output/line[2]="9,1"
+contain/ascii[0]/output/line[3]="11,0"
+contain/ascii[0]/status=0
+contain/ascii[1]/output/line[0]="1,1"
+contain/ascii[1]/output/line[1]="5,0"
+contain/ascii[1]/status=0
+contain/fields[0]/output/line[0]=",1,1"
+contain/fields[0]/output/line[1]=",5,0"
+contain/fields[0]/status=0
+contain/fields[1]/output/line[0]=",1,1"
+contain/fields[1]/output/line[1]=",5,0"
+contain/fields[1]/status=0
+contain/binary[0]/output/line[0]="1,1"
+contain/binary[0]/output/line[1]="5,0"
+contain/binary[0]/status=0
+contain/binary[1]/output/line[0]="1,1"
+contain/binary[1]/output/line[1]="5,0"
+contain/binary[1]/status=0
+contain/binary[2]/output/line[0]="1,1"
+contain/binary[2]/output/line[1]="5,0"
+contain/binary[2]/status=0
diff --git a/csv/test/csv-intervals/contain/input b/csv/test/csv-intervals/contain/input
new file mode 100644
index 000000000..eac7bd818
--- /dev/null
+++ b/csv/test/csv-intervals/contain/input
@@ -0,0 +1,7 @@
+contain/ascii[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals contain --intervals <( echo 0,2; echo 9,11 )"
+contain/ascii[1]="( echo 1; echo 5 ) | csv-intervals --fields scalar contain --intervals <( echo 0,2 )"
+contain/fields[0]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar contain --intervals <( echo 0,2 )"
+contain/fields[1]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar contain --intervals <( echo ,0,2 )';fields=,from,to'"
+contain/binary[0]="( echo 1; echo 5 ) | csv-to-bin ui | csv-intervals contain --binary ui --intervals <( echo 0,2; echo 9,11 ) | csv-from-bin ui,b"
+contain/binary[1]="( echo 1; echo 5 ) | csv-to-bin ui | csv-intervals contain --binary ui --intervals <( ( echo 0,2; echo 9,11 ) | csv-to-bin 2ui )';binary=2ui' | csv-from-bin ui,b"
+contain/binary[2]="( echo 1; echo 5 ) | csv-intervals contain --intervals <( ( echo 0,2; echo 9,11 ) | csv-to-bin 2ui )';binary=2ui'"
diff --git a/csv/test/csv-intervals/join/expected b/csv/test/csv-intervals/join/expected
new file mode 100644
index 000000000..2d0a5a80e
--- /dev/null
+++ b/csv/test/csv-intervals/join/expected
@@ -0,0 +1,27 @@
+join/ascii[0]/output/line[0]="1,0,2,a"
+join/ascii[0]/output/line[1]="9,9,11,b"
+join/ascii[0]/status=0
+join/ascii[1]/output/line[0]="9,0,10,b"
+join/ascii[1]/output/line[1]="9,0,10,c"
+join/ascii[1]/output/line[2]="9,0,20,d"
+join/ascii[1]/status=0
+join/fields[0]/output=",1,0,2,a"
+join/fields[0]/status=0
+join/fields[1]/output=",1,a,0,2,b"
+join/fields[1]/status=0
+join/binary[0]/output/line[0]="9,0,10,0"
+join/binary[0]/output/line[1]="9,0,10,1"
+join/binary[0]/output/line[2]="9,5,20,2"
+join/binary[0]/status=0
+join/matching[0]/output/line[0]="1"
+join/matching[0]/output/line[1]="9"
+join/matching[0]/status=0
+join/matching[1]/output/line[0]="1"
+join/matching[1]/output/line[1]="9"
+join/matching[1]/status=0
+join/not_matching[0]/output/line[0]="5"
+join/not_matching[0]/output/line[1]="11"
+join/not_matching[0]/status=0
+join/not_matching[1]/output/line[0]="5"
+join/not_matching[1]/output/line[1]="11"
+join/not_matching[1]/status=0
diff --git a/csv/test/csv-intervals/join/input b/csv/test/csv-intervals/join/input
new file mode 100644
index 000000000..4ffbfd8aa
--- /dev/null
+++ b/csv/test/csv-intervals/join/input
@@ -0,0 +1,9 @@
+join/ascii[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b )"
+join/ascii[1]="( echo 9 ) | csv-intervals join --intervals <( echo 0,2,a; echo 0,10,b; echo 0,10,c; echo 0,20,d )"
+join/fields[0]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar join --intervals <( echo 0,2,a )"
+join/fields[1]="( echo ,1; echo ,5 ) | csv-intervals --fields ,scalar join --intervals <( echo a,0,2,b )';fields=,from,to'"
+join/binary[0]="( echo 9 ) | csv-to-bin ui | csv-intervals join --binary ui --intervals <( ( echo 0,10,0; echo 0,10,1; echo 5,20,2 ) | csv-to-bin 3ui )';binary=3ui' | csv-from-bin 4ui"
+join/matching[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --matching"
+join/matching[1]="( echo 1; echo 5; echo 9; echo 11 ) | csv-to-bin ui | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --matching --binary ui | csv-from-bin ui"
+join/not_matching[0]="( echo 1; echo 5; echo 9; echo 11 ) | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --not-matching"
+join/not_matching[1]="( echo 1; echo 5; echo 9; echo 11 ) | csv-to-bin ui | csv-intervals join --intervals <( echo 0,2,a; echo 9,11,b ) --not-matching --binary ui | csv-from-bin ui"
diff --git a/csv/test/csv-interval/overlap-count/expected b/csv/test/csv-intervals/overlap-count/expected
similarity index 100%
rename from csv/test/csv-interval/overlap-count/expected
rename to csv/test/csv-intervals/overlap-count/expected
diff --git a/csv/test/csv-intervals/overlap-count/input b/csv/test/csv-intervals/overlap-count/input
new file mode 100644
index 000000000..5fb97b7f1
--- /dev/null
+++ b/csv/test/csv-intervals/overlap-count/input
@@ -0,0 +1,16 @@
+min[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 0"
+min[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 1"
+min[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 2"
+min[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 3"
+
+max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 0"
+max[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 1"
+max[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 2"
+max[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-max 3"
+
+min_max[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count-min 1 --overlap-count-max 2"
+
+equal[0]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 0"
+equal[1]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 1"
+equal[2]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 2"
+equal[3]="( echo 0,5,a; echo 4,7,b; echo 2,8,c ) | csv-intervals make --overlap-count 3"
diff --git a/csv/test/csv-join/block_less/expected b/csv/test/csv-join/block_less/expected
new file mode 100644
index 000000000..784085d5d
--- /dev/null
+++ b/csv/test/csv-join/block_less/expected
@@ -0,0 +1,58 @@
+block_less/basics[0]/output/line[0]="0,0,0,0"
+block_less/basics[0]/output/line[1]="1,0,0,0"
+block_less/basics[0]/output/line[2]="2,0,0,0"
+block_less/basics[0]/output/line[3]="3,0,0,0"
+block_less/basics[0]/output/line[4]="4,0,0,0"
+block_less/basics[0]/output/line[5]="5,0,0,0"
+block_less/basics[0]/output/line[6]="6,0,0,0"
+block_less/basics[0]/output/line[7]="7,0,0,0"
+block_less/basics[0]/output/line[8]="8,0,0,0"
+block_less/basics[0]/output/line[9]="9,0,0,0"
+block_less/basics[0]/status=0
+block_less/basics[1]/output/line[0]="3,0,3,0"
+block_less/basics[1]/output/line[1]="4,0,3,0"
+block_less/basics[1]/output/line[2]="5,0,3,0"
+block_less/basics[1]/output/line[3]="6,0,3,0"
+block_less/basics[1]/output/line[4]="7,0,3,0"
+block_less/basics[1]/output/line[5]="8,0,3,0"
+block_less/basics[1]/output/line[6]="9,0,3,0"
+block_less/basics[1]/status=0
+block_less/basics[2]/output="9,0,9,0"
+block_less/basics[2]/status=0
+block_less/basics[3]/output=""
+block_less/basics[3]/status=0
+block_less/basics[4]/output/line[0]="0,0,0,0"
+block_less/basics[4]/output/line[1]="1,0,0,0"
+block_less/basics[4]/output/line[2]="2,0,0,0"
+block_less/basics[4]/output/line[3]="3,0,0,0"
+block_less/basics[4]/output/line[4]="4,0,0,0"
+block_less/basics[4]/output/line[5]="5,0,0,0"
+block_less/basics[4]/output/line[6]="6,0,6,0"
+block_less/basics[4]/output/line[7]="7,0,6,0"
+block_less/basics[4]/output/line[8]="8,0,6,0"
+block_less/basics[4]/output/line[9]="9,0,6,0"
+block_less/basics[4]/status=0
+block_less/basics[5]/output/line[0]="3,0,3,0"
+block_less/basics[5]/output/line[1]="4,0,3,0"
+block_less/basics[5]/output/line[2]="5,0,3,0"
+block_less/basics[5]/output/line[3]="6,0,6,0"
+block_less/basics[5]/output/line[4]="7,0,6,0"
+block_less/basics[5]/output/line[5]="8,0,6,0"
+block_less/basics[5]/output/line[6]="9,0,6,0"
+block_less/basics[5]/status=0
+block_less/basics[6]/output/line[0]="3,0,3,0"
+block_less/basics[6]/output/line[1]="4,0,3,0"
+block_less/basics[6]/output/line[2]="5,0,3,0"
+block_less/basics[6]/output/line[3]="6,0,3,0"
+block_less/basics[6]/output/line[4]="7,0,3,0"
+block_less/basics[6]/output/line[5]="8,0,3,0"
+block_less/basics[6]/output/line[6]="9,0,9,0"
+block_less/basics[6]/status=0
+block_less/basics[7]/output/line[0]="3,0,3,0"
+block_less/basics[7]/output/line[1]="4,0,3,0"
+block_less/basics[7]/output/line[2]="5,0,3,0"
+block_less/basics[7]/output/line[3]="6,0,3,0"
+block_less/basics[7]/output/line[4]="7,0,3,0"
+block_less/basics[7]/output/line[5]="8,0,3,0"
+block_less/basics[7]/output/line[6]="9,0,3,0"
+block_less/basics[7]/status=0
diff --git a/csv/test/csv-join/block_less/input b/csv/test/csv-join/block_less/input
new file mode 100644
index 000000000..1cdbff01b
--- /dev/null
+++ b/csv/test/csv-join/block_less/input
@@ -0,0 +1,8 @@
+block_less/basics[0]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 0,0 )';fields=block,id' --block-less"
+block_less/basics[1]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0 )';fields=block,id' --block-less"
+block_less/basics[2]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 9,0 )';fields=block,id' --block-less"
+block_less/basics[3]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 10,0 )';fields=block,id' --block-less"
+block_less/basics[4]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 0,0; echo 6,0 )';fields=block,id' --block-less"
+block_less/basics[5]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0; echo 6,0 )';fields=block,id' --block-less"
+block_less/basics[6]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0; echo 9,0 )';fields=block,id' --block-less"
+block_less/basics[7]="csv-paste line-number value=0 | head | csv-join --fields block,id <( echo 3,0; echo 10,0 )';fields=block,id' --block-less"
\ No newline at end of file
diff --git a/csv/test/csv-join/drop-id/expected b/csv/test/csv-join/drop-id/expected
new file mode 100644
index 000000000..5a8109c1a
--- /dev/null
+++ b/csv/test/csv-join/drop-id/expected
@@ -0,0 +1,16 @@
+drop_id/ascii[0]/output="0,1,2,3,A,B,C"
+drop_id/ascii[1]/output="0,1,2,3,A,B,C"
+drop_id/ascii[2]/output="0,1,2,3,A,B,C"
+drop_id/ascii[3]/output="0,1,2,3,A,B,C"
+drop_id/ascii[4]/output="0,1,2,3,A,B"
+drop_id/ascii[5]/output="0,1,2,3,A,B"
+drop_id/ascii[6]/output/line[0]="a,1,b,3,A,B"
+drop_id/ascii[6]/output/line[1]="c,1,d,3,A,B"
+
+drop_id/binary[0]/output="0,1,2,3,111,222,333"
+drop_id/binary[1]/output="0,1,2,3,111,222"
+drop_id/binary[2]/output="0,1,2,3,111,222"
+drop_id/binary[3]/output="0,1,2,3,111,222"
+drop_id/binary[4]/output="0,1,2,3,111,222"
+drop_id/binary[5]/output/line[0]="111,1,222,3,111,222"
+drop_id/binary[5]/output/line[1]="333,1,444,3,111,222"
diff --git a/csv/test/csv-join/drop-id/input b/csv/test/csv-join/drop-id/input
new file mode 100644
index 000000000..864b7d21c
--- /dev/null
+++ b/csv/test/csv-join/drop-id/input
@@ -0,0 +1,14 @@
+drop_id/ascii[0]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo 1,A,B,C )';fields=x'"
+drop_id/ascii[1]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo 1,A,B,C )';fields=x,,,'"
+drop_id/ascii[2]="echo 0,1,2,3 | csv-join --drop-id --fields ,x <( echo A,1,B,C )';fields=,x'"
+drop_id/ascii[3]="echo 0,1,2,3 | csv-join --drop-id --fields ,,,x <( echo A,B,C,3 )';fields=,,,x'"
+drop_id/ascii[4]="echo 0,1,2,3 | csv-join --drop-id --fields ,x,,y <( echo 1,A,B,3 )';fields=x,,,y'"
+drop_id/ascii[5]="echo 0,1,2,3 | csv-join --drop-id --fields ,x,,y <( echo 3,A,B,1 )';fields=y,,,x'"
+drop_id/ascii[6]="( echo a,1,b,3; echo c,1,d,3 ) | csv-join --drop-id --fields ,x,,y <( echo 3,A,B,1 )';fields=y,,,x'"
+
+drop_id/binary[0]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x --binary=4ui <( echo 1,111,222,333 | csv-to-bin ui,d,ui,d )';fields=x;binary=ui,d,ui,d' | csv-from-bin 4ui,d,ui,d"
+drop_id/binary[1]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 1,111,222,3 | csv-to-bin ui,d,ui,ul )';fields=x,,,y;binary=ui,d,ui,ul' | csv-from-bin 4ui,d,ui"
+drop_id/binary[2]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 1,111,3,222 | csv-to-bin ui,d,ui,ul )';fields=x,,y,;binary=ui,d,ui,ul' | csv-from-bin 4ui,d,ul"
+drop_id/binary[3]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 3,111,1,222 | csv-to-bin ui,d,ui,ul )';fields=y,,x,;binary=ui,d,ui,ul' | csv-from-bin 4ui,d,ul"
+drop_id/binary[4]="echo 0,1,2,3 | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 111,3,1,222 | csv-to-bin ui,d,ui,ul )';fields=,y,x,;binary=ui,d,ui,ul' | csv-from-bin 4ui,ui,ul"
+drop_id/binary[5]="( echo 111,1,222,3; echo 333,1,444,3 ) | csv-to-bin 4ui | csv-join --drop-id --fields ,x,,y --binary=4ui <( echo 111,3,1,222 | csv-to-bin ui,d,ui,ul )';fields=,y,x,;binary=ui,d,ui,ul' | csv-from-bin 4ui,ui,ul"
diff --git a/csv/test/csv-paste/expected b/csv/test/csv-paste/expected
index ad48b2ffa..dce417c7f 100644
--- a/csv/test/csv-paste/expected
+++ b/csv/test/csv-paste/expected
@@ -47,3 +47,174 @@ line_number/multiple[1]/output="0,0;0,0;0,0;0,0;0,0;0,1;1,1;1,1;1,1;1,1;"
 line_number/multiple[1]/status=0
 line_number/multiple[2]/output="0,0;0,1;0,2;0,3;0,4;1,0;1,1;1,2;1,3;1,4;"
 line_number/multiple[2]/status=0
+
+line_number/binary[0]/output/line[0]="0"
+line_number/binary[0]/output/line[1]="1"
+line_number/binary[0]/output/line[2]="2"
+line_number/binary[0]/output/line[3]="3"
+line_number/binary[0]/status=0
+
+block_size/ascii[0]/output/line[0]="a,0"
+block_size/ascii[0]/output/line[1]="a,0"
+block_size/ascii[0]/output/line[2]="a,1"
+block_size/ascii[0]/output/line[3]="a,1"
+block_size/ascii[0]/output/line[4]="b,2"
+block_size/ascii[0]/output/line[5]="b,2"
+block_size/ascii[0]/output/line[6]="b,3"
+block_size/ascii[0]/output/line[7]="b,3"
+block_size/ascii[0]/status=0
+
+block_size/binary[0]/output/line[0]="0,0"
+block_size/binary[0]/output/line[1]="0,0"
+block_size/binary[0]/output/line[2]="0,1"
+block_size/binary[0]/output/line[3]="0,1"
+block_size/binary[0]/output/line[4]="1,2"
+block_size/binary[0]/output/line[5]="1,2"
+block_size/binary[0]/output/line[6]="1,3"
+block_size/binary[0]/output/line[7]="1,3"
+block_size/binary[0]/status=0
+
+line_number/step[0]/output/line[0]="0"
+line_number/step[0]/output/line[1]="2"
+line_number/step[0]/output/line[2]="4"
+line_number/step[0]/output/line[3]="6"
+line_number/step[0]/status=0
+line_number/step[1]/output/line[0]="0"
+line_number/step[1]/output/line[1]="2"
+line_number/step[1]/output/line[2]="4"
+line_number/step[1]/output/line[3]="6"
+line_number/step[1]/status=0
+line_number/step[2]/output/line[0]="0"
+line_number/step[2]/output/line[1]="2"
+line_number/step[2]/output/line[2]="4"
+line_number/step[2]/output/line[3]="6"
+line_number/step[2]/status=0
+line_number/step[3]/output/line[0]="0"
+line_number/step[3]/output/line[1]="0"
+line_number/step[3]/output/line[2]="0"
+line_number/step[3]/output/line[3]="0"
+line_number/step[3]/output/line[4]="0"
+line_number/step[3]/output/line[5]="2"
+line_number/step[3]/output/line[6]="2"
+line_number/step[3]/output/line[7]="2"
+line_number/step[3]/output/line[8]="2"
+line_number/step[3]/output/line[9]="2"
+line_number/step[3]/status=0
+line_number/step[4]/output/line[0]="0"
+line_number/step[4]/output/line[1]="2"
+line_number/step[4]/output/line[2]="4"
+line_number/step[4]/output/line[3]="6"
+line_number/step[4]/output/line[4]="8"
+line_number/step[4]/output/line[5]="0"
+line_number/step[4]/output/line[6]="2"
+line_number/step[4]/output/line[7]="4"
+line_number/step[4]/output/line[8]="6"
+line_number/step[4]/output/line[9]="8"
+line_number/step[4]/status=0
+line_number/step[5]/output/line[0]="8"
+line_number/step[5]/output/line[1]="6"
+line_number/step[5]/output/line[2]="4"
+line_number/step[5]/output/line[3]="2"
+line_number/step[5]/output/line[4]="0"
+line_number/step[5]/output/line[5]="8"
+line_number/step[5]/output/line[6]="6"
+line_number/step[5]/output/line[7]="4"
+line_number/step[5]/output/line[8]="2"
+line_number/step[5]/output/line[9]="0"
+line_number/step[5]/status=0
+line_number/step[6]/output/line[0]="20"
+line_number/step[6]/output/line[1]="18"
+line_number/step[6]/output/line[2]="16"
+line_number/step[6]/output/line[3]="14"
+line_number/step[6]/output/line[4]="12"
+line_number/step[6]/output/line[5]="20"
+line_number/step[6]/output/line[6]="18"
+line_number/step[6]/output/line[7]="16"
+line_number/step[6]/output/line[8]="14"
+line_number/step[6]/output/line[9]="12"
+line_number/step[6]/status=0
+line_number/step[7]/status=1
+
+head[0]/output=""
+head[0]/status=0
+head[1]/output="0"
+head[1]/status=0
+head[2]/output/line[0]="0"
+head[2]/output/line[1]="1"
+head[2]/status=0
+
+line_number/shape[0]/output/line[0]="0,0"
+line_number/shape[0]/output/line[1]="0,1"
+line_number/shape[0]/output/line[2]="0,2"
+line_number/shape[0]/output/line[3]="1,0"
+line_number/shape[0]/output/line[4]="1,1"
+line_number/shape[0]/output/line[5]="1,2"
+line_number/shape[0]/output/line[6]="0,0"
+line_number/shape[0]/output/line[7]="0,1"
+line_number/shape[0]/output/line[8]="0,2"
+line_number/shape[0]/output/line[9]="1,0"
+line_number/shape[0]/output/line[10]="1,1"
+line_number/shape[0]/output/line[11]="1,2"
+line_number/shape[0]/status=0
+
+line_number/shape[1]/output/line[0]="0,0"
+line_number/shape[1]/output/line[1]="0,1"
+line_number/shape[1]/output/line[2]="0,2"
+line_number/shape[1]/output/line[3]="1,0"
+line_number/shape[1]/output/line[4]="1,1"
+line_number/shape[1]/output/line[5]="1,2"
+line_number/shape[1]/output/line[6]="0,0"
+line_number/shape[1]/output/line[7]="0,1"
+line_number/shape[1]/output/line[8]="0,2"
+line_number/shape[1]/output/line[9]="1,0"
+line_number/shape[1]/output/line[10]="1,1"
+line_number/shape[1]/output/line[11]="1,2"
+line_number/shape[1]/status=0
+
+line_number/repeat[0]/output/line[0]="0"
+line_number/repeat[0]/output/line[1]="1"
+line_number/repeat[0]/output/line[2]="2"
+line_number/repeat[0]/status=0
+line_number/repeat[1]/output/line[0]="0"
+line_number/repeat[1]/output/line[1]="1"
+line_number/repeat[1]/output/line[2]="2"
+line_number/repeat[1]/status=0
+line_number/repeat[3]/output/line[0]="0"
+line_number/repeat[3]/output/line[1]="0"
+line_number/repeat[3]/output/line[2]="1"
+line_number/repeat[3]/output/line[3]="1"
+line_number/repeat[3]/status=0
+line_number/repeat[4]/output/line[0]="0"
+line_number/repeat[4]/output/line[1]="0"
+line_number/repeat[4]/output/line[2]="1"
+line_number/repeat[4]/output/line[3]="1"
+line_number/repeat[4]/output/line[4]="2"
+line_number/repeat[4]/output/line[5]="2"
+line_number/repeat[4]/status=0
+line_number/repeat[5]/output/line[0]="0"
+line_number/repeat[5]/output/line[1]="1"
+line_number/repeat[5]/output/line[2]="0"
+line_number/repeat[5]/output/line[3]="1"
+line_number/repeat[5]/output/line[4]="0"
+line_number/repeat[5]/output/line[5]="1"
+line_number/repeat[5]/status=0
+line_number/repeat[6]/output/line[0]="1"
+line_number/repeat[6]/output/line[1]="0"
+line_number/repeat[6]/output/line[2]="1"
+line_number/repeat[6]/output/line[3]="0"
+line_number/repeat[6]/output/line[4]="1"
+line_number/repeat[6]/output/line[5]="0"
+line_number/repeat[6]/status=0
+line_number/repeat[7]/output/line[0]="0,0"
+line_number/repeat[7]/output/line[1]="0,1"
+line_number/repeat[7]/output/line[2]="0,2"
+line_number/repeat[7]/output/line[3]="1,0"
+line_number/repeat[7]/output/line[4]="1,1"
+line_number/repeat[7]/output/line[5]="1,2"
+line_number/repeat[7]/output/line[6]="0,0"
+line_number/repeat[7]/output/line[7]="0,1"
+line_number/repeat[7]/output/line[8]="0,2"
+line_number/repeat[7]/output/line[9]="1,0"
+line_number/repeat[7]/output/line[10]="1,1"
+line_number/repeat[7]/output/line[11]="1,2"
+line_number/repeat[7]/status=0
diff --git a/csv/test/csv-paste/input b/csv/test/csv-paste/input
index fb5037a14..fa3d03564 100644
--- a/csv/test/csv-paste/input
+++ b/csv/test/csv-paste/input
@@ -12,15 +12,44 @@ line_number/command_line_options[6]="csv-paste line-number --size 5 --index --re
 line_number/command_line_options[7]="csv-paste line-number --size 5 --index --reverse --begin 3 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
 
 line_number/parametrized[0]="csv-paste 'line-number;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[1]="csv-paste 'line-number;size=5' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[2]="csv-paste 'line-number;size=5;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[3]="csv-paste 'line-number;size=5;index' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[4]="csv-paste 'line-number;size=5;index;reverse' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[5]="csv-paste 'line-number;size=5;index;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[6]="csv-paste 'line-number;size=5;index;reverse;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[7]="csv-paste 'line-number;size=5;index;reverse;begin=10' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/parametrized[8]="csv-paste 'line-number;size=5;index;reverse;begin=3' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[1]="csv-paste 'line-number;block-size=5' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[2]="csv-paste 'line-number;block-size=5;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[3]="csv-paste 'line-number;block-size=5;index' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[4]="csv-paste 'line-number;block-size=5;index;reverse' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[5]="csv-paste 'line-number;block-size=5;index;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[6]="csv-paste 'line-number;block-size=5;index;reverse;begin=4' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[7]="csv-paste 'line-number;block-size=5;index;reverse;begin=10' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/parametrized[8]="csv-paste 'line-number;block-size=5;index;reverse;begin=3' | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
 
 line_number/multiple[0]="csv-paste line-number 'line-number;begin=4' --begin=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/multiple[1]="csv-paste line-number 'line-number;size=5' --size=6 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
-line_number/multiple[2]="csv-paste line-number 'line-number;index' --size=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/multiple[1]="csv-paste line-number 'line-number;block-size=5' --block-size=6 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+line_number/multiple[2]="csv-paste line-number 'line-number;index' --block-size=5 | head | tr '\\n' ';'; comma_status_ok && exit 0 || exit 1"
+
+line_number/binary[0]="csv-paste 'line-number;binary=ui' | csv-from-bin ui | head -n4; comma_status_ok && exit 0 || exit 1"
+
+block_size/ascii[0]="csv-paste <( echo a; echo b )';block-size=4' <( echo 0; echo 1; echo 2; echo 3 )';block-size=2'"
+block_size/binary[0]="csv-paste <( { echo 0; echo 1; } | csv-to-bin ui )';size=4;block-size=4' <( { echo 0; echo 1; echo 2; echo 3; } | csv-to-bin ui )';size=4;block-size=2' | csv-from-bin 2ui"
+
+line_number/step[0]="csv-paste line-number --step 2 | head -n4; comma_status_ok && exit 0 || exit 1"
+line_number/step[1]="csv-paste "line-number;step=2" | head -n4; comma_status_ok && exit 0 || exit 1"
+line_number/step[2]="csv-paste "line-number;step=2" --step 3 | head -n4; comma_status_ok && exit 0 || exit 1"
+line_number/step[3]="csv-paste "line-number;block-size=5;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[4]="csv-paste "line-number;block-size=5;index;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[5]="csv-paste "line-number;block-size=5;index;reverse;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[6]="csv-paste "line-number;block-size=5;index;reverse;begin=20;step=2" | head; comma_status_ok && exit 0 || exit 1"
+line_number/step[7]="csv-paste "line-number;block-size=5;index;reverse;begin=4;step=2" | head; comma_status_ok && exit 0 || exit 1"
+
+head[0]="csv-paste 'line-number;size=10;index' --head=0"
+head[1]="csv-paste 'line-number;size=10;index' --head=1"
+head[2]="csv-paste 'line-number;size=10;index' --head=2"
+
+line_number/shape[0]="csv-paste 'line-number;shape=2,3' --head=12"
+line_number/shape[1]="csv-paste 'line-number;shape=2,3;binary=2ui' --head=12 | csv-from-bin 2ui"
+
+line_number/repeat[0]="csv-paste 'line-number' --repeat=3"
+line_number/repeat[1]="csv-paste 'line-number;repeat=3'"
+line_number/repeat[3]="csv-paste 'line-number;size=2' --repeat=2"
+line_number/repeat[4]="csv-paste 'line-number;size=2;repeat=3'"
+line_number/repeat[5]="csv-paste 'line-number;size=2;index;repeat=3'"
+line_number/repeat[6]="csv-paste 'line-number;size=2;index;reverse;repeat=3'"
+line_number/repeat[7]="csv-paste 'line-number;shape=2,3;repeat=2'"
diff --git a/csv/test/csv-repeat/append/all/expected b/csv/test/csv-repeat/append/all/expected
index 1f5958aeb..607742fc2 100644
--- a/csv/test/csv-repeat/append/all/expected
+++ b/csv/test/csv-repeat/append/all/expected
@@ -1,67 +1,89 @@
 ascii[0]/data=123
 ascii[0]/repeating=0
 ascii[0]/time=ascii[0]/timestamp +/- 0.01
+ascii[0]/count=0
 ascii[1]/data=456
 ascii[1]/repeating=0
 ascii[1]/time=ascii[1]/timestamp +/- 0.01
+ascii[1]/count=0
 ascii[2]/data=789
 ascii[2]/repeating=0
 ascii[2]/time=ascii[2]/timestamp +/- 0.01
+ascii[2]/count=0
 ascii[3]/data=789
 ascii[3]/repeating=1
 ascii[3]/time=ascii[3]/timestamp +/- 0.01
+ascii[3]/count=1
 ascii[4]/data=789
 ascii[4]/repeating=1
 ascii[4]/time=ascii[4]/timestamp +/- 0.01
+ascii[4]/count=2
 ascii[5]/data=789
 ascii[5]/repeating=1
 ascii[5]/time=ascii[5]/timestamp +/- 0.01
+ascii[5]/count=3
 ascii[6]/data=123
 ascii[6]/repeating=0
 ascii[6]/time=ascii[6]/timestamp +/- 0.01
+ascii[6]/count=0
 ascii[7]/data=456
 ascii[7]/repeating=0
 ascii[7]/time=ascii[7]/timestamp +/- 0.01
+ascii[7]/count=0
 ascii[8]/data=456
 ascii[8]/repeating=1
 ascii[8]/time=ascii[8]/timestamp +/- 0.01
+ascii[8]/count=1
 ascii[9]/data=456
 ascii[9]/repeating=1
 ascii[9]/time=ascii[9]/timestamp +/- 0.01
+ascii[9]/count=2
 ascii[10]/data=456
 ascii[10]/repeating=1
 ascii[10]/time=ascii[10]/timestamp +/- 0.01
+ascii[10]/count=3
 
 binary[0]/data=123
 binary[0]/repeating=0
 binary[0]/time=binary[0]/timestamp +/- 0.01
+binary[0]/count=0
 binary[1]/data=456
 binary[1]/repeating=0
 binary[1]/time=binary[1]/timestamp +/- 0.01
+binary[1]/count=0
 binary[2]/data=789
 binary[2]/repeating=0
 binary[2]/time=binary[2]/timestamp +/- 0.01
+binary[2]/count=0
 binary[3]/data=789
 binary[3]/repeating=1
 binary[3]/time=binary[3]/timestamp +/- 0.01
+binary[3]/count=1
 binary[4]/data=789
 binary[4]/repeating=1
 binary[4]/time=binary[4]/timestamp +/- 0.01
+binary[4]/count=2
 binary[5]/data=789
 binary[5]/repeating=1
 binary[5]/time=binary[5]/timestamp +/- 0.01
+binary[5]/count=3
 binary[6]/data=123
 binary[6]/repeating=0
 binary[6]/time=binary[6]/timestamp +/- 0.01
+binary[6]/count=0
 binary[7]/data=456
 binary[7]/repeating=0
 binary[7]/time=binary[7]/timestamp +/- 0.01
+binary[7]/count=0
 binary[8]/data=456
 binary[8]/repeating=1
 binary[8]/time=binary[8]/timestamp +/- 0.01
+binary[8]/count=1
 binary[9]/data=456
 binary[9]/repeating=1
 binary[9]/time=binary[9]/timestamp +/- 0.01
+binary[9]/count=2
 binary[10]/data=456
 binary[10]/repeating=1
 binary[10]/time=binary[10]/timestamp +/- 0.01
+binary[10]/count=3
diff --git a/csv/test/csv-repeat/append/all/input b/csv/test/csv-repeat/append/all/input
index a39a3c325..68fb9eadb 100644
--- a/csv/test/csv-repeat/append/all/input
+++ b/csv/test/csv-repeat/append/all/input
@@ -1,11 +1,11 @@
 timeout=0.3
 period=0.1
-append="repeating,time"
+append="repeating,time,count"
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.55
-123,0.01
-456,0.55
-"
+0.20,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999"
diff --git a/csv/test/csv-repeat/append/count/expected b/csv/test/csv-repeat/append/count/expected
new file mode 100644
index 000000000..35c6c3704
--- /dev/null
+++ b/csv/test/csv-repeat/append/count/expected
@@ -0,0 +1,45 @@
+ascii[0]/data=123
+ascii[0]/count=0
+ascii[1]/data=456
+ascii[1]/count=0
+ascii[2]/data=789
+ascii[2]/count=0
+ascii[3]/data=789
+ascii[3]/count=1
+ascii[4]/data=789
+ascii[4]/count=2
+ascii[5]/data=789
+ascii[5]/count=3
+ascii[6]/data=123
+ascii[6]/count=0
+ascii[7]/data=456
+ascii[7]/count=0
+ascii[8]/data=456
+ascii[8]/count=1
+ascii[9]/data=456
+ascii[9]/count=2
+ascii[10]/data=456
+ascii[10]/count=3
+
+binary[0]/data=123
+binary[0]/count=0
+binary[1]/data=456
+binary[1]/count=0
+binary[2]/data=789
+binary[2]/count=0
+binary[3]/data=789
+binary[3]/count=1
+binary[4]/data=789
+binary[4]/count=2
+binary[5]/data=789
+binary[5]/count=3
+binary[6]/data=123
+binary[6]/count=0
+binary[7]/data=456
+binary[7]/count=0
+binary[8]/data=456
+binary[8]/count=1
+binary[9]/data=456
+binary[9]/count=2
+binary[10]/data=456
+binary[10]/count=3
diff --git a/csv/test/csv-repeat/append/count/input b/csv/test/csv-repeat/append/count/input
new file mode 100644
index 000000000..35be3cee9
--- /dev/null
+++ b/csv/test/csv-repeat/append/count/input
@@ -0,0 +1,12 @@
+timeout=0.3
+period=0.1
+append="count"
+format=ui
+data="
+0.20,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999
+"
diff --git a/csv/test/csv-repeat/append/repeating/input b/csv/test/csv-repeat/append/repeating/input
index 49ada6517..ff35214a0 100644
--- a/csv/test/csv-repeat/append/repeating/input
+++ b/csv/test/csv-repeat/append/repeating/input
@@ -3,9 +3,10 @@ period=0.1
 append="repeating"
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.55
-123,0.01
-456,0.55
+0.20,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999
 "
diff --git a/csv/test/csv-repeat/append/time/input b/csv/test/csv-repeat/append/time/input
index 4710d985e..f301085f3 100644
--- a/csv/test/csv-repeat/append/time/input
+++ b/csv/test/csv-repeat/append/time/input
@@ -3,9 +3,9 @@ period=0.1
 append="time"
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.55
-123,0.01
-456,0.55
-"
+0.20,123
+0.01,456
+0.01,789
+0.55,123
+0.01,456
+0.55,999"
diff --git a/csv/test/csv-repeat/period/expected b/csv/test/csv-repeat/period/expected
index a233be089..2a51778fd 100644
--- a/csv/test/csv-repeat/period/expected
+++ b/csv/test/csv-repeat/period/expected
@@ -1,37 +1,49 @@
-ascii[0]/timestamp=0.00 +/- 0.03
+ascii[0]/timestamp=0 +/- 0.1
 ascii[0]/data=123
-ascii[1]/timestamp=0.01 +/- 0.03
+ascii[1]/timestamp=1 +/- 0.1
 ascii[1]/data=456
-ascii[2]/timestamp=0.02 +/- 0.03
+ascii[2]/timestamp=2 +/- 0.1
 ascii[2]/data=789
-ascii[3]/timestamp=0.32 +/- 0.03
+ascii[3]/timestamp=5 +/- 0.1
 ascii[3]/data=789
-ascii[4]/timestamp=0.42 +/- 0.03
+ascii[4]/timestamp=7 +/- 0.1
 ascii[4]/data=789
-ascii[5]/timestamp=0.50 +/- 0.03
+ascii[5]/timestamp=8 +/- 0.1
 ascii[5]/data=123
-ascii[6]/timestamp=0.51 +/- 0.03
+ascii[6]/timestamp=9 +/- 0.1
 ascii[6]/data=456
-ascii[7]/timestamp=0.81 +/- 0.03
+ascii[7]/timestamp=12 +/- 0.1
 ascii[7]/data=456
-ascii[8]/timestamp=0.91 +/- 0.03
+ascii[8]/timestamp=14 +/- 0.1
 ascii[8]/data=456
+ascii[9]/timestamp=16 +/- 0.1
+ascii[9]/data=456
+ascii[10]/timestamp=18 +/- 0.1
+ascii[10]/data=456
+ascii[11]/timestamp=19 +/- 0.1
+ascii[11]/data=999
 
-binary[0]/timestamp=0.00 +/- 0.03
+binary[0]/timestamp=0 +/- 0.1
 binary[0]/data=123
-binary[1]/timestamp=0.01 +/- 0.03
+binary[1]/timestamp=1 +/- 0.1
 binary[1]/data=456
-binary[2]/timestamp=0.02 +/- 0.03
+binary[2]/timestamp=2 +/- 0.1
 binary[2]/data=789
-binary[3]/timestamp=0.32 +/- 0.03
+binary[3]/timestamp=5 +/- 0.1
 binary[3]/data=789
-binary[4]/timestamp=0.42 +/- 0.03
+binary[4]/timestamp=7 +/- 0.1
 binary[4]/data=789
-binary[5]/timestamp=0.50 +/- 0.03
+binary[5]/timestamp=8 +/- 0.1
 binary[5]/data=123
-binary[6]/timestamp=0.51 +/- 0.03
+binary[6]/timestamp=9 +/- 0.1
 binary[6]/data=456
-binary[7]/timestamp=0.81 +/- 0.03
+binary[7]/timestamp=12 +/- 0.1
 binary[7]/data=456
-binary[8]/timestamp=0.91 +/- 0.03
+binary[8]/timestamp=14 +/- 0.1
 binary[8]/data=456
+binary[9]/timestamp=16 +/- 0.1
+binary[9]/data=456
+binary[10]/timestamp=18 +/- 0.1
+binary[10]/data=456
+binary[11]/timestamp=19 +/- 0.1
+binary[11]/data=999
diff --git a/csv/test/csv-repeat/period/input b/csv/test/csv-repeat/period/input
index 82f37d0f4..9919c34f2 100644
--- a/csv/test/csv-repeat/period/input
+++ b/csv/test/csv-repeat/period/input
@@ -1,10 +1,10 @@
-timeout=0.3
-period=0.1
+timeout=3
+period=2
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.48
-123,0.01
-456,0.49
-"
+0,123
+1,456
+1,789
+6,123
+1,456
+10,999"
diff --git a/csv/test/csv-repeat/test b/csv/test/csv-repeat/test
index 3f960c7ab..5976114e2 100755
--- a/csv/test/csv-repeat/test
+++ b/csv/test/csv-repeat/test
@@ -14,24 +14,24 @@ time_fields=t,$( csv-fields clear --except time <<< $output_fields )
 
 for mode in ascii binary; do
 
-    now=$( echo "1" | csv-time-stamp | csv-shuffle --fields=t, --output-fields=t | csv-time --to seconds )
+    csv_eval_expr="t-=init_t"
+    [[ $append =~ time ]] && csv_eval_expr+="; time-=init_t"
 
-    csv_eval_expr="t-=$now"
-    [[ $append =~ time ]] && csv_eval_expr+="; time-=$now"
-
-    while IFS=, read data pause; do
-        echo $data
+    while IFS=, read pause data; do
         sleep $pause
+        echo $data
     done <<< "$data" \
         | if [[ $mode == "binary" ]]; then
               csv-to-bin $format --flush \
                   | csv-repeat --timeout=$timeout $period_option $append_option --binary=$format \
-                  | csv-from-bin $output_format --flush
+                  | csv-time-stamp --binary $output_format \
+                  | csv-from-bin t,$output_format --flush
           else
-              csv-repeat --timeout=$timeout $period_option $append_option
+              csv-repeat --timeout=$timeout $period_option $append_option | csv-time-stamp
           fi \
-        | csv-time-stamp | csv-time --fields $time_fields --to seconds \
-        | csv-eval --fields=$time_fields "$csv_eval_expr" --flush \
+        | csv-time --fields $time_fields --to seconds \
+        | gawk 'BEGIN { FS="," } { if( init_t == 0 ) init_t=$1; print $0,init_t }' OFS=, \
+        | csv-eval --fields=$time_fields,init_t "$csv_eval_expr" --flush \
         | name-value-from-csv --fields=timestamp,$output_fields --line-number --prefix=$mode \
         | csv-quote -d = --unquote
 
diff --git a/csv/test/csv-repeat/timeout/input b/csv/test/csv-repeat/timeout/input
index 67127068f..197070675 100644
--- a/csv/test/csv-repeat/timeout/input
+++ b/csv/test/csv-repeat/timeout/input
@@ -1,9 +1,9 @@
 timeout=0.3
 format=ui
 data="
-123,0.01
-456,0.01
-789,0.48
-123,0.01
-456,0.49
-"
+0.20,123
+0.01,456
+0.01,789
+0.48,123
+0.01,456
+0.49,999"
diff --git a/csv/test/csv-repeat/timestamped/expected b/csv/test/csv-repeat/timestamped/expected
new file mode 100644
index 000000000..3e01a4129
--- /dev/null
+++ b/csv/test/csv-repeat/timestamped/expected
@@ -0,0 +1,53 @@
+timestamped[0]/output/line[0]="20200101T000010,a"
+timestamped[0]/output/line[1]="20200101T000010,a,"
+timestamped[0]/output/line[2]="20200101T000010,a,"
+timestamped[0]/output/line[3]="20200101T000010,a,"
+timestamped[0]/output/line[4]="20200101T000010,a,"
+timestamped[0]/output/line[5]="20200101T000020,b"
+timestamped[0]/status=0
+timestamped[1]/output/line[0]="20200101T000010,a,20200101T000010,0"
+timestamped[1]/output/line[1]="20200101T000010,a,20200101T000013,1"
+timestamped[1]/output/line[2]="20200101T000010,a,20200101T000016,1"
+timestamped[1]/output/line[3]="20200101T000010,a,20200101T000019,1"
+timestamped[1]/output/line[4]="20200101T000010,a,20200101T000020,1"
+timestamped[1]/output/line[5]="20200101T000020,b,20200101T000020,0"
+timestamped[1]/status=0
+timestamped[2]/output/line[0]="20200101T000010,a,20200101T000000,1"
+timestamped[2]/output/line[1]="20200101T000010,a,20200101T000003,1"
+timestamped[2]/output/line[2]="20200101T000010,a,20200101T000006,1"
+timestamped[2]/output/line[3]="20200101T000010,a,20200101T000009,1"
+timestamped[2]/output/line[4]="20200101T000010,a,20200101T000010,1"
+timestamped[2]/output/line[5]="20200101T000010,a,20200101T000010,0"
+timestamped[2]/output/line[6]="20200101T000010,a,20200101T000013,1"
+timestamped[2]/output/line[7]="20200101T000010,a,20200101T000016,1"
+timestamped[2]/output/line[8]="20200101T000010,a,20200101T000019,1"
+timestamped[2]/output/line[9]="20200101T000010,a,20200101T000020,1"
+timestamped[2]/output/line[10]="20200101T000020,b,20200101T000020,0"
+timestamped[2]/status=0
+timestamped[3]/output/line[0]="20200101T000010,a,20200101T000010,0"
+timestamped[3]/output/line[1]="20200101T000010,a,20200101T000013,1"
+timestamped[3]/output/line[2]="20200101T000010,a,20200101T000016,1"
+timestamped[3]/output/line[3]="20200101T000010,a,20200101T000019,1"
+timestamped[3]/output/line[4]="20200101T000010,a,20200101T000020,1"
+timestamped[3]/output/line[5]="20200101T000020,b,20200101T000020,0"
+timestamped[3]/output/line[6]="20200101T000020,b,20200101T000023,1"
+timestamped[3]/output/line[7]="20200101T000020,b,20200101T000026,1"
+timestamped[3]/output/line[8]="20200101T000020,b,20200101T000029,1"
+timestamped[3]/output/line[9]="20200101T000020,b,20200101T000030,1"
+timestamped[3]/status=0
+timestamped[4]/output/line[0]="20200101T000010,a,20200101T000000,1"
+timestamped[4]/output/line[1]="20200101T000010,a,20200101T000003,1"
+timestamped[4]/output/line[2]="20200101T000010,a,20200101T000006,1"
+timestamped[4]/output/line[3]="20200101T000010,a,20200101T000009,1"
+timestamped[4]/output/line[4]="20200101T000010,a,20200101T000010,1"
+timestamped[4]/output/line[5]="20200101T000010,a,20200101T000010,0"
+timestamped[4]/output/line[6]="20200101T000010,a,20200101T000013,1"
+timestamped[4]/output/line[7]="20200101T000010,a,20200101T000016,1"
+timestamped[4]/output/line[8]="20200101T000010,a,20200101T000019,1"
+timestamped[4]/output/line[9]="20200101T000010,a,20200101T000020,1"
+timestamped[4]/output/line[10]="20200101T000020,b,20200101T000020,0"
+timestamped[4]/output/line[11]="20200101T000020,b,20200101T000023,1"
+timestamped[4]/output/line[12]="20200101T000020,b,20200101T000026,1"
+timestamped[4]/output/line[13]="20200101T000020,b,20200101T000029,1"
+timestamped[4]/output/line[14]="20200101T000020,b,20200101T000030,1"
+timestamped[4]/status=0
diff --git a/csv/test/csv-repeat/timestamped/input b/csv/test/csv-repeat/timestamped/input
new file mode 100644
index 000000000..fcbfd69cc
--- /dev/null
+++ b/csv/test/csv-repeat/timestamped/input
@@ -0,0 +1,5 @@
+timestamped[0]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3"
+timestamped[1]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating"
+timestamped[2]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating --from 20200101T000000"
+timestamped[3]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating --to 20200101T000030"
+timestamped[4]="( echo 20200101T000010,a; echo 20200101T000020,b ) | csv-repeat --timestamped --period 3 --append time,repeating --to 20200101T000030 --from 20200101T000000"
diff --git a/csv/test/csv-repeat/timestamped/test b/csv/test/csv-repeat/timestamped/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/csv/test/csv-repeat/timestamped/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands
diff --git a/csv/test/csv-seek/data.bin b/csv/test/csv-seek/data.bin
new file mode 100644
index 000000000..2c6aacdec
Binary files /dev/null and b/csv/test/csv-seek/data.bin differ
diff --git a/csv/test/csv-seek/expected b/csv/test/csv-seek/expected
new file mode 100644
index 000000000..f6c826eff
--- /dev/null
+++ b/csv/test/csv-seek/expected
@@ -0,0 +1,33 @@
+index/in_bounds_single_lookup[0]/output="6"
+index/in_bounds_single_lookup[0]/status=0
+index/in_bounds_multi_lookup[0]/output/line[0]="0"
+index/in_bounds_multi_lookup[0]/output/line[1]="3"
+index/in_bounds_multi_lookup[0]/output/line[2]="5"
+index/in_bounds_multi_lookup[0]/output/line[3]="9"
+index/in_bounds_multi_lookup[0]/status=0
+index/binary_input_stream[1]/output/line[0]="0"
+index/binary_input_stream[1]/output/line[1]="3"
+index/binary_input_stream[1]/output/line[2]="5"
+index/binary_input_stream[1]/output/line[3]="9"
+index/binary_input_stream[1]/status=0
+index/multi_input_stream[2]/output/line[0]="0"
+index/multi_input_stream[2]/output/line[1]="3"
+index/multi_input_stream[2]/output/line[2]="5"
+index/multi_input_stream[2]/status=0
+index/multi_input_stream_binary[3]/output/line[0]="0"
+index/multi_input_stream_binary[3]/output/line[1]="3"
+index/multi_input_stream_binary[3]/output/line[2]="5"
+index/multi_input_stream_binary[3]/status=0
+index/out_of_bounds[4]/output=""
+index/out_of_bounds[4]/status=1
+index/out_of_bounds_permissive[5]/output=""
+index/out_of_bounds_permissive[5]/status=0
+offset[1]/output/line[0]="0"
+offset[1]/output/line[1]="3"
+offset[1]/output/line[2]="5"
+offset[1]/output/line[3]="9"
+offset[1]/status=0
+offset[2]/output/line[0]="0"
+offset[2]/output/line[1]="3"
+offset[2]/output/line[2]="5"
+offset[2]/status=0
diff --git a/csv/test/csv-seek/input b/csv/test/csv-seek/input
new file mode 100644
index 000000000..f3e93fe6a
--- /dev/null
+++ b/csv/test/csv-seek/input
@@ -0,0 +1,9 @@
+index/in_bounds_single_lookup[0]="( echo 6 ) | csv-seek 'data.bin;binary=ui' | csv-from-bin ui"
+index/in_bounds_multi_lookup[0]="( echo 0; echo 3; echo 5; echo 9 ) | csv-seek 'data.bin;binary=ui' | csv-from-bin ui"
+index/binary_input_stream[1]="( echo 0; echo 3; echo 5; echo 9 ) | csv-to-bin ui | csv-seek --binary=ui \'data.bin;binary=ui\' | csv-from-bin ui"
+index/multi_input_stream[2]="( echo a,0; echo b,3; echo c,5 ) | csv-seek --fields ,index 'data.bin;binary=ui' | csv-from-bin ui"
+index/multi_input_stream_binary[3]="( echo 0,0; echo 1,3; echo 2,5 ) | csv-to-bin 2ui | csv-seek --fields ,index --binary=2ui 'data.bin;binary=ui' | csv-from-bin ui"
+index/out_of_bounds[4]="( echo 200; ) | csv-seek 'data.bin;binary=ui' >/dev/null"
+index/out_of_bounds_permissive[5]="( echo 200; ) | csv-seek --permissive 'data.bin;binary=ui' >/dev/null"
+offset[1]="( echo 0; echo 0.30; echo 0.5; echo 0.9 ) | csv-seek --fields ratio 'data.bin;binary=ui' | csv-from-bin ui"
+offset[2]="( echo 0,0; echo 1,0.3; echo 2,0.5  ) | csv-to-bin ui,f | csv-seek --fields ,ratio --binary=ui,f 'data.bin;binary=ui' | csv-from-bin ui"
diff --git a/csv/test/csv-shape/repeat/expected b/csv/test/csv-shape/repeat/expected
new file mode 100644
index 000000000..972463d6e
--- /dev/null
+++ b/csv/test/csv-shape/repeat/expected
@@ -0,0 +1,17 @@
+ascii/output/line[0]="hello"
+ascii/output/line[1]="hello"
+ascii/output/line[2]="hello"
+ascii/output/line[3]="world"
+ascii/output/line[4]="world"
+ascii/output/line[5]="world"
+ascii/status=0
+binary/output/line[0]="1"
+binary/output/line[1]="1"
+binary/output/line[2]="1"
+binary/output/line[3]="2"
+binary/output/line[4]="2"
+binary/output/line[5]="2"
+binary/output/line[6]="3"
+binary/output/line[7]="3"
+binary/output/line[8]="3"
+binary/status=0
diff --git a/csv/test/csv-shape/repeat/input b/csv/test/csv-shape/repeat/input
new file mode 100644
index 000000000..9d2e8c57c
--- /dev/null
+++ b/csv/test/csv-shape/repeat/input
@@ -0,0 +1,2 @@
+ascii="( echo hello; echo; echo world ) | csv-shape repeat --size 3"
+binary="( echo 1; echo 2; echo 3 ) | csv-to-bin ui | csv-shape repeat --size 3 --binary ui | csv-from-bin ui"
diff --git a/csv/test/csv-shape/sliding-window/expected b/csv/test/csv-shape/sliding-window/expected
new file mode 100644
index 000000000..ee9d13b2d
--- /dev/null
+++ b/csv/test/csv-shape/sliding-window/expected
@@ -0,0 +1,26 @@
+basics[0]/output="a b c d e f "
+basics[1]/output="a b b c c d d e e f "
+basics[2]/output="a b c b c d c d e d e f "
+basics[3]/output="a b c d b c d e c d e f "
+step[0]/output="a b c d c d e f "
+step[1]/output="a b c d e f g h "
+block[0]/output="0,a 1,b 2,c 3,d 4,e 5,f "
+block[1]/output="0,a 0,b 1,b 1,c 2,c 2,d 3,d 3,e 4,e 4,f "
+block[2]/output="0,a 0,b 0,c 1,b 1,c 1,d 2,c 2,d 2,e 3,d 3,e 3,f "
+block[3]/output="0,a 0,b 0,c 0,d 1,b 1,c 1,d 1,e 2,c 2,d 2,e 2,f "
+block[4]/output="0,a 0,b 0,c 0,d 1,c 1,d 1,e 1,f "
+incremental/basic[0]/output="a b c d e f "
+incremental/basic[1]/output="a a b b c c d d e e f "
+incremental/basic[2]/output="a a b a b c b c d c d e d e f "
+incremental/basic[3]/output="a a b a b c a b c d b c d e c d e f "
+incremental/basic[4]/output="a b a b c d c d e f "
+incremental/block[0]/output="0,a 1,b 2,c 3,d 4,e 5,f "
+incremental/block[1]/output="0,a 1,a 1,b 2,b 2,c 3,c 3,d 4,d 4,e 5,e 5,f "
+incremental/block[2]/output="0,a 1,a 1,b 2,a 2,b 2,c 3,b 3,c 3,d 4,c 4,d 4,e 5,d 5,e 5,f "
+incremental/block[3]/output="0,a 1,a 1,b 2,a 2,b 2,c 3,a 3,b 3,c 3,d 4,b 4,c 4,d 4,e 5,c 5,d 5,e 5,f "
+incremental/block[4]/output="0,a 0,b 1,a 1,b 1,c 1,d 2,c 2,d 2,e 2,f "
+binary[0]/output="a b c d e f "
+binary[1]/output="a b c d b c d e c d e f "
+binary[2]/output="0,a 0,b 0,c 0,d 1,b 1,c 1,d 1,e 2,c 2,d 2,e 2,f "
+binary[3]/output="a a b a b c a b c d b c d e c d e f "
+binary[4]/output="0,a 1,a 1,b 2,a 2,b 2,c 3,a 3,b 3,c 3,d 4,b 4,c 4,d 4,e 5,c 5,d 5,e 5,f "
diff --git a/csv/test/csv-shape/sliding-window/input b/csv/test/csv-shape/sliding-window/input
new file mode 100644
index 000000000..b75549129
--- /dev/null
+++ b/csv/test/csv-shape/sliding-window/input
@@ -0,0 +1,30 @@
+basics[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 | tr '\\n' ' '"
+basics[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 | tr '\\n' ' '"
+basics[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 | tr '\\n' ' '"
+basics[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 | tr '\\n' ' '"
+
+step[0]="echo a b c d e f g | tr ' ' '\\n' | csv-shape sliding-window --size 4 --step 2 | tr '\\n' ' '"
+step[1]="echo a b c d e f g h i | tr ' ' '\\n' | csv-shape sliding-window --size 4 --step 4 | tr '\\n' ' '"
+
+block[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 --block | tr '\\n' ' '"
+block[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 --block | tr '\\n' ' '"
+block[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 --block | tr '\\n' ' '"
+block[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --block | tr '\\n' ' '"
+block[4]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --block --step 2 | tr '\\n' ' '"
+
+incremental/basic[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 --incremental | tr '\\n' ' '"
+incremental/basic[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 --incremental | tr '\\n' ' '"
+incremental/basic[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 --incremental | tr '\\n' ' '"
+incremental/basic[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental | tr '\\n' ' '"
+incremental/basic[4]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental --step 2 | tr '\\n' ' '"
+incremental/block[0]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 1 --incremental --block | tr '\\n' ' '"
+incremental/block[1]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 2 --incremental --block | tr '\\n' ' '"
+incremental/block[2]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 3 --incremental --block | tr '\\n' ' '"
+incremental/block[3]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental --block | tr '\\n' ' '"
+incremental/block[4]="echo a b c d e f | tr ' ' '\\n' | csv-shape sliding-window --size 4 --incremental --block --step 2 | tr '\\n' ' '"
+
+binary[0]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 1 | csv-from-bin c | tr '\\n' ' '"
+binary[1]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 | csv-from-bin c | tr '\\n' ' '"
+binary[2]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 --block | csv-from-bin ui,c | tr '\\n' ' '"
+binary[3]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 --incremental | csv-from-bin c | tr '\\n' ' '"
+binary[4]="echo a,b,c,d,e,f | csv-to-bin 6c | csv-shape sliding-window --binary b --size 4 --incremental --block | csv-from-bin ui,c | tr '\\n' ' '"
diff --git a/csv/test/csv-shape/split/expected b/csv/test/csv-shape/split/expected
new file mode 100644
index 000000000..d2b7aa428
--- /dev/null
+++ b/csv/test/csv-shape/split/expected
@@ -0,0 +1,18 @@
+split[0]/output/line[0]="1,2"
+split[0]/output/line[1]="3,4,5,6"
+split[0]/status=0
+split[1]/output/line[0]="1,2,3"
+split[1]/output/line[1]="4,5,6"
+split[1]/status=0
+split[2]/output/line[0]="1,2,3,4"
+split[2]/output/line[1]="5,6"
+split[2]/status=0
+split[3]/output/line[0]="1,2"
+split[3]/output/line[1]="3,4"
+split[3]/output/line[2]="5,6"
+split[3]/status=0
+split[4]/output/line[0]="1,2"
+split[4]/output/line[1]="3"
+split[4]/output/line[2]="4,5"
+split[4]/output/line[3]="6"
+split[4]/status=0
diff --git a/csv/test/csv-shape/split/input b/csv/test/csv-shape/split/input
new file mode 100644
index 000000000..244e91155
--- /dev/null
+++ b/csv/test/csv-shape/split/input
@@ -0,0 +1,5 @@
+split[0]="echo 1,2,3,4,5,6 | csv-shape split -n 2"
+split[1]="echo 1,2,3,4,5,6 | csv-shape split -n 3"
+split[2]="echo 1,2,3,4,5,6 | csv-shape split -n 4"
+split[3]="echo 1,2,3,4,5,6 | csv-shape split -n 2 --repeat"
+split[4]="( echo 1,2,3; echo; echo 4,5,6 ) | csv-shape split -n 2 --repeat"
diff --git a/csv/test/csv-shuffle/expected b/csv/test/csv-shuffle/expected
new file mode 100644
index 000000000..baf7b61ad
--- /dev/null
+++ b/csv/test/csv-shuffle/expected
@@ -0,0 +1,31 @@
+ascii[0]/output="0"
+ascii[0]/status=0
+ascii[1]/output="0,0"
+ascii[1]/status=0
+ascii[2]/output="5"
+ascii[2]/status=0
+ascii[3]/output="5,4"
+ascii[3]/status=0
+ascii[4]/output="1,3,1,3"
+ascii[4]/status=0
+ascii[5]/output="0,1,2"
+ascii[5]/status=0
+ascii[6]/output=""
+ascii[6]/status=1
+ascii[7]/output="0,1,2,5"
+ascii[7]/status=0
+ascii[8]/output="0,1,2,5"
+ascii[8]/status=0
+
+binary[0]/output="0"
+binary[0]/status=0
+binary[1]/output="3,4,5,0,1,2"
+binary[1]/status=0
+binary[2]/output="4,5,2,3,0,1"
+binary[2]/status=0
+binary[3]/output="1,2,1,2,1,2"
+binary[3]/status=0
+binary[4]/output="0,1,2"
+binary[4]/status=0
+binary[5]/output="0,1,2,5"
+binary[5]/status=0
diff --git a/csv/test/csv-shuffle/input b/csv/test/csv-shuffle/input
new file mode 100644
index 000000000..c27c04380
--- /dev/null
+++ b/csv/test/csv-shuffle/input
@@ -0,0 +1,16 @@
+ascii[0]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 0"
+ascii[1]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 0,0"
+ascii[2]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5"
+ascii[3]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 5,4"
+ascii[4]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,3,4,5 --output-fields 1,3,1,3"
+ascii[5]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2"
+ascii[6]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,,,5"
+ascii[7]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,,,5 --drop-empty"
+ascii[8]="echo 0,1,2,3,4,5 | csv-shuffle --fields 0,1,2,,,5 --output-fields 0,1,2,,,5 --drop-empty"
+
+binary[0]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 0 | csv-from-bin ui"
+binary[1]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 3,4,5,0,1,2 | csv-from-bin 3uw,3ui"
+binary[2]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 4,5,2,3,0,1 | csv-from-bin 2uw,ui,uw,2ui"
+binary[3]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,3,4,5 --output-fields 1,2,1,2,1,2 | csv-from-bin 6ui"
+binary[4]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2 | csv-from-bin 3ui"
+binary[5]="echo 0,1,2,3,4,5 | csv-to-bin 3ui,3uw | csv-shuffle --binary 3ui,3uw --fields 0,1,2,,,5 --drop-empty | csv-from-bin 3ui,uw"
diff --git a/csv/test/csv-sort/fixed_block_size/expected b/csv/test/csv-sort/fixed_block_size/expected
new file mode 100644
index 000000000..5b277ef74
--- /dev/null
+++ b/csv/test/csv-sort/fixed_block_size/expected
@@ -0,0 +1,46 @@
+fixed_block_size/ascii/block_field/output/line[0]="0,d"
+fixed_block_size/ascii/block_field/output/line[1]="0,e"
+fixed_block_size/ascii/block_field/output/line[2]="0,f"
+fixed_block_size/ascii/block_field/output/line[3]="1,a"
+fixed_block_size/ascii/block_field/output/line[4]="1,b"
+fixed_block_size/ascii/block_field/output/line[5]="1,c"
+fixed_block_size/ascii/block_field/status=0
+fixed_block_size/ascii/basic/output/line[0]="d"
+fixed_block_size/ascii/basic/output/line[1]="e"
+fixed_block_size/ascii/basic/output/line[2]="f"
+fixed_block_size/ascii/basic/output/line[3]="a"
+fixed_block_size/ascii/basic/output/line[4]="b"
+fixed_block_size/ascii/basic/output/line[5]="c"
+fixed_block_size/ascii/basic/status=0
+fixed_block_size/ascii/last_block/output/line[0]="x"
+fixed_block_size/ascii/last_block/output/line[1]="y"
+fixed_block_size/ascii/last_block/output/line[2]="z"
+fixed_block_size/ascii/last_block/output/line[3]="d"
+fixed_block_size/ascii/last_block/output/line[4]="e"
+fixed_block_size/ascii/last_block/output/line[5]="f"
+fixed_block_size/ascii/last_block/output/line[6]="x"
+fixed_block_size/ascii/last_block/output/line[7]="y"
+fixed_block_size/ascii/last_block/status=0
+fixed_block_size/binary/block_field/output/line[0]="0,d"
+fixed_block_size/binary/block_field/output/line[1]="0,e"
+fixed_block_size/binary/block_field/output/line[2]="0,f"
+fixed_block_size/binary/block_field/output/line[3]="1,a"
+fixed_block_size/binary/block_field/output/line[4]="1,b"
+fixed_block_size/binary/block_field/output/line[5]="1,c"
+fixed_block_size/binary/block_field/status=0
+fixed_block_size/binary/basic/output/line[0]="d"
+fixed_block_size/binary/basic/output/line[1]="e"
+fixed_block_size/binary/basic/output/line[2]="f"
+fixed_block_size/binary/basic/output/line[3]="a"
+fixed_block_size/binary/basic/output/line[4]="b"
+fixed_block_size/binary/basic/output/line[5]="c"
+fixed_block_size/binary/basic/status=0
+fixed_block_size/binary/last_block/output/line[0]="x"
+fixed_block_size/binary/last_block/output/line[1]="y"
+fixed_block_size/binary/last_block/output/line[2]="z"
+fixed_block_size/binary/last_block/output/line[3]="d"
+fixed_block_size/binary/last_block/output/line[4]="e"
+fixed_block_size/binary/last_block/output/line[5]="f"
+fixed_block_size/binary/last_block/output/line[6]="x"
+fixed_block_size/binary/last_block/output/line[7]="y"
+fixed_block_size/binary/last_block/status=0
diff --git a/csv/test/csv-sort/fixed_block_size/input b/csv/test/csv-sort/fixed_block_size/input
new file mode 100644
index 000000000..1c1e78f16
--- /dev/null
+++ b/csv/test/csv-sort/fixed_block_size/input
@@ -0,0 +1,7 @@
+fixed_block_size/ascii/block_field="( echo 0,f ; echo 0,e ; echo 0,d ; echo 1,c ; echo 1,b; echo 1,a ) | csv-sort --fields block,a"
+fixed_block_size/ascii/basic="( echo f ; echo e ; echo d ; echo c ; echo b; echo a ) | csv-sort --fields a --block-size 3"
+fixed_block_size/ascii/last_block="( echo z ; echo y ; echo x ; echo f ; echo e; echo d; echo y; echo x ) | csv-sort --fields a --block-size 3"
+
+fixed_block_size/binary/block_field="( echo 0,f ; echo 0,e ; echo 0,d ; echo 1,c ; echo 1,b; echo 1,a ) | csv-to-bin ui,c | csv-sort --fields block,a --binary=ui,c | csv-from-bin ui,c"
+fixed_block_size/binary/basic="( echo f ; echo e ; echo d ; echo c ; echo b; echo a ) | csv-to-bin c | csv-sort --fields a --block-size 3 --binary c | csv-from-bin c"
+fixed_block_size/binary/last_block="( echo z ; echo y ; echo x ; echo f ; echo e; echo d; echo y; echo x ) | csv-to-bin c | csv-sort --fields a --block-size 3 --binary c | csv-from-bin c"
diff --git a/csv/test/csv-sort/fixed_block_size/test b/csv/test/csv-sort/fixed_block_size/test
new file mode 100755
index 000000000..152895e63
--- /dev/null
+++ b/csv/test/csv-sort/fixed_block_size/test
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands
diff --git a/csv/test/csv-sort/sort/expected b/csv/test/csv-sort/sort/expected
index 15c7a5aec..5eadc99aa 100644
--- a/csv/test/csv-sort/sort/expected
+++ b/csv/test/csv-sort/sort/expected
@@ -17,3 +17,14 @@ numeric_keys_are_floats[1]/output/line[1]="3.1"
 numeric_keys_are_floats[1]/output/line[2]="4"
 numeric_keys_are_floats[1]/output/line[3]="5"
 numeric_keys_are_floats[1]/status=0
+
+strings[0]/output="a,z;b,y;b,z;"
+strings[1]/output="a,z;b,y;b,z;"
+strings[2]/output="a,z;b,z;b,y;"
+strings[3]/output="b,y;a,z;b,z;"
+strings[5]/output=",_a;,a_;,aa;"
+strings[6]/output=",_a;,a_;,aa;"
+strings[7]/output="x,aa;y,a_;z,_a;"
+strings[8]/output="x,aa;y,a_;z,_a;"
+strings[9]/output="x,aa;y,a_;z,_a;"
+strings[10]/output="z,_a;y,a_;x,aa;"
diff --git a/csv/test/csv-sort/sort/input b/csv/test/csv-sort/sort/input
index df6282f28..a9ae5a4ed 100644
--- a/csv/test/csv-sort/sort/input
+++ b/csv/test/csv-sort/sort/input
@@ -14,3 +14,15 @@ descending/block[2]="( echo 1,0; echo 0,0; echo 1,0 ; echo 1,1; echo 0,1; echo 1
 
 numeric_keys_are_floats[0]="( echo 5; echo 4; echo 3.1; echo 2 ) | csv-sort --fields a"
 numeric_keys_are_floats[1]="( echo 5; echo 4; echo 3.1; echo 2 ) | csv-sort --fields a --numeric-keys-are-floats"
+
+strings[0]="( echo a,z; echo b,z; echo b,y )     | csv-sort              | tr '\\n' ';'"
+strings[1]="( echo a,z; echo b,z; echo b,y )     | csv-sort --fields a,b | tr '\\n' ';'"
+strings[2]="( echo a,z; echo b,z; echo b,y )     | csv-sort --fields a   | tr '\\n' ';'"
+strings[3]="( echo a,z; echo b,z; echo b,y )     | csv-sort --fields ,a  | tr '\\n' ';'"
+strings[4]="( echo a_; echo aa; echo _a )        | csv-sort              | tr '\\n' ';'"
+strings[5]="( echo ,a_; echo ,aa; echo ,_a )     | csv-sort              | tr '\\n' ';'"
+strings[6]="( echo ,a_; echo ,aa; echo ,_a )     | csv-sort --fields ,a  | tr '\\n' ';'"
+strings[7]="( echo y,a_; echo x,aa; echo z,_a )  | csv-sort              | tr '\\n' ';'"
+strings[8]="( echo y,a_; echo x,aa; echo z,_a )  | csv-sort --fields a,b | tr '\\n' ';'"
+strings[9]="( echo y,a_; echo x,aa; echo z,_a )  | csv-sort --fields a   | tr '\\n' ';'"
+strings[10]="( echo y,a_; echo x,aa; echo z,_a ) | csv-sort --fields ,a  | tr '\\n' ';'"
\ No newline at end of file
diff --git a/csv/test/csv-split/size/expected b/csv/test/csv-split/size/expected
new file mode 100644
index 000000000..37d4bebf8
--- /dev/null
+++ b/csv/test/csv-split/size/expected
@@ -0,0 +1,8 @@
+fixed[0]/output/line[0]="8"
+fixed[0]/output/line[1]="8"
+fixed[0]/output/line[2]="8"
+fixed[0]/status=0
+
+variable[0]/output/line[0]="8"
+variable[0]/output/line[1]="16"
+variable[0]/status=0
diff --git a/csv/test/csv-split/size/input b/csv/test/csv-split/size/input
new file mode 100644
index 000000000..cc6a0066a
--- /dev/null
+++ b/csv/test/csv-split/size/input
@@ -0,0 +1,2 @@
+fixed[0]="( echo 111,0; echo 222,1; echo 333,2 ) | csv-to-bin 2ui | ( mkdir -p output && cd output && csv-split --fields ,id --binary 2ui && wc -c < 0.bin && wc -c < 1.bin && wc -c < 2.bin )"
+variable[0]="( echo 0,0 | csv-to-bin 2ui; echo 1,8,3,4 | csv-to-bin 4ui ) | ( mkdir -p output && cd output && csv-split --fields id,size --binary 2ui && wc -c < 0.bin && wc -c < 1.bin )"
\ No newline at end of file
diff --git a/csv/test/csv-strings/expected b/csv/test/csv-strings/expected
new file mode 100644
index 000000000..4c52e3e8b
--- /dev/null
+++ b/csv/test/csv-strings/expected
@@ -0,0 +1,278 @@
+basename/append[0]/output/line[0]="a,a"
+basename/append[0]/output/line[1]="a/b,b"
+basename/append[0]/output/line[2]="a/b/c,c"
+basename/append[1]/output/line[0]="a,a"
+basename/append[1]/output/line[1]="a/b,a/b"
+basename/append[1]/output/line[2]="a/b/c,b/c"
+basename/append[2]/output/line[0]="a,a"
+basename/append[2]/output/line[1]="a/b,a/b"
+basename/append[2]/output/line[2]="a/b/c,a/b/c"
+basename/append[3]/output/line[0]="a,a"
+basename/append[3]/output/line[1]="a/b,a/b"
+basename/append[3]/output/line[2]="a/b/c,a/b/c"
+basename/append[4]/output/line[0]="/,/"
+basename/append[4]/output/line[1]="/aaa,aaa"
+basename/append[4]/output/line[2]="/aaa/bbb,bbb"
+basename/append[5]/output/line[0]="/,/"
+basename/append[5]/output/line[1]="/aaa,/aaa"
+basename/append[5]/output/line[2]="/aaa/bbb,aaa/bbb"
+basename/append[6]/output/line[0]="/,/"
+basename/append[6]/output/line[1]="/aaa,/aaa"
+basename/append[6]/output/line[2]="/aaa/bbb,/aaa/bbb"
+basename/append[7]/output/line[0]="/,/"
+basename/append[7]/output/line[1]="/aaa,/aaa"
+basename/append[7]/output/line[2]="/aaa/bbb,/aaa/bbb"
+
+basename/emplace[0]/output/line[0]="a"
+basename/emplace[0]/output/line[1]="b"
+basename/emplace[0]/output/line[2]="c"
+basename/emplace[1]/output/line[0]="a"
+basename/emplace[1]/output/line[1]="a/b"
+basename/emplace[1]/output/line[2]="b/c"
+basename/emplace[2]/output/line[0]="a"
+basename/emplace[2]/output/line[1]="a/b"
+basename/emplace[2]/output/line[2]="a/b/c"
+basename/emplace[3]/output/line[0]="a"
+basename/emplace[3]/output/line[1]="a/b"
+basename/emplace[3]/output/line[2]="a/b/c"
+
+basename/binary/emplace[0]/output/line[0]="a"
+basename/binary/emplace[0]/output/line[1]="b"
+basename/binary/emplace[0]/output/line[2]="c"
+
+basename/head/append[0]/output/line[0]="a,"
+basename/head/append[0]/output/line[1]="a/b,b"
+basename/head/append[0]/output/line[2]="a/b/c,b/c"
+basename/head/append[1]/output/line[0]="a,"
+basename/head/append[1]/output/line[1]="a/b,"
+basename/head/append[1]/output/line[2]="a/b/c,c"
+basename/head/append[2]/output/line[0]="/,"
+basename/head/append[2]/output/line[1]="/aaa,aaa"
+basename/head/append[2]/output/line[2]="/aaa/bbb,aaa/bbb"
+basename/head/append[3]/output/line[0]="/,"
+basename/head/append[3]/output/line[1]="/aaa,"
+basename/head/append[3]/output/line[2]="/aaa/bbb,bbb"
+basename/head/append[4]/output/line[0]="/,"
+basename/head/append[4]/output/line[1]="/aaa,"
+basename/head/append[4]/output/line[2]="/aaa/bbb,"
+basename/head/append[5]/output/line[0]="/,"
+basename/head/append[5]/output/line[1]="/aaa,"
+basename/head/append[5]/output/line[2]="/aaa/bbb,"
+
+basename/head/emplace[0]/output/line[0]=""
+basename/head/emplace[0]/output/line[1]="b"
+basename/head/emplace[0]/output/line[2]="b/c"
+basename/head/emplace[1]/output/line[0]=""
+basename/head/emplace[1]/output/line[1]=""
+basename/head/emplace[1]/output/line[2]="c"
+
+basename/binary/head/emplace[0]/output/line[0]=""
+basename/binary/head/emplace[0]/output/line[1]="b"
+basename/binary/head/emplace[0]/output/line[2]="b/c"
+
+dirname/append[0]/output/line[0]="/,/"
+dirname/append[0]/output/line[1]="/a,/"
+dirname/append[0]/output/line[2]="/a/,/a"
+dirname/append[0]/output/line[3]="/a/b,/a"
+dirname/append[0]/output/line[4]="/a/b/c,/a/b"
+dirname/append[0]/output/line[5]="/aaa/bbb,/aaa"
+dirname/append[0]/output/line[6]="/aaa/bbb/ccc,/aaa/bbb"
+
+dirname/append[1]/output/line[0]="a,"
+dirname/append[1]/output/line[1]="a/,a"
+dirname/append[1]/output/line[2]="a/b,a"
+dirname/append[1]/output/line[3]="a/b/c,a/b"
+dirname/append[1]/output/line[4]="aaa/bbb,aaa"
+dirname/append[1]/output/line[5]="aaa/bbb/ccc,aaa/bbb"
+
+dirname/tail/append[0]/output/line[0]="a,"
+dirname/tail/append[0]/output/line[1]="a/b,a"
+dirname/tail/append[0]/output/line[2]="a/b/c,a/b"
+dirname/tail/append[1]/output/line[0]="a,"
+dirname/tail/append[1]/output/line[1]="a/b,"
+dirname/tail/append[1]/output/line[2]="a/b/c,a"
+dirname/tail/append[2]/output/line[0]="a,"
+dirname/tail/append[2]/output/line[1]="a/b,"
+dirname/tail/append[2]/output/line[2]="a/b/c,"
+dirname/tail/append[3]/output/line[0]="a,"
+dirname/tail/append[3]/output/line[1]="a/b,"
+dirname/tail/append[3]/output/line[2]="a/b/c,"
+dirname/tail/append[4]/output/line[0]="/,/"
+dirname/tail/append[4]/output/line[1]="/aaa,/"
+dirname/tail/append[4]/output/line[2]="/aaa/bbb,/aaa"
+dirname/tail/append[5]/output/line[0]="/,/"
+dirname/tail/append[5]/output/line[1]="/aaa,/"
+dirname/tail/append[5]/output/line[2]="/aaa/bbb,/"
+dirname/tail/append[6]/output/line[0]="/,/"
+dirname/tail/append[6]/output/line[1]="/aaa,/"
+dirname/tail/append[6]/output/line[2]="/aaa/bbb,/"
+dirname/tail/append[7]/output/line[0]="/,/"
+dirname/tail/append[7]/output/line[1]="/aaa,/"
+dirname/tail/append[7]/output/line[2]="/aaa/bbb,/"
+
+dirname/tail/emplace[0]/output/line[0]=""
+dirname/tail/emplace[0]/output/line[1]="a"
+dirname/tail/emplace[0]/output/line[2]="a/b"
+dirname/tail/emplace[1]/output/line[0]=""
+dirname/tail/emplace[1]/output/line[1]=""
+dirname/tail/emplace[1]/output/line[2]="a"
+dirname/tail/emplace[2]/output/line[0]=","
+dirname/tail/emplace[2]/output/line[1]=","
+dirname/tail/emplace[2]/output/line[2]=","
+dirname/tail/emplace[3]/output/line[0]=","
+dirname/tail/emplace[3]/output/line[1]=","
+dirname/tail/emplace[3]/output/line[2]=","
+
+dirname/binary/tail/emplace[0]/output/line[0]=""
+dirname/binary/tail/emplace[0]/output/line[1]="a"
+dirname/binary/tail/emplace[0]/output/line[2]="a/b"
+
+dirname/head/append[0]/output/line[0]="a,"
+dirname/head/append[0]/output/line[1]="a/b,a"
+dirname/head/append[0]/output/line[2]="a/b/c,a/b"
+dirname/head/append[1]/output/line[0]="a,a"
+dirname/head/append[1]/output/line[1]="a/b,a/b"
+dirname/head/append[1]/output/line[2]="a/b/c,a/b"
+dirname/head/append[2]/output/line[0]="a,a"
+dirname/head/append[2]/output/line[1]="a/b,a/b"
+dirname/head/append[2]/output/line[2]="a/b/c,a/b/c"
+dirname/head/append[3]/output/line[0]="a,a"
+dirname/head/append[3]/output/line[1]="a/b,a/b"
+dirname/head/append[3]/output/line[2]="a/b/c,a/b/c"
+dirname/head/append[4]/output/line[0]="/,/"
+dirname/head/append[4]/output/line[1]="/aaa,/"
+dirname/head/append[4]/output/line[2]="/aaa/bbb,/"
+dirname/head/append[5]/output/line[0]="/,/"
+dirname/head/append[5]/output/line[1]="/aaa,/aaa"
+dirname/head/append[5]/output/line[2]="/aaa/bbb,/aaa"
+dirname/head/append[6]/output/line[0]="/,/"
+dirname/head/append[6]/output/line[1]="/aaa,/aaa"
+dirname/head/append[6]/output/line[2]="/aaa/bbb,/aaa/bbb"
+dirname/head/append[7]/output/line[0]="/,/"
+dirname/head/append[7]/output/line[1]="/aaa,/aaa"
+dirname/head/append[7]/output/line[2]="/aaa/bbb,/aaa/bbb"
+
+dirname/head/emplace[0]/output/line[0]=""
+dirname/head/emplace[0]/output/line[1]="a"
+dirname/head/emplace[0]/output/line[2]="a/b"
+dirname/head/emplace[1]/output/line[0]="a"
+dirname/head/emplace[1]/output/line[1]="a/b"
+dirname/head/emplace[1]/output/line[2]="a/b"
+dirname/head/emplace[2]/output/line[0]="a"
+dirname/head/emplace[2]/output/line[1]="a/b"
+dirname/head/emplace[2]/output/line[2]="a/b/c"
+dirname/head/emplace[3]/output/line[0]="a,"
+dirname/head/emplace[3]/output/line[1]="a/b,"
+dirname/head/emplace[3]/output/line[2]="a/b/c,"
+
+dirname/binary/head/emplace[0]/output/line[0]=""
+dirname/binary/head/emplace[0]/output/line[1]="a"
+dirname/binary/head/emplace[0]/output/line[2]="a/b"
+
+delimiter[0]/output/line[0]="a.a"
+delimiter[0]/output/line[1]="a.b.a"
+delimiter[0]/output/line[2]="a.b/c.d/e.a"
+delimiter[1]/output/line[0]="a"
+delimiter[1]/output/line[1]="a.b"
+delimiter[1]/output/line[2]="a.b/c.d/e"
+delimiter[2]/output/line[0]="a."
+delimiter[2]/output/line[1]="a.b."
+delimiter[2]/output/line[2]="a.b/c.d/e."
+delimiter[3]/output/line[0]=""
+delimiter[3]/output/line[1]=".b"
+delimiter[3]/output/line[2]=".b/c.d/e"
+
+strict[0]/output="a/b/c,a/b/c"
+strict[0]/status=1
+strict[1]/output="a/b/c"
+strict[1]/status=1
+strict[2]/output="a/b/c,"
+strict[2]/status=1
+strict[3]/output=""
+strict[3]/status=1
+strict[4]/output="a/b/c,a/b/c"
+strict[4]/status=1
+strict[5]/output="a/b/c"
+strict[5]/status=1
+
+fields[0]/output/line[0]="k,,a,,x,a,x"
+fields[0]/output/line[1]="l,,a/b,,x/y,b,y"
+fields[0]/output/line[2]="m,,a/b/c,,x/y/z,c,z"
+fields[1]/output/line[0]="k,,a,,x"
+fields[1]/output/line[1]="l,,b,,y"
+fields[1]/output/line[2]="m,,c,,z"
+fields[2]/output/line[0]="k,,a,,x"
+fields[2]/output/line[1]="l,,a/b,,x/y"
+fields[2]/output/line[2]="m,,b/c,,y/z"
+fields[3]/output/line[0]="k,,a,,x,,"
+fields[3]/output/line[1]="l,,a/b,,x/y,a,x"
+fields[3]/output/line[2]="m,,a/b/c,,x/y/z,a/b,x/y"
+fields[4]/output/line[0]="k,,,,"
+fields[4]/output/line[1]="l,,a,,x"
+fields[4]/output/line[2]="m,,a/b,,x/y"
+fields[5]/output/line[0]="k,,,,"
+fields[5]/output/line[1]="l,,,,"
+fields[5]/output/line[2]="m,,a,,x"
+
+add[0]/output="a,b,xay,xby"
+add[1]/output="xay,xby"
+
+path_common/once[0]/output="a/b"
+path_common/once[1]/output="/"
+path_common/once[2]/output="a"
+path_common/once[3]/output="/a"
+path_common/once[4]/output="a/b,d/e,g/h"
+path_common/once[5]/output="g/h"
+path_common/once[6]/output="a/b,g/h"
+path_common/once[7]/output="abc"
+
+path_common/delimiter[0]/output="a-b,g-h"
+
+path_common/fields[0]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,d/e,g/h"
+path_common/fields[0]/output/line[1]="a/b/d,d/e,g/h/k,a/b,d/e,g/h"
+path_common/fields[0]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,d/e,g/h"
+path_common/fields[1]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,g/h"
+path_common/fields[1]/output/line[1]="a/b/d,d/e,g/h/k,a/b,g/h"
+path_common/fields[1]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,g/h"
+path_common/fields[2]/output/line[0]="a/b/c,d/e/f,g/h/i,g/h"
+path_common/fields[2]/output/line[1]="a/b/d,d/e,g/h/k,g/h"
+path_common/fields[2]/output/line[2]="a/b/z,d/e/x,g/h/y,g/h"
+
+path_common/dirname[0]/output="/"
+path_common/dirname[1]/output="/"
+path_common/dirname[2]/output="/"
+path_common/dirname[3]/output="/aaa"
+path_common/dirname[4]/output="/aaa"
+path_common/dirname[5]/output="/aaa/bbb"
+path_common/dirname[6]/output=""
+path_common/dirname[7]/output=""
+path_common/dirname[8]/output="aaa"
+path_common/dirname[9]/output="aaa"
+path_common/dirname[10]/output="aaa/bbb"
+
+path_common/dirname_on_single_record[0]/output="a/b"
+path_common/dirname_on_single_record[1]/output="a/b"
+
+path_common/dirname_on_single_record[2]/fields[0]/output="a/b,d/e,g/h"
+path_common/dirname_on_single_record[2]/fields[1]/output="a/b,d/e,g/h"
+
+path_common/dirname_on_single_record[2]/append[0]/output/line[0]="a/b/c,a/b"
+path_common/dirname_on_single_record[2]/append[0]/output/line[1]="a/b/d,a/b"
+path_common/dirname_on_single_record[2]/append[0]/output/line[2]="a/b/z,a/b"
+path_common/dirname_on_single_record[2]/append[1]/output/line[0]="a/b/c,d/e/f,g/h/i,a/b,d/e,g/h"
+path_common/dirname_on_single_record[2]/append[1]/output/line[1]="a/b/d,d/e,g/h/k,a/b,d/e,g/h"
+path_common/dirname_on_single_record[2]/append[1]/output/line[2]="a/b/z,d/e/x,g/h/y,a/b,d/e,g/h"
+
+path_common/dirname_on_full_match[0]/output="a/b"
+path_common/dirname_on_full_match[1]/output="a"
+
+path_common/dirname_on_full_match[2]/fields[0]/output=",abc,"
+
+path_common/dirname_on_full_match[3]/append[0]/output/line[0]="abc/def/ghi,"
+path_common/dirname_on_full_match[3]/append[0]/output/line[1]="abc/deg/hij,"
+path_common/dirname_on_full_match[3]/append[0]/output/line[2]="abc/dgh/ijk,"
+path_common/dirname_on_full_match[3]/append[0]/output/line[3]="abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[0]="abc/def/ghi,abc/abc/abc,abc/def/abc,,abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[1]="abc/deg/hij,abc/abc/abb,abc/def/hij,,abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[2]="abc/dgh/ijk,abc/abc/xyz,abc/d/ijk,,abc,"
+path_common/dirname_on_full_match[3]/append[1]/output/line[3]="abc,abc/abc,abc,,abc,"
diff --git a/csv/test/csv-strings/input b/csv/test/csv-strings/input
new file mode 100644
index 000000000..3ace06be6
--- /dev/null
+++ b/csv/test/csv-strings/input
@@ -0,0 +1,128 @@
+basename/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename"
+basename/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 2"
+basename/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3"
+basename/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 4"
+basename/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 1"
+basename/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 2"
+basename/append[6]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 3"
+basename/append[7]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --tail 100"
+
+basename/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --emplace"
+basename/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 2 --emplace"
+basename/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 3 --emplace"
+basename/emplace[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --tail 4 --emplace"
+
+basename/binary/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-basename --emplace --binary s[6] | csv-from-bin s[6]"
+
+basename/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1"
+basename/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2"
+basename/head/append[2]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 1"
+basename/head/append[3]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 2"
+basename/head/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 3"
+basename/head/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-basename --head 100"
+
+basename/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 1 --emplace"
+basename/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-basename --head 2 --emplace"
+
+basename/binary/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-basename --head 1 --emplace --binary s[6] | csv-from-bin s[6]"
+
+dirname/append[0]="( echo /; echo /a; echo /a/; echo /a/b; echo /a/b/c; echo /aaa/bbb; echo /aaa/bbb/ccc; ) | csv-strings path-dirname"
+dirname/append[1]="( echo a; echo a/; echo a/b; echo a/b/c; echo aaa/bbb; echo aaa/bbb/ccc; ) | csv-strings path-dirname"
+
+dirname/tail/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
+dirname/tail/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2"
+dirname/tail/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 3"
+dirname/tail/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 4"
+dirname/tail/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 1"
+dirname/tail/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 2"
+dirname/tail/append[6]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 3"
+dirname/tail/append[7]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --tail 100"
+
+dirname/tail/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
+dirname/tail/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --tail 2 --emplace"
+dirname/tail/emplace[2]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 3 --emplace"
+dirname/tail/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --tail 4 --emplace"
+
+dirname/binary/tail/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-dirname --emplace --binary s[6] | csv-from-bin s[6]"
+
+dirname/head/append[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname"
+dirname/head/append[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2"
+dirname/head/append[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3"
+dirname/head/append[3]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 4"
+dirname/head/append[4]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 1"
+dirname/head/append[5]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 2"
+dirname/head/append[6]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 3"
+dirname/head/append[7]="( echo /; echo /aaa; echo /aaa/bbb; ) | csv-strings path-dirname --head 100"
+
+dirname/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --emplace"
+dirname/head/emplace[1]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 2 --emplace"
+dirname/head/emplace[2]="( echo a; echo a/b; echo a/b/c ) | csv-strings path-dirname --head 3 --emplace"
+dirname/head/emplace[3]="( echo a,; echo a/b,; echo a/b/c, ) | csv-strings path-dirname --head 4 --emplace"
+
+dirname/binary/head/emplace[0]="( echo a; echo a/b; echo a/b/c ) | csv-to-bin s[6] | csv-strings path-dirname --emplace --binary s[6] | csv-from-bin s[6]"
+
+delimiter[0]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=."
+delimiter[1]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-basename --delimiter=. --emplace"
+delimiter[2]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-dirname --delimiter=."
+delimiter[3]="( echo a; echo a.b; echo a.b/c.d/e ) | csv-strings path-dirname --delimiter=. --emplace"
+
+strict[0]="( echo a/b/c; echo a/b ) | csv-strings path-basename --tail 3 --strict"
+strict[1]="( echo a/b/c; echo a/b ) | csv-strings path-basename --tail 3 --emplace --strict"
+strict[2]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --tail 3 --strict"
+strict[3]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --tail 3 --emplace --strict"
+strict[4]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --head 3 --strict"
+strict[5]="( echo a/b/c; echo a/b ) | csv-strings path-dirname --head 3 --emplace --strict"
+
+fields[0]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n"
+fields[1]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n --emplace"
+fields[2]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-basename --fields ,,m,,n --emplace --tail 2"
+fields[3]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n"
+fields[4]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace"
+fields[5]="( echo k,,a,,x; echo l,,a/b,,x/y; echo m,,a/b/c,,x/y/z ) | csv-strings path-dirname --fields ,,m,,n --emplace --tail 2"
+
+add[0]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b"
+add[1]="echo a,b | csv-strings add --prefix x --suffix y --fields a,b --emplace"
+
+path_common/once[0]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --once"
+path_common/once[1]="{ echo /; } | csv-strings path-common --once"
+path_common/once[2]="{ echo a; } | csv-strings path-common --once"
+path_common/once[3]="{ echo /a; } | csv-strings path-common --once"
+path_common/once[4]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --once"
+path_common/once[5]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c --once"
+path_common/once[6]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c --once"
+path_common/once[7]="{ echo abc/def/ghi; echo abc/deg/hij; echo abc/dgh/ijk; } | csv-strings path-common --once"
+
+path_common/delimiter[0]="{ echo a-b-c,d-e-f,g-h-i; echo a-b-d,d-e,g-h-k; echo a-b-z,d-e-x,g-h-y; } | csv-strings path-common --fields a,,c --once --path-delimiter -"
+
+path_common/fields[0]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c"
+path_common/fields[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,,c"
+path_common/fields[2]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields ,,c"
+
+path_common/dirname[0]="{ echo /; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[1]="{ echo /a; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[2]="{ echo /aaa; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[3]="{ echo /aaa/; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[4]="{ echo /aaa/bbb; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[5]="{ echo /aaa/bbb/ccc; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[6]="{ echo a; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[7]="{ echo aaa; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[8]="{ echo aaa/; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[9]="{ echo aaa/bbb; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname[10]="{ echo aaa/bbb/ccc; } | csv-strings path-common --dirname-on-single-record --once"
+
+path_common/dirname_on_single_record[0]="{ echo a/b/c; } | csv-strings path-common --dirname-on-single-record --once"
+path_common/dirname_on_single_record[1]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-single-record --once"
+
+path_common/dirname_on_single_record[2]/fields[0]="{ echo a/b/c,d/e/f,g/h/i; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
+path_common/dirname_on_single_record[2]/fields[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e/g,g/h/j; echo a/b/x,d/e/y,g/h/z; } | csv-strings path-common --dirname-on-single-record --once --fields a,b,c"
+
+path_common/dirname_on_single_record[2]/append[0]="{ echo a/b/c; echo a/b/d; echo a/b/z; } | csv-strings path-common --dirname-on-single-record"
+path_common/dirname_on_single_record[2]/append[1]="{ echo a/b/c,d/e/f,g/h/i; echo a/b/d,d/e,g/h/k; echo a/b/z,d/e/x,g/h/y; } | csv-strings path-common --fields a,b,c --dirname-on-single-record"
+
+path_common/dirname_on_full_match[0]="{ echo a/b/c; echo a/b/d; echo a/b/e; } | csv-strings path-common --dirname-on-full-match --once"
+path_common/dirname_on_full_match[1]="{ echo a/b/c; echo a/b/d; echo a/b/e; echo a/b; } | csv-strings path-common --dirname-on-full-match --once"
+
+path_common/dirname_on_full_match[2]/fields[0]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --once --fields a,b,c"
+
+path_common/dirname_on_full_match[3]/append[0]="{ echo abc/def/ghi; echo abc/deg/hij; echo abc/dgh/ijk; echo abc; } | csv-strings path-common --dirname-on-full-match"
+path_common/dirname_on_full_match[3]/append[1]="{ echo abc/def/ghi,abc/abc/abc,abc/def/abc; echo abc/deg/hij,abc/abc/abb,abc/def/hij; echo abc/dgh/ijk,abc/abc/xyz,abc/d/ijk; echo abc,abc/abc,abc; } | csv-strings path-common --dirname-on-full-match --fields a,b,c"
diff --git a/csv/test/csv-thin/deterministic/expected b/csv/test/csv-thin/deterministic/expected
deleted file mode 100644
index fb91f8dbe..000000000
--- a/csv/test/csv-thin/deterministic/expected
+++ /dev/null
@@ -1,5 +0,0 @@
-output[0]/n="3"
-output[1]/n="7"
-output[2]/n="11"
-output[3]/n="15"
-output[4]/n="19"
diff --git a/csv/test/csv-thin/deterministic/test b/csv/test/csv-thin/deterministic/test
deleted file mode 100755
index 52bf9b4bc..000000000
--- a/csv/test/csv-thin/deterministic/test
+++ /dev/null
@@ -1,2 +0,0 @@
-csv-paste line-number | head -20 | csv-thin 0.25 --deterministic \
-    | name-value-from-csv --fields n --prefix output --line-number
diff --git a/csv/test/csv-thin/expected b/csv/test/csv-thin/expected
new file mode 100644
index 000000000..01b70a6eb
--- /dev/null
+++ b/csv/test/csv-thin/expected
@@ -0,0 +1,6 @@
+deterministic[0]/output="4,8,12,16,20,"
+deterministic[0]/status=0
+random/deterministic[0]/output="1,3,5,7,9,"
+random/deterministic[0]/status=0
+random/inverted[0]/output="1,2,3,4,5,6,7,8,9,10,"
+random/inverted[0]/status=0
diff --git a/csv/test/csv-thin/input b/csv/test/csv-thin/input
new file mode 100644
index 000000000..905183713
--- /dev/null
+++ b/csv/test/csv-thin/input
@@ -0,0 +1,3 @@
+deterministic[0]="seq 20 | csv-thin 0.25 --deterministic | tr '\\\n' ','"
+random/deterministic[0]="seq 10 | csv-thin 0.5 --invert --deterministic | tr '\\\n' ','"
+random/inverted[0]="( seq 10 | csv-thin 0.5; seq 10 | csv-thin 0.5 --invert ) | csv-sort --fields i | tr '\\\n' ','"
diff --git a/csv/test/csv-thin/period/ascii/expected b/csv/test/csv-thin/period/ascii/expected
index 768041874..b25ec4ecf 100644
--- a/csv/test/csv-thin/period/ascii/expected
+++ b/csv/test/csv-thin/period/ascii/expected
@@ -1,5 +1,5 @@
-output[0]/t="20180608T175915.180390703"
-output[0]/n="1"
+output[0]/t="20180608T175915.168851696"
+output[0]/n="0"
 output[1]/t="20180608T175915.271129830"
 output[1]/n="9"
 output[2]/t="20180608T175915.375231419"
diff --git a/csv/test/csv-thin/period/binary/expected b/csv/test/csv-thin/period/binary/expected
index 7f1c01d9b..27fa96e35 100644
--- a/csv/test/csv-thin/period/binary/expected
+++ b/csv/test/csv-thin/period/binary/expected
@@ -1,5 +1,5 @@
-output[0]/t="20180608T175915.180390"
-output[0]/n="1"
+output[0]/t="20180608T175915.168851"
+output[0]/n="0"
 output[1]/t="20180608T175915.271129"
 output[1]/n="9"
 output[2]/t="20180608T175915.375231"
diff --git a/csv/test/csv-thin/period/irregular/baseline/expected b/csv/test/csv-thin/period/irregular/baseline/expected
new file mode 100644
index 000000000..ddd2da28f
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/baseline/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120002.0"
+output[2]/n="20"
+output[3]/t="20210117T120003.0"
+output[3]/n="30"
+output[4]/t="20210117T120004.0"
+output[4]/n="40"
+output[5]/t="20210117T120005.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/baseline/input b/csv/test/csv-thin/period/irregular/baseline/input
new file mode 100644
index 000000000..c1e23e235
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/baseline/input
@@ -0,0 +1,60 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.6,16
+20210117T120001.7,17
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T120002.0,20
+20210117T120002.1,21
+20210117T120002.2,22
+20210117T120002.3,23
+20210117T120002.4,24
+20210117T120002.5,25
+20210117T120002.6,26
+20210117T120002.7,27
+20210117T120002.8,28
+20210117T120002.9,29
+20210117T120003.0,30
+20210117T120003.1,31
+20210117T120003.2,32
+20210117T120003.3,33
+20210117T120003.4,34
+20210117T120003.5,35
+20210117T120003.6,36
+20210117T120003.7,37
+20210117T120003.8,38
+20210117T120003.9,39
+20210117T120004.0,40
+20210117T120004.1,41
+20210117T120004.2,42
+20210117T120004.3,43
+20210117T120004.4,44
+20210117T120004.5,45
+20210117T120004.6,46
+20210117T120004.7,47
+20210117T120004.8,48
+20210117T120004.9,49
+20210117T120005.0,50
+20210117T120005.1,51
+20210117T120005.2,52
+20210117T120005.3,53
+20210117T120005.4,54
+20210117T120005.5,55
+20210117T120005.6,56
+20210117T120005.7,57
+20210117T120005.8,58
+20210117T120005.9,59
diff --git a/csv/test/csv-thin/period/irregular/gaps-01/expected b/csv/test/csv-thin/period/irregular/gaps-01/expected
new file mode 100644
index 000000000..ddd2da28f
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-01/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120002.0"
+output[2]/n="20"
+output[3]/t="20210117T120003.0"
+output[3]/n="30"
+output[4]/t="20210117T120004.0"
+output[4]/n="40"
+output[5]/t="20210117T120005.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/gaps-01/input b/csv/test/csv-thin/period/irregular/gaps-01/input
new file mode 100644
index 000000000..28da4540f
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-01/input
@@ -0,0 +1,47 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.7,17
+20210117T120002.0,20
+20210117T120002.1,21
+20210117T120002.2,22
+20210117T120002.3,23
+20210117T120002.8,28
+20210117T120002.9,29
+20210117T120003.0,30
+20210117T120003.1,31
+20210117T120003.2,32
+20210117T120003.3,33
+20210117T120003.4,34
+20210117T120003.5,35
+20210117T120003.6,36
+20210117T120003.7,37
+20210117T120003.8,38
+20210117T120003.9,39
+20210117T120004.0,40
+20210117T120004.1,41
+20210117T120004.2,42
+20210117T120004.3,43
+20210117T120004.4,44
+20210117T120004.5,45
+20210117T120004.6,46
+20210117T120004.7,47
+20210117T120004.8,48
+20210117T120004.9,49
+20210117T120005.0,50
+20210117T120005.1,51
+20210117T120005.2,52
+20210117T120005.3,53
+20210117T120005.4,54
+20210117T120005.5,55
+20210117T120005.6,56
+20210117T120005.7,57
+20210117T120005.8,58
+20210117T120005.9,59
diff --git a/csv/test/csv-thin/period/irregular/gaps-02/expected b/csv/test/csv-thin/period/irregular/gaps-02/expected
new file mode 100644
index 000000000..1f56535f5
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-02/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.3"
+output[1]/n="13"
+output[2]/t="20210117T120002.0"
+output[2]/n="20"
+output[3]/t="20210117T120003.0"
+output[3]/n="30"
+output[4]/t="20210117T120004.4"
+output[4]/n="44"
+output[5]/t="20210117T120005.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/gaps-02/input b/csv/test/csv-thin/period/irregular/gaps-02/input
new file mode 100644
index 000000000..b390c96ad
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/gaps-02/input
@@ -0,0 +1,48 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T120002.0,20
+20210117T120002.1,21
+20210117T120002.2,22
+20210117T120002.3,23
+20210117T120002.4,24
+20210117T120002.5,25
+20210117T120002.6,26
+20210117T120002.7,27
+20210117T120002.8,28
+20210117T120002.9,29
+20210117T120003.0,30
+20210117T120003.1,31
+20210117T120003.2,32
+20210117T120003.3,33
+20210117T120003.4,34
+20210117T120003.5,35
+20210117T120003.6,36
+20210117T120003.7,37
+20210117T120003.8,38
+20210117T120004.4,44
+20210117T120004.5,45
+20210117T120004.6,46
+20210117T120004.7,47
+20210117T120004.8,48
+20210117T120004.9,49
+20210117T120005.0,50
+20210117T120005.1,51
+20210117T120005.2,52
+20210117T120005.3,53
+20210117T120005.4,54
+20210117T120005.5,55
+20210117T120005.6,56
+20210117T120005.7,57
+20210117T120005.8,58
+20210117T120005.9,59
diff --git a/csv/test/csv-thin/period/irregular/jump-backward/expected b/csv/test/csv-thin/period/irregular/jump-backward/expected
new file mode 100644
index 000000000..b5667b240
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-backward/expected
@@ -0,0 +1,6 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120002.0"
+output[2]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/jump-backward/input b/csv/test/csv-thin/period/irregular/jump-backward/input
new file mode 100644
index 000000000..e35a4988a
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-backward/input
@@ -0,0 +1,60 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.6,16
+20210117T120001.7,17
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T110059.0,20
+20210117T110059.1,21
+20210117T110059.2,22
+20210117T110059.3,23
+20210117T110059.4,24
+20210117T110059.5,25
+20210117T110059.6,26
+20210117T110059.7,27
+20210117T110059.8,28
+20210117T110059.9,29
+20210117T120000.0,30
+20210117T120000.1,31
+20210117T120000.2,32
+20210117T120000.3,33
+20210117T120000.4,34
+20210117T120000.5,35
+20210117T120000.6,36
+20210117T120000.7,37
+20210117T120000.8,38
+20210117T120000.9,39
+20210117T120001.0,40
+20210117T120001.1,41
+20210117T120001.2,42
+20210117T120001.3,43
+20210117T120001.4,44
+20210117T120001.5,45
+20210117T120001.6,46
+20210117T120001.7,47
+20210117T120001.8,48
+20210117T120001.9,49
+20210117T120002.0,50
+20210117T120002.1,51
+20210117T120002.2,52
+20210117T120002.3,53
+20210117T120002.4,54
+20210117T120002.5,55
+20210117T120002.6,56
+20210117T120002.7,57
+20210117T120002.8,58
+20210117T120002.9,59
diff --git a/csv/test/csv-thin/period/irregular/jump-forward/expected b/csv/test/csv-thin/period/irregular/jump-forward/expected
new file mode 100644
index 000000000..1e319278e
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-forward/expected
@@ -0,0 +1,12 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120001.0"
+output[1]/n="10"
+output[2]/t="20210117T120102.0"
+output[2]/n="20"
+output[3]/t="20210117T120103.0"
+output[3]/n="30"
+output[4]/t="20210117T120104.0"
+output[4]/n="40"
+output[5]/t="20210117T120105.0"
+output[5]/n="50"
diff --git a/csv/test/csv-thin/period/irregular/jump-forward/input b/csv/test/csv-thin/period/irregular/jump-forward/input
new file mode 100644
index 000000000..f98d8dc66
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/jump-forward/input
@@ -0,0 +1,60 @@
+20210117T120000.0,0
+20210117T120000.1,1
+20210117T120000.2,2
+20210117T120000.3,3
+20210117T120000.4,4
+20210117T120000.5,5
+20210117T120000.6,6
+20210117T120000.7,7
+20210117T120000.8,8
+20210117T120000.9,9
+20210117T120001.0,10
+20210117T120001.1,11
+20210117T120001.2,12
+20210117T120001.3,13
+20210117T120001.4,14
+20210117T120001.5,15
+20210117T120001.6,16
+20210117T120001.7,17
+20210117T120001.8,18
+20210117T120001.9,19
+20210117T120102.0,20
+20210117T120102.1,21
+20210117T120102.2,22
+20210117T120102.3,23
+20210117T120102.4,24
+20210117T120102.5,25
+20210117T120102.6,26
+20210117T120102.7,27
+20210117T120102.8,28
+20210117T120102.9,29
+20210117T120103.0,30
+20210117T120103.1,31
+20210117T120103.2,32
+20210117T120103.3,33
+20210117T120103.4,34
+20210117T120103.5,35
+20210117T120103.6,36
+20210117T120103.7,37
+20210117T120103.8,38
+20210117T120103.9,39
+20210117T120104.0,40
+20210117T120104.1,41
+20210117T120104.2,42
+20210117T120104.3,43
+20210117T120104.4,44
+20210117T120104.5,45
+20210117T120104.6,46
+20210117T120104.7,47
+20210117T120104.8,48
+20210117T120104.9,49
+20210117T120105.0,50
+20210117T120105.1,51
+20210117T120105.2,52
+20210117T120105.3,53
+20210117T120105.4,54
+20210117T120105.5,55
+20210117T120105.6,56
+20210117T120105.7,57
+20210117T120105.8,58
+20210117T120105.9,59
diff --git a/csv/test/csv-thin/period/irregular/test b/csv/test/csv-thin/period/irregular/test
new file mode 100755
index 000000000..5e645c4bc
--- /dev/null
+++ b/csv/test/csv-thin/period/irregular/test
@@ -0,0 +1 @@
+csv-thin --period 1 --fields t | name-value-from-csv --fields t,n --prefix output --line-number
diff --git a/csv/test/csv-thin/period/slow/expected b/csv/test/csv-thin/period/slow/expected
new file mode 100644
index 000000000..a894b6eaa
--- /dev/null
+++ b/csv/test/csv-thin/period/slow/expected
@@ -0,0 +1,24 @@
+output[0]/t="20210117T120000.0"
+output[0]/n="0"
+output[1]/t="20210117T120000.5"
+output[1]/n="5"
+output[2]/t="20210117T120001.0"
+output[2]/n="10"
+output[3]/t="20210117T120001.5"
+output[3]/n="15"
+output[4]/t="20210117T120002.0"
+output[4]/n="20"
+output[5]/t="20210117T120002.5"
+output[5]/n="25"
+output[6]/t="20210117T120003.0"
+output[6]/n="30"
+output[7]/t="20210117T120003.5"
+output[7]/n="35"
+output[8]/t="20210117T120004.0"
+output[8]/n="40"
+output[9]/t="20210117T120004.5"
+output[9]/n="45"
+output[10]/t="20210117T120005.0"
+output[10]/n="50"
+output[11]/t="20210117T120005.5"
+output[11]/n="55"
diff --git a/csv/test/csv-thin/period/slow/input b/csv/test/csv-thin/period/slow/input
new file mode 100644
index 000000000..041668da6
--- /dev/null
+++ b/csv/test/csv-thin/period/slow/input
@@ -0,0 +1,12 @@
+20210117T120000.0,0
+20210117T120000.5,5
+20210117T120001.0,10
+20210117T120001.5,15
+20210117T120002.0,20
+20210117T120002.5,25
+20210117T120003.0,30
+20210117T120003.5,35
+20210117T120004.0,40
+20210117T120004.5,45
+20210117T120005.0,50
+20210117T120005.5,55
diff --git a/csv/test/csv-thin/period/slow/test b/csv/test/csv-thin/period/slow/test
new file mode 100755
index 000000000..86cc14297
--- /dev/null
+++ b/csv/test/csv-thin/period/slow/test
@@ -0,0 +1 @@
+csv-thin --period 0.1 --fields t | name-value-from-csv --fields t,n --prefix output --line-number
diff --git a/csv/test/csv-time-join/realtime/simple/expected b/csv/test/csv-time-join/realtime/simple/expected
index 557a39cf2..ebc28fe03 100644
--- a/csv/test/csv-time-join/realtime/simple/expected
+++ b/csv/test/csv-time-join/realtime/simple/expected
@@ -1,2 +1,2 @@
-num_records="10"
-num_fields="4"
+num_records=10 +/- 1
+num_fields=4
diff --git a/csv/test/csv-time-join/realtime/timestamp-only/expected b/csv/test/csv-time-join/realtime/timestamp-only/expected
index df5c38113..373fa6438 100644
--- a/csv/test/csv-time-join/realtime/timestamp-only/expected
+++ b/csv/test/csv-time-join/realtime/timestamp-only/expected
@@ -1,2 +1,2 @@
-num_records="10"
-num_fields="3"
+num_records=10 +/- 1
+num_fields=3
diff --git a/csv/test/csv-time-join/test b/csv/test/csv-time-join/test
index 07f0ab933..2a0e3b47b 100755
--- a/csv/test/csv-time-join/test
+++ b/csv/test/csv-time-join/test
@@ -33,7 +33,8 @@ cat $input \
     | if [[ $options =~ --realtime ]]; then
           sed 's/[^,]//g' | wc -lc | tr -s ' ' | sed 's/^ //' | tr ' ' , \
               | csv-eval --fields=lines,chars "chars = chars / lines" \
-              | name-value-from-csv -f num_records,num_fields
+              | name-value-from-csv -f num_records,num_fields \
+              | csv-quote --unquote -d =
       else
           name-value-from-csv -f line -d : -n -p output
       fi
diff --git a/csv/test/csv-time-stamp/test b/csv/test/csv-time-stamp/test
index fd3691851..e10c00d8d 100755
--- a/csv/test/csv-time-stamp/test
+++ b/csv/test/csv-time-stamp/test
@@ -4,8 +4,6 @@ source $( type -p comma-application-util )
 
 comma_path_value_to_var < <( cat )
 
-now=$( date -u +%Y%m%dT%H%M%S.%N | csv-time --from iso --to seconds )
-
 input_fn=cat
 output_fn=cat
 if [[ $options =~ --binary|--size ]]; then
@@ -13,13 +11,22 @@ if [[ $options =~ --binary|--size ]]; then
     output_fn="csv-from-bin t,$format"
 fi
 
+function timestamper()
+{
+    local now=$( date -u +%Y%m%dT%H%M%S.%N | csv-time --from iso --to seconds )
+    $input_fn \
+        | csv-time-stamp $options \
+        | $output_fn | csv-time --from iso --to seconds \
+        | csv-eval --fields=t "d=t-$now" \
+        | name-value-from-csv --prefix=output --line-number --fields=t,$fields,d \
+        | csv-quote --unquote --delimiter='='
+}
+
+# prime the system to load everything from disk, so that timestamp comparison is more accurate
+
+echo "dummy" | timestamper >/dev/null 2>&1
+
 # put a small delay between the outputting of each line,
 # so the timestamps are different
 
-echo -e $input | while read line; do echo $line; sleep 0.1; done \
-    | $input_fn \
-    | csv-time-stamp $options \
-    | $output_fn | csv-time --from iso --to seconds \
-    | csv-eval --fields=t "d=t-$now" \
-    | name-value-from-csv --prefix=output --line-number --fields=t,$fields,d \
-    | csv-quote --unquote --delimiter='='
+echo -e $input | while read line; do echo $line; sleep 0.1; done | timestamper
diff --git a/csv/test/csv-time/expected b/csv/test/csv-time/expected
index 2b4551879..036aaea01 100644
--- a/csv/test/csv-time/expected
+++ b/csv/test/csv-time/expected
@@ -47,6 +47,57 @@ sql[1]/status=0
 sql[2]/output="1394060400"
 sql[2]/status=0
 
+tai_to_tai[0]/output="19700101T000000"
+tai_to_tai[0]/status=0
+tai_to_tai[1]/output="19711231T235959"
+tai_to_tai[1]/status=0
+tai_to_tai[2]/output="19720101T000010"
+tai_to_tai[2]/status=0
+tai_to_tai[3]/output="19720101T000011"
+tai_to_tai[3]/status=0
+tai_to_tai[4]/output="19720701T000009"
+tai_to_tai[4]/status=0
+tai_to_tai[5]/output="19720701T000011"
+tai_to_tai[5]/status=0
+tai_to_tai[6]/output="19720701T000012"
+tai_to_tai[6]/status=0
+tai_to_tai[7]/output="20170101T000035"
+tai_to_tai[7]/status=0
+tai_to_tai[8]/output="20170101T000037"
+tai_to_tai[8]/status=0
+tai_to_tai[9]/output="20170101T000038"
+tai_to_tai[9]/status=0
+tai_to_tai[10]/output="20240101T000037"
+tai_to_tai[10]/status=0
+
+tai_stream[0]/output/line[0]="20170101T000035"
+tai_stream[0]/output/line[1]="20170101T000037"
+tai_stream[0]/output/line[2]="20170101T000038"
+tai_stream[0]/status=0
+tai_stream[1]/output/line[0]="20240101T000037"
+tai_stream[1]/output/line[1]="20240101T000038"
+tai_stream[1]/output/line[2]="20240101T000039"
+tai_stream[1]/status=0
+
+tai_from_tai[0]/output="19720101T000000"
+tai_from_tai[0]/status=0
+tai_from_tai[1]/output="19720630T235959"
+tai_from_tai[1]/status=0
+tai_from_tai[2]/output="19720701T000000"
+tai_from_tai[2]/status=0
+tai_from_tai[3]/output="19720701T000000"
+tai_from_tai[3]/status=0
+tai_from_tai[4]/output="19720701T000001"
+tai_from_tai[4]/status=0
+tai_from_tai[5]/output="20170101T000000"
+tai_from_tai[5]/status=0
+tai_from_tai[6]/output="20170101T000000"
+tai_from_tai[6]/status=0
+tai_from_tai[7]/output="20170101T000001"
+tai_from_tai[7]/status=0
+tai_from_tai[8]/output="20240101T000000"
+tai_from_tai[8]/status=0
+
 xsd[0]/output="1394060400"
 xsd[0]/status=0
 xsd[1]/output="1394060400"
diff --git a/csv/test/csv-time/input b/csv/test/csv-time/input
index e5983b608..04a419ddc 100644
--- a/csv/test/csv-time/input
+++ b/csv/test/csv-time/input
@@ -28,6 +28,33 @@ sql[0]="echo '2014-03-05 23:00:00' | csv-time --from sql --to seconds"
 sql[1]="echo '2014-03-05 23:00:00' | csv-time --from posix --to seconds"
 sql[2]="echo '2014-03-05 23:00:00' | csv-time --from 'ieee-std-1003.1' --to seconds"
 
+# I'd like to test datetimes like 19720630T235960 (that was a leap-second) but
+# boost doesn't understand them. It treats them as identical to 19720701T000000
+tai_to_tai[0]="echo 19700101T000000 | csv-time --to tai"
+tai_to_tai[1]="echo 19711231T235959 | csv-time --to tai"
+tai_to_tai[2]="echo 19720101T000000 | csv-time --to tai"
+tai_to_tai[3]="echo 19720101T000001 | csv-time --to tai"
+tai_to_tai[4]="echo 19720630T235959 | csv-time --to tai"
+tai_to_tai[5]="echo 19720701T000000 | csv-time --to tai"
+tai_to_tai[6]="echo 19720701T000001 | csv-time --to tai"
+tai_to_tai[7]="echo 20161231T235959 | csv-time --to tai"
+tai_to_tai[8]="echo 20170101T000000 | csv-time --to tai"
+tai_to_tai[9]="echo 20170101T000001 | csv-time --to tai"
+tai_to_tai[10]="echo 20240101T000000 | csv-time --to tai"
+
+tai_stream[0]="echo -e '20161231T235959\\n20170101T000000\\n20170101T000001' | csv-time --to tai"
+tai_stream[1]="echo -e '20240101T000000\\n20240101T000001\\n20240101T000002' | csv-time --to tai"
+
+tai_from_tai[0]="echo 19720101T000010 | csv-time --from tai"
+tai_from_tai[1]="echo 19720701T000009 | csv-time --from tai"
+tai_from_tai[2]="echo 19720701T000010 | csv-time --from tai"
+tai_from_tai[3]="echo 19720701T000011 | csv-time --from tai"
+tai_from_tai[4]="echo 19720701T000012 | csv-time --from tai"
+tai_from_tai[5]="echo 20170101T000036 | csv-time --from tai"
+tai_from_tai[6]="echo 20170101T000037 | csv-time --from tai"
+tai_from_tai[7]="echo 20170101T000038 | csv-time --from tai"
+tai_from_tai[8]="echo 20240101T000037 | csv-time --from tai"
+
 xsd[0]="echo '2014-03-05T23:00:00.000Z' | csv-time --from xsd --to seconds"
 xsd[1]="echo '2014-03-05T23:00:00.000Z' | csv-time --from 'iso-8601-extended' --to seconds"
 
@@ -85,4 +112,3 @@ precision[6]="echo 19700101T000000.000001 | csv-time --from=iso --to=seconds | c
 
 format[0]="echo 20180102T123456 | csv-time --from 'format;%Y%m%dT%H%M%S'"
 format[1]="echo 10m23s | csv-time --from 'format;%Mm%S' --to seconds"
-
diff --git a/csv/test/csv-to-from-bin/expected b/csv/test/csv-to-from-bin/expected
new file mode 100644
index 000000000..2d2e0e82b
--- /dev/null
+++ b/csv/test/csv-to-from-bin/expected
@@ -0,0 +1,4 @@
+#python
+
+for n in range( number_of( test )):
+    expect test[n]/output == test[n]/input
diff --git a/csv/test/csv-to-from-bin/input b/csv/test/csv-to-from-bin/input
new file mode 100644
index 000000000..be15fceac
--- /dev/null
+++ b/csv/test/csv-to-from-bin/input
@@ -0,0 +1,8 @@
+b 0,64,127,-64,-127
+ub 0,64,127,128,255
+w 0,64,127,-64,-127,-1000,1000
+uw 0,64,127,128,255,1000,3000
+i 0,64,127,-64,-127,-1000,1000,-1000000000,1000000000
+ui 0,64,127,128,255,1000,3000,1000000000,3000000000
+l 0,64,127,-64,-127,-1000,1000,-1000000000,1000000000,-10000000000,10000000000
+ul 0,64,127,128,255,1000,3000,1000000000,3000000000,10000000000,30000000000
diff --git a/csv/test/csv-to-from-bin/test b/csv/test/csv-to-from-bin/test
new file mode 100755
index 000000000..25c74455f
--- /dev/null
+++ b/csv/test/csv-to-from-bin/test
@@ -0,0 +1,7 @@
+#!/bin/bash
+
+while read format data; do
+    for x in $( tr , ' ' <<< $data ); do
+        echo $format,$x,$( echo $x | csv-to-bin $format | csv-from-bin $format )
+    done
+done | name-value-from-csv format,input,output --prefix test --line-number
diff --git a/csv/test/format_test.cpp b/csv/test/format_test.cpp
index 97e3929ea..e3a08c7da 100644
--- a/csv/test/format_test.cpp
+++ b/csv/test/format_test.cpp
@@ -41,6 +41,14 @@ TEST( csv, format )
         try { comma::csv::format f( "%" ); EXPECT_TRUE( false ); } catch ( ... ) {}
         try { comma::csv::format f( "blah" ); EXPECT_TRUE( false ); } catch ( ... ) {}
     }
+    {
+        comma::csv::format f( "%ub" );
+        EXPECT_EQ( f.bin_to_csv( f.csv_to_bin( "64" ) ), "64" );
+    }
+    {
+        comma::csv::format f( "%b" );
+        EXPECT_EQ( f.bin_to_csv( f.csv_to_bin( "-64" ) ), "-64" );
+    }
     {
         comma::csv::format f( "%uw" );
         EXPECT_EQ( f.bin_to_csv( f.csv_to_bin( "1234" ) ), "1234" );
@@ -349,6 +357,7 @@ TEST( csv, unstructured )
     EXPECT_EQ( "l,l,l,l", comma::csv::impl::unstructured::guess_format( "1,2,3,4" ).string() );
     EXPECT_EQ( "l,d,t,s[1024]", comma::csv::impl::unstructured::guess_format( "1,2.1,20121212T000000,blah" ).string() );
     comma::csv::options csv;
+    csv.full_xpath = false;
     csv.fields = "a,,,b,,,c";
     csv.delimiter = ',';
     EXPECT_EQ( "l,s[1024],s[1024],s[1024],s[1024],s[1024],t", comma::csv::impl::unstructured::guess_format( "1,,,blah,,,20121212T000000" ).string() );
diff --git a/csv/test/names_test.cpp b/csv/test/names_test.cpp
index 07a41f975..26649b597 100644
--- a/csv/test/names_test.cpp
+++ b/csv/test/names_test.cpp
@@ -245,6 +245,14 @@ TEST( csv, names )
     EXPECT_EQ( join( names< test_struct >( ",,,,no-such-field,,," ), ',' ), ",,,,no-such-field,,," );
 }
 
+TEST( csv, leaves )
+{
+    {
+        std::unordered_map< std::string, std::string > m{ { "A", "D/A" }, { "X", "D/B/X" }, { "Y", "D/B/Y" } };
+        EXPECT_EQ( leaves< test_struct >( "D" ), m );
+    }
+}
+
 TEST( csv, names_optional_element )
 {
     EXPECT_EQ( join( names< struct_with_optional_element >(), ',' ), "x,nested/X,nested/Y" );
diff --git a/csv/test/options_test.cpp b/csv/test/options_test.cpp
index faf3f53ae..7d02c244b 100644
--- a/csv/test/options_test.cpp
+++ b/csv/test/options_test.cpp
@@ -28,6 +28,7 @@
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <gtest/gtest.h>
+#include "../../application/command_line_options.h"
 #include "../../csv/options.h"
 
 namespace comma {
@@ -36,6 +37,7 @@ TEST( options, has_paths )
 {
     {
         comma::csv::options csv;
+        csv.full_xpath = false;
         csv.fields = "a,b/c,d/e/f,p[0],q[0]/x,s/t/y[0],s/t/y[1]/z";
         EXPECT_TRUE( csv.has_paths( "a" ) );
         EXPECT_TRUE( csv.has_paths( "b" ) );
@@ -66,6 +68,7 @@ TEST( options, has_paths )
     }
     {
         comma::csv::options csv;
+        csv.full_xpath = false;
         csv.fields = "a,b/c,d/e/f,p[0],q[0]/x,s/t/y[0],s/t/y[1]/z";
         EXPECT_TRUE( csv.has_some_of_paths( "a" ) );
         EXPECT_TRUE( csv.has_some_of_paths( "a,blah" ) );
@@ -96,5 +99,38 @@ TEST( options, has_paths )
         EXPECT_FALSE( csv.has_some_of_paths( "c" ) );
     }
 }
-    
+
+TEST( options, aliases )
+{
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "" } ), std::unordered_map< std::string, std::string >() );
+        EXPECT_EQ( csv.fields, "" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "" } ), { { "b", "x/y/b" } }, "a,b,b" );
+        EXPECT_EQ( csv.fields, "a,x/y/b,x/y/b" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,b,c" } ), std::unordered_map< std::string, std::string >() );
+        EXPECT_EQ( csv.fields, "a,b,c" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=,b,c" } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, ",x/y/b,c" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,b," } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, "a,x/y/b," );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,,b" } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, "a,,x/y/b" );
+    }
+    {
+        comma::csv::options csv( comma::command_line_options( std::vector< std::string >{ "", "--fields=a,b,c" } ), { { "b", "x/y/b" } } );
+        EXPECT_EQ( csv.fields, "a,x/y/b,c" );
+    }
+    // todo: more tests
+}
+
 } // namespace comma {
diff --git a/csv/test/stream_test.cpp b/csv/test/stream_test.cpp
index 2322d3cde..04a788baf 100644
--- a/csv/test/stream_test.cpp
+++ b/csv/test/stream_test.cpp
@@ -94,14 +94,13 @@ namespace comma { namespace csv { namespace stream_test {
 TEST( csv, container )
 {
 	comma::csv::options csv;
-     csv.full_xpath = true;
 	{
         std::string s( "2,3,,,6" );
         std::istringstream iss( s );
         test_container sample; sample.vector = std::vector< int >( 5, 1 );
         comma::csv::input_stream< test_container > istream( iss, csv, sample );
         const test_container *c = istream.read();
-        EXPECT_EQ( c->vector.size(), 5 );
+        EXPECT_EQ( int( c->vector.size() ), 5 );
         std::string so = comma::join( c->vector, ',' );
         EXPECT_EQ( so, "2,3,1,1,6" );
     }
@@ -112,11 +111,33 @@ TEST( csv, container )
         c.vector[1] = 5;
         c.vector[2] = 3;
         ostream.write( c );
-        EXPECT_EQ( c.vector.size(), 5 );
+        EXPECT_EQ( int( c.vector.size() ), 5 );
         EXPECT_EQ( oss.str(), "1,5,3,1,1\n" );
     }
 }
 
+TEST( csv, passed_ascii )
+{
+    {
+        std::istringstream iss( "1,2\n3,4" );
+        comma::csv::input_stream< test_struct > is( iss );
+        std::ostringstream oss;
+        comma::csv::passed< test_struct > p( is, oss );
+        is.read();
+        p.write();
+        EXPECT_EQ( "1,2\n", oss.str() );
+        is.read();
+        p.write();
+        EXPECT_EQ( "1,2\n3,4\n", oss.str() );
+        is.read();
+        p.write( test_struct( 10, 20 ) );
+        EXPECT_EQ( "1,2\n3,4\n10,20\n", oss.str() );
+    }
+    {
+        // todo! binary test
+    }
+}
+
 } } } // namespace comma { namespace csv { namespace stream_test {
 
 namespace comma { namespace csv { namespace stream_test {
diff --git a/csv/traits.h b/csv/traits.h
index 0aeba617f..35cc0ce40 100644
--- a/csv/traits.h
+++ b/csv/traits.h
@@ -1,36 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_CSV_TRAITS_H_
-#define COMMA_CSV_TRAITS_H_
+#pragma once
 
 #include "../csv/options.h"
 #include "../visiting/traits.h"
@@ -45,12 +17,11 @@ template <> struct traits< comma::csv::options >
         v.apply( "filename", p.filename );
         v.apply( "delimiter", p.delimiter );
         v.apply( "fields", p.fields );
-        v.apply( "full-xpath", p.full_xpath );
         v.apply( "precision", p.precision );
         v.apply( "quote", p.quote ? std::string( 1, *p.quote ) : std::string() );
         v.apply( "flush", p.flush );
         if( p.binary() ) { v.apply( "binary", p.format().string() ); }
-        
+
     }
 
     template < typename Key, class Visitor >
@@ -59,7 +30,6 @@ template <> struct traits< comma::csv::options >
         v.apply( "filename", p.filename );
         v.apply( "delimiter", p.delimiter );
         v.apply( "fields", p.fields );
-        v.apply( "full-xpath", p.full_xpath );
         v.apply( "precision", p.precision );
         std::string quote = p.quote ? std::string( 1, *p.quote ) : std::string();
         v.apply( "quote", p.quote );
@@ -77,5 +47,3 @@ template <> struct traits< comma::csv::options >
 };
 
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_CSV_TRAITS_H_
diff --git a/debian/changelog b/debian/changelog
new file mode 100644
index 000000000..012c9b8de
--- /dev/null
+++ b/debian/changelog
@@ -0,0 +1,5 @@
+comma (1.1.0-0ppa0) jammy; urgency=low
+
+  * substantially more functionality and bug fixes in utilities like csv-paste, io-cat, etc
+
+ -- Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>  Mon, 5 Feb 2024 12:44:00 +1000
diff --git a/debian/control b/debian/control
new file mode 100644
index 000000000..5a3e13941
--- /dev/null
+++ b/debian/control
@@ -0,0 +1,14 @@
+Source: comma
+Standards-Version: 4.6.0.1
+Section: devel
+Priority: optional
+Maintainer: Vsevolod Vlaskine <vsevolod.vlaskine@gmail.com>
+Build-Depends: cmake, libc-dev, libboost-all-dev (>=1.65)
+Homepage: https://gitlab.com/orthographic/comma/-/wikis/home
+
+Package: comma
+Architecture: any
+Depends: libc-dev, libboost-all-dev (>=1.65), gawk, recode, socat
+Description: generic libraries and cli for csv and fixed-width data processing
+  comma, libraries and command line utilities for efficient streaming and
+  processing of comma-separated (csv) and fixed-width binary data
diff --git a/debian/copyright b/debian/copyright
new file mode 100644
index 000000000..e21faf1d4
--- /dev/null
+++ b/debian/copyright
@@ -0,0 +1,32 @@
+####################################################################
+#                              comma                               #
+####################################################################
+
+Copyright (c) 2011 The University of Sydney
+Copyright (c) 2018-2022 Vsevolod Vlaskine
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+1. Redistributions of source code must retain the above copyright
+   notice, this list of conditions and the following disclaimer.
+2. Redistributions in binary form must reproduce the above copyright
+   notice, this list of conditions and the following disclaimer in the
+   documentation and/or other materials provided with the distribution.
+3. Neither the name of the University of Sydney nor the
+   names of its contributors may be used to endorse or promote products
+   derived from this software without specific prior written permission.
+
+NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
diff --git a/debian/rules b/debian/rules
new file mode 100755
index 000000000..22df25864
--- /dev/null
+++ b/debian/rules
@@ -0,0 +1,54 @@
+#!/usr/bin/make -f
+
+BUILDDIR=build_dir
+
+# secondly called by launchpad
+build:
+	mkdir $(BUILDDIR);
+	cd $(BUILDDIR); cmake .. \
+	                 -DCMAKE_INSTALL_PREFIX=../debian/tmp/usr \
+					 -DCMAKE_BUILD_TYPE=Release \
+					 -DBUILD_SHARED_LIBS=ON \
+					 -DBUILD_PYTHON_PACKAGES=OFF \
+					 -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+					 -DBUILD_TESTS=OFF \
+					 -DINSTALL_BASH_COMPLETION=OFF \
+					 -DINSTALL_TESTS=OFF \
+					 -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+					 -Dcomma_INSTALL_PACKAGE_DIR=lib/x86_64-linux-gnu/cmake/comma \
+					 -Dcomma_INSTALL_RUN_POST_INSTALL=OFF \
+					 -Dcomma_BUILD_XML=OFF \
+					 -Dcomma_BUILD_ZEROMQ=OFF \
+					 -Dcomma_build_io_rabbit_cat=OFF
+	cd $(BUILDDIR); make
+
+# thirdly called by launchpad
+binary: binary-indep binary-arch
+
+binary-indep:
+	# nothing to be done
+
+# todo
+#   ! try running rules with make locally
+#   - try cpack (which sucks)
+#   for now super quick and dirty:
+#       mkdir debian/tmp/usr/lib -p
+#       cp -r $(BUILDDIR)/lib/x86_64-linux-gnu debian/tmp/usr/lib
+#   there seems to be a bug, most likely in generate_comma_config.cmake
+#   that installs libraries in build instead of debian/tmp
+#   (cannot reproduce it locally: locally, installation works,
+#   but on launchpad it does not
+binary-arch:
+	cd $(BUILDDIR); make install
+	mkdir debian/tmp/usr/lib -p
+	cp -r $(BUILDDIR)/lib/x86_64-linux-gnu debian/tmp/usr/lib
+	mkdir debian/tmp/DEBIAN
+	dpkg-gencontrol -pcomma
+	dpkg --build debian/tmp ..
+
+# firstly called by launchpad
+clean:
+	rm -rf $(BUILDDIR)
+	rm -f debian/files
+
+.PHONY: binary binary-arch binary-indep clean
diff --git a/dispatch/test/CMakeLists.txt b/dispatch/test/CMakeLists.txt
index aae4ec058..25f6a18aa 100644
--- a/dispatch/test/CMakeLists.txt
+++ b/dispatch/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT dispatch )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT dispatch )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/dynamic/CMakeLists.txt b/dynamic/CMakeLists.txt
new file mode 100644
index 000000000..c5d406906
--- /dev/null
+++ b/dynamic/CMakeLists.txt
@@ -0,0 +1,14 @@
+SET( PROJECT "dynamic" )
+SET( TARGET_NAME comma_${PROJECT} )
+
+FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp )
+FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h )
+SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
+ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
+ADD_DEPENDENCIES( ${TARGET_NAME} comma_base )
+
+INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+
+IF( comma_BUILD_TESTS )
+    ADD_SUBDIRECTORY( test )
+ENDIF( comma_BUILD_TESTS )
diff --git a/dynamic/shared_library.h b/dynamic/shared_library.h
new file mode 100644
index 000000000..ac908cbb0
--- /dev/null
+++ b/dynamic/shared_library.h
@@ -0,0 +1,60 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+
+/// @authors aspen eyers, vsevolod vlaskine
+
+#pragma once 
+#include <dlfcn.h>
+#include <vector>
+#include <memory>
+#include "../base/exception.h"
+
+namespace comma { namespace dynamic {
+
+class shared_library
+{
+    public:
+        shared_library( const std::string& lib, std::vector<std::string> link_directories={} );
+
+        ~shared_library() { dlclose(handle_); }
+
+        template < typename T, typename... Args >
+        T* make( const std::string& library_symbol, Args... args ) const;
+
+    private:
+        void* handle_;
+        std::string lib_;
+};
+
+
+inline shared_library::shared_library( const std::string& lib, std::vector<std::string> link_directories )
+: lib_(lib)
+{
+    char* error;
+    // sanitise_search_directories_
+    for (auto& dir : link_directories) { if( dir.back() != '/' ) { dir += std::string("/"); } }
+    for (const auto& dir : link_directories) {
+        std::string link_lib = (dir+lib).c_str();
+        handle_ = dlopen( &link_lib[0], RTLD_LAZY);
+        error = dlerror();
+        if( error == NULL ){ break; } 
+    }
+    if( error != NULL ) handle_ = dlopen(&lib[0], RTLD_LAZY);
+    COMMA_ASSERT( error == NULL, error );
+}
+
+template < typename T, typename... Args >
+inline T* shared_library::make( const std::string& library_symbol, Args... args ) const
+{
+    char* error{nullptr};
+    auto symbol = dlsym(handle_, &library_symbol[0]);
+    COMMA_ASSERT( error == nullptr, error );
+    if( symbol == nullptr ) { std::cerr << dlerror() << std::endl; }
+    COMMA_ASSERT( symbol, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");
+    T* (*create_)(Args...) = reinterpret_cast<T*(*)(Args...)>(symbol);
+    COMMA_ASSERT( create_, "Shared library loading failed: could not find "+library_symbol+" symbol; on library: \"" + lib_ + "\"");
+
+    T* object = create_(args...);
+    return object;
+}
+
+}}; // namespace comma { namespace dynamic {
diff --git a/dynamic/test/CMakeLists.txt b/dynamic/test/CMakeLists.txt
new file mode 100644
index 000000000..1353ef27e
--- /dev/null
+++ b/dynamic/test/CMakeLists.txt
@@ -0,0 +1,17 @@
+set( KIT dynamic )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+
+add_library( comma_dynamic_test_classes SHARED shared_library_test_classes.cpp )
+target_compile_definitions(comma_dynamic_test_classes PRIVATE DYNAMICLIB_EXPORTS)
+
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread ${CMAKE_DL_LIBS} )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/dynamic/test/include_test.cpp b/dynamic/test/include_test.cpp
new file mode 100644
index 000000000..dbe7b6d29
--- /dev/null
+++ b/dynamic/test/include_test.cpp
@@ -0,0 +1,66 @@
+
+// Copyright (c) 2023 aspen eyers
+
+#include <gtest/gtest.h>
+#include "../shared_library.h"
+#include "../../base/exception.h"
+
+#include "shared_library_test_detail.h"
+#include <dlfcn.h>
+
+namespace comma {
+
+TEST( initialise, no_args )
+{
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    auto p = library.make< comma::dynamic::test::simple >( "comma_dynamic_test_create_simple" );
+    ( void )p;
+}
+
+
+TEST( initialise, args )
+{
+    comma::dynamic::test::point* p;
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    p = library.make<comma::dynamic::test::point, float, float, float>( "comma_dynamic_test_create_point", 1.0, 2.0, 3.0 );
+    EXPECT_EQ( p->x, 1.0 );
+    EXPECT_EQ( p->y, 2.0 );
+    EXPECT_EQ( p->z, 3.0 );
+}
+
+TEST( initialise, polymorphic )
+{
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    auto p = library.make< comma::dynamic::test::polymorphic_point, float, float, float>( "comma_dynamic_test_create_polymorphic_point", 1.0, 2.0, 3.0 );
+    EXPECT_EQ( p->get_x(), 1.0 );
+    EXPECT_EQ( p->get_y(), 2.0 );
+    EXPECT_EQ( p->get_z(), 3.0 );
+}
+
+
+TEST( initialise, vector )
+{
+    std::vector<comma::dynamic::shared_library*> libraries;
+    libraries.emplace_back( new comma::dynamic::shared_library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} ) );
+    auto p = libraries.back()->make< comma::dynamic::test::polymorphic_point, float, float, float>( "comma_dynamic_test_create_polymorphic_point", 1.0, 2.0, 3.0 );
+    EXPECT_EQ( p->get_x(), 1.0 );
+    EXPECT_EQ( p->get_y(), 2.0 );
+    EXPECT_EQ( p->get_z(), 3.0 );
+
+}
+
+TEST( initialise, failure_case )
+{
+    comma::dynamic::shared_library library( "libcomma_dynamic_test_classes.so", {"/home/aspen/src/comma/build/lib"} );
+    EXPECT_THROW({library.make< comma::dynamic::test::simple >( "non_existant_symbol" ); }, comma::exception);
+}
+
+
+
+} // namespace comma {
+
+int main( int argc, char* argv[] )
+{    
+    ::testing::InitGoogleTest(&argc, argv);
+    return RUN_ALL_TESTS();
+}
diff --git a/dynamic/test/shared_library_test_classes.cpp b/dynamic/test/shared_library_test_classes.cpp
new file mode 100644
index 000000000..2f931c638
--- /dev/null
+++ b/dynamic/test/shared_library_test_classes.cpp
@@ -0,0 +1 @@
+#include "shared_library_test_classes.h"
diff --git a/dynamic/test/shared_library_test_classes.h b/dynamic/test/shared_library_test_classes.h
new file mode 100644
index 000000000..dbb456dc6
--- /dev/null
+++ b/dynamic/test/shared_library_test_classes.h
@@ -0,0 +1,7 @@
+#pragma once 
+#include "shared_library_test_detail.h"
+#define DYNAMICLIB_API
+
+extern "C" DYNAMICLIB_API comma::dynamic::test::simple* comma_dynamic_test_create_simple(){ return new comma::dynamic::test::simple(); }
+extern "C" DYNAMICLIB_API comma::dynamic::test::point* comma_dynamic_test_create_point(float x, float y, float z){ return new comma::dynamic::test::point(x, y, z); }
+extern "C" DYNAMICLIB_API comma::dynamic::test::polymorphic_point* comma_dynamic_test_create_polymorphic_point(float x, float y, float z){ return new comma::dynamic::test::polymorphic_point(x, y, z); }
diff --git a/dynamic/test/shared_library_test_detail.h b/dynamic/test/shared_library_test_detail.h
new file mode 100644
index 000000000..f8eadf39d
--- /dev/null
+++ b/dynamic/test/shared_library_test_detail.h
@@ -0,0 +1,34 @@
+#pragma once
+#include <string>
+
+namespace comma { namespace dynamic { namespace test {
+
+class simple{
+    std::string name{"hello world"};
+};
+
+class point{
+    public:
+        point() : x(0), y(0), z(0) {}
+        point(float x, float y, float z) : x(x), y(y), z(z) {}
+        float x;
+        float y;
+        float z;
+};
+
+class polymorphic_point {
+public:
+    polymorphic_point() : x(0), y(0), z(0) {}
+    polymorphic_point(float x, float y, float z) : x(x), y(y), z(z) {}
+    virtual ~polymorphic_point() {}
+    virtual float get_x() const { return x; }
+    virtual float get_y() const { return y; }
+    virtual float get_z() const { return z; }
+
+private:
+    float x;
+    float y;
+    float z;
+};
+
+} } } // namespace comma { namespace dynamic { namespace test {
diff --git a/etc/bash_completion.d/CMakeLists.txt b/etc/bash_completion.d/CMakeLists.txt
index 78be444a2..806af761c 100644
--- a/etc/bash_completion.d/CMakeLists.txt
+++ b/etc/bash_completion.d/CMakeLists.txt
@@ -1,9 +1,6 @@
 IF (UNIX)
-    OPTION( INSTALL_BASH_COMPLETION "Install the BASH completion scripts." ON )
-    SET( INSTALL_BASH_COMPLETION_DIR /etc/bash_completion.d
-         CACHE PATH "Location in which to install the bash completion scripts.")
+    SET( INSTALL_BASH_COMPLETION_DIR /etc/bash_completion.d CACHE PATH "Location in which to install the bash completion scripts.")
     IF( INSTALL_BASH_COMPLETION )
         INSTALL(FILES comma DESTINATION ${INSTALL_BASH_COMPLETION_DIR} )
     ENDIF()
 ENDIF()
-
diff --git a/etc/bash_completion.d/comma b/etc/bash_completion.d/comma
index 6dd9eec80..349dd15cf 100644
--- a/etc/bash_completion.d/comma
+++ b/etc/bash_completion.d/comma
@@ -1,5 +1,5 @@
 # This file is part of comma, a generic and flexible library
-# Copyright (c) 2011 The University of Sydney
+# Copyright (c) 2015 The University of Sydney
 # All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
@@ -36,7 +36,6 @@ _comma_opts()
 --delimiter
 --fields
 --flush
---full-xpath
 --help
 --output-fields
 --precision
@@ -114,7 +113,7 @@ complete -F _csv_time csv-time
 complete -F _csv_update csv-update
 
 # todo
-#     - add --bash-completion to csv-units, csv-update, comma-test-_comma_test_run
+#     - add --bash-completion to csv-update
 #     - install in the installation directory, if possible (if not, /etc is OK)
 
 _comma_bash_completion()
@@ -137,7 +136,9 @@ _comma_bash_completion()
 complete -F _comma_bash_completion comma-test-enforce
 complete -F _comma_bash_completion comma-test-run
 complete -F _comma_bash_completion csv-calc
+complete -F _comma_bash_completion csv-play
 complete -F _comma_bash_completion csv-repeat
 complete -F _comma_bash_completion csv-time-join
 complete -F _comma_bash_completion csv-units
 complete -F _comma_bash_completion io-bandwidth
+complete -F _comma_bash_completion io-topics
diff --git a/examples.md b/examples.md
new file mode 100644
index 000000000..e0c521e7b
--- /dev/null
+++ b/examples.md
@@ -0,0 +1,28 @@
+# csv
+
+## accumulate values
+
+### take velocities, calculate distance
+
+generate sample file with velocity a m/sec at each given time:
+
+```bash
+cat <<eof > velocities.csv
+20200101T000000,0.7
+20200101T000001,1.1
+20200101T000002,1.1
+20200101T000003,0.9
+20200101T000004,1.3
+eof 
+
+```
+
+append distance travelled to each data point:
+
+```bash
+cat velocities.csv \
+    | csv-shuffle --fields t,v --output-fields t,t,v \
+    | csv-time --to seconds --fields ,t \
+    | csv-eval --init-values "prev=0;sum=0" --fields ,cur,v "sum+=(cur-prev)*(prev>0)*v;prev=cur" \
+    | csv-shuffle --fields t,,v,d --output-fields t,v,d
+```
diff --git a/io/CMakeLists.txt b/io/CMakeLists.txt
index 26997da0b..a7ddc3c63 100644
--- a/io/CMakeLists.txt
+++ b/io/CMakeLists.txt
@@ -1,7 +1,7 @@
 SET( PROJECT "io" )
 SET( TARGET_NAME comma_${PROJECT} )
 SET( dir ${SOURCE_CODE_BASE_DIR}/${PROJECT} )
-FILE( GLOB source   ${dir}/*.cpp) 
+FILE( GLOB source   ${dir}/*.cpp)
 FILE( GLOB includes ${dir}/*.h)
 FILE( GLOB impl_source   ${dir}/impl/*.cpp)
 FILE( GLOB impl_includes ${dir}/impl/*.h)
@@ -17,7 +17,7 @@ ELSE( comma_BUILD_ZEROMQ )
 ENDIF( comma_BUILD_ZEROMQ )
 
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_string )
+target_link_libraries( ${TARGET_NAME} ${Boost_LIBRARIES} ${ZeroMQ_LIBRARY} comma_base comma_name_value comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
@@ -32,7 +32,7 @@ INSTALL(
 if( comma_BUILD_APPLICATIONS )
     add_subdirectory( applications )
 endif( comma_BUILD_APPLICATIONS )
-                                           
+
 IF( comma_BUILD_TESTS )
     ADD_SUBDIRECTORY( test )
 ENDIF( comma_BUILD_TESTS )
diff --git a/io/applications/CMakeLists.txt b/io/applications/CMakeLists.txt
index da59b5f07..336357f5f 100644
--- a/io/applications/CMakeLists.txt
+++ b/io/applications/CMakeLists.txt
@@ -6,6 +6,7 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 IF( comma_BUILD_ZEROMQ )
 ADD_EXECUTABLE( zero-cat ${dir}/zero-cat.cpp )
 TARGET_LINK_LIBRARIES ( zero-cat ${ZeroMQ_LIBRARY} comma_io comma_application ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( zero-cat PROPERTIES LINK_FLAGS_RELEASE -s )
 INSTALL( TARGETS zero-cat
          RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR}
          COMPONENT Runtime )
@@ -13,43 +14,55 @@ ENDIF( comma_BUILD_ZEROMQ )
 
 add_executable( io-buffer ${dir}/io-buffer.cpp )
 target_link_libraries( io-buffer comma_application comma_io comma_csv comma_base ) # profiler )
+set_target_properties( io-buffer PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS io-buffer RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 if( NOT WIN32 )
     add_executable( io-bandwidth ${dir}/io-bandwidth.cpp )
     target_link_libraries( io-bandwidth comma_application comma_io )
+    set_target_properties( io-bandwidth PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-bandwidth RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-cat ${dir}/io-cat.cpp )
     target_link_libraries( io-cat comma_application comma_io comma_csv comma_base ) # profiler )
+    set_target_properties( io-cat PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-cat RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-line io-line.cpp )
     target_link_libraries ( io-line comma_application )
+    set_target_properties( io-line PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-line RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-ls ${dir}/io-ls.cpp )
     target_link_libraries( io-ls comma_application comma_csv comma_xpath )
+    set_target_properties( io-ls PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-ls RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( io-publish ${dir}/io-publish.cpp )
-    target_link_libraries( io-publish comma_base comma_io comma_application ) # profiler )
+    target_link_libraries( io-publish comma_base comma_io comma_application comma_xpath comma_name_value ) # profiler )
+    set_target_properties( io-publish PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-publish RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
     add_executable( io-tee ${dir}/io-tee.cpp )
     target_link_libraries( io-tee comma_application comma_io comma_csv comma_base ) # profiler )
+    set_target_properties( io-tee PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-tee RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( udp-client ${dir}/udp-client.cpp )
-    target_link_libraries( udp-client comma_application comma_io comma_csv comma_base ) # profiler )
+    target_link_libraries( udp-client comma_application comma_name_value comma_io comma_csv comma_base comma_string ) # profiler )
+    set_target_properties( udp-client PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS udp-client RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     
     add_executable( io-console ${dir}/io-console.cpp )
     target_link_libraries( io-console comma_base comma_io comma_application ) # profiler )
+    set_target_properties( io-console PROPERTIES LINK_FLAGS_RELEASE -s )
     install( TARGETS io-console RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 endif( NOT WIN32 )
 
 install( PROGRAMS io-topics DESTINATION ${comma_INSTALL_BIN_DIR})
-install( PROGRAMS rabbit-cat DESTINATION ${comma_INSTALL_BIN_DIR})
+option( comma_build_io_rabbit_cat "build rabbit-cat" ON )
+if( comma_build_io_rabbit_cat )
+    install( PROGRAMS rabbit-cat DESTINATION ${comma_INSTALL_BIN_DIR})
+endif( comma_build_io_rabbit_cat )
 install( PROGRAMS zero-publish DESTINATION ${comma_INSTALL_BIN_DIR})
 
diff --git a/io/applications/io-bandwidth.cpp b/io/applications/io-bandwidth.cpp
index 86ebfef73..6db3e413e 100644
--- a/io/applications/io-bandwidth.cpp
+++ b/io/applications/io-bandwidth.cpp
@@ -31,12 +31,13 @@
 
 #include <iostream>
 #include <numeric>
+#include <sstream>
 #include <boost/algorithm/string/replace.hpp>
 #include <boost/array.hpp>
 #include <boost/circular_buffer.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
+#include "../../base/none.h"
 #include "../../io/select.h"
 #include "../../io/stream.h"
 
@@ -45,7 +46,7 @@ static const double default_window_resolution = 0.1f;
 static const double default_update_interval = 1.0f;
 static const char default_delimiter = ',';
 static const std::string standard_output_fields="timestamp,received_bytes,bytes_per_second/all_time,bytes_per_second/window";
-static const std::string extended_output_fields="timestamp,received_bytes,bytes_per_second/all_time,bytes_per_second/window,records_per_second/all_time,records_per_second/window";
+static const std::string extended_output_fields="timestamp,received_bytes,bytes_per_second/all_time,bytes_per_second/window,records_per_second/all_time,records_per_second/window,progress";
 
 static void bash_completion( unsigned const ac, char const * const * av )
 {
@@ -66,12 +67,17 @@ void usage( bool verbose = false )
     std::cerr << "usage: io-bandwidth [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
+    std::cerr << "    --delimiter,-d <delimiter>: default ','" << std::endl;
+    std::cerr << "    --output-fields: list output fields and exit" << std::endl;
+    std::cerr << "    --output-progress,--progress: output only progress indicator; todo: --fields=<output-fields>" << std::endl;
+    std::cerr << "    --porcelain: human-readable output" << std::endl;
+    std::cerr << "    --porcelain-title,--title=<title>; default=io-bandwidth: output will be prefixed with <title>" << std::endl;
+    std::cerr << "    --resolution,-r=[<n>]: sliding window resolution; default=" << default_window_resolution << "s" << std::endl;
     std::cerr << "    --size,-s=[<bytes>]: specify size of one record of input data" << std::endl;
-    std::cerr << "    --window,-w=[<n>]: sliding window; default=" << default_window << "s" << std::endl;
+    std::cerr << "    --total-count=[<n>]: total expected record count, if present, output progress in percent" << std::endl;
+    std::cerr << "    --total-size=[<bytes>]: total expected size in bytes, if present, output progress in percent" << std::endl;
     std::cerr << "    --update,-u=[<n>]: update interval; default=" << default_update_interval << "s" << std::endl;
-    std::cerr << "    --resolution,-r=[<n>]: sliding window resolution; default=" << default_window_resolution << "s" << std::endl;
-    std::cerr << "    --output-fields: list output fields and exit" << std::endl;
-    std::cerr << "    --delimiter,-d <delimiter>: default ','" << std::endl;
+    std::cerr << "    --window,-w=[<n>]: sliding window; default=" << default_window << "s" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    The sliding window consists of a number of buckets. The width of each" << std::endl;
     std::cerr << "    bucket is given by --resolution, and there are sufficient buckets to" << std::endl;
@@ -105,7 +111,15 @@ void usage( bool verbose = false )
     std::cerr << "            dd if=/dev/urandom bs=100 count=1 2> /dev/null; sleep 0.1" << std::endl;
     std::cerr << "        done | io-bandwidth 2> >( io-publish tcp:8888 ) | hexdump" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
+    std::cerr << "    show values in terminal title bar" << std::endl;
+    std::cerr << "        yes | csv-repeat --pace --period 0.001 | head -n10000 \\" << std::endl;
+    std::cerr << "            | io-bandwidth --total-count 10000 --size 2 \\" << std::endl;
+    std::cerr << "                           --porcelain --titlebar >/dev/null" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "    show progress indicator in terminal title bar" << std::endl;
+    std::cerr << "        yes | csv-repeat --pace --period 0.001 | head -n50000 \\" << std::endl;
+    std::cerr << "            | io-bandwidth --total-count 10000 --size 2 \\" << std::endl;
+    std::cerr << "                           --porcelain --titlebar --progress --title='counting yes' >/dev/null" << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
@@ -120,42 +134,47 @@ int main( int ac, char** av )
     {
         comma::command_line_options options( ac, av, usage );
         if( options.exists( "--bash-completion" ) ) bash_completion( ac, av );
-
         if( options.exists( "--output-fields" ))
         {
             if( options.exists( "--size,-s" )) { std::cout << extended_output_fields << std::endl; }
             else { std::cout << standard_output_fields << std::endl; }
             return 0;
         }
-
+        options.assert_mutually_exclusive( "--total-size", "--total-count" );
         // Functionally equivalent to boost::optional< std::size_t > record_size
         // but eliminates the gcc "maybe-uninitialized" warning
-        boost::optional< std::size_t > record_size = boost::make_optional< std::size_t >( false, 0 );
+        boost::optional< std::size_t > record_size = comma::silent_none< std::size_t >();
         if( options.exists( "--size,-s" )) { record_size = options.value< std::size_t >( "--size,-s" ); }
-
+        auto total_count = options.optional< std::uint64_t >( "--total-count" );
+        auto total_size = options.optional< std::uint64_t >( "--total-size" );
+        bool output_progress = options.exists( "--output-progress,--progress" ); // todo! --fields <output fields>
+        COMMA_ASSERT_BRIEF( !total_count || record_size, "--total-count given, please specify --size" );
+        COMMA_ASSERT_BRIEF( !output_progress || total_count || total_size, "--output-progress given; please specify --total-count or --total-size" );
         boost::posix_time::time_duration update_interval = boost::posix_time::microseconds( static_cast<unsigned int> (options.value< double >( "--update,-u", default_update_interval ) * 1000000) );
         double window = options.value< double >( "--window,-w", default_window );
         double bucket_width = options.value< double >( "--resolution,-r", default_window_resolution );
         boost::posix_time::time_duration bucket_duration = boost::posix_time::microseconds( static_cast<unsigned int> (bucket_width * 1000000) );
         char delimiter = options.value( "--delimiter,-d", default_delimiter );
-
+        bool porcelain = options.exists( "--porcelain" );
+        //std::pair< unsigned int, std::string > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? "-\\|/" : "" };
+        //std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "|<>       |", "| <>      |", "|  <>     |", "|   <>    |", "|    <>   |", "|     <>  |", "|      <> |", "|       <>|", "|      <> |", "|     <>  |", "|    <>   |", "|   <>    |", "|  <>     |", "| <>      |" } : std::vector< std::string >{} };
+        std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "[>________]", "[_>_______]", "[__>______]", "[___>_____]", "[____>____]", "[_____>___]", "[______>__]", "[_______>_]", "[________>]", "[________<]", "[_______<_]", "[______<__]", "[_____<___]", "[____<____]", "[___<_____]", "[__<______]", "[_<_______]", "[<________]" } : std::vector< std::string >{} };
+        //std::pair< unsigned int, std::vector< std::string > > porcelain_spinner{ 0, options.exists( "--porcelain-spinner,--spinner" ) ? std::vector< std::string >{ "\\/\\/\\/       ", " /\\/\\/\\      ", "  \\/\\/\\/     ", "   /\\/\\/\\    ", "  \\/\\/\\/   ", "     /\\/\\/\\  ", "    \\/\\/\\/   ", "   /\\/\\/\\    ", "  \\/\\/\\/     ", " /\\/\\/\\      " } : std::vector< std::string >{} };
+        std::string porcelain_title = options.value< std::string >( "--porceilain-title,--title", "io-bandwidth" );
+        if( porcelain ) { delimiter = ' '; }
         comma::io::select select;
         select.read().add( comma::io::stdin_fd );
         comma::io::istream is( "-", comma::io::mode::binary );
-
         unsigned long long total_bytes = 0;
         unsigned int bucket_bytes = 0;
         boost::circular_buffer< unsigned int > window_buckets( std::ceil( window / bucket_width ));
-
         boost::posix_time::ptime start_time = boost::posix_time::microsec_clock::universal_time();
         boost::posix_time::ptime next_update = start_time + update_interval;
         boost::posix_time::ptime next_bucket = start_time + bucket_duration;
-
         bool end_of_stream = false;
         boost::array< char, 65536 > buffer;
         std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
         std::cin.tie( NULL ); // std::cin is tied to std::cout by default
-        
         while( !end_of_stream )
         {
             select.wait( wait_interval );
@@ -170,9 +189,7 @@ int main( int ac, char** av )
                 std::cout.write( &buffer[0], size );
                 std::cout.flush();
             }
-
             boost::posix_time::ptime now = boost::posix_time::microsec_clock::universal_time();
-
             if( now >= next_bucket )
             {
                 window_buckets.push_back( bucket_bytes );
@@ -185,29 +202,35 @@ int main( int ac, char** av )
                     next_bucket = now + bucket_duration;
                 }
             }
-
             if( now >= next_update && !window_buckets.empty() )
             {
                 double elapsed_time = double( ( now - start_time ).total_milliseconds() ) / 1000.0f;
-                double bandwidth = (double)total_bytes / elapsed_time;
-                double window_bandwidth = (double)std::accumulate( window_buckets.begin()
-                                                                 , window_buckets.end()
-                                                                 , 0.0f )
-                                                  / window_buckets.size() / bucket_width;
-
-                std::cerr << boost::posix_time::to_iso_string( now )
-                          << std::fixed
-                          << delimiter << total_bytes
-                          << delimiter << bandwidth
-                          << delimiter << window_bandwidth;
-                std::cerr.unsetf( std::ios_base::floatfield );
-                if( record_size )
+                double bandwidth = double( total_bytes ) / elapsed_time;
+                double window_bandwidth = static_cast< double >( std::accumulate( window_buckets.begin(), window_buckets.end(), 0.0f ) ) / window_buckets.size() / bucket_width;
+                std::ostringstream oss;
+                if( porcelain ) { oss << porcelain_title << ": "; }
+                if( !output_progress )
                 {
-                    std::cerr << delimiter << bandwidth / *record_size
-                              << delimiter << window_bandwidth / *record_size;
+                    oss << ( porcelain ? "time: " : "" ) << boost::posix_time::to_iso_string( now )
+                        << std::fixed
+                        << delimiter << ( porcelain ? "bytes: " : "" ) << total_bytes
+                        << delimiter << ( porcelain ? "bandwidth: " : "" ) << bandwidth
+                        << delimiter << ( porcelain ? "window-bandwidth: " : "" ) << window_bandwidth;
+                    oss.unsetf( std::ios_base::floatfield );
+                    if( record_size )
+                    {
+                        oss << delimiter << ( porcelain ? "record-rate: " : "" ) << bandwidth / *record_size
+                            << delimiter << ( porcelain ? "window-rate: " : "" ) << window_bandwidth / *record_size;
+                    }
                 }
-                std::cerr << std::endl;
-
+                if( total_count ) { oss << delimiter << ( porcelain ? "complete: " : "" ) << ( total_bytes / *record_size * 100 / *total_count ) << ( porcelain ? "%" : "" ); }
+                if( total_size ) { oss << delimiter << ( porcelain ? "complete: " : "" ) << ( total_bytes * 100 / *total_size ) << ( porcelain ? "%" : "" ); }
+                if( output_progress )
+                {
+                    if( !porcelain_spinner.second.empty() ) { oss << " " << porcelain_spinner.second[porcelain_spinner.first++]; }
+                    if( porcelain_spinner.first == porcelain_spinner.second.size() ) { porcelain_spinner.first = 0; }
+                }
+                COMMA_TITLE_BARE( oss.str() );
                 next_update += update_interval;
                 // If there's been a large pause (for some reason), catch up
                 if( now > next_update ) { next_update = now + update_interval; }
diff --git a/io/applications/io-buffer.cpp b/io/applications/io-buffer.cpp
index f2901cfb4..4463bbd04 100644
--- a/io/applications/io-buffer.cpp
+++ b/io/applications/io-buffer.cpp
@@ -43,12 +43,10 @@
 #include <cctype>
 #include <vector>
 #include <fstream>
-#include <boost/filesystem/operations.hpp>
 #include <boost/interprocess/sync/file_lock.hpp>
 #include <boost/interprocess/sync/scoped_lock.hpp>
 #include <boost/algorithm/string.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../io/stream.h"
@@ -102,7 +100,6 @@ void usage( bool verbose = false )
     std::cerr << "          See 'out' operation, in this mode, the program write to standard output and exits when buffer is full." << std::endl;
     std::cerr << "          Call io-buffer multiple times to read more input data." << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/io/applications/io-cat.cpp b/io/applications/io-cat.cpp
index 0e85ec4e7..42064a87a 100644
--- a/io/applications/io-cat.cpp
+++ b/io/applications/io-cat.cpp
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -40,72 +41,107 @@
 #include <boost/scoped_ptr.hpp>
 #include <boost/thread.hpp>
 #include "../../application/command_line_options.h"
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
-#include "../../io/stream.h"
 #include "../../io/select.h"
+#include "../../io/server.h"
+#include "../../io/stream.h"
 #include "../../string/string.h"
 
 void usage( bool verbose = false )
 {
-    std::cerr << std::endl;
-    std::cerr << "read from one or a few sources, merge, and output to stdout" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: io-cat <address> [<address>] ... [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<address>" << std::endl;
-    std::cerr << "    local:<path>: local socket" << std::endl;
-    std::cerr << "    tcp:<host>:<port>: tcp socket" << std::endl;
-    std::cerr << "    udp:<port>: udp socket" << std::endl;
-    std::cerr << "    zmp-<protocol>:<address>: zmq (todo)" << std::endl;
-    std::cerr << "    <filename>: file" << std::endl;
-    std::cerr << "    <fifo>: named pipe" << std::endl;
-    std::cerr << "    -: stdin" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --exit-on-first-closed,-e: exit, if one of the streams finishes" << std::endl;
-    std::cerr << "    --flush,--unbuffered,-u: flush output" << std::endl;
-    std::cerr << "    --round-robin=[<number of packets>]: todo: only for multiple inputs: read not more" << std::endl;
-    std::cerr << "                                         than <number of packets> from an input at once," << std::endl;
-    std::cerr << "                                         before checking other inputs" << std::endl;
-    std::cerr << "                                         if not specified, read from each input" << std::endl;
-    std::cerr << "                                         all available data" << std::endl;
-    std::cerr << "                                         ignored for udp streams, where one full udp" << std::endl;
-    std::cerr << "                                         packet at a time is always read" << std::endl;
-    std::cerr << "    --size,-s=[<size>]: packet size, if binary data (required only for multiple sources)" << std::endl;
-    std::cerr << "    --verbose,-v: more output" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "connect options" << std::endl;
-    std::cerr << "    --connect-max-attempts,--connect-attempts,--attempts,--max-attempts=<n>; default=1; number of attempts to reconnect or 'unlimited'" << std::endl;
-    std::cerr << "    --connect-period=<seconds>; default=1; how long to wait before the next connect attempt" << std::endl;
-    std::cerr << "    --permissive; run even if connection to some sources fails" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "supported address types: tcp, udp, local (unix) sockets, named pipes, files, zmq (todo)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    single stream" << std::endl;
-    std::cerr << "        io-cat tcp:localhost:12345" << std::endl;
-    std::cerr << "        io-cat udp:12345" << std::endl;
-    std::cerr << "        io-cat local:/tmp/socket" << std::endl;
-    std::cerr << "        io-cat some/pipe" << std::endl;
-    std::cerr << "        io-cat some/file" << std::endl;
-    std::cerr << "        io-cat zmq-local:/tmp/socket (not implemented)" << std::endl;
-    std::cerr << "        io-cat zmq-tcp:localhost:12345 (not implemented)" << std::endl;
-    std::cerr << "        echo hello | io-cat -" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    multiple streams" << std::endl;
-    std::cerr << "        merge line-based input" << std::endl;
-    std::cerr << "            io-cat tcp:localhost:55555 tcp:localhost:88888" << std::endl;
-    std::cerr << "        merge binary input with packet size 100 bytes" << std::endl;
-    std::cerr << "            io-cat tcp:localhost:55555 tcp:localhost:88888 --size 100" << std::endl;
-    std::cerr << "        merge line-based input with stdin" << std::endl;
-    std::cerr << "            echo hello | io-cat tcp:localhost:55555 -" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
+    std::cerr << R"(
+read from one or a few sources, merge, and output to stdout
+
+usage: io-cat <address> [<address>] ... [<options>]
+
+<address>
+    local:<path>: local socket
+    tcp:<host>:<port>: tcp socket
+    tcp:<port>: tcp server socket (only partly implemented)
+    udp:<port>: udp socket
+    zmp-<protocol>:<address>: zmq (todo)
+    <filename>: file
+    <fifo>: named pipe
+    -: stdin
+
+options
+    --exit-on-first-closed,-e: exit, if one of the streams finishes
+    --flush,--unbuffered,-u: flush output
+    --verbose,-v: more output
+
+output order options
+    --blocking: blocking read on each source in order sources appear on command line
+                output modes
+                    default:     output all records from the first source, then all
+                                 records from the seconds source, etc
+                    round robin: output <n> records from the first source, then <n>
+                                 records from the seconds source, etc; note that if
+                                 the number of records in a source is not divisible by <n>
+                                 then the last records groups may contain fewer than <n>
+                                 records
+                attention: if you want full control over record ordering, use --blocking
+                           when using subshells or sockets as io-cat inputs)" << std::endl;
+    if( verbose )
+    {
+        std::cerr << R"(                           io-cat will open such inputs, but they may not be immediately
+                           ready for reading, which may lead to records being read from sources
+                           out of order;  use --blocking to avoid this problem
+                           e.g. in the following command without --blocking one subshell may
+                           start slightly earlier than the other and thus likely to output
+                           not what you expect or want - add --blocking to fix that:
+                               io-cat --round-robin=1 \\
+                                      <( csv-paste line-number value=a | head -n100 ) \\
+                                      <( csv-paste line-number value=b | head -n100 ))" << std::endl;
+    }
+    else
+    {
+        std::cerr << "                           run io-cat --help --verbose for more details..." << std::endl;
+    }
+    std::cerr << R"(    --head=[<n>]; output first <n> records and exit without waiting for record n+1
+                  a workaround for sparse input fed into: io-cat ... | head -n10, which
+                  not exit until io-cat receives record 11
+                  instead run: io-cat ... --head=10 (use --flush if you don't want buffering
+    --repeat=[<n>]; read each stream, output <n> times
+                  e.g: run: io-cat my-file-1 my-file-2 --repeat=3
+                       instead of: cat my-file-1 my-file-2 my-file-1 my-file-2 my-file-1 my-file-2
+                  when using for large source, be aware that the sources get stored in memory first
+    --repeat-forever,--forever; same as --repeat, but forever
+    --round-robin=[<number of packets>]: only for multiple inputs: read not more
+                                         than <number of packets> from an input at once,
+                                         before checking other inputs
+                                         if not specified, read from each input
+                                         all available data
+                                         ignored for udp streams, where one full udp
+                                         packet at a time is always read
+    --size=[<bytes>]; on fixed-width binary records, size of the record in bytes, for --round-robin or --head
+    
+connect options
+    --connect-max-attempts,--connect-attempts,--attempts,--max-attempts=<n>; default=1; number of attempts to reconnect or 'unlimited'
+    --connect-period=<seconds>; default=1; how long to wait before the next connect attempt
+    --permissive; run even if connection to some sources fails
+    
+supported address types: tcp, udp, local (unix) sockets, named pipes, files, zmq (todo)
+    
+examples
+    single stream
+        io-cat tcp:localhost:12345
+        io-cat udp:12345
+        io-cat local:/tmp/socket
+        io-cat some/pipe
+        io-cat some/file
+        io-cat zmq-local:/tmp/socket (not implemented)
+        io-cat zmq-tcp:localhost:12345 (not implemented)
+        echo hello | io-cat -
+    multiple streams
+        merge line-based input
+            io-cat tcp:localhost:55555 tcp:localhost:88888
+        merge binary input with packet size 100 bytes
+            io-cat tcp:localhost:55555 tcp:localhost:88888 --size 100
+        merge line-based input with stdin
+            echo hello | io-cat tcp:localhost:55555 -
+)" << std::endl;
     exit( 0 );
 }
 
@@ -114,14 +150,18 @@ class stream
     public:
         stream( const std::string& address ): address_( address ) {}
         virtual ~stream() {}
-        virtual unsigned int read_available( std::vector< char >& buffer, unsigned int max_count ) = 0;
-        virtual comma::io::file_descriptor fd() const = 0;
+        virtual unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking ) = 0;
+        virtual comma::io::file_descriptor fd() const { return comma::io::invalid_file_descriptor; }
         virtual bool eof() const = 0;
         virtual bool empty() const = 0;
         virtual void close() = 0;
         virtual bool closed() const = 0;
         virtual bool connected() const = 0;
         virtual void connect() = 0;
+        virtual void add_to( comma::io::select& select ) const { select.read().add( fd() ); }
+        virtual void remove_from( comma::io::select& select ) const { select.read().remove( fd() ); }
+        virtual bool ready( comma::io::select& select ) const { return select.read().ready( fd() ); }
+        virtual void update( comma::io::select& select ) const {}
         const std::string& address() const { return address_; }
         
     protected:
@@ -148,7 +188,7 @@ class udp_stream : public stream
         
         comma::io::file_descriptor fd() const { return socket_->native_handle(); }
         
-        unsigned int read_available( std::vector< char >& buffer, unsigned int )
+        unsigned int read_available( std::vector< char >& buffer, unsigned int, bool )
         {
             boost::system::error_code error;
             std::size_t size = socket_->receive( boost::asio::buffer( buffer ), 0, error );
@@ -179,17 +219,17 @@ class udp_stream : public stream
         mutable boost::scoped_ptr< boost::asio::ip::udp::socket > socket_; // boost::asio::ip::udp::socket::fd() is non-const for some reason
 };
 
-class any_stream : public stream
+class client_stream : public stream
 {
     public:
-        any_stream( const std::string& address, unsigned int size, bool binary ): stream( address ), size_( size ), binary_( binary ), closed_( false ) {}
+        client_stream( const std::string& address, unsigned int size, bool binary ): stream( address ), size_( size ), binary_( binary ), closed_( false ) {}
         
         comma::io::file_descriptor fd() const { return ( *istream_ ).fd(); }
         
-        unsigned int read_available( std::vector< char >& buffer, unsigned int max_count )
+        unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
         {
             std::size_t available = available_();
-            if( available == 0 ) { return 0; }
+            if( !blocking && available == 0 ) { return 0; }
             if( binary_ )
             {
                 unsigned int count = size_ ? available / size_ : 0;
@@ -213,7 +253,7 @@ class any_stream : public stream
         
         bool empty() const { return !connected() || closed_ || available_() == 0; }
         
-        bool eof() const { return !( *istream_ )->good() || ( *istream_ )->eof(); }
+        bool eof() const { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
         
         void close() { closed_ = true; ( *istream_ ).close(); }
         
@@ -224,7 +264,8 @@ class any_stream : public stream
         void connect()
         {
             if( istream_ ) { return; }
-            istream_.reset( new comma::io::istream( address_, comma::io::mode::binary, comma::io::mode::non_blocking ) );
+            auto blocking_mode = false ? comma::io::mode::non_blocking : comma::io::mode::blocking; // todo? expose on command line?
+            istream_.reset( new comma::io::istream( address_, comma::io::mode::binary, blocking_mode ) );
             if( ( *istream_ )() != &std::cin ) { return; }
             std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
             std::cin.tie( NULL ); // std::cin is tied to std::cout by default
@@ -247,12 +288,105 @@ class any_stream : public stream
         }
 };
 
-static stream* make_stream( const std::string& address, unsigned int size, bool binary )
+class server_stream : public stream // todo! super-quick and dirty! get streams from the server instead and add/remove them to/from read methods
+{
+    public:
+        server_stream( const std::string& address, unsigned int size, bool binary, bool blocking )
+            : stream( address )
+            , _size( size )
+            , _binary( binary )
+            , _blocking( blocking )
+            , _server( address, binary ? comma::io::mode::binary : comma::io::mode::ascii, blocking )
+        {
+        }
+        
+        unsigned int read_available( std::vector< char >& buffer, unsigned int max_count, bool blocking )
+        {
+            COMMA_ASSERT_BRIEF( blocking == _blocking, "server stream is " << ( _blocking ? "blocking" : "non-blocking" ) << ", but asked to do " << ( blocking ? "blocking" : "non-blocking" ) << " read" );
+            unsigned int count{0};
+            char* p = &buffer[0];
+            while( true )
+            {
+                std::size_t available_at_least = _server.available_at_least();
+                if( !blocking && available_at_least == 0 ) { return 0; }
+                if( _binary )
+                {
+                    if( _server.read( p, _size ) != _size ) { return 0; } // todo? more checks?
+                    ++count;
+                    p += _size;
+                    if( count >= max_count || count * _size >= available_at_least ) { return count * _size; }
+                }
+                else
+                {
+                    std::string line = _server.getline();
+                    if( line.empty() ) { return 0; }
+                    if( line.size() >= buffer.size() ) { buffer.resize( line.size() + 1 ); }
+                    ::memcpy( &buffer[0], &line[0], line.size() );
+                    buffer[ line.size() ] = '\n';
+                    return line.size() + 1;
+                }
+            }
+            return 0;
+        }
+        
+        bool empty() const { return _closed || _server.available_at_least() == 0; }
+        
+        bool eof() const { return closed(); } // { return bool( istream_ ) && ( !( *istream_ )->good() || ( *istream_ )->eof() ); }
+        
+        void close() { _closed = true; _server.close(); }
+        
+        bool closed() const { return _closed; }
+        
+        bool connected() const { return true; }
+        
+        void connect() {}
+
+        void add_to( comma::io::select& select ) const
+        {
+            for( auto d: _server.select().read()() ) { select.read().add( d ); }
+            select.read().add( _server.acceptor_file_descriptor() ); // uber-quick and dirty
+        }
+
+        void remove_from( comma::io::select& select ) const
+        {
+            for( auto d: _server.select().read()() ) {  select.read().remove( d ); }
+            select.read().add( _server.acceptor_file_descriptor() ); // uber-quick and dirty
+        }
+
+        void update( comma::io::select& select ) const
+        {
+            // todo
+        }
+
+        // todo!? use io::impl::receive()?
+        // todo! get streams from the server instead and add/remove them to/from read methods
+        // todo! test connecting/disconnecting clients
+        // todo! test multiple clients
+        // todo! cpu performance when there are no connections
+        // todo? for now, if server, don't allow multiple input streams
+        // todo! examples
+
+        bool ready( comma::io::select& select ) const
+        {
+            for( auto d: _server.select().read()() ) { if( select.read().ready( d ) ) { return true; } }
+            return false;
+        }
+        
+    private:
+        unsigned int _size{0};
+        bool _binary{false};
+        bool _blocking{false};
+        bool _closed{false};
+        comma::io::iserver _server;
+};
+
+static stream* make_stream( const std::string& address, unsigned int size, bool binary, bool blocking )
 {
     const std::vector< std::string >& v = comma::split( address, ':' );
     if( v[0] == "udp" ) { return new udp_stream( address ); }
-    if( v[0] == "zmq-local" || v[0] == "zero-local" || v[0] == "zmq-tcp" || v[0] == "zero-tcp" ) { COMMA_THROW( comma::exception, "io-cat: zmq support not implemented" ); }
-    return new any_stream( address, size, binary );
+    if( v[0] == "tcp" && v.size() == 2 ) { return new server_stream( address, size, binary, blocking ); } // todo: quick and dirty for now; a better check if tcp:<port>-like
+    COMMA_ASSERT_BRIEF( v[0] != "zmq-local" && v[0] != "zero-local" && v[0] != "zmq-tcp" && v[0] != "zero-tcp", "zmq support not implemented" );
+    return new client_stream( address, size, binary );
 }
 
 static bool verbose;
@@ -260,10 +394,19 @@ static unsigned int connect_max_attempts;
 static boost::posix_time::time_duration connect_period;
 static bool permissive;
 
-static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select& select, bool connected_all_we_could )
+static bool ready( const boost::ptr_vector< stream >& streams, comma::io::select& select, bool connected_all_we_could, bool blocking )
 {
+    for( const auto& s: streams ) { s.update( select ); } // quick and dirty
+    if( blocking )
+    {
+        select.check();
+        bool r{connected_all_we_could};
+        for( unsigned int i = 0; i < streams.size() && r; ++i ) { r = streams[i].closed() || streams[i].ready( select ); }
+        if( !r ) { boost::this_thread::sleep( boost::posix_time::milliseconds( 10 ) ); } // quick and dirty
+        return r;
+    }
     for( unsigned int i = 0; i < streams.size(); ++i ) { if( !streams[i].empty() ) { select.check(); return true; } }
-    if( !select.read()().empty() ) { return select.wait( boost::posix_time::seconds( 1 ) ) > 0; }
+    if( !select.read()().empty() ) { return select.wait( boost::posix_time::milliseconds( 100 ) ) > 0; }
     if( connected_all_we_could ) { return true; }
     boost::this_thread::sleep( connect_period );
     return false;
@@ -285,32 +428,90 @@ static bool try_connect( boost::ptr_vector< stream >& streams, comma::io::select
         if( streams[i].connected() ) { continue; }
         try
         {
-            if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): connecting, attempt " << ( attempts + 1 ) << " of " << ( connect_max_attempts == 0 ? std::string( "unlimited" ) : boost::lexical_cast< std::string >( connect_max_attempts ) ) << "..." << std::endl; }
+            comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connecting, attempt " << ( attempts + 1 ) << " of " << ( connect_max_attempts == 0 ? std::string( "unlimited" ) : boost::lexical_cast< std::string >( connect_max_attempts ) ) << "..." << std::endl;
             streams[i].connect();
-            if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): connected" << std::endl; }
-            select.read().add( streams[i] );
+            comma::saymore() << "stream " << i << " (" << streams[i].address() << "): connected" << std::endl;
+            streams[i].add_to( select );
             --unconnected_count;
             continue;
         }
         catch( std::exception& ex ) { what = ex.what(); }
         catch( ... ) { what = "unknown exception"; }
-        if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): failed to connect" << std::endl; }
+        comma::saymore() << "stream " << i << " (" << streams[i].address() << "): failed to connect" << std::endl;
     }
     ++attempts;
-    connected_all_we_could = unconnected_count == 0 || ( permissive && connect_max_attempts > 0 && attempts >= connect_max_attempts );
-    if( connected_all_we_could ) { return connected_all_we_could; }
-    if( connect_max_attempts == 0 || attempts < connect_max_attempts ) { return connected_all_we_could; }
-    std::cerr << "io-cat: fatal: after " << attempts << " attempt(s): " << what << std::endl;
+    if( unconnected_count == 0 ) { return true; }
+    if( connect_max_attempts == 0 ) { return false; }
+    if( attempts < connect_max_attempts ) { return false; }
+    if( permissive ) { return true; }
+    comma::say() << "fatal: after " << attempts << " attempt(s): " << what << std::endl;
     exit( 1 );
 }
 
+struct output_t
+{
+    unsigned int size{0};
+    bool forever{false};
+    std::vector< std::vector< char > > buffers; // todo: quick and dirty, watch performance on push back of large inputs
+
+    operator bool() const { return !buffers.empty(); }
+
+    output_t() = default;
+    output_t( const comma::command_line_options& options, unsigned int n )
+        : size( options.value( "--repeat", 0 ) )
+        , forever( options.exists( "--repeat-forever,--forever" ) )
+        , buffers( size > 0 || forever ? n : 0 )
+    {
+    }
+
+    void write( unsigned int i, const std::vector< char >& buffer, unsigned int bytes_read )
+    {
+        if( buffers.empty() ) { std::cout.write( &buffer[0], bytes_read ); return; }
+        unsigned int s = buffers[i].size();
+        buffers[i].resize( s + bytes_read );
+        std::memcpy( &buffers[i][s], &buffer[0], bytes_read );
+    }
+
+    void finalise( const comma::signal_flag& is_shutdown ) const
+    {
+        for( unsigned int i = 0; !is_shutdown && ( i < size || forever ); ++i )
+        {
+            for( unsigned int j = 0; !is_shutdown && j < buffers.size() && std::cout.good(); ++j )
+            {
+                std::cout.write( &buffers[j][0], buffers[j].size() );
+            }
+        }
+    }
+};
+
+output_t output;
+
+static bool _write( unsigned int i, const comma::command_line_options& options, const std::vector< char >& buffer, unsigned int bytes_read )
+{
+    static unsigned int head = options.value( "--head", 0 );
+    static unsigned int size = options.value( "--size,-s", 0 );
+    static unsigned int count = 0;
+    if( head == 0 ) { output.write( i, buffer, bytes_read ); return true; }
+    if( size == 0 )
+    {
+        output.write( i, buffer, bytes_read );
+        ++count;
+    }
+    else
+    {
+        unsigned int n = std::min( bytes_read / size, head - count );
+        output.write( i, buffer, n * size );
+        count += n;
+    }
+    return count < head;
+}
+
 int main( int argc, char** argv )
 {
     #ifdef WIN32
-    std::cerr << "io-cat: not implemented on windows" << std::endl;
+    comma::say() << "not implemented on windows" << std::endl;
     return 1;
     #endif
-    
     try
     {
         if( argc < 2 ) { usage(); }
@@ -318,53 +519,61 @@ int main( int argc, char** argv )
         comma::signal_flag is_shutdown;
         verbose = options.exists( "--verbose,-v" );
         unsigned int size = options.value( "--size,-s", 0 );
+        bool blocking = options.exists( "--blocking" );
         bool unbuffered = options.exists( "--flush,--unbuffered,-u" );
         bool exit_on_first_closed = options.exists( "--exit-on-first-closed,-e" );
+        options.assert_mutually_exclusive( "--blocking", "--permissive" );
         std::string connect_max_attempts_string = options.value< std::string >( "--connect-max-attempts,--connect-attempts,--attempts,--max-attempts", "1" );
         connect_max_attempts = connect_max_attempts_string == "unlimited" ? 0 : boost::lexical_cast< unsigned int >( connect_max_attempts_string );
         double connect_period_seconds = options.value( "--connect-period", 1.0 );
         connect_period = boost::posix_time::milliseconds( static_cast<unsigned int>(std::floor( connect_period_seconds * 1000 ) ));
         permissive = options.exists( "--permissive" );
-        const std::vector< std::string >& unnamed = options.unnamed( "--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
+        bool has_head = options.exists( "--head" );
+        const std::vector< std::string >& unnamed = options.unnamed( "--repeat-forever,--forever,--blocking,--permissive,--exit-on-first-closed,-e,--flush,--unbuffered,-u,--verbose,-v", "-.+" );
+        options.assert_mutually_exclusive( "--round-robin", "--repeat,--repeat-forever,--forever" );
         #ifdef WIN32
-        if( size || unnamed.size() == 1 ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        if( size || ( unnamed.size() == 1 && !has_head ) ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        //if( size ) { _setmode( _fileno( stdout ), _O_BINARY ); }
         #endif
-        if( unnamed.empty() ) { std::cerr << "io-cat: please specify at least one source" << std::endl; return 1; }
+        COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify at least one source" );
+        output = output_t( options, unnamed.size() );
         boost::ptr_vector< stream > streams;
         comma::io::select select;
-        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size || unnamed.size() == 1 ) ); }
+        for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 || ( unnamed.size() == 1 && !has_head ), blocking ) ); }
+        //for( unsigned int i = 0; i < unnamed.size(); ++i ) { streams.push_back( make_stream( unnamed[i], size, size > 0 ) ); }
+        comma::saymore() << "created " << unnamed.size() << " stream" << ( unnamed.size() == 1 ? "" : "s" ) << std::endl;
         const unsigned int max_count = size ? ( size > 65536u ? 1 : 65536u / size ) : 0;
         std::vector< char > buffer( size ? size * max_count : 65536u );        
         unsigned int round_robin_count = unnamed.size() > 1 ? options.value( "--round-robin", 0 ) : 0;
         for( bool done = false; !done; )
         {
-            if( is_shutdown ) { std::cerr << "io-cat: received signal" << std::endl; break; }
+            if( is_shutdown ) { comma::saymore() << "received signal" << std::endl; break; }
             bool connected_all_we_could = try_connect( streams, select );
-            if( !ready( streams, select, connected_all_we_could ) ) { continue; }
+            if( !ready( streams, select, connected_all_we_could, blocking ) ) { continue; }
             done = true;
             for( unsigned int i = 0; i < streams.size(); ++i )
             {
                 if( !streams[i].connected() ) { done = connected_all_we_could; continue; }
                 if( streams[i].closed() ) { continue; }
-                bool ready = select.read().ready( streams[i].fd() );
+                bool ready = streams[i].ready( select );
                 bool empty = streams[i].empty();
-                if( empty && ( streams[i].eof() || ready ) )
-                { 
-                    if( verbose ) { std::cerr << "io-cat: stream " << i << " (" << unnamed[i] << "): closed" << std::endl; }
-                    select.read().remove( streams[i].fd() );
+                if( empty && ( ready || streams[i].eof() ) )
+                {
+                    comma::saymore() << "stream " << i << " (" << unnamed[i] << "): closed" << std::endl;
+                    streams[i].remove_from( select );
                     streams[i].close();
-                    if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { return 0; }
+                    if( exit_on_first_closed || ( connected_all_we_could && select.read()().empty() ) ) { done = true; break; }
                     continue;
                 }
                 if( !ready && empty ) { done = false; continue; }
                 unsigned int countdown = round_robin_count;
                 while( !streams[i].eof() ) // todo? check is_shutdown here as well?
                 {
-                    unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count );
+                    unsigned int bytes_read = streams[i].read_available( buffer, countdown ? countdown : max_count, blocking );
                     if( bytes_read == 0 ) { break; }
                     done = false;
-                    if( size && bytes_read % size != 0 ) { std::cerr << "io-cat: stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) << std::endl; return 1; }
-                    std::cout.write( &buffer[0], bytes_read );
+                    COMMA_ASSERT_BRIEF( !( size && bytes_read % size != 0 ), "stream " << i << " (" << streams[i].address() << "): expected " << size << " byte(s), got only " << ( bytes_read % size ) );
+                    if( !_write( i, options, buffer, bytes_read ) ) { done = true; break; }
                     if( !std::cout.good() ) { done = true; break; }
                     if( unbuffered ) { std::cout.flush(); }
                     if( round_robin_count )
@@ -375,9 +584,10 @@ int main( int argc, char** argv )
                 }
             }
         }
+        output.finalise( is_shutdown );
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << "io-cat: " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << "io-cat: unknown exception" << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
diff --git a/io/applications/io-console.cpp b/io/applications/io-console.cpp
index 5ff2525d8..6076306e1 100644
--- a/io/applications/io-console.cpp
+++ b/io/applications/io-console.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <termios.h>
 #include <iostream>
@@ -34,6 +7,23 @@
 #include "../../application/signal_flag.h"
 #include "../select.h"
 
+class no_echo_term
+{
+    public:
+        no_echo_term()
+        {
+            ::tcgetattr( STDIN_FILENO, &_old );
+            termios t = _old;
+            t.c_lflag &= ~( ICANON | ECHO );
+            ::tcsetattr( STDIN_FILENO, TCSANOW, &t );
+        }
+
+        ~no_echo_term() { ::tcsetattr( STDIN_FILENO, TCSANOW, &_old ); }
+
+    private:
+        struct termios _old;
+};
+
 int main( int argc, char** argv )
 {
     try
@@ -44,22 +34,20 @@ int main( int argc, char** argv )
             ( "help,h", "display help message" )
             ( "heartbeat,b", "output byte with value 0x00 when key pressed" )
             ( "period,t", boost::program_options::value< double >( &period )->default_value( 0.1, "0.1" ), "period in seconds between heartbeats" );
-
         boost::program_options::variables_map vm;
         boost::program_options::store( boost::program_options::parse_command_line( argc, argv, description), vm );
         boost::program_options::notify( vm );
-
         if ( vm.count( "help" ) )
         {
-            std::cerr << "take arrow keys, output key numeric values to stdout" << std::endl;
+            std::cerr << std::endl;
+            std::cerr << "take key presses, output key numeric values to stdout" << std::endl;
             std::cerr << "usage: io-console [<options>]" << std::endl;
             std::cerr << description << std::endl;
-            return 1;
+            std::cerr << std::endl;
+            return 0;
         }
-
         boost::scoped_ptr< comma::io::select > select;
-        unsigned int seconds = 0;
-        unsigned int nanoseconds = 0;
+        unsigned int seconds{0}, nanoseconds{0};
         if ( vm.count( "heartbeat" ) )
         {
             select.reset( new comma::io::select() );
@@ -67,15 +55,7 @@ int main( int argc, char** argv )
             seconds = std::floor( period );
             nanoseconds = std::floor( double( seconds == 0 ? period : std::fmod( period, seconds ) ) * 1e9 );
         }
-        
-        // remove echo from the console
-        struct termios oldTerm;
-        struct termios newTerm;
-        ::tcgetattr( STDIN_FILENO, &oldTerm );
-        newTerm = oldTerm;
-        newTerm.c_lflag &= ~( ICANON | ECHO );
-        ::tcsetattr( STDIN_FILENO, TCSANOW, &newTerm );
-        
+        no_echo_term t;
         comma::signal_flag signal;
         while( !signal && std::cout.good() && !std::cout.bad() )
         {
@@ -88,7 +68,6 @@ int main( int argc, char** argv )
             std::cout.write( &c, 1 );
             std::cout.flush();
         }
-        ::tcsetattr( STDIN_FILENO, TCSANOW, &oldTerm ); // restore the console
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << argv[0] << ": " << ex.what() << std::endl; }
diff --git a/io/applications/io-line.cpp b/io/applications/io-line.cpp
index 3194ea6f9..7617634f0 100644
--- a/io/applications/io-line.cpp
+++ b/io/applications/io-line.cpp
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author mathew hounsell
 
@@ -38,13 +11,12 @@
 #include <string>
 #include <vector>
  
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 
 void usage( bool const verbose = false )
 {
-    static char const * const message =
+    std::cerr <<
         "\n"
         "\nA toolkit for quick access to ascii line-based input stream"
         "\n"
@@ -79,7 +51,6 @@ void usage( bool const verbose = false )
         "\n    ( echo xxx ; echo yy ; echo zzzz ) | io-line length | while true ; do echo 'read line:' ; io-line get || break ; done"
         "\n"
         "\n";
-    std::cerr << message << comma::contact_info << '\n' << std::endl;
     std::exit( 0 );
 }
 
diff --git a/io/applications/io-ls.cpp b/io/applications/io-ls.cpp
index 80c5b8308..916b8ad2e 100644
--- a/io/applications/io-ls.cpp
+++ b/io/applications/io-ls.cpp
@@ -1,3 +1,32 @@
+// This file is part of comma, a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
 #include "../../application/command_line_options.h"
 #include "../../application/verbose.h"
 #include "../../csv/stream.h"
@@ -140,12 +169,12 @@ void process_tcp(std::istream& is, const comma::csv::options& csv)
     comma::csv::output_stream<output_t> os(std::cout, csv);
     //first line is header
     std::getline(is,line);
-    comma::verbose<<line<<std::endl;
-    while(is.good())
+    comma::saymore() << line << std::endl;
+    while( is.good() )
     {
         std::getline(is,line);
-        comma::verbose<<line<<std::endl;
-        output.scan(line);
+        comma::saymore() << line << std::endl;
+        output.scan( line );
         if(port && output.local.port != *port) {continue;}
         if(state && output.state != *state) {continue;}
         os.write(output);
@@ -155,7 +184,7 @@ void usage(bool detail)
 {
     std::cerr << "    list tcp connections; reads and parses lines from /proc/net/tcp file and outputs them in csv format" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "usage:  " << comma::verbose.app_name() << " [ <options> ]" << std::endl;
+    std::cerr << "usage:  io-ls [ <options> ]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "options" << std::endl;
     std::cerr << "    --help,-h: show help" << std::endl;
@@ -172,7 +201,7 @@ void usage(bool detail)
     }
     else { std::cerr << "    see --help --verbose for more details" << std::endl<< std::endl; }
     std::cerr << "example" << std::endl;
-    std::cerr << "    (" << comma::verbose.app_name() << " --output-fields; "<<comma::verbose.app_name() << ") | column -ts, " << std::endl;
+    std::cerr << "    (io-ls --output-fields; io-ls | column -ts, " << std::endl;
     std::cerr << std::endl;
     std::cerr << "    io-ls --fields=local,state | csv-join --fields=,,state <(io-ls --enum-state)\";fields=state\"" << std::endl;
     std::cerr << std::endl;
@@ -192,14 +221,9 @@ int main( int ac, char** av )
         state=options.optional<unsigned int>("--state");
         std::fstream file("/proc/net/tcp", std::ios::in);
         process_tcp(file, csv);
+        return 0;
     }
-    catch( std::exception& ex )
-    {
-        std::cerr << comma::verbose.app_name() << ": " << ex.what() << std::endl; return 1;
-    }
-    catch( ... )
-    {
-        std::cerr << comma::verbose.app_name() << ": " << "unknown exception" << std::endl; return 1;
-    }
-    return 0;
+    catch( std::exception& ex ) { comma::say() << ": " << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << ": unknown exception" << std::endl; }
+    return 1;
 }
diff --git a/io/applications/io-publish.cpp b/io/applications/io-publish.cpp
index bda3ad29f..0f46d6d86 100644
--- a/io/applications/io-publish.cpp
+++ b/io/applications/io-publish.cpp
@@ -1,50 +1,16 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2020 Vsevolod Vlaskine
 
 /// @authors cedric wohlleber, vsevolod vlaskine, dave jennings
 
-#include <errno.h>
-#include <signal.h>
-#include <sys/wait.h>
-#include <unistd.h>
-
-#include <boost/bind.hpp>
-#include <boost/date_time/posix_time/posix_time.hpp>
-#include <boost/ptr_container/ptr_vector.hpp>
-#include <boost/scoped_ptr.hpp>
-#include <boost/thread.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../application/signal_flag.h"
 #include "../../base/last_error.h"
 #include "../../io/file_descriptor.h"
 #include "../../io/publisher.h"
+#include "../../io/impl/publish.h"
+#include "../../io/select.h"
+#include "../../name_value/map.h"
 #include "../../string/string.h"
 #include "../../sync/synchronized.h"
 
@@ -52,207 +18,91 @@
 
 static void usage( bool verbose = false )
 {
-    std::cerr << std::endl;
-    std::cerr << "read from standard input and write to given outputs (files, sockets, named pipes):" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "- the data is only written to the outputs that are ready for writing" << std::endl;
-    std::cerr << "- client can connect and disconnect at any time" << std::endl;
-    std::cerr << "- only full packets are written" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: io-publish [<options>] <outputs>" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "general options" << std::endl;
-    std::cerr << "    --help,-h: show this help" << std::endl;
-    std::cerr << "    --verbose,-v: more output to stderr" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "stream options" << std::endl;
-    std::cerr << "    --size,-s: binary input; packet size" << std::endl;
-    std::cerr << "    --multiplier,-m: multiplier for packet size, default is 1. The actual packet size will be m * s" << std::endl;
-    std::cerr << "    --no-discard: if present, do blocking write to every open stream" << std::endl;
-    std::cerr << "    --no-flush: if present, do not flush the output stream (use on high bandwidth sources)" << std::endl;
-    std::cerr << "    --exec=[<cmd>]: read from cmd rather than stdin" << std::endl;
-    std::cerr << "    -- [<cmd>]: alternate syntax for specifying a command (simplifies quoting)" << std::endl;
-    std::cerr << "    --on-demand: only run <cmd> when a client is connected" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "client options" << std::endl;
-    std::cerr << "    --exit-on-no-clients,-e: once the last client disconnects, exit" << std::endl;
-    std::cerr << "    --output-number-of-clients,--clients: output to stdout timestamped number of clients whenever it changes" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    attention: in the current implementation, the number of clients will be" << std::endl;
-    std::cerr << "               updated only on attempt to write a new record," << std::endl;
-    std::cerr << "               i.e. output number of clients will not change if there are no new" << std::endl;
-    std::cerr << "               records on stdin, even if the actual number of clients changes" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "    known problems: io::ostream or at least boost::asio::ostream does not mark" << std::endl;
-    std::cerr << "               stream as bad, if one tries to write to it first time after" << std::endl;
-    std::cerr << "               stream has been closed; the stream is marked as bad only after" << std::endl;
-    std::cerr << "               writing to it second time." << std::endl;
-    std::cerr << "               This problem is pretty benign: the worst thing that happens is" << std::endl;
-    std::cerr << "               writing to a closed stream, which will not cause grief unless you" << std::endl;
-    std::cerr << "               specifically rely on io-publish exiting on no clients for a" << std::endl;
-    std::cerr << "               rarely sent heartbeat." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "               io-publish will not be very responsive in counting clients for" << std::endl;
-    std::cerr << "               low bandwidth streams. It immediately recognises new clients" << std::endl;
-    std::cerr << "               but might take a while to notice that a client has gone." << std::endl;
-    std::cerr << "               This affects --output-number-of-clients and --on-demand." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "output streams" << std::endl;
-    std::cerr << "    tcp:<port>: e.g. tcp:1234" << std::endl;
-    std::cerr << "    udp:<port>: e.g. udp:1234 (todo)" << std::endl;
-    std::cerr << "    local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket" << std::endl;
-    std::cerr << "    <named pipe name>: named pipe, which will be re-opened, if client reconnects" << std::endl;
-    std::cerr << "    <filename>: a regular file" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "examples" << std::endl;
-    std::cerr << "    cat data | io-publish tcp:1234 --size 100" << std::endl;
-    std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand --exec \"camera-cat arg1 arg2\"" << std::endl;
-    std::cerr << "    io-publish tcp:1234 --size 24000 --on-demand -- camera-cat arg1 arg2" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 0 );
-}
+    std::cerr << R"(
+read from standard input and write to given outputs (files, sockets, named pipes):
 
-class publish
-{
-    public:
-        typedef comma::synchronized< boost::ptr_vector< comma::io::publisher > > publishers_t;
-        
-        typedef publishers_t::scoped_transaction transaction_t;
-        
-        publish( const std::vector< std::string >& filenames
-               , unsigned int packet_size
-               , bool discard
-               , bool flush
-               , bool output_number_of_clients
-               , bool report_no_clients )
-            : buffer_( packet_size, '\0' )
-            , packet_size_( packet_size )
-            , output_number_of_clients_( output_number_of_clients )
-            , report_no_clients_( report_no_clients )
-            , got_first_client_ever_( false )
-            , sizes_( filenames.size(), 0 )
-            , num_clients_( 0 )
-            , is_shutdown_( false )
-        {
-            struct sigaction new_action, old_action;
-            new_action.sa_handler = SIG_IGN;
-            sigemptyset( &new_action.sa_mask );
-            sigaction( SIGPIPE, NULL, &old_action );
-            sigaction( SIGPIPE, &new_action, NULL );
-            transaction_t t( publishers_ );
-            for( std::size_t i = 0; i < filenames.size(); ++i )
-            {
-                t->push_back( new comma::io::publisher( filenames[i]
-                                                      , is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii
-                                                      , !discard
-                                                      , flush ));
-            }
-            acceptor_thread_.reset( new boost::thread( boost::bind( &publish::accept_, boost::ref( *this ))));
-        }
-        
-        ~publish()
-        {
-            is_shutdown_ = true;
-            acceptor_thread_->join();
-            transaction_t t( publishers_ );
-            { for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i].close(); } }
-        }
-        
-        bool read( std::istream& input )
-        {
-            if( is_binary_() )
-            {
-                input.read( &buffer_[0], buffer_.size() );
-                if( input.gcount() < int( buffer_.size() ) || !input.good() ) { return false; }
-            }
-            else
-            {
-                std::getline( input, buffer_ );
-                buffer_ += '\n';
-                if( !input.good() ) { return false; }
-            }
-            transaction_t t( publishers_ );
-            for( std::size_t i = 0; i < t->size(); ++i ) { ( *t )[i].write( &buffer_[0], buffer_.size(), false ); }
-            return handle_sizes_( t );
-        }
+- the data is only written to the outputs that are ready for writing
+- client can connect and disconnect at any time
+- only full packets are written
 
-        unsigned int num_clients() const { return num_clients_; }
+usage: io-publish [<options>] <outputs>
 
-    private:
-        bool is_binary_() const { return packet_size_ > 0; }
-        
-        bool handle_sizes_( transaction_t& t )
-        {
-            if( !output_number_of_clients_ && !report_no_clients_ ) { return true; }
-            unsigned int total = 0;
-            bool changed = false;
-            for( unsigned int i = 0; i < t->size(); ++i )
-            {
-                unsigned int size = ( *t )[i].size();
-                total += size;
-                if( sizes_[i] == size ) { continue; }
-                sizes_[i] = size;
-                changed = true;
-                num_clients_ = total;
-            }
-            if( !changed ) { return true; }
-            if( output_number_of_clients_ )
-            {
-                std::cout << boost::posix_time::to_iso_string( boost::posix_time::microsec_clock::universal_time() );
-                for( unsigned int i = 0; i < sizes_.size(); ++i ) { std::cout << ',' << sizes_[i]; }
-                std::cout << std::endl;
-            }
-            if( report_no_clients_ )
-            {
-                if( total > 0 ) { got_first_client_ever_ = true; }
-                else if( got_first_client_ever_ ) { std::cerr << "io-publish: the last client exited" << std::endl; return false; }
-            }
-            return true;
-        }
-        
-        void accept_()
-        {
-            comma::io::select select;
-            {
-                transaction_t t( publishers_ );
-                for( unsigned int i = 0; i < t->size(); ++i ) { if( ( *t )[i].acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i].acceptor_file_descriptor() ); } }
-            }
-            while( !is_shutdown_ )
-            {
-                select.wait( boost::posix_time::millisec( 100 ) ); // arbitrary timeout
-                transaction_t t( publishers_ );
-                for( unsigned int i = 0; i < t->size(); ++i )
-                {
-                    if( select.read().ready( ( *t )[i].acceptor_file_descriptor() ) ) { ( *t )[i].accept(); }
-                }
-                handle_sizes_( t );
-            }
-        }
-        
-        publishers_t publishers_;
-        std::string buffer_;
-        unsigned int packet_size_;
-        bool output_number_of_clients_;
-        bool report_no_clients_;
-        bool got_first_client_ever_;
-        std::vector< unsigned int > sizes_;
-        unsigned int num_clients_;
-        boost::scoped_ptr< boost::thread > acceptor_thread_;
-        bool is_shutdown_;
-};
+general options
+    --help,-h: show this help
+    --verbose,-v: more output to stderr
+
+stream options
+    --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
+                                         the cached records will be sent to it once connected
+    --size,-s: binary input; packet size
+    --multiplier,-m: multiplier for packet size, default is 1. The actual packet size will be m * s
+    --no-discard: if present, do blocking write to every open stream
+    --no-flush: if present, do not flush the output stream (use on high bandwidth sources)
+    --exec=[<command>]: read from <command> rather than stdin
+    -- [<command>]: alternate syntax for specifying a command (simplifies quoting)
+    --on-demand: only run <command> when a client is connected
+    --timeout-read,--read-timeout=<seconds>; exit or disconnect if no input data
+                                             for longer than <seconds>
+                                             limitation: if an input packet is half-read
+                                                         io-publish still will block on read
+    --timeout-reconnect,--reconnect-on-timeout; reconnect on read timeout only if --exec present
+    --timeout-is-error; exit with error on timeout
+
+client options
+    --exit-on-no-clients,-e: once the last client disconnects, exit
+    --output-number-of-clients,--clients: output to stdout timestamped number of clients whenever it changes
+
+    attention: in the current implementation, the number of clients will be
+               updated only on attempt to write a new record,
+               i.e. output number of clients will not change if there are no new
+               records on stdin, even if the actual number of clients changes
+
+    known problems: io::ostream or at least boost::asio::ostream does not mark
+               stream as bad, if one tries to write to it first time after
+               stream has been closed; the stream is marked as bad only after
+               writing to it second time.
+               This problem is pretty benign: the worst thing that happens is
+               writing to a closed stream, which will not cause grief unless you
+               specifically rely on io-publish exiting on no clients for a
+               rarely sent heartbeat.
+
+               io-publish will not be very responsive in counting clients for
+               low bandwidth streams. It immediately recognises new clients
+               but might take a while to notice that a client has gone.
+               This affects --output-number-of-clients and --on-demand.
+
+output streams: <address>[;<options>]
+    <address>
+        tcp:<port>: e.g. tcp:1234
+        udp:<port>: e.g. udp:1234 (todo)
+        local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket
+        <named pipe name>: named pipe, which will be re-opened, if client reconnects
+        <filename>: a regular file
+        -: stdout
+    <options>
+        primary (default): clients always can connect to the 'primary' stream
+        secondary: clients can connect to the 'secondary' stream, only if there are existing clients on a primary stream
+                   if a client connects to a 'primary' stream, 'secondary' streams will be opened
+                   if last client on a 'primary' stream disconnects, 'secondary' streams will be closed
+                   e.g: io-publish tcp:8888 'tcp:9999;secondary'
+
+examples
+    cat data | io-publish tcp:1234 --size 100
+    io-publish tcp:1234 --size 24000 --on-demand --exec \"camera-cat arg1 arg2\"
+    io-publish tcp:1234 --size 24000 --on-demand -- camera-cat arg1 arg2
+)";
+    exit( 0 );
+}
 
 class command
 {
     public:
-        command( const std::string& cmd )
-            : cmd_( cmd )
-            , child_pid_( -1 )
+        command( const std::string& command ): command_( command ), child_pid_( -1 )
         {
-            comma::verbose << "launching " << cmd << std::endl;
+            comma::saymore() << "launching command: " << command << std::endl;
             int fd[2];
             if( ::pipe( fd ) == -1 ) { comma::last_error::to_exception( "couldn't open pipe" ); } // create a pipe to send the child stdout to the parent stdin
+            fd_ = fd[0];
             pid_t pid = fork();
             if( pid == -1 ) { comma::last_error::to_exception( "failed to fork()" ); }
             if( pid == 0 )
@@ -261,93 +111,145 @@ class command
                 while( ( dup2( fd[1], STDOUT_FILENO ) == -1 ) && ( errno == EINTR ) ) {} // connect pipe input to stdout in child
                 ::close( fd[1] );     // no longer need fd[1], now that it's duped
                 ::close( fd[0] );     // don't need pipe output in the child
-                ::execlp( "bash", "bash", "-c", &cmd_[0], NULL );
-                std::cerr << "io-publish: failed to exec child: errno " << comma::last_error::value() << " - " << comma::last_error::to_string() << std::endl;
+                // quick and dirty as impl/publisher.cpp sets the SIGPIPE handler to ignore
+                // the clean way would be to handle it correctly in impl/publisher.cpp, but
+                // that might be too fiddly for now
+                //
+                // failure example:
+                //     io-publish tcp:1234 --exec "yes | csv-thin --period 0.1 | csv-time-stamp"
+                //     killall csv-time-stamp
+                //     then, if you comment the SIGPIPE-related code below, csv-thin
+                //     will ignore SIGPIPE as exec environment inherits the ignore SIGPIPE
+                //     handler
+                // also, all applications in comma and snark would benefit from setting
+                // the SIGPIPE handling explicitly to avoid similar problems in future
+                struct sigaction new_action, old_action;
+                new_action.sa_handler = SIG_DFL;
+                sigemptyset( &new_action.sa_mask );
+                sigaction( SIGPIPE, NULL, &old_action );
+                sigaction( SIGPIPE, &new_action, NULL );
+                ::execlp( "bash", "bash", "-c", &command_[0], NULL );
+                comma::say() << "failed to exec child: errno " << comma::last_error::value() << " - " << comma::last_error::to_string() << std::endl;
                 exit( 1 );
             }
             child_pid_ = pid;
-            while( ( ::dup2( fd[0], STDIN_FILENO ) == -1 ) && ( errno == EINTR ) ) {} // connect pipe output to stdin in parent
-            ::close( fd[0] ); // no longer need fd[0], now that it's duped
+            comma::saymore() << "launched command with pid: " << pid << std::endl;
+            ::close( STDIN_FILENO );
             ::close( fd[1] ); // don't need pipe input in the parent
         }
+        
+        int fd() const { return fd_; }
 
         ~command()
         {
-            comma::verbose << "killing child pid " << child_pid_ << " for " << cmd_ << "..." << std::endl;
+            comma::saymore() << "closing file descriptor " << fd_ << " for " << comma::split( command_ )[0] << "..." << std::endl;
+            ::close( fd_ );
+            comma::saymore() << "sending SIGTERM to " << comma::split( command_ )[0] << " (pid " << child_pid_ << ")..." << std::endl;
             ::kill( -child_pid_, SIGTERM );
-            comma::verbose << "waiting for pid " << child_pid_ << "..." << std::endl;
-            if( ::waitpid( -child_pid_, NULL, 0 ) < 0 ) { comma::verbose << "warning: waiting for pid " << child_pid_ << " failed" << std::endl; }
-            while( std::getchar() >= 0 ); // todo: lame, but select or c-style reading produce bizarre results; investigate further
-            comma::verbose << "waiting for pid " << child_pid_ << " done" << std::endl;
+            comma::saymore() << "waiting for pid " << child_pid_ << "..." << std::endl;
+            if( ::waitpid( -child_pid_, NULL, 0 ) < 0 ) { comma::saymore() << "warning: waiting for pid " << child_pid_ << " failed" << std::endl; }
+            while( std::getchar() >= 0 ); // todo: lame, but select or c-style reading produce bizarre results; investigate sometime
+            comma::saymore() << "waiting for pid " << child_pid_ << " done" << std::endl;
         }
 
     private:
-        std::string cmd_;
+        std::string command_;
         pid_t child_pid_;
+        int fd_;
 };
 
 int main( int ac, char** av )
 {
     try
     {
-        //comma::command_line_options options( ac, av, usage );
         std::vector< std::string > head, tail;
         for( int i = 0; i < ac && std::string( "--" ) != av[i]; ++i ) { head.push_back( av[i] ); }
         for( int i = head.size() + 1; i < ac; ++i ) { tail.push_back( av[i] ); }
         comma::command_line_options options( head, usage );
-        const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand", "-.+" );
-        if( names.empty() ) { std::cerr << "io-publish: please specify at least one stream; use '-' for stdout" << std::endl; return 1; }
+        const std::vector< std::string >& names = options.unnamed( "--no-discard,--verbose,-v,--no-flush,--output-number-of-clients,--clients,--exit-on-no-clients,-e,--on-demand,--timeout-reconnect,--reconnect-on-timeout,--timeout-is-error", "-.+" );
+        if( names.empty() ) { comma::say() << "please specify at least one stream; use '-' for stdout" << std::endl; return 1; }
+        options.assert_mutually_exclusive( "--cache-size,--cache", "--on-demand" );
         const boost::array< comma::signal_flag::signals, 2 > signals = { { comma::signal_flag::sigint, comma::signal_flag::sigterm } };
         comma::signal_flag is_shutdown( signals );
         bool on_demand = options.exists( "--on-demand" );
         bool exit_on_no_clients = options.exists( "--exit-on-no-clients,-e" );
-        publish p( names
-                 , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
-                 , !options.exists( "--no-discard" )
-                 , !options.exists( "--no-flush" )
-                 , options.exists( "--output-number-of-clients,--clients" )
-                 , exit_on_no_clients || on_demand );
         std::string exec_command = options.value< std::string >( "--exec", "" );
+        bool reconnect_on_read_timeout = options.exists( "--timeout-reconnect,--reconnect-on-timeout" );
+        bool timeout_is_error = options.exists( "--timeout-is-error" );
+        boost::optional< double > read_timeout = options.optional< double >( "--timeout-read,--read-timeout" );
+        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || read_timeout, "--reconnect-on-timeout requires --read-timeout <seconds>" );
+        COMMA_ASSERT_BRIEF( !reconnect_on_read_timeout || !exec_command.empty(), "--reconnect-on-timeout requires --exec <command>" );
+        COMMA_ASSERT_BRIEF( !timeout_is_error || read_timeout, "--timeout-is-error requires --read-timeout <seconds>" );
+        comma::io::impl::publish p( names
+                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                  , !options.exists( "--no-discard" )
+                                  , !options.exists( "--no-flush" )
+                                  , options.exists( "--output-number-of-clients,--clients" )
+                                  , exit_on_no_clients || on_demand
+                                  , options.value( "--cache-size,--cache", 0 )
+                                  , read_timeout );
         if( !tail.empty() )
         {
-            if( !exec_command.empty() ) { std::cerr << "io-publish: expected either --exec or --, got both" << std::endl; return 1; }
+            COMMA_ASSERT_BRIEF( exec_command.empty(), "expected either --exec or --, got both" );
             exec_command = comma::join( tail, ' ' );
         }
         //ProfilerStart( "io-publish.prof" ); {
         if( exec_command.empty() )
         {
-            while( std::cin.good() && !is_shutdown ) { if( !p.read( std::cin ) && exit_on_no_clients ) { break; } }
+            COMMA_ASSERT_BRIEF( !on_demand, "got --on-demand; please specify --exec <command> or -- <command>, or remove --on-demand" );
+            std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
+            std::cin.tie( NULL ); // std::cin is tied to std::cout by default
+            while( std::cin.good() && !is_shutdown && !p.is_timeout() )
+            {
+                if( !p.read( std::cin ) )
+                {
+                    if( exit_on_no_clients ) { break; }
+                    if( read_timeout && p.is_timeout() ) { comma::say() << "timeout: received no data after " << *read_timeout << " seconds" << std::endl; break; }
+                }
+            }
         }
         else
         {
+            COMMA_ASSERT_BRIEF( !read_timeout, "--read-timeout with --exec: implementing..." );
             bool done = false;
+            int fd[2];
+            if( ::pipe( fd ) == -1 ) { comma::last_error::to_exception( "couldn't open pipe" ); } // create a pipe to send the child stdout to the parent stdin
             while( !done && !is_shutdown )
             {
-                if( !on_demand || p.num_clients() > 0 )
-                {
-                    command cmd( exec_command );
-                    while( std::cin.good() && !is_shutdown && p.read( std::cin ) );
-                    if( !on_demand ) { done = true; }
-                }
-                else
+                if( on_demand && p.num_clients() == 0 ) { ::sleep( 0.1 ); continue; } // todo? make timeout configurable?
+                comma::saymore() << "number of clients: " << p.num_clients() << std::endl;
+                command cmd( exec_command );
+                typedef boost::iostreams::file_descriptor_source fd_t;
+                boost::iostreams::stream< fd_t > is( fd_t( cmd.fd(), boost::iostreams::never_close_handle ) );
+                while( is.good() && !is_shutdown )
                 {
-                    ::sleep( 0.1 );
+                    if( p.read( is, cmd.fd() ) ) { continue; }
+                    //if( exit_on_no_clients ) { break; }
+                    if( read_timeout && p.is_timeout() )
+                    {
+                        comma::say() << "timeout: received no data after " << *read_timeout << " seconds" << std::endl;
+                        if( !reconnect_on_read_timeout ) { break; }
+                    }
+                    break;
                 }
+                if( !on_demand ) { break; }
+                p.disconnect_all();
             }
         }
         //ProfilerStop(); }
-        if( is_shutdown ) { std::cerr << "io-publish: interrupted by signal" << std::endl; }
+        if( p.is_timeout() ) { return timeout_is_error ? 1 : 0; }
+        if( is_shutdown ) { comma::say() << "interrupted by signal" << std::endl; }
         return 0;
     }
     catch( std::exception& ex )
     {
         if( comma::last_error::value() == EINTR || comma::last_error::value() == EBADF ) { return 0; }
-        std::cerr << "io-publish: " << ex.what() << std::endl;
+        comma::say() << "" << ex.what() << std::endl;
     }
     catch( ... )
     {
         if( comma::last_error::value() == EINTR || comma::last_error::value() == EBADF ) { return 0; }
-        std::cerr << "io-publish: unknown exception" << std::endl;
+        comma::say() << "unknown exception" << std::endl;
     }
     return 1;
 }
diff --git a/io/applications/io-tee.cpp b/io/applications/io-tee.cpp
index c15efb20d..a0188585a 100644
--- a/io/applications/io-tee.cpp
+++ b/io/applications/io-tee.cpp
@@ -41,11 +41,9 @@
 #include "../../io/select.h"
 #include "../../io/stream.h"
 
-static const char *app_name = "io-tee";
-
 static void show_usage()
 {
-    std::cerr << "Usage: " << app_name << " <output file> [options ... --] <command ...>\n";
+    std::cerr << "Usage: io-tee <output file> [options ... --] <command ...>\n";
 }
 
 static void show_help( bool verbose = false )
@@ -63,14 +61,14 @@ static void show_help( bool verbose = false )
         << "    --verbose,-v: more output" << std::endl
         << std::endl
         << "Note that only single commands are supported; to run multiple commands (or a pipeline), put them inside a bash function:" << std::endl
-        << "*** IMPORTANT *** use \"export -f function_name\" to make the function visible to " << app_name << "." << std::endl
-        << "Remember that " << app_name << " will not have access to the unexported variables, so pass any required values as function arguments." << std::endl
+        << "*** IMPORTANT *** use \"export -f function_name\" to make the function visible to io-tee." << std::endl
+        << "Remember that io-tee will not have access to the unexported variables, so pass any required values as function arguments." << std::endl
         << "On Ubuntu 16.04, io-tee might fail to discover a bash function even if it is exported." << std::endl
         << "In this case, comma_tee_function defined in comma-application-util should be used." << std::endl
         << std::endl
         << "If any options are used (such as --unbuffered), \"--\" must precede the command." << std::endl
         << std::endl
-        << "A note about using \"grep\": be aware grep returns 1 if the pattern is not found, which will make " << app_name << " think the command failed." << std::endl
+        << "A note about using \"grep\": be aware grep returns 1 if the pattern is not found, which will make io-tee think the command failed." << std::endl
         << "To avoid this, call grep inside a function like this: grep (pattern) || true." << std::endl
         << std::endl
         << "Example 1:" << std::endl
@@ -127,19 +125,19 @@ int main( int ac, char **av )
             else if ( av[n] == std::string( "--help" ) || av[n] == std::string( "-h" ) ) { show_help(); exit( 0 ); }
         }
         int command_offset = ( dashdash_pos == -1 ? 2 : dashdash_pos + 1 );
-        if ( command_offset >= ac ) { std::cerr << app_name << ": missing command; "; show_usage(); exit( 1 ); }
+        if ( command_offset >= ac ) { std::cerr << "io-tee: missing command; "; show_usage(); exit( 1 ); }
         // if there is no "--", there can be no command line options, just the output filename
         int options_ac = ( dashdash_pos == -1 ? 2 : dashdash_pos );
         if ( debug )
         {
-            std::cerr << app_name << ": options_ac=" << options_ac << "; command line: " << app_name;
+            std::cerr << "io-tee: options_ac=" << options_ac << "; command line: io-tee";
             for ( int m = 1; m < ac; ++m ) { std::cerr << ' ' << av[m]; }
             std::cerr << std::endl;
         }
         comma::command_line_options options( options_ac, av );
         const std::vector< std::string >& unnamed = options.unnamed( "--unbuffered,-u,--verbose,-v,--debug,--dry-run,--dry,--append,-a", "-.*" );
-        if( unnamed.empty() ) { std::cerr << app_name << ": please specify output file name" << std::endl; return 1; }
-        if( unnamed.size() > 1 ) { std::cerr << app_name << ": expected one output filename, got: " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
+        if( unnamed.empty() ) { std::cerr << "io-tee: please specify output file name" << std::endl; return 1; }
+        if( unnamed.size() > 1 ) { std::cerr << "io-tee: expected one output filename, got: " << comma::join( unnamed, ' ' ) << std::endl; return 1; }
         std::string outfile = unnamed[0];
         // bash -c only takes a single argument, so put the whole command in single quotes, then double quote each individual argument
         std::string command = "bash -c '" + escape_quotes( av[command_offset] );
@@ -147,24 +145,24 @@ int main( int ac, char **av )
         bool append_to_outfile = options.exists( "--append,-a" );
         if( append_to_outfile ) { command += " >> "; }
         else { command += " > "; }
-        command += outfile;
+        command += '"' + outfile + '"';
         command += "'";
         bool unbuffered = options.exists( "--unbuffered,-u" );
         bool verbose = options.exists( "--verbose,-v" );
         if ( debug ) { verbose = true; }
-        if( !file_is_writable( outfile, append_to_outfile ) ) { std::cerr << app_name << ": cannot write to " << outfile << std::endl; exit( 1 ); }
         if( options.exists( "--dry-run,--dry" ) ) { std::cout << command << std::endl; return 0; }
-        if( verbose ) { std::cerr << app_name << ": will run command: " << command << std::endl; }
+        if( verbose ) { std::cerr << "io-tee: will run command: " << command << std::endl; }
+        if( !file_is_writable( outfile, append_to_outfile ) ) { std::cerr << "io-tee: cannot write to " << outfile << std::endl; exit( 1 ); }
         std::cout.flush();
         pipe = ::popen( &command[0], "w" );
-        if( pipe == NULL ) { std::cerr << app_name << ": failed to open pipe; command: " << command << std::endl; return 1; }
+        if( pipe == NULL ) { std::cerr << "io-tee: failed to open pipe; command: " << command << std::endl; return 1; }
         boost::array< char, 0xffff > buffer;
-        if ( debug ) { std::cerr << app_name << ": created buffer" << std::endl; }
+        if ( debug ) { std::cerr << "io-tee: created buffer" << std::endl; }
         comma::io::select stdin_select;
-        if ( debug ) { std::cerr << app_name << ": constructed comma::io::select" << std::endl; }
-        if( unbuffered ) { stdin_select.read().add( 0 ); if ( debug ) { std::cerr << app_name << ": did initial unbuffered read" << std::endl; } }
+        if ( debug ) { std::cerr << "io-tee: constructed comma::io::select" << std::endl; }
+        if( unbuffered ) { stdin_select.read().add( 0 ); if ( debug ) { std::cerr << "io-tee: did initial unbuffered read" << std::endl; } }
         comma::io::istream is( "-", comma::io::mode::binary );
-        if ( debug ) { std::cerr << app_name << ": opened input stream" << std::endl; }
+        if ( debug ) { std::cerr << "io-tee: opened input stream" << std::endl; }
         if( unbuffered )
         {
             std::ios_base::sync_with_stdio( false ); // unsync to make rdbuf()->in_avail() working
@@ -172,51 +170,51 @@ int main( int ac, char **av )
         }
         while( std::cin.good() )
         {
-            if ( debug ) { std::cerr << app_name << ": loop" << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: loop" << std::endl; }
             std::size_t bytes_to_read = buffer.size();
             if( unbuffered )
             {
-                if ( debug ) { std::cerr << app_name << ": calling stdin_select.wait(1)" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: calling stdin_select.wait(1)" << std::endl; }
                 if( stdin_select.wait( boost::posix_time::seconds( 1 ) ) == 0 ) { continue; }
-                if ( debug ) { std::cerr << app_name << ": after stdin_select.wait" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: after stdin_select.wait" << std::endl; }
                 std::size_t available = is.available_on_file_descriptor();
-                if ( debug ) { std::cerr << app_name << ": " << available << " bytes available" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: " << available << " bytes available" << std::endl; }
                 bytes_to_read = std::min( available, buffer.size() );
             }
-            if ( debug ) { std::cerr << app_name << ": bytes_to_read = " << bytes_to_read << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: bytes_to_read = " << bytes_to_read << std::endl; }
             std::cin.read( &buffer[0], bytes_to_read );
-            if ( debug ) { std::cerr << app_name << ": cin.gcount is " << std::cin.gcount() << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: cin.gcount is " << std::cin.gcount() << std::endl; }
             if( std::cin.gcount() <= 0 ) { break; }
             std::size_t gcount = std::cin.gcount();
-            if ( debug ) { std::cerr << app_name << ": writing " << gcount << " bytes to stdout" << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: writing " << gcount << " bytes to stdout" << std::endl; }
             std::cout.write( &buffer[0], gcount );
-            if ( debug ) { std::cerr << app_name << ": writing " << gcount << " bytes to pipe" << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: writing " << gcount << " bytes to pipe" << std::endl; }
             int r = ::fwrite( &buffer[0], sizeof( char ), gcount, pipe );
-            if ( debug ) { std::cerr << app_name << ": fwrite to pipe returned " << r << std::endl; }
+            if ( debug ) { std::cerr << "io-tee: fwrite to pipe returned " << r << std::endl; }
             if( r != (int) gcount )
             { 
-                std::cerr << app_name << ": error on pipe: " << std::strerror( errno ) <<  std::endl;
+                std::cerr << "io-tee: error on pipe: " << std::strerror( errno ) <<  std::endl;
                 ::pclose( pipe );
                 return 1;
             }
             if( unbuffered )
             { 
-                if ( debug ) { std::cerr << app_name << ": flushing stdout" << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: flushing stdout" << std::endl; }
                 std::cout.flush();
-                if ( debug ) { std::cerr << app_name << ": flushing pipe" << std::endl; }
-                if ( ::fflush( pipe ) != 0 ) { std::cerr << app_name << ": flushing pipe failed: " << std::strerror( errno ) << "; command was: " << command << std::endl; ::pclose( pipe ); exit( 1 ); }
-                if ( debug ) { std::cerr << app_name << ": flushed stdout and pipe " << std::endl; }
+                if ( debug ) { std::cerr << "io-tee: flushing pipe" << std::endl; }
+                if ( ::fflush( pipe ) != 0 ) { std::cerr << "io-tee: flushing pipe failed: " << std::strerror( errno ) << "; command was: " << command << std::endl; ::pclose( pipe ); exit( 1 ); }
+                if ( debug ) { std::cerr << "io-tee: flushed stdout and pipe " << std::endl; }
             }
         }
         std::cout.flush();
         ::fflush( pipe );
         int result = ::pclose( pipe );
-        if ( result == -1 ) { std::cerr << app_name << ": pipe error: " << std::strerror( errno ) << "; command was: " << command << std::endl; exit( 1 ); }
-        else if ( result != 0 ) { std::cerr << app_name << ": command failed: " << command << std::endl; return 1; }
+        if ( result == -1 ) { std::cerr << "io-tee: pipe error: " << std::strerror( errno ) << "; command was: " << command << std::endl; exit( 1 ); }
+        else if ( result != 0 ) { std::cerr << "io-tee: command failed: " << command << std::endl; return 1; }
         return 0;
     }
-    catch( std::exception& ex ) { std::cerr << app_name << ": " << ex.what() << std::endl; }
-    catch( ... ) { std::cerr << app_name << ": unknown exception" << std::endl; }
+    catch( std::exception& ex ) { std::cerr << "io-tee: " << ex.what() << std::endl; }
+    catch( ... ) { std::cerr << "io-tee: unknown exception" << std::endl; }
     if( pipe ) { ::pclose( pipe ); }
     return 1;
 }
diff --git a/io/applications/io-topics b/io/applications/io-topics
index 2ff6ad9e7..6f1f17218 100755
--- a/io/applications/io-topics
+++ b/io/applications/io-topics
@@ -1,5 +1,9 @@
 #!/bin/bash
 
+# Copyright (c) 2011 The University of Sydney
+# Copyright (c) 2020 Vsevolod Vlaskine
+# All rights reserved.
+
 scriptname=$( basename $0 )
 
 source $( type -p comma-application-util ) || { echo "io-topics: could not source 'comma-application-util'" >&2; exit 1; }
@@ -7,101 +11,178 @@ source $( type -p comma-process-util ) || { echo "io-topics: could not source 'c
 
 # todo: --master-config: default behaviour: first config; --guess-by command: all configs
 
+function bash_completion()
+{
+    echo "cat list log publish"
+    { common_options; log_options; } | comma_options_to_bash_completion
+}
+
 function common_options()
 {
     cat <<EOF
---help,-h; display help and exit
---config=[<config>]; <config>: <dir>[:<path>], where <dir> is path to a json or path-value file specifying topic attributes, <path>: path inside config, multiple --config options allowed, configs will be applied in the reverse order of --config options on command line (see examples)
---dry-run,--dry; print final command and exit
---topics-from-all-configs,--all; take topics from all configs and topic command values, default: take topics and topic command values only from the first config ("master config")
---topic-fields; output topic config fields and exit
---topic-fields-help; output topic config fields help and exit
---verbose,-v; print verbose information
+--help,-h;            display help and exit
+--config=[<config>];  <config>: <dir>[:<path>], where <dir> is path to a
+                      json or path-value file specifying topic attributes,
+                      <path>: path inside config, multiple --config options
+                      allowed, configs will be applied in the reverse order
+                      of --config options on command line (see examples)
+--dry-run,--dry;      print final command and exit
+--env=[<defintions>]; <definitions>: bash-style variable definitions that 
+                      will be used only for \${some-var} variable substitution
+                      in commands, see variable substition in commands below
+                      e.g. --env="my_var=123;another_var='hello;world'"
+--topics-from-all-configs,--all; take topics from all configs and topic
+                      command values, default: take topics and topic command
+                      values only from the first config ("master config")
+--topic-fields;       output topic config fields and exit
+--topic-fields-help;  output topic config fields help and exit
+--verbose,-v;         print verbose information
 EOF
 }
 
 function usage()
 {
+    local verbose=$1
     cat >&2 <<eof
     
-a simple topic publisher supporting tcp, local sockets, and zero-mq (i.e. whatever io-publish supports)
+a simple topic publisher supporting tcp, local sockets, and zero-mq
+(i.e. whatever io-publish supports)
 
 usage: io-topics <operation> [<topics>] <options>
 
 todo: debug zero-mq support
 
 operations
-    cat: receive and handle data on given topics
-    
-    list: list topics
-    
-    log: log topics (todo)
-        options
-$( log_options | sed 's/^/            /g' )
-
-    play: play back logs, counterpart to log operation (todo)
-    
-    publish: start all the publishers listed on command line or in the config file (todo)
+    cat:     receive and handle data on given topics
+    list:    list topics
+    log:     log topics
+    play:    play back logs, counterpart to log operation (todo)
+    publish: start all the publishers listed on command line or config file
+
+variable substition in commands
+    options can be passed to command and on_exit fields via variable substition
+    examples
+        "command": "log-some-sensor \${log_dir}"
+        "on_exit": "save-to-dir \${log_dir}"
+    all command line options and values defined in --env are available
+        e.g:
+            --config -> \${config}
+            --log-dir -> \${log_dir}
+            --env="my_var=5" -> \${my_var}
+    see examples below for more detail
 
 common options
 $( common_options | sed 's/^/    /g' )
 
+log operation options
+$( log_options | sed 's/^/    /g' )
+
+eof
+    if (( verbose )); then
+        cat >&2 <<eof
 examples
-    publish
-        run publisher with topics a and b, with b on demand
-            > io-topics publish --config <( echo "a/command=csv-paste line-number"; echo "a/port=8888"; echo "b/command=csv-paste line-number"; echo "b/port=9999"; echo "b/on_demand=1" )
+    --- publish ---
+        run publisher with topics a and b, with b on demand:
+            $ io-topics publish --config <( sed 's/^ *//' <<EOF
+                  a/command=csv-paste line-number
+                  a/port=8888
+                  b/command=csv-paste line-number
+                  b/port=9999
+                  b/on_demand=1
+EOF
+)
             io-topics: will run 'comma_execute_and_wait --group' with commands:
-            io-topics:     io-publish tcp:8888   -- csv-paste line-number
-            io-topics:     io-publish tcp:9999  --on-demand -- csv-paste line-number
+            io-topics: io-publish tcp:8888   -- csv-paste line-number
+            io-topics: io-publish tcp:9999  --on-demand -- csv-paste line-number
         
-        in a different shell, observe that topic a keeps running even if no-one is listening, whereas topic b runs only if at least one client is connected:
-            > socat tcp:localhost:8888 | head -n5 # will output something like:
+        in a different shell, observe that topic a keeps running even if no-one
+        is listening, whereas topic b runs only if at least one client is
+        connected:
+            $ socat tcp:localhost:8888 - | head -n5    # outputs something like:
             16648534
             16648535
             16648536
             16648537
             16648538
-            
-            > socat tcp:localhost:9999 - | head -n5
+            $ socat tcp:localhost:9999 - | head -n5
             0
             1
             2
             3
             4
             
-    cat
-        run publisher
-            > io-topics publish --config <( echo "a/command=csv-paste line-number"; echo "a/port=12345"; echo "b/command=csv-paste line-number"; echo "b/port=12346"; echo "b/on_demand=1" )
-        
-        in a different shell, run clients
-            > io-topics cat --config <( echo "a/command=head -n5 | tee a.csv"; echo "a/address=tcp:localhost:12345"; echo "b/command=head -n5 | tee b.csv"; echo "b/address=tcp:localhost:12346" )
+        secondary address or port with --dry-run (try it without dry run):
+            $ io-topics publish --config <( sed 's/^ *//' <<EOF
+                  a/command=csv-paste line-number
+                  a/port=12345
+                  b/command=csv-paste line-number
+                  b/port=12346
+                  b/secondary/port=8888
+                  b/on_demand=1
+EOF
+) --dry-run
+            io-topics: publish: will run 'comma_execute_and_wait --group'
+                                with commands:
+            io-topics: publish: io-publish tcp:12345 -- csv-paste line-number
+            io-topics: publish: io-publish tcp:12346 tcp:8888;secondary
+                                           --on-demand -- csv-paste line-number
             
-        check output
-            > cat a.csv 
+    --- cat ---
+        run publisher:
+            $ io-topics publish --config <( sed 's/^ *//' <<EOF
+                  a/command=csv-paste line-number
+                  a/port=12345
+                  b/command=csv-paste line-number
+                  b/port=12346
+                  b/on_demand=1
+EOF
+)
+        in a different shell, run clients:
+            $ io-topics cat --config <( sed 's/^ *//' <<EOF
+                  a/command=head -n5 | tee a.csv
+                  a/address=tcp:localhost:12345
+                  b/command=head -n5 | tee b.csv
+                  b/address=tcp:localhost:12346
+EOF
+)
+        check output:
+            $ cat a.csv 
             203740462
             203740463
             203740464
             203740465
             203740466
-            > cat b.csv 
+            $ cat b.csv 
             0
             1
             2
             3
             4
             
-    log
-        run publisher as in previous examples and then run logging
-            > io-topics log --dir my-log --config <( echo "a/address=tcp:localhost:8888"; echo "b/address=tcp:localhost:9999" )
-            > ls -al my-log/a
-            > ls -al my-log/b
+    --- log ---
+        run publisher as in first example and then run logging:
+            $ io-topics log --dir my-log --config <(
+                  echo "a/address=tcp:localhost:8888"
+                  echo "b/address=tcp:localhost:9999" )
+            $ ls -al my-log/a
+            $ ls -al my-log/b
             
-        run publisher as in previous examples and then run logging with a custom command
-            > io-topics log --dir my-log --config <( echo "a/address=tcp:localhost:12345"; echo 'b/command=socat tcp:localhost:12346 - > log.csv' )
-            > ls -al my-log/a
-            > head my-log/b/log.csv
+        run publisher as in second example and then log with a custom command:
+            $ io-topics log --dir my-log --config <(
+                  echo "a/address=tcp:localhost:12345"
+                  echo 'b/command=socat tcp:localhost:12346 - > log.csv' )
+            $ ls -al my-log/a
+            $ head my-log/b/log.csv
+
+        trigger logging on a remote machine with templated command
+            $ io-topics log --dir my-log --config <(
+                  echo "a/command=curl 'http://remote:7000/log=start&name=${log_dir}'" )
 
 eof
+    else
+        echo "use \"$scriptname --help --verbose\" for examples"
+    fi
+    echo
     exit 0
 }
 
@@ -112,172 +193,213 @@ function die() { say "$@"; exit 1; }
 
 function list_topic_fields() { :; }
 
-function publish_topic_fields()
+# todo: flush field? flush is default behaviour in io-publish, which is inconsistent with
+# log and cat operations and thus introducing flush in publish might be confusing
+function publish_topic_fields() { publish_topic_fields_help | grep -v '^ ' | cut -f1 -d';'; }
+
+function publish_topic_fields_help()
 {
     cat <<eof
-address
-binary
-command
-on_demand
-port
-size
+address;              passed verbatim to io-publish, port attribute will be ignored
+binary;               for binary data, binary format of data, overrides size
+cache_size;           same meaning as io-publish --cache-size
+command;              command for the publisher to run
+input;                input topic for publish command to read on stdin
+multiplier;           passed to io-publish
+on_demand;            same meaning as io-publish --on-demand
+on_exit;              command to run when publisher stops
+port;                 tcp port for publishing, unless address field is present
+reconnect_on_timeout; same meaning as io-publish --reconnect-on-timeout
+secondary/address;    passed verbatim to io-publish as '<address>;secondary',
+                      in this case port attribute ignored
+secondary/port;       secondary tcp port for publishing, unless address field is
+                      present, io-publish as 'tcp:<port>;secondary'
+size;                 for binary data, size of the binary record
+timeout;              same meaning as io-publish --timeout=<seconds>
 eof
 }
 
-function publish_topic_fields_help()
+function cat_topic_fields() { cat_topic_fields_help | grep -v '^ ' | cut -f1 -d';'; }
+
+function cat_topic_fields_help()
 {
     cat <<eof
-address; if present, passed verbatim to io-publish, in this case port attribute ignored
-binary; if publisher publishes binary data, the binary format of the data, overrides size
-command; command for the publisher to run
-on_demand; if present, same meaning as io-publish --on-demand
-port; tcp port for publishing, unless address field is present
-size; if publisher publishes binary data, size of the binary record, if no binary attribute given
+address;          passed verbatim to io-cat, port attribute will be ignored
+binary;           if data is binary, binary format of data, overrides size
+command;          command for the client to run
+connect_attempts; number of connect attempts
+connect_period;   time in seconds between connect attempts
+flush;            flush output on each record, default: buffer output
+host;             tcp host for publishing, unless address field is present
+on_exit;          command to run when output stops
+port;             tcp port for publishing, unless address field is present
+size;             if data is binary, size of the binary record
 eof
 }
 
-function cat_topic_fields()
+function log_topic_fields() { log_topic_fields_help | grep -v '^ ' | cut -f1 -d';'; }
+
+function log_topic_fields_help()
 {
     cat <<eof
-address
-binary
-command
-connect_attempts
-connect_period
-flush
-host
-port
-size
+address;          passed verbatim to io-cat, in this case port attribute ignored
+binary;           if data is binary, binary format of data, overrides size
+command;          optional command for logger to run instead of default logger
+connect_attempts; number of connect attempts
+connect_period;   time in seconds between connect attempts
+flush;            flush output on each record, default: buffer output
+header/binary;    only required for variable payload size
+                  value after the fixed-width data part is expected
+header/fields;    if binary and has 'size' field, variable payload of size field
+host;             tcp host for publishing, unless address field is present
+index;            optional command to generate index file, default: fixed-width
+                  binary index for each binary record, ascii: no index file
+on_exit;          command to run when logger stops
+path;             prefix path for log directory (to split logs across drives)
+period;           split log files at given number of seconds, overrides --period
+port;             tcp port for publishing, unless address field is present
+restart;          if data stream disconnects keep trying to reconnect
+size;             if data is binary, size of the binary record
+suffix;           optional log suffix, default: bin for binary, csv for ascii
 eof
 }
 
-function cat_topic_fields_help()
+function log_options()
 {
     cat <<eof
-address; if present, passed verbatim to io-publish, in this case port attribute ignored
-binary; if data is binary, the binary format of the data, overrides size
-command; command for the client to run
-connect_attempts; number of connect attemtps
-connect_period; time in seconds between connect attempts
-flush; flush output on each record, default: buffer output
-host; tcp host for publishing, unless address field is present
-port; tcp port for publishing, unless address field is present
-size; if if data is binary, size of the binary record, if no binary attribute given
+--log-dir,--dir=[<path>]; log directory, for each topic, actual log
+                          directory will be [<path>/]<dir>/<topic>,
+                          see io-topics log --topic-fields-help
+--period=<seconds>;       default=60; the log files will be split based
+                          on a given time period, settings for specific
+                          topic override this option
 eof
 }
 
-function log_topic_fields()
+function io_topics_restart_topic()
 {
-    cat <<eof
-address
-binary
-command
-connect_attempts
-connect_period
-flush
-host
-index
-path
-period
-port
-restart
-size
-suffix
-eof
+    local is_shutdown=0
+    trap "local is_shutdown=1" HUP INT TERM
+    while (( ! is_shutdown )) ; do bash -c "$@"; sleep 0.1; done # quick and dirty
 }
 
-function log_topic_fields_help()
+export -f io_topics_restart_topic
+
+function set_topic_address()
 {
-    cat <<eof
-address; if present, passed verbatim to io-publish, in this case port attribute ignored
-binary; if data is binary, the binary format of the data, overrides size
-command; optional command for the logger to run instead of default logger
-connect_attempts; number of connect attemtps
-connect_period; time in seconds between connect attempts
-flush; flush output on each record, default: buffer output
-host; tcp host for publishing, unless address field is present
-index; optional command to generate index file, default: fixed-width binary index for each binary record, ascii: no index file
-path; prefix path for log directory (e.g. if logs need to be split across multiple drives)
-period; split log files on a given number of seconds, overrides --period
-port; tcp port for publishing, unless address field is present
-restart; if data stream disconnects keep trying to reconnect
-size; if if data is binary, size of the binary record, if no binary attribute given
-suffix; optional log file suffix, default: bin for binary, csv for ascii
-eof
+    [[ -n "$topic_address" || ( -n "$topic_host" && -n "$topic_port" ) ]] || die "topic '$topic': neither address nor host/port specified in files ${configs[@]}"
+    [[ -n "$topic_address" ]] || topic_address="tcp:$topic_host:$topic_port"
+    [[ -n "$topic_address" ]] || die "topic: '$topic': failed to set topic address"
 }
 
-function log_options()
+function set_topic_variables()
 {
-    cat <<eof
---log-dir,--dir=[<path>]; log directory, for each topic, actual log directory will be [<path>/]<dir>/<topic>, see io-topics log --topic-fields-help
---period=<seconds>; default=60; the log files will be split based on a given time period, settings for specific topic override this option
-eof
+    local operation="$1"
+    local topic="$2"
+    eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
+    eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
+    [[ -z "$topic_header_binary" || -z "$topic_binary" ]] || die "expected either header/binary or binary; got both"
+    [[ -z "$topic_header_binary" || -z "$topic_size" ]] || die "expected either header/binary or size; got both"
+    [[ -z "$topic_header_fields" || -n "$topic_header_binary" ]] || die "header/fields specified, but header/binary is not"
+    topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )" # quick and dirty
+    unset size_option binary_option fields_option
+    if [[ -n "$topic_binary" ]]; then size_option="--size=$( echo $topic_binary | csv-format size )"; binary_option="--binary=$topic_binary"
+    elif [[ -n "$topic_size" ]]; then size_option="--size=$topic_size"; fi
+    if [[ -n "$topic_header_fields" ]]; then fields_option="--fields=$topic_header_fields"; else unset fields_option; fi
+    if [[ -n "$topic_header_binary" ]]; then binary_option="--binary=$topic_header_binary"; fi
+}
+
+function expanded_command() # quick and dirty
+{
+    local cmd="$1"
+    {
+        grep "=" <<< "$options" | comma_path_value_mangle
+        echo "$options_env"
+        echo "$cmd"
+    } \
+        | env -i $BASH -c 'input=$( cat )
+                           eval "$( head -n-1 <<< "$input" )"
+                           cmd=""
+                           while IFS="" read line; do
+                               if [[ $line =~ ^\$\{[a-zA-Z_][a-zA-Z0-9_]*\}$ ]]; then var="${line:2:-1}"; cmd+="${!var}"; else cmd+="$line"; fi
+                           done < <( tail -n1 <<< "$input" | sed -e "s#\${#\n\$\{#g" -e "s#}#}\n#g" )
+                           echo "$cmd"'
 }
 
 function publish_command()
 {
-    [[ -n "$topic_command" ]] || die "command not specified for topic '$topic' in files ${configs[@]}"
-    [[ -n "$topic_address" || -n "$topic_port" ]] || die "neither address nor port specified for topic '$topic' in files ${configs[@]}"
+    [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
+    [[ -n "$topic_address" || -n "$topic_port" ]] || die "topic '$topic': neither address nor port specified in files ${configs[@]}"
     [[ -n "$topic_address" ]] || topic_address="tcp:$topic_port"
-    if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
-    local cmd="io-publish $topic_address $size_option $on_demand -- $topic_command"
+    [[ -n "$topic_secondary_address" ]] || { [[ -z "$topic_secondary_port" ]] || topic_secondary_address="tcp:$topic_secondary_port"; }
+    [[ -z "$topic_secondary_address" ]] || topic_secondary_address="$topic_secondary_address;secondary"
+    if [[ -n "$topic_multiplier" ]]; then multiplier="--multiplier $topic_multiplier"; else unset multiplier; fi
+    if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi
+    if [[ "$topic_timeout" == 1 || "$topic_timeout" == "true" ]]; then timeout="--timeout=$timeout"; else unset timeout; fi
+    if [[ "$topic_reconnect_on_timeout" == 1 || "$topic_reconnect_on_timeout" == "true" ]]; then reconnect_on_timeout="--reconnect-on-timeout"; else unset reconnect_on_timeout; fi
+    if [[ -n "$topic_cache_size" ]]; then cache_size="--cache-size=$topic_cache_size"; else unset cache_size; fi
+    local cmd="io-publish $topic_address $topic_secondary_address $size_option $multiplier $on_demand $cache_size $timeout $reconnect_on_timeout -- "
+    verbose "publish topic_command: $topic_command"
+    local expanded_topic_command=$( expanded_command "$topic_command" )
+    verbose "publish expanded_topic_command: $expanded_topic_command"
+    if [[ -z "$topic_input" ]]; then cmd+="$expanded_topic_command"
+    else cmd+="$( set_topic_variables "cat" "$topic_input"; cat_command "$topic_input" 1 ) --flush --verbose | $expanded_topic_command" || die "topic '$topic': failed to configure input topic '$topic_input'"; fi
     verbose "$cmd"
     echo "$cmd"
 }
 
-function set_topic_address()
-{
-    [[ -n "$topic_address" || ( -n "$topic_host" && -n "$topic_port" ) ]] || die "neither address nor host/port specified for topic '$topic' in files ${configs[@]}"
-    [[ -n "$topic_address" ]] || topic_address="tcp:$topic_host:$topic_port"
-}
-
 function cat_command()
 {
-    [[ -n "$topic_command" ]] || die "command not specified for topic '$topic' in files ${configs[@]}"
+    local topic=$1
+    local ignore_command=$2
+    (( ignore_command )) || [[ -n "$topic_command" ]] || die "topic '$topic': command not specified in files ${configs[@]}"
     set_topic_address
-    if [[ -n "$topic_on_demand" ]]; then on_demand="--on-demand"; else unset on_demand; fi
+    if [[ "$topic_on_demand" == 1 || "$topic_on_demand" == "true" ]]; then on_demand="--on-demand"; else unset on_demand; fi # todo? remove? is it even used anywhere?
+    if [[ "$topic_timeout" == 1 || "$topic_timeout" == "true" ]]; then timeout="--timeout=$timeout"; else unset timeout; fi
+    if [[ "$topic_reconnect_on_timeout" == 1 || "$topic_reconnect_on_timeout" == "true" ]]; then reconnect_on_timeout="--reconnect-on-timeout"; else unset reconnect_on_timeout; fi
+    if [[ -n "$topic_cache_size" ]]; then cache_size=$topic_cache_size; else unset cache_size; fi
     if [[ -n "$topic_flush" ]]; then flush_option="--flush"; else unset flush_option; fi # todo! make flush default?!
     if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
     if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
     if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
-    local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_command" # todo? comma_execute_and_wait?
+    if (( ignore_command )); then local cmd="io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option"
+    else
+        verbose "cat topic_command: $topic_command"
+        local expanded_topic_command=$( expanded_command "$topic_command" )
+        verbose "cat expanded_topic_command: $expanded_topic_command"
+        local cmd="bash -c io-cat $topic_address $size_option $flush_option $connect_attempts_option $connect_period_option $verbose_option | $expanded_topic_command"
+    fi # todo? comma_execute_and_wait?
     verbose "$cmd"
     echo "$cmd"
 }
 
-function io_topics_log_run_forever()
-{
-    local is_shutdown=0
-    trap "local is_shutdown=1" HUP INT TERM
-    while (( ! is_shutdown )) ; do bash -c "$@"; sleep 0.1; done # quick and dirty
-}
-
-export -f io_topics_log_run_forever
-
 function log_command()
 {
     [[ -n "$options_log_dir" ]] || die "please specify --log-dir"
     local topic=$1
     local cmd="$topic_command"
-    if [[ -z "$cmd" ]]; then
+    if [[ "$cmd" ]]; then
+        verbose "got $cmd"
+        cmd=$( expanded_command "$cmd" )
+        verbose "expanded to $cmd"
+    else
         set_topic_address
         [[ -n "$topic_index" ]] || topic_index="cat"
         local flush_option suffix_option
         (( topic_flush )) && flush_option="--flush"
         [[ -z "$topic_suffix" ]] || suffix_option="--suffix=$topic_suffix"
-        local period=$options_period
-        [[ -z "$topic_period" ]] || period=$topic_period
-        if [[ -n "$topic_connect_attempts" ]]; then connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
-        if [[ -n "$topic_connect_period" ]]; then connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
-        if [[ -n "$options_verbose" ]]; then verbose_option="--verbose"; else unset verbose_option; fi
-        #if [[ -n "$options_verbose" ]]; then say "--> verbose set"; else say "--> verbose not set"; fi
-        cmd="io-cat $topic_address $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_index | csv-split -t $period $size_option $suffix_option $flush_option"
+        if [[ -n "$topic_period" ]]; then local period=$topic_period; else local period=$options_period; fi
+        if [[ -n "$topic_connect_attempts" ]]; then local connect_attempts_option="--connect-attempts=$topic_connect_attempts"; else unset connect_attempts_option; fi
+        if [[ -n "$topic_connect_period" ]]; then local connect_period_option="--connect-period=$topic_connect_period"; else unset connect_period_option; fi
+        if [[ -n "$options_verbose" ]]; then local verbose_option="--verbose"; else unset verbose_option; fi
+        if [[ -n "$binary_option" ]]; then local format_option=$binary_option; else local format_option=$size_option; fi
+        cmd="io-cat $topic_address $flush_option $connect_attempts_option $connect_period_option $verbose_option | $topic_index | csv-split -t $period $fields_option $format_option $suffix_option $flush_option"
     fi
     local path
     [[ -z "$topic_path" ]] || path+="$topic_path/"
     path+="$options_log_dir/$topic"
-    [[ -z "$topic_restart" ]] || cmd="io_topics_log_run_forever \"$cmd\""
-    (( "$options_dry_run" )) || mkdir -p $path || die "failed to make directory $path for topic $topic"
+    [[ -z "$topic_restart" ]] || cmd="io_topics_restart_topic \"$cmd\""
+    (( "$options_dry_run" )) || mkdir -p $path || die "topic '$topic': failed to make directory $path"
     cmd="( cd $path && $cmd )"
     echo "bash -c $cmd"
 }
@@ -291,9 +413,14 @@ function cat_config()
 
 function topics_from_config() # quick and dirty
 {
-    if [[ -n "$options_topics_from_all_configs" ]]; then egrep -e "/address=|/port=|/command=" <<< "$config" | cut -d= -f1 | sed -e 's#/address$##' -e 's#/port$##' -e 's#/command$##' | uniq; return; fi
-    grep '=""' <<< "$master_config" | cut -d= -f1
-    for path in $( grep -v '=""' <<< "$master_config" | cut -d= -f1 ); do dirname $path; done | uniq # todo: don't do it just through the dirname? join with operation fields and filter by them instead
+    local expression="/address=|/host=|/port=|/command=|/secondary/address=|/secondary/host|/secondary/port=|/header/fields=|/header/binary="
+    function grep_by_topic_config_fields() { egrep -e "$expression" | cut -d= -f1 | sed -e 's#/secondary/address$##' -e 's#/secondary/host$##' -e 's#/secondary/port$##' -e 's#/address$##' -e 's#/host$##' -e 's#/port$##' -e 's#/command$##'; }
+    [[ -z "$options_topics_from_all_configs" ]] || { grep_by_topic_config_fields <<< "$config" | sort --unique; return; }
+    {
+        grep '=""' <<< "$master_config" | cut -d= -f1
+        grep -v '=""' <<< "$master_config" | egrep -v -e "$expression" | cut -d= -f1 | csv-strings dirname --emplace # quick and dirty, is it even correct?
+        grep_by_topic_config_fields <<< "$master_config"
+    } | sort --unique
 }
 
 function read_configs()
@@ -309,9 +436,25 @@ function get_topics()
     topics=( ${unnamed[@]:1} )
     if (( ${#topics[@]} == 0 )); then topics=( $( topics_from_config ) ); fi
     (( ${#topics[@]} > 0 )) || die "no topics in config files ${configs[@]}"
+    verbose "topics: ${topics[@]}"
+}
+
+(( $( comma_options_has "--bash-completion" $@ ) )) && { bash_completion; exit 0; }
+
+if (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )); then
+    (( $( comma_options_has --verbose "$@" ) || $( comma_options_has -v "$@" ) )) && verbose=1 || verbose=0
+    usage $verbose
+fi
+
+on_exit_commands=()
+
+function on_exit()
+{
+    say "running commands on exit:"
+    for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
+    comma_execute_and_wait --group "${on_exit_commands[@]}"
 }
 
-(( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )) && usage
 operation=$1
 [[ $( type -t ${operation}_topic_fields ) == "function" ]] || die "expected operation, got '$operation'" # quick and dirty
 (( $( comma_options_has --topic-fields "$@" ) )) && { ${operation}_topic_fields; exit 0; }
@@ -324,17 +467,17 @@ get_topics
 if [[ $operation == "list" ]]; then for topic in ${topics[@]}; do echo $topic; done; exit; fi
 commands=()
 for topic in ${topics[@]}; do
-    eval "$( ${operation}_topic_fields | comma_path_mangle | sed 's#^#unset topic_#' )" # todo: quick and dirty, watch performance
-    eval "$( grep $topic <<< "$config" | grep -v "^$topic/command" | sed "s#^$topic/#topic/#" | comma_path_value_mangle )"
-    topic_command="$( grep ^$topic/command <<< "$master_config" | cut -d= -f1 --complement | sed -e 's#^"##' -e 's#"$##'  )"
-    #[[ -n "$topic_command" ]] || die "command not specified for topic '$topic' in files ${configs[@]}"
-    if [[ -n "$topic_binary" ]]; then size_option="--size $( csv-size $topic_binary )"
-    elif [[ -n "$topic_size" ]]; then size_option="--size $topic_size"
-    else unset size_option; fi
-    cmd="$( ${operation}_command $topic )" || die "on topic $topic: making command failed"
+    set_topic_variables "$operation" "$topic"
+    cmd="$( ${operation}_command $topic )" || die "topic '$topic': making command failed"
     commands+=( "$cmd" )
+    [[ $topic_on_exit ]] && on_exit_commands+=( "$( expanded_command "$topic_on_exit" )" )
 done
 say "will run 'comma_execute_and_wait --group' with commands:"
 for cmd in "${commands[@]}"; do say "    $cmd"; done
+if (( ${#on_exit_commands[@]} > 0 )); then
+    say "on exit will run:"
+    for cmd in "${on_exit_commands[@]}"; do say "    $cmd"; done
+    [[ $options_dry_run ]] || trap on_exit EXIT
+fi
 [[ -z "$options_dry_run" ]] || exit
 comma_execute_and_wait --group "${commands[@]}"
diff --git a/io/applications/rabbit-cat b/io/applications/rabbit-cat
index 89362d50d..3a17a0275 100755
--- a/io/applications/rabbit-cat
+++ b/io/applications/rabbit-cat
@@ -1,33 +1,6 @@
-#!/usr/bin/python
+#!/usr/bin/env python3
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2018 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 import argparse
 import signal
@@ -44,11 +17,11 @@ import pika
 def command_line_options():
     global application_name
     description="""Rabbit MQ client: send/receive messages to/from rabbit mq server
-    
+
 rabbit-cat <operation> <connection_string> [ <options> ]
 
 operation:
-    send        read messages from stdin and send 
+    send        read messages from stdin and send
     listen      receive messages and write to stdout, or run command with --exec
 """
     #rpc-send    <<NOT IMPLEMENTED>> send request and wait for reply
@@ -58,7 +31,7 @@ operation:
 
     epilog="""
 
-sample connection string:    
+sample connection string:
 # Set the connection parameters to connect to rabbit-server1 on port 5672
 # on the / virtual host using the username "guest" and password "guest"
 "amqp://guest:guest@rabbit-server1:5672/%2F"
@@ -78,7 +51,7 @@ example 2: send message to work queue with multiple receivers (each message is r
 
 
 example 3: publish and subscribe
-    rabbit-cat listen localhost --fanout --exchange="exchange2" 
+    rabbit-cat listen localhost --fanout --exchange="exchange2"
     &
     rabbit-cat listen localhost --fanout --exchange="exchange2"
     &
@@ -110,7 +83,7 @@ example 5: topic
     #rabbit-cat rpc-listen localhost --queue="queue1" --exec="bc"
     #&
     #echo "2+3" | rabbit-cat rpc-send localhost --queue="queue1" --routing-key="queue1"
-    
+
 
     #"""
 
@@ -158,7 +131,7 @@ def run_send( channel, exchange_name ):
             if message: send_message( channel, exchange_name, message )
             return
         if args.end_of_message=='\n':
-            while True:            
+            while True:
                 line = sys.stdin.readline()
                 if not line: break
                 if line.endswith('\n'): send_message( channel, exchange_name, line[:-1] )
diff --git a/io/applications/udp-client.cpp b/io/applications/udp-client.cpp
index a72ea7b23..c523a93ee 100644
--- a/io/applications/udp-client.cpp
+++ b/io/applications/udp-client.cpp
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -27,102 +28,186 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
 #ifndef WIN32
 #include <stdlib.h>
 #endif
 #include <iostream>
+#include <sstream>
+#include <type_traits>
 #include <boost/array.hpp>
 #include <boost/asio/ip/udp.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/noncopyable.hpp>
-#include <boost/static_assert.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
+#include "../../application/signal_flag.h"
+#include "../../base/exception.h"
 #include "../../base/types.h"
 #include "../../csv/format.h"
+#include "../../csv/options.h"
+#include "../../string/string.h"
+#include "../../io/impl/publish.h"
 
-void usage()
+static void usage()
 {
-    std::cerr << "simple udp client: receives udp packets and outputs them on stdout" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "rationale: netcat and socat somehow do not work very well with udp" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "usage: udp-client <port> [<options>]" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "<options>" << std::endl;
-    std::cerr << "    --ascii: output timestamp as ascii; default: 64-bit binary" << std::endl;
-    std::cerr << "    --binary: output timestamp as 64-bit binary; default" << std::endl;
-    std::cerr << "    --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','" << std::endl;
-    std::cerr << "    --size=<size>: hint of maximum buffer size; default 16384" << std::endl;
-    std::cerr << "    --reuse-addr,--reuseaddr: reuse udp address/port" << std::endl;
-    std::cerr << "    --timestamp: output packet timestamp (currently just system time)" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
-    std::cerr << std::endl;
-    exit( 1 );
+    std::cerr << R"(
+simple udp client: receive udp packets and outputs them on stdout (default)
+                   or to given output streams
+
+rationale: netcat and socat somehow do not work very well with udp
+
+usage: udp-client <port> [<output-streams>] [<options>]
+
+attention! it is possible to receive several packets udp packets in a single
+           read from the udp socket; the way to deal with it:
+               - if fixed-width data is published on the UDP socket, use:
+                 udp-client ... --size=<expected-fixed-size>
+               - if variable-size data is published on the UDP socket, the data
+                 receiver will have to parse the packets depending on communication
+                 protocol or nature of the data
+               - if using udp-client --fields=size,data or --fields=t,size,data,
+                 size field will have the total size in bytes for all UDP packets
+                 read from the UDP socket in a single receive call
+
+options
+    --ascii; output timestamp as ascii; default: 64-bit binary
+    --cache-size,--cache=<n>; default=0; number of cached records; if a new client connects, the
+                                         the cached records will be sent to it once connected
+    --delimiter=<delimiter>: if ascii and --timestamp, use this delimiter; default: ','
+    --discard: not present, do blocking write to every open output stream
+    --endl; if --ascii, output '\n' after data
+    --fields=<fields>; default=data; choices (for now): 'data', 't,data', 't,size,data', 'size,data'
+                                                        't', 't,size', 'size' 
+        <fields>
+            t: utc timestamp, same as --timestamp
+            size: data size in bytes
+            data: udp packet data
+    --flush; flush stdout after each packet
+    --reuse-addr,--reuseaddr: reuse udp address/port
+    --size=<size>; default=16384; hint of maximum buffer size in bytes, if using timestamped
+                                  fixed-width data, use --size=<fixed-width-size>, otherwise
+                                  multiple packets may be read from the UDP socket at once
+    --timestamp: deprecated, use --fields; output packet timestamp; currently just system
+                 time as UTC; if binary, little endian uint64
+
+output streams: <address>
+    <address>
+        tcp:<port>: e.g. tcp:1234
+        udp:<port>: e.g. udp:1234 (todo)
+        local:<name>: linux/unix local server socket e.g. local:./tmp/my_socket
+        <named pipe name>: named pipe, which will be re-opened, if client reconnects
+        <filename>: a regular file
+        -: stdout
+
+examples
+    publishing on udp
+        ( echo a; echo b; echo c ) | socat - udp:localhost::12345
+    basics
+        udp-client 12435 > raw.bin
+        udp-client 12435 --fields=t,data > timestamped.bin
+        udp-client 12435 --fields=t,size,data > timestamp.size.bin
+        udp-client 12435 --fields=t,size,data --ascii > timestamp.size.csv
+    re-publishing
+        udp-client 12435 tcp::4567 
+        udp-client 12435 tcp::4567 tcp::7890 
+        udp-client 12435 tcp::4567 - > log.bin
+)" << std::endl;
+    exit( 0 );
 }
 
 int main( int argc, char** argv )
 {
-    comma::command_line_options options( argc, argv );
-    if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
-    const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--reuse-addr,--reuseaddr,--timestamp", "--delimiter,--size" );
-    if( unnamed.empty() ) { std::cerr << "udp-client: please specify port" << std::endl; return 1; }
-    unsigned short port = boost::lexical_cast< unsigned short >( unnamed[0] );
-    bool timestamped = options.exists( "--timestamp" );
-    bool binary = !options.exists( "--ascii" );
-    char delimiter = options.value( "--delimiter", ',' );
-    std::vector< char > packet( options.value( "--size", 16384 ) );
-#if (BOOST_VERSION >= 106600)
-    boost::asio::io_context service;
-#else
-    boost::asio::io_service service;
-#endif
-    boost::asio::ip::udp::socket socket( service );
-    socket.open( boost::asio::ip::udp::v4() );
-    boost::system::error_code error;
-    socket.set_option( boost::asio::ip::udp::socket::broadcast( true ), error );
-    if( error ) { std::cerr << "udp-client: failed to set broadcast option on port " << port << std::endl; return 1; }
-    if( options.exists( "--reuse-addr,--reuseaddr" ) )
-    {
-        socket.set_option( boost::asio::ip::udp::socket::reuse_address( true ), error );
-        if( error ) { std::cerr << "udp-client: failed to set reuse address option on port " << port << std::endl; return 1; }
-    }
-    socket.bind( boost::asio::ip::udp::endpoint( boost::asio::ip::udp::v4(), port ), error );
-    if( error ) { std::cerr << "udp-client: failed to bind port " << port << std::endl; return 1; }
-
-    #ifdef WIN32
-    if( binary )
-    {
-        _setmode( _fileno( stdout ), _O_BINARY );        
-    }
-    #endif
-    
-    while( std::cout.good() )
+    try
     {
+        comma::command_line_options options( argc, argv );
+        if( argc < 2 || options.exists( "--help,-h" ) ) { usage(); }
+        const std::vector< std::string >& unnamed = options.unnamed( "--ascii,--binary,--discard,--endl,--flush,--reuse-addr,--reuseaddr,--timestamp", "-.+" );
+        COMMA_ASSERT_BRIEF( !unnamed.empty(), "please specify port" );
+        std::vector< std::string > output_streams( unnamed.size() > 1 ? unnamed.size() - 1 : 1 );
+        if( unnamed.size() == 1 ) { output_streams[0] = "-"; }
+        else { std::copy( unnamed.begin() + 1, unnamed.end(), output_streams.begin() ); }
+        unsigned short port = boost::lexical_cast< unsigned short >( unnamed[0] );
+        options.assert_mutually_exclusive( "--timestamp", "--fields" );
+        bool timestamped = options.exists( "--timestamp" );
+        if( timestamped ) { comma::say() << "--timestamped: deprecated (will be maintained for now); use --fields=t,data" << std::endl; }
+        if( options.exists( "--binary" ) ) { comma::say() << "--binary: deprecated, please remove; data deemed binary anyway unless --ascii specified" << std::endl; }
+        bool binary = !options.exists( "--ascii" );
+        bool endl = options.exists( "--endl" );
+        comma::csv::options csv( options, timestamped ? "t,data" : "data" );
+        COMMA_ASSERT_BRIEF(    csv.fields == "data"
+                            || csv.fields == "t,data"
+                            || csv.fields == "t,size,data"
+                            || csv.fields == "size,data"
+                            || csv.fields == "t"
+                            || csv.fields == "t,size"
+                            || csv.fields == "size"
+                          , "unsupported fields: '" << csv.fields << "'" ); // uber-quick and dirty, shameful
+        bool has_time = csv.has_field( "t" ) || timestamped;
+        bool has_size = csv.has_field( "size" );
+        bool has_data = csv.has_field( "data" );
+        static_assert( sizeof( boost::posix_time::ptime ) == 8 ); // quick and dirty
+        unsigned max_size = options.value( "--size", 16384 );
+        std::vector< char > buffer( max_size + 12 ); // quick and dirty
+        #if BOOST_VERSION >= 106600
+            boost::asio::io_context service;
+        #else
+            boost::asio::io_service service;
+        #endif
+        boost::asio::ip::udp::socket socket( service );
+        socket.open( boost::asio::ip::udp::v4() );
         boost::system::error_code error;
-        std::size_t size = socket.receive( boost::asio::buffer( packet ), 0, error );
-        if( error || size == 0 ) { break; }
-        if( timestamped )
+        socket.set_option( boost::asio::ip::udp::socket::broadcast( true ), error );
+        COMMA_ASSERT_BRIEF( !bool( error ), "failed to set broadcast option on port " << port );
+        if( options.exists( "--reuse-addr,--reuseaddr" ) )
+        {
+            socket.set_option( boost::asio::ip::udp::socket::reuse_address( true ), error );
+            COMMA_ASSERT_BRIEF( !bool( error ), "failed to set reuse address option on port " << port );
+        }
+        socket.bind( boost::asio::ip::udp::endpoint( boost::asio::ip::udp::v4(), port ), error );
+        COMMA_ASSERT_BRIEF( !bool( error ), "failed to bind port " << port );
+        #ifdef WIN32
+        if( binary ) { _setmode( _fileno( stdout ), _O_BINARY ); }
+        #endif
+        static_assert( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ), "expected time of size 8" );
+        comma::io::impl::publish p( output_streams
+                                  , options.value( "-s,--size", 0 ) * options.value( "-m,--multiplier", 1 )
+                                  , options.exists( "--discard" )
+                                  , options.exists( "--flush" ) || !binary
+                                  , false
+                                  , false
+                                  , options.value( "--cache-size,--cache", 0 ) );
+        comma::signal_flag is_shutdown;
+        if( binary )
         {
-            boost::posix_time::ptime timestamp = boost::posix_time::microsec_clock::universal_time();
-            BOOST_STATIC_ASSERT( sizeof( boost::posix_time::ptime ) == sizeof( comma::uint64 ) );
-            if( binary )
-            { 
-                static char buf[ sizeof( comma::int64 ) ];
-                comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( timestamp, buf );
-                std::cout.write( buf, sizeof( comma::int64 ) );
+            unsigned int offset = ( has_time ? 8 : 0 ) + ( has_size ? 4 : 0 ); // hyper-quick and dirty for now
+            while( !is_shutdown )
+            {
+                std::uint32_t size = socket.receive( boost::asio::buffer( &buffer[offset], max_size ), 0, error );
+                if( error || size == 0 ) { break; } // todo? throw on error?
+                if( has_time ) { comma::csv::format::traits< boost::posix_time::ptime, comma::csv::format::time >::to_bin( boost::posix_time::microsec_clock::universal_time(), &buffer[0] ); }
+                if( has_size ) { ::memcpy( &buffer[ has_time ? 8 : 0 ], reinterpret_cast< const char* >( &size ), 4 ); }
+                p.write( &buffer[0], offset + ( has_data ? size : 0 ) );
             }
-            else
+        }
+        else
+        {
+            std::string delimiter;
+            while( !is_shutdown )
             {
-                std::cout << boost::posix_time::to_iso_string( timestamp ) << delimiter;
+                std::size_t size = socket.receive( boost::asio::buffer( &buffer[0], max_size ), 0, error );
+                if( error || size == 0 ) { break; } // todo? throw on error?
+                std::ostringstream oss;
+                if( has_time ) { oss << boost::posix_time::to_iso_string( boost::posix_time::microsec_clock::universal_time() ); delimiter = csv.delimiter; }
+                if( has_size ) { oss << delimiter << size; delimiter = csv.delimiter; }
+                if( has_data ) { oss << delimiter; oss.write( &buffer[0], size ); if( endl ) { oss << std::endl; } }
+                const std::string& s = oss.str();
+                p.write( &s[0], s.size() );
             }
         }
-        std::cout.write( &packet[0], size );
-        std::cout.flush();
-   }
-   return 0;
+        return 0;
+    }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
+    return 1;
 }
diff --git a/io/applications/zero-cat.cpp b/io/applications/zero-cat.cpp
index fef48ef75..acec1baf2 100644
--- a/io/applications/zero-cat.cpp
+++ b/io/applications/zero-cat.cpp
@@ -41,7 +41,6 @@
 #include <boost/array.hpp>
 #include <boost/program_options.hpp>
 #include <boost/thread.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/signal_flag.h"
 #include "../../io/publisher.h"
 #include "../../string/string.h"
@@ -116,7 +115,6 @@ void usage( boost::program_options::options_description const & description, boo
                  "\n        If outputting messages to a single pipe it is better to keep zero-cat"
                  "\n        running to minimise load and maximise throughput."
                  "\n"
-                << comma::contact_info
                 << std::endl;
 }
 
@@ -272,7 +270,7 @@ int main(int argc, char* argv[])
                 else { socket.bind( &endpoints[i][0] ); }
             }
             // we convert to milliseconds as converting to second floors the number so 0.99 becomes 0
-            if( wait_after_connect > 0 ) { boost::this_thread::sleep(boost::posix_time::milliseconds(wait_after_connect * 1000.0)); }
+            if( wait_after_connect > 0 ) { boost::this_thread::sleep(boost::posix_time::milliseconds( static_cast< long >( wait_after_connect * 1000.0 ) ) ); }
             
             std::string buffer;
             if( binary ) { buffer.resize( size ); }
@@ -311,7 +309,7 @@ int main(int argc, char* argv[])
                 else { socket.connect( endpoints[i].c_str() ); }
             }
             socket.setsockopt( ZMQ_SUBSCRIBE, "", 0 );
-            if( wait_after_connect > 0 ) { boost::this_thread::sleep( boost::posix_time::milliseconds( wait_after_connect * 1000.0 ) ); }
+            if( wait_after_connect > 0 ) { boost::this_thread::sleep( boost::posix_time::milliseconds( static_cast< long >( wait_after_connect * 1000.0 ) ) ); }
             if( vm.count( "server" ) )
             {
                 comma::io::publisher publisher( server, comma::io::mode::binary, true, false );
diff --git a/io/applications/zero-publish b/io/applications/zero-publish
index e0c51def5..7fcef8c5c 100644
--- a/io/applications/zero-publish
+++ b/io/applications/zero-publish
@@ -1,5 +1,34 @@
 #!/bin/bash
 
+# This file is part of comma, a generic and flexible library
+# Copyright (c) 2011 The University of Sydney
+# All rights reserved.
+#
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are met:
+# 1. Redistributions of source code must retain the above copyright
+#    notice, this list of conditions and the following disclaimer.
+# 2. Redistributions in binary form must reproduce the above copyright
+#    notice, this list of conditions and the following disclaimer in the
+#    documentation and/or other materials provided with the distribution.
+# 3. Neither the name of the University of Sydney nor the
+#    names of its contributors may be used to endorse or promote products
+#    derived from this software without specific prior written permission.
+#
+# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
 function usage()
 {
     echo "publish data on tcp in a packet-based manner"
diff --git a/io/impl/filesystem.h b/io/impl/filesystem.h
new file mode 100644
index 000000000..9a8d93804
--- /dev/null
+++ b/io/impl/filesystem.h
@@ -0,0 +1,37 @@
+// Copyright (c) 2024 Mission Systems Pty Ltd
+//
+// Allow selection of filesystem library from either boost or C++ standard library
+//
+// Can assist with interoperation with other libraries that require or conflict
+// with one or the other
+//
+// Usage:
+// #include "io/impl/filesystem.h"
+// ...
+// comma::filesystem::<some-op>
+//
+// Configuration:
+//   in CMake set comma_USE_BOOST_FILESYSTEM
+//     "ON" will use boost::filesystem
+//     "OFF" will use std::filesystem or std::experimental::filesystem
+//           if you're using gcc older than version 8.1
+
+#pragma once
+
+#ifdef COMMA_USE_BOOST_FILESYSTEM
+  #include <boost/filesystem.hpp>
+  namespace comma { namespace filesystem = boost::filesystem; }
+#else
+  #if defined(__GNUC__)
+    #if __has_include (<filesystem>)
+      #include <filesystem>
+      namespace comma { namespace filesystem = std::filesystem; }
+    #else
+      #include <experimental/filesystem>
+      namespace comma { namespace filesystem = std::experimental::filesystem; }
+    #endif
+  #else
+    #include <filesystem>
+    namespace comma { namespace filesystem = std::filesystem; }
+  #endif
+#endif
diff --git a/io/impl/publish.cpp b/io/impl/publish.cpp
new file mode 100644
index 000000000..e97a09d7a
--- /dev/null
+++ b/io/impl/publish.cpp
@@ -0,0 +1,293 @@
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2020 Vsevolod Vlaskine
+// All rights reserved.
+
+#include "../../name_value/map.h"
+#include "publish.h"
+
+namespace comma { namespace io { namespace impl {
+
+template < typename S > struct server_traits; // quick and dirty
+
+template <> struct server_traits< io::iserver > // quick and dirty
+{
+    static io::iserver* make( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) { return new io::iserver( name, mode, blocking ); }
+    template < typename T > static void write( T&, const char*, unsigned int ) {} 
+    template < typename T > static void flush( T& ) {}
+};
+
+template <> struct server_traits< io::oserver > // quick and dirty
+{
+    static io::oserver* make( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) { return new io::oserver( name, mode, blocking, flush ); }
+    template < typename T > static void write( T& s, const char* buf, unsigned int size ) { s.write( buf, size ); }
+    template < typename T > static void flush( T& s ) { s.flush(); }
+};
+
+template < typename Server >
+multiserver< Server >::multiserver( const std::vector< std::string >& endpoints
+                                  , unsigned int packet_size
+                                  , bool discard
+                                  , bool flush
+                                  , bool output_number_of_clients
+                                  , bool update_no_clients
+                                  , unsigned int cache_size )
+    : discard_( discard )
+    , flush_( flush )
+    , buffer_( packet_size, '\0' )
+    , packet_size_( packet_size )
+    , output_number_of_clients_( output_number_of_clients )
+    , cache_size_( cache_size )
+    , update_no_clients_( update_no_clients )
+    , got_first_client_ever_( false )
+    , sizes_( endpoints.size(), 0 )
+    , num_clients_( 0 )
+    , is_shutdown_( false )
+{
+    bool has_primary_stream = false;
+    for( unsigned int i = 0; i < endpoints.size(); ++i )
+    {
+        comma::name_value::map m( endpoints[i], "address", ';', '=' );
+        bool secondary = !m.exists( "primary" ) && m.exists( "secondary" );
+        endpoints_.push_back( endpoint( m.value< std::string >( "address" ), secondary ) ); // todo? quick and dirty; better usage semantics?
+        if( !secondary ) { has_primary_stream = true; }
+    }
+    COMMA_ASSERT_BRIEF( has_primary_stream, "please specify at least one primary stream" );
+    struct sigaction new_action, old_action;
+    new_action.sa_handler = SIG_IGN;
+    sigemptyset( &new_action.sa_mask );
+    sigaction( SIGPIPE, NULL, &old_action );
+    sigaction( SIGPIPE, &new_action, NULL );
+    transaction_t t( servers_ );
+    t->resize( endpoints.size() );
+    for( std::size_t i = 0; i < endpoints.size(); ++i )
+    {
+        if( !endpoints_[i].secondary ) { ( *t )[i].reset( server_traits< Server >::make( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard, flush ) ); }
+    }
+    acceptor_thread_.reset( new boost::thread( boost::bind( &multiserver< Server >::accept_, boost::ref( *this ))));
+}
+
+template < typename Server >
+multiserver< Server >::~multiserver()
+{
+    is_shutdown_ = true;
+    acceptor_thread_->join();
+    transaction_t t( servers_ );
+    for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->close(); } }
+}
+
+template < typename Server >
+void multiserver< Server >::disconnect_all()
+{
+    transaction_t t( servers_ );
+    for( auto& p: *t ) { if( p ) { p->disconnect_all(); } }
+    handle_sizes_( t ); // quick and dirty
+}
+
+template < typename Server >
+bool multiserver< Server >::handle_sizes_( typename multiserver< Server >::transaction_t& t ) // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
+{
+    if( !output_number_of_clients_ && !update_no_clients_ ) { return true; }
+    unsigned int total = 0;
+    bool changed = false;
+    has_primary_clients_ = false;
+    for( unsigned int i = 0; i < t->size(); ++i )
+    {
+        unsigned int size = ( *t )[i] ? ( *t )[i]->size() : 0;
+        total += size;
+        if( !endpoints_[i].secondary && size > 0 ) { has_primary_clients_ = true; }
+        if( sizes_[i] == size ) { continue; }
+        sizes_[i] = size;
+        changed = true;
+        num_clients_ = total;
+    }
+    if( !changed ) { return true; }
+    if( output_number_of_clients_ )
+    {
+        std::cout << boost::posix_time::to_iso_string( boost::posix_time::microsec_clock::universal_time() );
+        for( unsigned int i = 0; i < sizes_.size(); ++i ) { std::cout << ',' << sizes_[i]; }
+        std::cout << std::endl;
+    }
+    if( update_no_clients_ )
+    {
+        if( total > 0 ) { got_first_client_ever_ = true; }
+        else if( got_first_client_ever_ ) { return false; } // { comma::saymore() << "the last client exited" << std::endl; return false; }
+    }
+    return true;
+}
+
+template < typename Server >
+void multiserver< Server >::accept_()
+{
+    comma::io::select select;
+    {
+        transaction_t t( servers_ );
+        for( unsigned int i = 0; i < t->size(); ++i )
+        {
+            if( !( *t )[i] ) { continue; }
+            if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
+        }
+    }
+    if( select.read()().empty() ) { return; }
+    while( !is_shutdown_ )
+    {
+        select.wait( boost::posix_time::millisec( 100 ) ); // todo? make timeout configurable?
+        transaction_t t( servers_ );
+        for( unsigned int i = 0; i < t->size(); ++i )
+        {
+            if( ( *t )[i] && select.read().ready( ( *t )[i]->acceptor_file_descriptor() ) )
+            {
+                const auto& streams = ( *t )[i]->accept();
+                if( !cache_.empty() )
+                {
+                    for( auto& s: streams )
+                    {
+                        for( const auto& c: cache_ ) { server_traits< Server >::write( **s, &c[0], c.size() ); }
+                        if( flush_ ) { server_traits< Server >::flush( **s ); }
+                    }
+                }
+            }
+        }
+        handle_sizes_( t );
+        if( has_primary_clients_ )
+        {
+            for( unsigned int i = 0; i < t->size(); ++i )
+            {
+                if( !endpoints_[i].secondary || ( *t )[i] ) { continue; }
+                ( *t )[i].reset( server_traits< Server >::make( endpoints_[i].address, is_binary_() ? comma::io::mode::binary : comma::io::mode::ascii, !discard_, flush_ ) );
+                if( ( *t )[i]->acceptor_file_descriptor() != comma::io::invalid_file_descriptor ) { select.read().add( ( *t )[i]->acceptor_file_descriptor() ); }
+            }
+        }
+        else
+        {
+            for( unsigned int i = 0; i < t->size(); ++i )
+            {
+                if( !endpoints_[i].secondary || !( *t )[i] ) { continue; }
+                select.read().remove( ( *t )[i]->acceptor_file_descriptor() );
+                ( *t )[i].reset();
+            }
+        }
+    }
+}
+
+publish::publish( const std::vector< std::string >& endpoints
+                , unsigned int packet_size
+                , bool discard
+                , bool flush
+                , bool output_number_of_clients
+                , bool update_no_clients
+                , unsigned int cache_size
+                , const boost::optional< double >& timeout )
+    : multiserver< comma::io::oserver >( endpoints
+                                       , packet_size
+                                       , discard
+                                       , flush
+                                       , output_number_of_clients
+                                       , update_no_clients
+                                       , cache_size )
+    , _timeout( timeout )
+{
+}
+
+bool publish::write( const std::string& s )
+{
+    transaction_t t( servers_ );
+    if( cache_size_ > 0 )
+    {
+        cache_.push_back( s );
+        if( cache_.size() > cache_size_ ) { cache_.pop_front(); }
+    }
+    for( auto& p: *t ) { if( p ) { p->write( &s[0], s.size(), false ); } } // for( std::size_t i = 0; i < t->size(); ++i ) { if( ( *t )[i] ) { ( *t )[i]->write( &buffer_[0], buffer_.size(), false ); } }
+    return handle_sizes_( t );
+}
+
+bool publish::write( const char* buf, unsigned int size )
+{
+    return write( std::string( buf, size ) ); // todo: quick and dirty, watch performance
+}
+
+static bool _enough( std::istream& is, unsigned int size )
+{
+    auto available = is.rdbuf()->in_avail();
+    return ( size == 0 && available > 0 ) || ( size > 0 && available >= size );
+}
+
+bool publish::read( std::istream& is, io::file_descriptor fd )
+{
+    if( _timeout )
+    {
+        _is_timeout = false;
+        if( !_enough( is, packet_size_ ) && !is.eof() )
+        {
+            if( _select.read()().empty() || *_select.read()().begin() != fd )
+            {
+                _select.read().clear(); // todo: quick and dirty, watch performance
+                _select.read().add( fd );
+            }
+            _select.wait( *_timeout );
+            _is_timeout = !_enough( is, packet_size_ ) && !_select.read().ready( fd );
+            if( _is_timeout ) { return false; }
+        }
+    }
+    if( is_binary_() )
+    {
+        is.read( &buffer_[0], buffer_.size() );
+        if( is.gcount() < int( buffer_.size() ) || !is.good() || is.eof() ) { return false; }
+    }
+    else
+    {
+        std::getline( is, buffer_ );
+        buffer_ += '\n';
+        if( !is.good() || is.eof() ) { return false; }
+    }
+    return write( buffer_ );
+}
+
+receive::receive( const std::string& endpoint
+                , unsigned int packet_size
+                , bool flush
+                , bool output_number_of_clients
+                , bool update_no_clients )
+    : multiserver< comma::io::iserver >( std::vector< std::string >( 1, endpoint )
+                                       , packet_size
+                                       , false
+                                       , flush
+                                       , output_number_of_clients
+                                       , update_no_clients
+                                       , 0 )
+{
+}
+
+bool receive::read( char* buf, unsigned int size )
+{
+    transaction_t t( servers_ );
+    auto count = ( *t )[0]->read( buf, size );
+    return handle_sizes_( t ) || count != size;
+}
+
+bool receive::getline( std::string& line ) // quick and dirty
+{
+    transaction_t t( servers_ );
+    line = ( *t )[0]->getline();
+    return handle_sizes_( t );
+}
+
+bool receive::write( std::ostream& output )
+{
+    if( is_binary_() )
+    {
+        if( read( &buffer_[0], buffer_.size() ) != buffer_.size() ) { return false; }
+    }
+    else
+    {
+        if( !getline( buffer_ ) ) { return false; }
+        buffer_ += '\n';
+    }
+    output.write( &buffer_[0], buffer_.size() );
+    if( flush_ ) { output.flush(); }
+    return output.good();
+}
+
+template class multiserver< io::iserver >;
+template class multiserver< io::oserver >;
+
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/publish.h b/io/impl/publish.h
new file mode 100644
index 000000000..a21db620b
--- /dev/null
+++ b/io/impl/publish.h
@@ -0,0 +1,122 @@
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2020 Vsevolod Vlaskine
+// All rights reserved.
+
+#pragma once
+
+#include <errno.h>
+#include <signal.h>
+#include <sys/wait.h>
+#include <unistd.h>
+#include <deque>
+#include <memory>
+#include <boost/bind/bind.hpp>
+#include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/iostreams/device/file_descriptor.hpp>
+#include <boost/iostreams/stream.hpp>
+#include <boost/optional.hpp>
+#include <boost/thread.hpp>
+#include "../../base/none.h"
+#include "../../io/file_descriptor.h"
+#include "../../io/select.h"
+#include "../../io/server.h"
+#include "../../string/string.h"
+#include "../../sync/synchronized.h"
+
+namespace comma { namespace io { namespace impl {
+
+template < typename Server >
+class multiserver
+{
+    public:
+        typedef comma::synchronized< std::vector< std::unique_ptr< Server > > > servers_t;
+        
+        typedef typename servers_t::scoped_transaction transaction_t;
+        
+        struct endpoint
+        {
+            std::string address;
+            bool secondary;
+            endpoint( const std::string& address = "", bool secondary = false ): address( address ), secondary( secondary ) {}
+        };
+        
+        multiserver( const std::vector< std::string >& endpoints
+                   , unsigned int packet_size
+                   , bool discard
+                   , bool flush
+                   , bool output_number_of_clients
+                   , bool update_no_clients
+                   , unsigned int cache_size );
+        
+        ~multiserver();
+        
+        void disconnect_all();
+        
+        unsigned int num_clients() const { return num_clients_; }
+
+    protected:
+        std::vector< endpoint > endpoints_;
+        bool discard_;
+        bool flush_;
+        servers_t servers_;
+        std::string buffer_;
+        unsigned int packet_size_;
+        bool output_number_of_clients_;
+        unsigned int cache_size_;
+        bool update_no_clients_;
+        bool got_first_client_ever_;
+        std::vector< unsigned int > sizes_;
+        bool has_primary_clients_;
+        unsigned int num_clients_;
+        std::unique_ptr< boost::thread > acceptor_thread_;
+        bool is_shutdown_;
+        std::deque< std::string > cache_;
+
+        bool is_binary_() const { return packet_size_ > 0; }
+        bool handle_sizes_( transaction_t& t ); // todo? why pass transaction? it doen not seem going out of scope at the point of call; remove?
+        void accept_();
+};
+
+class publish : public multiserver< comma::io::oserver >
+{
+    public:
+        publish( const std::vector< std::string >& endpoints
+               , unsigned int packet_size
+               , bool discard
+               , bool flush
+               , bool output_number_of_clients
+               , bool update_no_clients
+               , unsigned int cache_size
+               , const boost::optional< double >& timeout = comma::silent_none< double >() );
+        
+        bool read( std::istream& input, io::file_descriptor fd = 0 );
+
+        bool write( const std::string& s );
+
+        bool write( const char* buf, unsigned int size );
+
+        bool is_timeout() const { return _is_timeout; }
+
+    protected:
+        comma::io::select _select;
+        boost::optional< double > _timeout;
+        io::file_descriptor _fd{0};
+        bool _is_timeout{false};
+};
+
+class receive : public multiserver< comma::io::iserver >
+{
+    receive( const std::string& endpoint
+           , unsigned int packet_size
+           , bool flush
+           , bool output_number_of_clients
+           , bool update_no_clients );
+
+    bool read( char* buf, unsigned int size );
+
+    bool getline( std::string& line );
+
+    bool write( std::ostream& output );
+};
+
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/publisher.cpp b/io/impl/publisher.cpp
deleted file mode 100644
index 5511ddbee..000000000
--- a/io/impl/publisher.cpp
+++ /dev/null
@@ -1,312 +0,0 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-/// @author cedric wohlleber
-
-#ifdef WIN32
-#include <io.h>
-#include <fcntl.h>
-#include <sys/stat.h>
-#include <sys/types.h>
-#endif
-
-#include <boost/asio/ip/tcp.hpp>
-#include <boost/asio/local/stream_protocol.hpp>
-#include <boost/bind.hpp>
-#include <boost/filesystem/operations.hpp>
-#include <boost/lexical_cast.hpp>
-#include "../../base/exception.h"
-#include "../../io/file_descriptor.h"
-#include "../../string/string.h"
-#include "publisher.h"
-
-namespace comma { namespace io { namespace impl {
-
-class file_acceptor : public acceptor
-{
-    public:
-        file_acceptor( const std::string& name, io::mode::value mode )
-            : name_( name )
-            , mode_( mode )
-            , closed_( true )
-            , fd_( io::invalid_file_descriptor )
-        {
-        }
-
-        ~file_acceptor()
-        {
-#ifndef WIN32
-            ::close( fd_ );
-#else
-            _close( fd_ );
-#endif
-        }
-
-        io::ostream* accept( boost::posix_time::time_duration )
-        {
-            if( !closed_ ) { return NULL; }
-#ifndef WIN32
-            fd_ = ::open( &name_[0], O_WRONLY | O_CREAT | O_NONBLOCK, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH ); // quick and dirty
-#else
-            fd_ = _open( &name_[0], O_WRONLY | _O_CREAT, _S_IWRITE );
-#endif
-            if( fd_ == io::invalid_file_descriptor ) { return NULL; }
-            closed_ = false;
-            return new io::ostream( name_, mode_, io::mode::non_blocking ); // quick and dirty
-        }
-
-        void notify_closed() { closed_ = true; ::close( fd_ ); }
-        
-        io::file_descriptor fd() const { return fd_; }
-
-    private:
-        const std::string name_;
-        const io::mode::value mode_;
-        bool closed_;
-        io::file_descriptor fd_; // todo: make io::ostream non-throwing on construction
-};
-
-struct Tcp {};
-template < typename S > struct socket_traits {};
-
-template <> struct socket_traits< Tcp >
-{
-    typedef boost::asio::ip::tcp::endpoint endpoint_type;
-    typedef boost::asio::ip::tcp::acceptor acceptor;
-    typedef boost::asio::ip::tcp::iostream iostream;
-    typedef unsigned short name_type;
-    static endpoint_type endpoint( unsigned short port ) { return endpoint_type( boost::asio::ip::tcp::v4(), port ); }
-};
-
-#ifndef WIN32
-struct local {};
-template <> struct socket_traits< local >
-{
-    typedef boost::asio::local::stream_protocol::endpoint endpoint_type;
-    typedef boost::asio::local::stream_protocol::acceptor acceptor;
-    typedef boost::asio::local::stream_protocol::iostream iostream;
-    typedef std::string name_type;
-    static endpoint_type endpoint( const std::string& name ) { return endpoint_type( name ); }
-};
-#endif
-
-template < typename S >
-class socket_acceptor : public acceptor
-{
-    public:
-        socket_acceptor( const typename socket_traits< S >::name_type& name, io::mode::value mode )
-            : mode_( mode )
-            , acceptor_( m_service, socket_traits< S >::endpoint( name ) )
-        {
-#ifndef WIN32
-#if (BOOST_VERSION >= 106600)
-            select_.read().add( acceptor_.native_handle() );
-#else
-            select_.read().add( acceptor_.native() );
-#endif
-#else
-#if (BOOST_VERSION >= 106600)
-            SOCKET socket = acceptor_.native_handle();
-#else
-            SOCKET socket = acceptor_.native();
-#endif
-            select_.read().add( socket );
-#endif
-        }
-
-        io::ostream* accept( boost::posix_time::time_duration timeout )
-        {
-            select_.wait( timeout );
-#ifndef WIN32
-#if (BOOST_VERSION >= 106600)
-            if( !select_.read().ready( acceptor_.native_handle() ) ) { return NULL; }
-#else
-            if( !select_.read().ready( acceptor_.native() ) ) { return NULL; }
-#endif
-#else
-#if (BOOST_VERSION >= 106600)
-            SOCKET socket = acceptor_.native_handle();
-#else
-            SOCKET socket = acceptor_.native();
-#endif
-            if( !select_.read().ready( socket ) ) { return NULL; }
-#endif
-            typename socket_traits< S >::iostream* stream = new typename socket_traits< S >::iostream;
-            acceptor_.accept( *( stream->rdbuf() ) );
-#if (BOOST_VERSION >= 106600)
-            return new io::ostream( stream, stream->rdbuf()->native_handle(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
-#else
-            return new io::ostream( stream, stream->rdbuf()->native(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
-#endif
-        }
-
-        void close() { acceptor_.close(); }
-
-#ifndef WIN32
-#if (BOOST_VERSION >= 106600)
-        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( acceptor_ ).native_handle(); }
-#else
-        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( acceptor_ ).native(); }
-#endif
-#else
-        io::file_descriptor fd() const { return io::invalid_file_descriptor; }
-#endif
-
-    private:
-        io::mode::value mode_;
-        io::select select_;
-#if (BOOST_VERSION >= 106600)
-        boost::asio::io_context m_service;
-#else
-        boost::asio::io_service m_service;
-#endif
-        typename socket_traits< S >::acceptor acceptor_;
-};
-
-class zero_acceptor_ : public acceptor
-{
-    public:
-        zero_acceptor_( const std::string& name, io::mode::value mode ):
-            stream_( new io::ostream( name, mode ) ),
-            accepted_( false )
-        {
-        }
-
-        io::ostream* accept( boost::posix_time::time_duration )
-        {
-            if( accepted_ ) { return NULL; }
-            accepted_ = true;
-            return stream_;
-        }
-
-        void close() { stream_->close(); }
-        
-        io::file_descriptor fd() const { return io::invalid_file_descriptor; } // quick and dirty
-
-    private:
-        io::ostream* stream_;
-        bool accepted_;
-};
-
-publisher::publisher( const std::string& name, io::mode::value mode, bool blocking, bool flush )
-    : blocking_( blocking ),
-      flush_( flush )
-{
-    std::vector< std::string > v = comma::split( name, ':' );
-    if( v[0] == "tcp" )
-    {
-        if( v.size() != 2 ) { COMMA_THROW( comma::exception, "expected tcp server endpoint, got " << name ); }
-        acceptor_.reset( new socket_acceptor< Tcp >( boost::lexical_cast< unsigned short >( v[1] ), mode ) );
-    }
-    else if( v[0] == "udp" )
-    {
-        COMMA_THROW( comma::exception, "udp: todo" );
-    }
-    else if( v[0] == "local" )
-    {
-#ifndef WIN32
-        if( v.size() != 2 ) { COMMA_THROW( comma::exception, "expected local socket, got " << name ); }
-        acceptor_.reset( new socket_acceptor< local >( v[1], mode ) );
-#endif
-    }
-    else if( v[0].substr( 0, 4 ) == "zero" )
-    {
-        acceptor_.reset( new zero_acceptor_( name, mode ) );
-    }
-    else
-    {
-        if( name == "-" )
-        {
-            streams_.insert( boost::shared_ptr< io::ostream >( new io::ostream( name, mode ) ) );
-#ifndef WIN32
-            select_.write().add( 1 );
-#endif
-        }
-        else
-        {
-            acceptor_.reset( new file_acceptor( name, mode ) );
-            io::ostream* s = acceptor_->accept( boost::posix_time::time_duration() );
-            streams_.insert( boost::shared_ptr< io::ostream >( s ) ); // todo: should we simply abolish file_acceptor and do it in the same way as for stdout?
-            if( s->fd() == comma::io::invalid_file_descriptor ) { COMMA_THROW( comma::exception, "failed to open '" << name << "'" ); }
-#ifndef WIN32
-            select_.write().add( s->fd() );
-#endif
-        }
-    }
-}
-
-unsigned int publisher::write( const char* buf, std::size_t size, bool do_accept )
-{
-    if( do_accept ) { accept(); }
-    if( !blocking_ ) { select_.check(); } // todo: if slow, put all the files in one select
-    unsigned int count = 0;
-    for( streams::iterator i = streams_.begin(); i != streams_.end(); )
-    {
-        streams::iterator it = i++;
-        if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
-        ( **it )->write( buf, size );
-        if( flush_ ) { ( **it )->flush(); }
-        if( ( **it )->good() ) { ++count; }
-        else { remove_( it ); }
-    }
-    return count;
-}
-
-void publisher::close()
-{
-    if( acceptor_ ) { acceptor_->close(); }
-    while( streams_.begin() != streams_.end() ) { remove_( streams_.begin() ); }
-}
-
-unsigned int publisher::accept()
-{
-    if( !acceptor_ ) { return 0; }
-    unsigned int count = 0;
-    while( true ) // while( streams_.size() < maxSize ?
-    {
-        io::ostream* s = acceptor_->accept();
-        if( s == NULL ) { return count; }
-        streams_.insert( boost::shared_ptr< io::ostream >( s ) );
-        select_.write().add( *s );
-        ++count;
-    }
-}
-
-void publisher::remove_( streams::iterator it )
-{
-    select_.write().remove( **it );
-    ( *it )->close();
-    if( acceptor_ ) { acceptor_->notify_closed(); }
-    streams_.erase( it );
-}
-
-std::size_t publisher::size() const { return streams_.size(); }
-
-} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/publisher.h b/io/impl/publisher.h
deleted file mode 100644
index 0e0e37d81..000000000
--- a/io/impl/publisher.h
+++ /dev/null
@@ -1,106 +0,0 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-/// @author cedric wohlleber
-
-#ifndef COMMA_IO_IMPL_PUBLISHER_H_
-#define COMMA_IO_IMPL_PUBLISHER_H_
-
-#include <set>
-#include <boost/scoped_ptr.hpp>
-#include <boost/shared_ptr.hpp>
-#include "../file_descriptor.h"
-#include "../select.h"
-#include "../stream.h"
-
-namespace comma { namespace io {
-    
-class publisher;
-
-} } // namespace comma { namespace io {
-
-namespace comma { namespace io { namespace impl {
-
-struct acceptor
-{
-    virtual ~acceptor() {}
-    virtual io::file_descriptor fd() const = 0;
-    virtual io::ostream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
-    virtual void notify_closed() {} // quick and dirty
-    virtual void close() {}
-};
-    
-class publisher
-{
-    public:
-        publisher( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
-
-        unsigned int write( const char* buf, std::size_t size, bool do_accept = true );
-
-        template < typename T >
-        impl::publisher& operator<<( const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
-        {
-            accept();
-            select_.check();
-            unsigned int count = 0;
-            for( streams::iterator i = streams_.begin(); i != streams_.end(); )
-            {
-                streams::iterator it = i++;
-                if( !blocking_ && !select_.write().ready( **it ) ) { continue; }
-                ( ***it ) << lhs;
-                if( flush_ ) { ( **it )->flush(); }
-                if( ( **it )->good() ) { ++count; }
-                else { remove_( it ); }
-            }
-            return *this;
-        }
-
-        void close();
-
-        std::size_t size() const;
-
-        unsigned int accept();
-        
-        const io::impl::acceptor& acceptor() const { return *acceptor_; }
-
-    private:
-        friend class comma::io::publisher;
-        bool blocking_;
-        bool flush_;
-        boost::scoped_ptr< io::impl::acceptor > acceptor_;
-        typedef std::set< boost::shared_ptr< io::ostream > > streams;
-        streams streams_;
-        io::select select_;
-        void remove_( streams::iterator it );
-};
-
-} } } // namespace comma { namespace io { namespace impl {
-
-#endif // #ifndef COMMA_IO_IMPL_PUBLISHER_H_
diff --git a/io/impl/server.cpp b/io/impl/server.cpp
new file mode 100644
index 000000000..d4266c4ed
--- /dev/null
+++ b/io/impl/server.cpp
@@ -0,0 +1,372 @@
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+
+/// @author cedric wohlleber
+
+#ifdef WIN32
+#include <io.h>
+#include <fcntl.h>
+#include <sys/stat.h>
+#include <sys/types.h>
+#endif
+
+#include <boost/asio/ip/tcp.hpp>
+#include <boost/asio/local/stream_protocol.hpp>
+#include <boost/bind/bind.hpp>
+#include <boost/lexical_cast.hpp>
+#include "../../base/exception.h"
+#include "../../io/file_descriptor.h"
+#include "../../string/string.h"
+#include "server.h"
+
+namespace comma { namespace io { namespace impl {
+
+template < typename Stream > struct stream_traits;
+
+template <> struct stream_traits< io::istream >
+{
+    static constexpr bool is_input_stream{true};
+    static constexpr bool is_output_stream{false};
+};
+
+template <> struct stream_traits< io::ostream >
+{
+    static constexpr bool is_input_stream{false};
+    static constexpr bool is_output_stream{true};
+};
+
+template <> struct stream_traits< io::iostream >
+{
+    static constexpr bool is_input_stream{true};
+    static constexpr bool is_output_stream{true};
+};
+
+template < typename Stream > class file_acceptor : public acceptor< Stream >
+{
+    public:
+        file_acceptor( const std::string& name, io::mode::value mode ): name_( name ), mode_( mode ), fd_( io::invalid_file_descriptor ) { this->_closed = true; }
+
+        ~file_acceptor()
+        {
+#ifndef WIN32
+            ::close( fd_ );
+#else
+            _close( fd_ );
+#endif
+        }
+
+        Stream* accept( boost::posix_time::time_duration )
+        {
+            if( !this->_closed ) { return nullptr; }
+#ifndef WIN32
+            fd_ = ::open( &name_[0], O_WRONLY | O_CREAT | O_NONBLOCK, S_IRUSR | S_IWUSR | S_IRGRP | S_IROTH ); // quick and dirty
+#else
+            fd_ = _open( &name_[0], O_WRONLY | _O_CREAT, _S_IWRITE );
+#endif
+            if( fd_ == io::invalid_file_descriptor ) { return nullptr; }
+            this->_closed = false;
+            return new Stream( name_, mode_, io::mode::non_blocking ); // quick and dirty
+        }
+
+        void notify_closed() { this->_closed = true; ::close( fd_ ); }
+        
+        io::file_descriptor fd() const { return fd_; }
+
+        bool closed() const { COMMA_THROW( comma::exception, "todo" ); }
+
+    private:
+        const std::string name_;
+        const io::mode::value mode_;
+        io::file_descriptor fd_{0}; // todo: make io::istream, io::ostream non-throwing on construction
+};
+
+struct Tcp {};
+template < typename S > struct socket_traits {};
+
+template <> struct socket_traits< Tcp >
+{
+    typedef boost::asio::ip::tcp::endpoint endpoint_type;
+    typedef boost::asio::ip::tcp::acceptor acceptor;
+    typedef boost::asio::ip::tcp::iostream iostream;
+    typedef unsigned short name_type;
+    static endpoint_type endpoint( unsigned short port ) { return endpoint_type( boost::asio::ip::tcp::v4(), port ); }
+};
+
+#ifndef WIN32
+struct local {};
+template <> struct socket_traits< local >
+{
+    typedef boost::asio::local::stream_protocol::endpoint endpoint_type;
+    typedef boost::asio::local::stream_protocol::acceptor acceptor;
+    typedef boost::asio::local::stream_protocol::iostream iostream;
+    typedef std::string name_type;
+    static endpoint_type endpoint( const std::string& name ) { return endpoint_type( name ); }
+};
+#endif
+
+template < typename Stream, typename S > class socket_acceptor : public acceptor< Stream >
+{
+    public:
+        socket_acceptor( const typename socket_traits< S >::name_type& name, io::mode::value mode )
+            : mode_( mode )
+            , _acceptor( m_service, socket_traits< S >::endpoint( name ) )
+        {
+#ifndef WIN32
+#if (BOOST_VERSION >= 106600)
+            select_.read().add( _acceptor.native_handle() );
+#else
+            select_.read().add( _acceptor.native() );
+#endif
+#else
+#if (BOOST_VERSION >= 106600)
+            SOCKET socket = _acceptor.native_handle();
+#else
+            SOCKET socket = _acceptor.native();
+#endif
+            select_.read().add( socket );
+#endif
+        }
+
+        Stream* accept( boost::posix_time::time_duration timeout )
+        {
+            select_.wait( timeout );
+#ifndef WIN32
+#if (BOOST_VERSION >= 106600)
+            if( !select_.read().ready( _acceptor.native_handle() ) ) { return nullptr; }
+#else
+            if( !select_.read().ready( _acceptor.native() ) ) { return nullptr; }
+#endif
+#else
+#if (BOOST_VERSION >= 106600)
+            SOCKET socket = _acceptor.native_handle();
+#else
+            SOCKET socket = _acceptor.native();
+#endif
+            if( !select_.read().ready( socket ) ) { return nullptr; }
+#endif
+            typename socket_traits< S >::iostream* stream = new typename socket_traits< S >::iostream;
+            _acceptor.accept( *( stream->rdbuf() ) );
+#if (BOOST_VERSION >= 106600)
+            return new Stream( stream, stream->rdbuf()->native_handle(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
+#else
+            return new Stream( stream, stream->rdbuf()->native(), mode_, boost::bind( &socket_traits< S >::iostream::close, stream ) );
+#endif
+        }
+
+        void close() { this->_closed = true; _acceptor.close(); }
+
+#ifndef WIN32
+#if (BOOST_VERSION >= 106600)
+        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( _acceptor ).native_handle(); }
+#else
+        io::file_descriptor fd() const { return const_cast< typename socket_traits< S >::acceptor& >( _acceptor ).native(); }
+#endif
+#else
+        io::file_descriptor fd() const { return io::invalid_file_descriptor; }
+#endif
+
+        bool closed() const { COMMA_THROW( comma::exception, "todo" ); }
+
+    private:
+        io::mode::value mode_{io::mode::binary};
+        io::select select_;
+#if (BOOST_VERSION >= 106600)
+        boost::asio::io_context m_service;
+#else
+        boost::asio::io_service m_service;
+#endif
+        typename socket_traits< S >::acceptor _acceptor;
+};
+
+template < typename Stream >
+class zero_acceptor_ : public acceptor< Stream >
+{
+    public:
+        zero_acceptor_( const std::string& name, io::mode::value mode ): _stream( new Stream( name, mode ) ), accepted_( false ) {}
+
+        Stream* accept( boost::posix_time::time_duration )
+        {
+            if( accepted_ ) { return nullptr; }
+            accepted_ = true;
+            return _stream;
+        }
+
+        void close() { this->_closed = true; _stream->close(); }
+        
+        io::file_descriptor fd() const { return io::invalid_file_descriptor; } // quick and dirty
+
+        bool closed() const { return this->_closed || _stream.eof(); }
+
+    private:
+        Stream* _stream{nullptr};
+        bool accepted_{false};
+};
+
+template < typename Stream > server< Stream >::server( const std::string& name, io::mode::value mode, bool blocking, bool flush )
+    : blocking_( blocking ),
+      flush_( flush )
+{
+    std::vector< std::string > v = comma::split( name, ':' );
+    if( v[0] == "tcp" )
+    {
+        if( v.size() != 2 ) { COMMA_THROW( comma::exception, "expected tcp server endpoint, got " << name ); }
+        _acceptor.reset( new socket_acceptor< Stream, Tcp >( boost::lexical_cast< unsigned short >( v[1] ), mode ) );
+    }
+    else if( v[0] == "udp" )
+    {
+        COMMA_THROW( comma::exception, "udp: todo" );
+    }
+    else if( v[0] == "local" )
+    {
+#ifndef WIN32
+        if( v.size() != 2 ) { COMMA_THROW( comma::exception, "expected local socket, got " << name ); }
+        _acceptor.reset( new socket_acceptor< Stream, local >( v[1], mode ) );
+#endif
+    }
+    else if( v[0].substr( 0, 4 ) == "zero" )
+    {
+        _acceptor.reset( new zero_acceptor_< Stream >( name, mode ) );
+    }
+    else
+    {
+        if( name == "-" )
+        {
+            streams_.insert( std::unique_ptr< Stream >( new Stream( name, mode ) ) );
+#ifndef WIN32
+            if( stream_traits< Stream >::is_input_stream ) { select_.read().add( 0 ); }
+            if( stream_traits< Stream >::is_output_stream ) { select_.write().add( 1 ); }
+#endif
+        }
+        else
+        {
+            _acceptor.reset( new file_acceptor< Stream >( name, mode ) );
+            Stream* s = _acceptor->accept( boost::posix_time::time_duration() );
+            streams_.insert( std::unique_ptr< Stream >( s ) ); // todo: should we simply abolish file_acceptor and do it in the same way as for stdout?
+            if( s->fd() == comma::io::invalid_file_descriptor ) { COMMA_THROW( comma::exception, "failed to open '" << name << "'" ); }
+#ifndef WIN32
+            if( stream_traits< Stream >::is_input_stream ) { select_.read().add( s->fd() ); }
+            if( stream_traits< Stream >::is_output_stream ) { select_.write().add( s->fd() ); }
+#endif
+        }
+    }
+}
+
+template < typename Stream > void server< Stream >::close()
+{
+    if( _acceptor ) { _acceptor->close(); }
+    disconnect_all();
+}
+
+template < typename Stream > void server< Stream >::disconnect_all()
+{
+    while( streams_.begin() != streams_.end() ) { _remove( streams_.begin() ); }
+}
+
+template < typename Stream > std::vector< Stream* > server< Stream >::accept()
+{
+    std::vector< Stream* > streams;
+    if( !_acceptor ) { return streams; }
+    while( true ) // while( streams_.size() < maxSize ?
+    {
+        Stream* s = _acceptor->accept();
+        if( s == nullptr ) { return streams; }
+        streams.emplace_back( s );
+        streams_.insert( std::unique_ptr< Stream >( s ) );
+        if( stream_traits< Stream >::is_input_stream ) { select_.read().add( s->fd() ); }
+        if( stream_traits< Stream >::is_output_stream ) { select_.write().add( s->fd() ); }
+    }
+}
+
+template < typename Stream > void server< Stream >::_remove( typename _streams_type::iterator it )
+{
+    if( stream_traits< Stream >::is_input_stream ) { select_.read().remove( **it ); }
+    if( stream_traits< Stream >::is_output_stream ) { select_.write().remove( **it ); }
+    ( *it )->close();
+    if( _acceptor ) { _acceptor->notify_closed(); }
+    streams_.erase( it );
+}
+
+template < typename Stream > std::size_t server< Stream >::size() const { return streams_.size(); }
+
+template < typename Stream > unsigned int server< Stream >::write( server< io::ostream >* s, const char* buf, std::size_t size, bool do_accept )
+{
+    if( do_accept ) { s->accept(); }
+    if( !s->blocking_ ) { s->select_.check(); } // todo: if slow, put all the files in one select
+    unsigned int count = 0;
+    for( auto i = s->streams_.begin(); i != s->streams_.end(); )
+    {
+        auto it = i++;
+        if( !s->blocking_ && !s->select_.write().ready( **it ) ) { continue; }
+        ( **it )->write( buf, size );
+        if( s->flush_ ) { ( **it )->flush(); }
+        if( ( **it )->good() ) { ++count; }
+        else { s->_remove( it ); }
+    }
+    return count;
+}
+
+template < typename Stream > void server< Stream >::_remove_bad()
+{
+    for( auto i = streams_.begin(); i != streams_.end(); ) { if( !( **i )->good() ) { _remove( i ); } }
+}
+
+template < typename Stream > unsigned int server< Stream >::read( server< io::istream >* s, char* buf, std::size_t size, bool do_accept )
+{
+    while( !s->_acceptor->closed() )
+    {
+        if( do_accept ) { s->accept(); }
+        if( s->blocking_ ) { s->select_.wait( boost::posix_time::milliseconds( 100 ) ); } // todo? pass timeout as a parameter?
+        auto j = s->streams_.begin();
+        for( ; j != s->streams_.end() && ( *j )->fd() != s->_last_read; ++j );
+        if( j == s->streams_.end() ) { j = s->streams_.begin(); s->_last_read = io::invalid_file_descriptor; }
+        for( auto i = j; i != s->streams_.end(); )
+        {
+            auto it = i++;
+            if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
+            ( **it )->read( buf, size );
+            if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
+            s->_remove_bad();
+            s->_last_read = ( *it )->fd();
+            return size;
+        }
+        auto e = j == s->streams_.end() ? j : ++j;
+        for( auto i = s->streams_.begin(); i != e; ) // todo: remove code duplication: combine with the previous loop
+        {
+            auto it = i++;
+            if( !s->blocking_ && !s->select_.read().ready( **it ) ) { continue; }
+            ( **it )->read( buf, size );
+            if( ( **it )->gcount() < int( size ) ) { continue; } // quick and dirty
+            s->_remove_bad();
+            s->_last_read = ( *it )->fd();
+            return size;
+        }
+        if( !s->blocking_ ) { return 0; }
+    }
+    return 0;
+}
+
+template < typename Stream > std::string server< Stream >::getline( server< io::istream >* s, bool do_accept )
+{
+    COMMA_THROW( comma::exception, "todo..." );
+}
+
+
+template < typename Stream > std::size_t server< Stream >::available_at_least( const server< io::istream >* s )
+{
+    std::size_t a = 0;
+    for( const auto& t: s->streams_ )
+    {
+        auto n = ( *t )->rdbuf()->in_avail();
+        if( n > int( a ) ) { a = n; }
+    }
+    return a;
+}
+
+template struct acceptor< io::istream >;
+template struct acceptor< io::ostream >;
+// todo: template struct acceptor< io::iostream >;
+template struct server< io::istream >;
+template struct server< io::ostream >;
+// todo: template struct server< io::iostream >;
+
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/impl/server.h b/io/impl/server.h
new file mode 100644
index 000000000..9d6265015
--- /dev/null
+++ b/io/impl/server.h
@@ -0,0 +1,97 @@
+// Copyright (c) 2011 The University of Sydney
+// All rights reserved.
+
+/// @author cedric wohlleber
+
+#pragma once
+
+#include <set>
+#include <boost/scoped_ptr.hpp>
+#include <boost/shared_ptr.hpp>
+#include "../file_descriptor.h"
+#include "../select.h"
+#include "../stream.h"
+
+namespace comma { namespace io {
+
+template < typename Stream > class server;
+
+} } // namespace comma { namespace io {
+
+namespace comma { namespace io { namespace impl {
+
+template < typename Stream >
+class acceptor
+{
+    public:
+        typedef Stream stream_type;
+
+        virtual ~acceptor() {}
+        virtual io::file_descriptor fd() const = 0;
+        virtual Stream* accept( boost::posix_time::time_duration timeout = boost::posix_time::seconds( 0 ) ) = 0;
+        virtual void notify_closed() {} // quick and dirty
+        virtual void close() { _closed = true; }
+        bool closed() const { return _closed; }
+        
+    protected:
+        bool _closed{false};
+};
+
+template < typename Stream >
+class server
+{
+    public:
+        typedef Stream stream_type;
+
+        server( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
+
+        void close();
+        
+        void disconnect_all();
+
+        std::size_t size() const;
+
+        std::vector< Stream* > accept(); // quick and dirty; return naked pointers for now
+        
+        const io::impl::acceptor< Stream >& acceptor() const { return *_acceptor; }
+
+        static unsigned int write( server< io::ostream >* s, const char* buf, std::size_t size, bool do_accept = true );
+
+        template < typename T >
+        static void write( server< io::ostream >* s, const T& lhs ) // quick and dirty, inefficient, but then ascii is meant to be slow...
+        {
+            s->accept();
+            s->select_.check();
+            unsigned int count = 0;
+            for( typename _streams_type::iterator i = s->streams_.begin(); i != s->streams_.end(); )
+            {
+                typename _streams_type::iterator it = i++;
+                if( !s->blocking_ && !s->select_.write().ready( **it ) ) { continue; }
+                ( ***it ) << lhs;
+                if( s->flush_ ) { ( **it )->flush(); }
+                if( ( **it )->good() ) { ++count; }
+                else { s->_remove( it ); }
+            }
+        }
+
+        static unsigned int read( server< io::istream >* s, char* buf, std::size_t size, bool do_accept = true );
+
+        static std::string getline( server< io::istream >* s, bool do_accept = true );
+
+        static std::size_t available_at_least( const server< io::istream >* s );
+
+    protected:
+        template < typename > friend class comma::io::server;
+        template < typename > friend class comma::io::impl::server;
+        bool blocking_;
+        bool flush_;
+        boost::scoped_ptr< io::impl::acceptor< Stream > > _acceptor;
+        typedef std::set< std::unique_ptr< Stream > > _streams_type;
+        io::file_descriptor _last_read{io::invalid_file_descriptor}; // quick and dirty
+        _streams_type streams_;
+        io::select select_;
+        void _remove( typename _streams_type::iterator it );
+        void _remove_bad();
+};
+
+} } } // namespace comma { namespace io { namespace impl {
diff --git a/io/load.h b/io/load.h
new file mode 100644
index 000000000..b6e2599a1
--- /dev/null
+++ b/io/load.h
@@ -0,0 +1,43 @@
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <fstream>
+#include <string>
+#include <vector>
+#include "impl/filesystem.h"
+#include "../base/exception.h"
+
+namespace comma { namespace io {
+
+/// convenience function to load a vector-like contiguous container from file
+template < typename T, template < typename S, typename A > class C = std::vector, typename A = std::allocator< T > >
+C< T, A >& load_array( C< T, A >& a, const std::string& path );
+    
+/// convenience function to load a vector-like contiguous container from file
+/// @note allocates and returns the container, thus it is up to the user to use move semantics
+template < typename T, template < typename S, typename A > class C = std::vector, typename A = std::allocator< T > >
+C< T, A > load_array( const std::string& path );
+
+
+template < typename T, template < typename S, typename A > class C, typename A >
+inline C< T, A >& load_array( C< T, A >& a, const std::string& path )
+{
+    std::ifstream ifs( path );
+    if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << path << "\"" ); }
+    a.resize( comma::filesystem::file_size( path ) / sizeof( T ) ); // todo? will file_size work on symlinks?
+    ifs.read( reinterpret_cast< char * >( &a[0] ), a.size() * sizeof( T ) );
+    if( ifs.gcount() != int( a.size() * sizeof( T ) ) ) { COMMA_THROW( comma::exception, "expected to read " << a.size() * sizeof( T ) << " bytes (" << a.size() << " elements " << sizeof( T ) << " byte(s) each) from \"" << path << "\"; got: " << ifs.gcount() << " byte(s)" ); }
+    return a;
+}
+
+template < typename T, template < typename S, typename A > class C, typename A >
+inline C< T, A > load_array( const std::string& path )
+{
+    C< T, A > a;
+    return load_array( a, path );
+}
+    
+} } // namespace comma { namespace io {
diff --git a/io/publisher.h b/io/publisher.h
index a40c45aac..ed18d842d 100644
--- a/io/publisher.h
+++ b/io/publisher.h
@@ -1,95 +1,14 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_IO_PUBLISHER_H_
-#define COMMA_IO_PUBLISHER_H_
+#pragma once
 
-#include <stdlib.h>
-#include <string>
-#include <boost/noncopyable.hpp>
-#include "stream.h"
-#include "impl/publisher.h"
+#include "server.h"
 
 namespace comma { namespace io {
 
-/// a simple publisher that opens and writes to using services (e.g. tcp, udp, etc)
-class publisher : public boost::noncopyable
-{
-    public:
-        /// constructor
-        /// @param name ::= tcp:<port> | udp:<port> | <filename>
-        ///     if tcp:<port>, create tcp server
-        ///     @todo if udp:<port>, broadcast on udp
-        ///     if <filename> is a regular file, just write to it
-        ///     @todo if <filename> is named pipe, keep reopening it, if closed
-        ///     if <filename> is Linux domain socket, create Linux domain socket server
-        /// @param mode ascii or binary, a hint for Windows
-        /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
-        publisher( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
-
-        /// destructor
-        ~publisher();
-
-        /// publish to all existing connections (blocking), return number of clients with successful write
-        std::size_t write( const char* buf, std::size_t size, bool do_accept = true );
-
-        /// publish to all existing connections (blocking)
-        /// @note data integrity is the user's responsibility
-        ///       i.e. if someone writes:
-        ///           publisher p( "tcp:localhost:1234" );
-        ///           p << 1 << "," << 2 << std::endl;
-        ///       and a client connects after "1" already
-        ///       has been output, this client will receive
-        ///       ",2", which most likely was not intended
-        template < typename T >
-        publisher& operator<<( const T& rhs ) { pimpl_->operator<<( rhs ); return *this; }
-
-        /// close
-        void close();
-
-        /// return current number of connected clients
-        std::size_t size() const;
-
-        /// accept waiting clients, non-blocking
-        /// @return number of clients accepted
-        unsigned int accept();
-        
-        /// return acceptor file descriptor
-        file_descriptor acceptor_file_descriptor() const;
-        
-    private:
-        impl::publisher* pimpl_;
-};
+typedef oserver publisher; // quick and dirty for backward compatibility
 
 } } // namespace comma { namespace io {
-
-#endif // #ifndef COMMA_IO_PUBLISHER_H_
diff --git a/io/select.cpp b/io/select.cpp
index f64de14cb..2ddc1c6ef 100755
--- a/io/select.cpp
+++ b/io/select.cpp
@@ -98,9 +98,12 @@ std::size_t select::wait( boost::posix_time::time_duration timeout )
 
 std::size_t select::check() { return wait( 0 ); }
 
-select::descriptors::descriptors()
+select::descriptors::descriptors() { reset_fds_(); }
+
+void select::descriptors::clear()
 {
-    reset_fds_();
+    FD_ZERO( &fd_set_ );
+    descriptors_.clear();
 }
 
 fd_set* select::descriptors::reset_fds_()
diff --git a/io/select.h b/io/select.h
index 7c9ed9a0a..516e89be0 100755
--- a/io/select.h
+++ b/io/select.h
@@ -94,15 +94,18 @@ class select
                 /// return true, if file descriptor found in descriptor list and ready
                 bool ready( file_descriptor fd ) const;
                 template < typename T > bool ready( const T& t ) const { return ready( t.fd() ); }
+
+                /// remove all descriptors
+                void clear();
                 
                 /// return set of descriptors
                 const std::set< file_descriptor >& operator()() const { return descriptors_; } //const boost::unordered_set< file_descriptor >& operator()() const { return descriptors_; }
 
             private:
                 friend class select;
-                fd_set* reset_fds_();
+                ::fd_set* reset_fds_();
                 std::set< file_descriptor > descriptors_; //boost::unordered_set< file_descriptor > descriptors_;
-                fd_set fd_set_;
+                ::fd_set fd_set_;
         };
 
         /// return read descriptors
diff --git a/io/serial.cpp b/io/serial.cpp
new file mode 100644
index 000000000..db9fcb6a3
--- /dev/null
+++ b/io/serial.cpp
@@ -0,0 +1,88 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+// All rights reserved.
+
+/// @author dave jennings
+
+#include "serial.h"
+
+namespace comma { namespace io { namespace serial {
+
+port::port( const std::string& name ): _port( _service, name ) {}
+
+port::port( const port::properties& p ): port( p.name, p.baud_rate ) {}
+
+port::port( const std::string& name, unsigned int baud_rate )
+    : _port( _service, name )
+{
+    if( baud_rate == 0 ) { return; } // quick and dirty for now
+    set_baud_rate( baud_rate );
+    set_character_size( 8 );
+    set_flow_control( boost::asio::serial_port_base::flow_control::none );
+    set_parity( boost::asio::serial_port_base::parity::none );
+    set_stop_bits( boost::asio::serial_port_base::stop_bits::one );
+}
+
+void port::set_baud_rate( unsigned int baud_rate ) { _port.set_option( boost::asio::serial_port_base::baud_rate( baud_rate )); }
+
+void port::set_character_size( unsigned int character_size ) { _port.set_option( boost::asio::serial_port_base::character_size( character_size )); }
+
+void port::set_flow_control( boost::asio::serial_port_base::flow_control::type flow_control ) { _port.set_option( boost::asio::serial_port_base::flow_control( flow_control )); }
+
+void port::set_parity( boost::asio::serial_port_base::parity::type parity ) { _port.set_option( boost::asio::serial_port_base::parity( parity )); }
+
+void port::set_stop_bits( boost::asio::serial_port_base::stop_bits::type stop_bits ) { _port.set_option( boost::asio::serial_port_base::stop_bits( stop_bits )); }
+
+std::size_t port::read_some( char* buf, std::size_t size ) { return read_some( reinterpret_cast< unsigned char* >( buf ), size ); }
+
+std::size_t port::read_some( unsigned char* buf, std::size_t buf_size )
+{
+    boost::system::error_code ec;
+    std::size_t count = _port.read_some( boost::asio::buffer( buf, buf_size ), ec );
+    COMMA_ASSERT( !ec, ec.message() );
+    return count;
+}
+
+std::size_t port::read_some( char* buf
+                           , std::size_t size
+                           , const boost::asio::deadline_timer::duration_type& timeout )
+{
+    return read_some( reinterpret_cast< unsigned char* >( buf ), size, timeout );
+}
+
+std::size_t port::read_some( unsigned char* buf
+                           , std::size_t buf_size
+                           , const boost::asio::deadline_timer::duration_type& timeout )
+
+{
+    boost::optional< boost::system::error_code > timer_result;
+    boost::asio::deadline_timer timer( _service );
+    timer.expires_from_now( timeout );
+    timer.async_wait( [&timer_result]( const boost::system::error_code& error ) { timer_result.reset( error ); });
+
+    boost::optional< boost::system::error_code > read_result;
+    std::size_t count = 0;
+    _port.async_read_some( boost::asio::buffer( buf, buf_size )
+                         , [&read_result, &count]( const boost::system::error_code& error, std::size_t count_ )
+                         {
+                             read_result.reset( error );
+                             count = count_;
+                         });
+    _service.reset();
+    while( _service.run_one() )
+    {
+        if( read_result ) { timer.cancel(); }
+        if( timer_result ) { _port.cancel(); }
+    }
+    if( *read_result )
+    {
+        // https://www.boost.org/doc/libs/1_65_1/libs/system/doc/reference.html#Header-error_code
+        if( read_result->value() != boost::system::errc::operation_canceled ) { throw boost::system::system_error( *read_result ); }
+    }
+    return count;
+}
+
+std::size_t port::write( const char* buf, std::size_t to_write ) { return boost::asio::write( _port, boost::asio::buffer( buf, to_write )); }
+
+std::size_t port::write( const unsigned char* buf, std::size_t to_write ) { return boost::asio::write( _port, boost::asio::buffer( buf, to_write )); }
+
+} } } // namespace comma { namespace io { namespace serial {
diff --git a/io/serial.h b/io/serial.h
new file mode 100644
index 000000000..8f27814ae
--- /dev/null
+++ b/io/serial.h
@@ -0,0 +1,57 @@
+// Copyright (c) 2023 Mission Systems Pty Ltd
+// All rights reserved.
+
+/// @author dave jennings
+
+#pragma once
+
+#include "../base/exception.h"
+#include <boost/asio.hpp>
+#include <boost/optional.hpp>
+
+namespace comma { namespace io { namespace serial {
+
+class port
+{
+    public:
+        struct properties
+        {
+            std::string name;
+            unsigned int baud_rate{0};
+        };
+
+        port( const std::string& name );
+
+        /// open port as 8N1
+        port( const std::string& name, unsigned int baud_rate );
+
+        port( const properties& p );
+
+        void set_baud_rate( unsigned int baud_rate );
+
+        void set_character_size( unsigned int character_size );
+
+        void set_flow_control( boost::asio::serial_port_base::flow_control::type flow_control );
+
+        void set_parity( boost::asio::serial_port_base::parity::type parity );
+
+        void set_stop_bits( boost::asio::serial_port_base::stop_bits::type stop_bits );
+
+        std::size_t read_some( char* buf, std::size_t buf_size );
+
+        std::size_t read_some( unsigned char* buf, std::size_t buf_size );
+
+        std::size_t read_some( char* buf, std::size_t buf_size, const boost::asio::deadline_timer::duration_type& timeout );
+
+        std::size_t read_some( unsigned char* buf, std::size_t buf_size, const boost::asio::deadline_timer::duration_type& timeout );
+
+        std::size_t write( const char* buf, std::size_t to_write );
+
+        std::size_t write( const unsigned char* buf, std::size_t to_write );
+
+    private:
+        boost::asio::io_service _service; // renamed as io_context in Boost 1.66 (io_service remains as typedef)
+        boost::asio::serial_port _port;
+};
+
+} } } // namespace comma { namespace io { namespace serial {
diff --git a/io/server.cpp b/io/server.cpp
new file mode 100644
index 000000000..5e323b981
--- /dev/null
+++ b/io/server.cpp
@@ -0,0 +1,65 @@
+// This file is part of comma, a generic and flexible library
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+/// @author vsevolod vlaskine
+
+#include "server.h"
+
+namespace comma { namespace io {
+
+template < typename Stream > server< Stream >::server( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) : pimpl_( new impl::server< Stream >( name, mode, blocking, flush ) ) {}
+
+template < typename Stream > server< Stream >::~server() { delete pimpl_; }
+
+template < typename Stream > std::vector< Stream* > server< Stream >::accept() { return pimpl_->accept(); }
+
+template < typename Stream > void server< Stream >::close() { pimpl_->close(); }
+
+template < typename Stream > void server< Stream >::disconnect_all() { pimpl_->disconnect_all(); }
+
+template < typename Stream > std::size_t server< Stream >::size() const { return pimpl_->size(); }
+
+template < typename Stream > file_descriptor server< Stream >::acceptor_file_descriptor() const { return pimpl_->_acceptor ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
+
+template < typename Stream > const io::select& server< Stream >::select() const { return pimpl_->select_; }
+
+std::size_t oserver::write( const char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::ostream >::write( pimpl_, buf, size, do_accept ); }
+
+std::size_t iserver::read( char* buf, std::size_t size, bool do_accept ) { return io::impl::server< io::istream >::read( pimpl_, buf, size, do_accept ); }
+
+std::string iserver::getline( bool do_accept ) { return io::impl::server< io::istream >::getline( pimpl_, do_accept ); }
+
+std::size_t iserver::available_at_least() const { return io::impl::server< io::istream >::available_at_least( pimpl_ ); }
+
+template class server< io::istream >;
+template class server< io::ostream >;
+// todo: template class server< io::iostream >;
+
+} } // namespace comma { namespace io {
diff --git a/io/server.h b/io/server.h
new file mode 100644
index 000000000..2fcf237d5
--- /dev/null
+++ b/io/server.h
@@ -0,0 +1,124 @@
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <stdlib.h>
+#include <memory>
+#include <string>
+#include "stream.h"
+#include "impl/server.h"
+
+namespace comma { namespace io {
+
+/// a simple server base class that opens and reads from or writes to streams using services (e.g. tcp, udp, etc)
+template < typename Stream >
+class server
+{
+    public:
+        /// constructor
+        /// @param name ::= tcp:<port> | udp:<port> | <filename>
+        ///     if tcp:<port>, create tcp server
+        ///     @todo if udp:<port>, broadcast on udp
+        ///     if <filename> is a regular file, just write to it
+        ///     @todo if <filename> is named pipe, keep reopening it, if closed
+        ///     if <filename> is Linux domain socket, create Linux domain socket server
+        /// @param mode ascii or binary, a hint for Windows
+        /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
+        server( const std::string& name, io::mode::value mode, bool blocking = false, bool flush = true );
+
+        /// destructor
+        ~server();
+
+        /// stop accepting clients, disconnect all existing clients
+        void close();
+        
+        /// disconnect all existing clients
+        void disconnect_all();
+
+        /// return current number of connected clients
+        std::size_t size() const;
+
+        /// return acceptor file descriptor
+        file_descriptor acceptor_file_descriptor() const;
+
+        /// publish to all existing connections (blocking)
+        /// @note data integrity is the user's responsibility
+        ///       i.e. if someone writes:
+        ///           server p( "tcp:localhost:1234" );
+        ///           p << 1 << "," << 2 << std::endl;
+        ///       and a client connects after "1" already
+        ///       has been output, this client will receive
+        ///       ",2", which most likely was not intended
+        std::vector< Stream* > accept(); // quick and dirty, use nacked pointers for now
+
+        /// return reference to select on the existing streams
+        const io::select& select() const;
+        
+    protected:
+        server( const server& );
+        server& operator=( const server& );
+        impl::server< Stream >* pimpl_;
+};
+
+struct oserver: public io::server< io::ostream >
+{
+    /// @param name ::= tcp:<port> | udp:<port> | <filename>
+    ///     if tcp:<port>, create tcp server
+    ///     @todo if udp:<port>, broadcast on udp
+    ///     if <filename> is a regular file, just write to it
+    ///     @todo if <filename> is named pipe, keep reopening it, if closed
+    ///     if <filename> is Linux domain socket, create Linux domain socket server
+    /// @param mode ascii or binary, a hint for Windows
+    /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
+    oserver( const std::string& name, comma::io::mode::value mode, bool blocking = false, bool flush = true ): io::server< io::ostream >( name, mode, blocking, flush ) {}
+
+    /// publish to all existing connections (blocking), return number of clients with successful write
+    std::size_t write( const char* buf, std::size_t size, bool do_accept = true );
+
+    /// publish to all existing connections (blocking)
+    /// @note data integrity is the user's responsibility
+    ///       i.e. if someone writes:
+    ///           server p( "tcp:localhost:1234" );
+    ///           p << 1 << "," << 2 << std::endl;
+    ///       and a client connects after "1" already
+    ///       has been output, this client will receive
+    ///       ",2", which most likely was not intended
+    template < typename T >
+    oserver& operator<<( const T& rhs ) { io::impl::server< io::ostream >::write( pimpl_, rhs ); return *this; }
+};
+
+struct iserver: public io::server< io::istream >
+{
+    /// @param name ::= tcp:<port> | udp:<port> | <filename>
+    ///     if tcp:<port>, create tcp server
+    ///     @todo if udp:<port>, broadcast on udp
+    ///     if <filename> is a regular file, just write to it
+    ///     @todo if <filename> is named pipe, keep reopening it, if closed
+    ///     if <filename> is Linux domain socket, create Linux domain socket server
+    /// @param mode ascii or binary, a hint for Windows
+    /// @param blocking if true, blocking write to a client, otherwise discard, if client not ready
+    iserver( const std::string& name, comma::io::mode::value mode, bool blocking = false ): io::server< io::istream >( name, mode, blocking ) {}
+
+    /// read <size> bytes to <buf> from first available client
+    /// return 0 if no clients have data
+    /// start from the next client on the next read to assure round-robin behaviour
+    std::size_t read( char* buf, std::size_t size, bool do_accept = true );
+
+    /// read eol-terminated string from first available client
+    /// return 0 if no clients have data
+    /// start from the next client on the next read to assure round-robin behaviour
+    std::string getline( bool do_accept = true );
+
+    std::size_t available_at_least() const;
+};
+
+// struct ioserver: public io::server< io::iostream >
+// {
+//     // todo
+// };
+
+} } // namespace comma { namespace io {
diff --git a/io/stream.cpp b/io/stream.cpp
index 74d63aae9..fab2b1ab1 100644
--- a/io/stream.cpp
+++ b/io/stream.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// All rights reserved
 
 /// @author vsevolod vlaskine
 
@@ -43,17 +16,16 @@
 
 #include <fcntl.h>
 #include <fstream>
-#include <vector>
+#include <sstream>
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/ip/udp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
-#include <boost/bind.hpp>
-#include <boost/filesystem.hpp>
-#include <boost/filesystem/operations.hpp>
+#include <boost/bind/bind.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include "../base/exception.h"
 #include "../string/string.h"
+#include "impl/filesystem.h"
 #include "file_descriptor.h"
 #include "select.h"
 #include "stream.h"
@@ -66,11 +38,9 @@ namespace comma { namespace io {
 
 namespace impl {
 
-template < typename S >
-struct traits {};
+template < typename S > struct traits {};
 
-template <>
-struct traits < std::istream >
+template <> struct traits < std::istream >
 {
     typedef std::ifstream file_stream;
     static bool is_standard( const std::istream* is ) { return is == &std::cin; }
@@ -96,8 +66,7 @@ struct traits < std::istream >
     #endif
 };
 
-template <>
-struct traits < std::ostream >
+template <> struct traits < std::ostream >
 {
     typedef std::ofstream file_stream;
     static bool is_standard( const std::ostream* is ) { return is == &std::cout || is == &std::cerr; }
@@ -131,12 +100,11 @@ struct traits < std::ostream >
     #endif
 };
 
-template <>
-struct traits < std::iostream >
+template <> struct traits < std::iostream >
 {
     typedef std::fstream file_stream; // quick and dirty, does not matter for now
     static bool is_standard( const std::iostream* ) { return false; }
-    static std::iostream* standard( comma::io::mode::value mode ) { (void) mode; return NULL; }
+    static std::iostream* standard( comma::io::mode::value mode ) { (void) mode; return nullptr; }
     static comma::io::file_descriptor standard_fd() { return comma::io::invalid_file_descriptor; }
     #ifdef WIN32
         static io::file_descriptor open( const std::string& name ) { return io::invalid_file_descriptor; }
@@ -157,28 +125,26 @@ template < typename S > void close_file_stream( typename traits< S >::file_strea
 
 } // namespace impl
 
-template < typename S >
-stream< S >::~stream()
+template < typename S > stream< S >::~stream()
 {
-    if( stream_ == NULL || impl::traits< S >::is_standard( stream_ ) ) { return; }
+    if( stream_ == nullptr || impl::traits< S >::is_standard( stream_ ) ) { return; }
     delete stream_;
-    stream_ = NULL;
+    stream_ = nullptr;
     close_ = NULL;
 }
 
-template < typename S >
-S* stream< S >::lazily_make_stream_()
+template < typename S > S* stream< S >::lazily_make_stream_()
 {
     #ifndef WIN32
-    if( stream_ == NULL ) // quick and dirty: if fstream, cannot open on construction, as pipe might block
+    if( stream_ == nullptr ) // quick and dirty: if fstream, cannot open on construction, as pipe might block
     {
-        if( !boost::filesystem::is_regular_file( name_ ) && !blocking_ ) // quick and dirty
+        if( !comma::filesystem::is_regular_file( name_ ) && !blocking_ ) // quick and dirty
         {
             io::select select;
             select.read().add( fd_ ); // todo: express via traits
             select.write().add( fd_ ); // todo: express via traits
-            select.check(); //if( !select.check() ) { return NULL; }
-            if( !select.read().ready( fd_ ) && !select.write().ready( fd_ ) ) { return NULL; }
+            select.check(); //if( !select.check() ) { return nullptr; }
+            if( !select.read().ready( fd_ ) && !select.write().ready( fd_ ) ) { return nullptr; }
         }
         typename impl::traits< S >::file_stream* s = new typename impl::traits< S >::file_stream( name_.c_str(), static_cast< std::ios::openmode >( mode_ ) );
         if( s->bad() ) { COMMA_THROW( comma::exception, "failed to open " << name_ ); }
@@ -212,8 +178,7 @@ static void set_non_blocking_flags_( io::file_descriptor fd )
 #endif // #ifndef WIN32
 }
 
-template < typename S >
-comma::io::file_descriptor stream< S >::fd() const
+template < typename S > comma::io::file_descriptor stream< S >::fd() const
 {
     #ifdef WIN32
     if( fd_ == io::invalid_file_descriptor )
@@ -227,8 +192,7 @@ comma::io::file_descriptor stream< S >::fd() const
     return fd_;
 }
 
-template < typename S >
-std::size_t stream< S >::available_on_file_descriptor() const
+template < typename S > std::size_t stream< S >::available_on_file_descriptor() const
 {
     int count = 0;
 #ifdef WIN32
@@ -242,11 +206,10 @@ std::size_t stream< S >::available_on_file_descriptor() const
 
 template < typename S > const std::string& stream< S >::name() const { return name_; }
 
-template < typename S >
-stream< S >::stream( const std::string& name, mode::value m, mode::blocking_value blocking )
+template < typename S > stream< S >::stream( const std::string& name, mode::value m, mode::blocking_value blocking )
     : name_( name )
     , mode_( m )
-    , stream_( NULL )
+    , stream_( nullptr )
     , fd_( comma::io::invalid_file_descriptor )
     , close_d( false )
     , blocking_( blocking )
@@ -382,11 +345,39 @@ stream< S >::stream( const std::string& name, mode::value m, mode::blocking_valu
 
         fd_ = impl::traits< S >::open( name );
         if( fd_ != io::invalid_file_descriptor ) { set_non_blocking_flags_( fd_ ); return; }
-        if( boost::filesystem::is_regular_file( name ) ) { COMMA_THROW( comma::exception, "failed to open \"" << name << "\"" ); }
+        if( comma::filesystem::is_regular_file( name ) ) { COMMA_THROW( comma::exception, "failed to open \"" << name << "\"" ); }
         #endif // #ifdef WIN32
     }
 }
 
+namespace impl {
+
+static std::string usage( const std::string& what, const std::string& dash, unsigned int indent, bool verbose )
+{
+    std::string i( indent, ' ' );
+    std::ostringstream oss;
+    oss << i << "<" << what << ">" << std::endl;
+    if( verbose )
+    {
+        oss << i << "    '-'                  : " << dash << std::endl;
+        oss << i << "    <path>               : path to input file or named pipe" << std::endl;
+        oss << i << "    local:<path>         : local linux socket" << std::endl;
+        oss << i << "    tcp:<address>:<port> : tcp socket" << std::endl;
+    }
+    else
+    {
+        oss << i << "    run --help --verbose for details" << std::endl;
+    }
+    return oss.str();
+}
+
+} // namespace impl {
+
+std::string istream::usage( unsigned int indent, bool verbose ) { return impl::usage( "input", "stdin", indent, verbose ); }
+std::string ostream::usage( unsigned int indent, bool verbose ) { return impl::usage( "output", "stdout", indent, verbose ); }
+std::string iostream::usage( unsigned int indent, bool verbose ) { return impl::usage( "input/output", "n/a", indent, verbose ); }
+std::string istreams::usage( unsigned int indent, bool verbose ) { return impl::usage( "input", "stdin", indent, verbose ); } // todo: improve; kind bogus...
+
 template class stream< std::istream >;
 template class stream< std::ostream >;
 template class stream< std::iostream >;
@@ -399,4 +390,46 @@ ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, boo
 ostream::ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close ) : stream< std::ostream >( s, fd, mode, blocking, close ) {}
 iostream::iostream( const std::string& name, mode::value mode , mode::blocking_value blocking ) : stream< std::iostream >( name, mode, blocking ) {}
 
+istreams::istreams( const std::vector< std::string >& names, mode::value mode, mode::blocking_value blocking )
+    : _istream( std::make_unique< istream >( names[0], mode, blocking ) )
+    , _names( names )
+    , _index( 0 )
+    , _mode( mode )
+    , _blocking( blocking )
+{
+}
+
+bool istreams::eof() const { return _index >= _names.size(); }
+
+istreams& istreams::operator++()
+{
+    if( _index >= _names.size() ) { return *this; }
+    ++_index;
+    if( _index < _names.size() ) { _istream.reset(); _istream.reset( new istream( _names[_index], _mode, _blocking ) ); }
+    return *this;
+}
+
+bool istreams::read( char* buf, std::size_t size )
+{
+    std::size_t s = size;
+    for( char* p = buf; s > 0 && !eof(); )
+    {
+        auto& is = *( *_istream );
+        is.read( p, s );
+        if( is.gcount() > 0 ) { s -= is.gcount(); p += is.gcount(); }
+        if ( is.eof() ) { ++( *this ); }
+    }
+    return s == 0;
+}
+
+std::string istreams::getline()
+{
+    COMMA_THROW( comma::exception, "todo, just ask" );
+}
+
+void seek( std::uint64_t offset )
+{
+    COMMA_THROW( comma::exception, "todo, just ask" );
+}
+
 } } // namespace comma { namespace io {
diff --git a/io/stream.h b/io/stream.h
index 9948e9bf9..a86ac2e58 100644
--- a/io/stream.h
+++ b/io/stream.h
@@ -1,40 +1,15 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// All rights reserved
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_IO_STREAM_H_
-#define COMMA_IO_STREAM_H_
+#pragma once
 
+#include <cstdint>
 #include <iostream>
+#include <memory>
 #include <string>
+#include <vector>
 #include <boost/function.hpp>
 #include <boost/noncopyable.hpp>
 #include "file_descriptor.h"
@@ -92,6 +67,12 @@ class stream : boost::noncopyable
         /// @return stream name
         const std::string& name() const;
 
+        /// @return stream mode
+        io::mode::value mode() const { return mode_; }
+
+        /// @return true if stream is blocking
+        bool blocking() const { return blocking_; }
+
     protected:
         stream( const std::string& name, mode::value mode, mode::blocking_value blocking );
         template < typename T >
@@ -121,6 +102,7 @@ struct istream : public stream< std::istream >
     istream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
     istream( std::istream* s, io::file_descriptor fd, mode::value mode, boost::function< void() > close );
     istream( std::istream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close );
+    static std::string usage( unsigned int indent = 0, bool verbose = false );
 };
 
 /// output stream owner
@@ -129,14 +111,43 @@ struct ostream : public stream< std::ostream >
     ostream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
     ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, boost::function< void() > close );
     ostream( std::ostream* s, io::file_descriptor fd, mode::value mode, mode::blocking_value blocking, boost::function< void() > close );
+    static std::string usage( unsigned int indent = 0, bool verbose = false );
 };
 
 /// input/output stream owner
 struct iostream : public stream< std::iostream >
 {
     iostream( const std::string& name, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
+    static std::string usage( unsigned int indent = 0, bool verbose = false );
 };
 
-} } // namespace comma { namespace io {
+/// convenience class: multiple input streams read one by one
+/// use case
+///     - we have log files split by size, e.g. 1MB each: 0.bin, 1.bin, 2.bin, etc
+///     - we want to read records from those files seamlessly
+/// @todo currently, we assume a record never is split across two input files
+///       support for split records: todo, just ask
+/// @todo derive from std::istream (kinda super-fiddly, forwarding lots of methods...)
+/// @todo support constructing from a directory name
+class istreams
+{
+    public:
+        // todo: istreams( const std::string& dir...
+        istreams( const std::vector< std::string >& names, mode::value mode = mode::ascii, mode::blocking_value blocking = mode::blocking );
+        static std::string usage( unsigned int indent = 0, bool verbose = false );
+        bool eof() const;
+        bool read( char* buf, std::size_t size );
+        std::string getline();
+        void seek( std::uint64_t offset );
+        stream< std::istream >& operator()() { return *_istream; }
+        const stream< std::istream >& operator()() const { return *_istream; }
+        istreams& operator++();
+    protected:
+        std::unique_ptr< istream > _istream;
+        std::vector< std::string > _names;
+        unsigned int _index{0};
+        mode::value _mode;
+        mode::blocking_value _blocking;
+};
 
-#endif
+} } // namespace comma { namespace io {
diff --git a/io/terminal.cpp b/io/terminal.cpp
new file mode 100644
index 000000000..ff1a63139
--- /dev/null
+++ b/io/terminal.cpp
@@ -0,0 +1,19 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#include "terminal.h"
+
+namespace comma { namespace io { namespace terminal { namespace controls {
+
+char end::value[] = { 0x07, 0 };
+
+char stderr::start[] = { 0 };
+
+char stderr::end[] = { '\n', 0 }; // quick and dirty
+
+char titlebar::start[] = { 0x1b, ']', '0', ';', 0 };
+
+char titlebar::end[] = { 0x07, 0 };
+
+} } } } // namespace comma { namespace io { namespace terminal { namespace controls {
diff --git a/io/terminal.h b/io/terminal.h
new file mode 100644
index 000000000..bd38d6f5f
--- /dev/null
+++ b/io/terminal.h
@@ -0,0 +1,74 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <iostream>
+
+namespace comma { namespace io { namespace terminal {
+
+namespace controls {
+
+struct end { static char value[]; };
+
+struct stderr { static char start[]; static char end[]; }; // quick and dirty
+
+struct titlebar { static char start[]; static char end[]; };
+
+template < unsigned int Colour >
+struct coloured; // todo
+
+// todo! combining multiple controls
+
+} // namespace controls {
+
+template < typename T >
+void write_to( const std::string& s ) { std::cerr << T::start << s << T::end; }
+
+namespace impl {
+
+template < typename S > struct traits
+{
+    template < typename T > static bool output_if_end( bool started ) { return false; }
+    static void output( const S& s ) { std::cerr << s; }
+};
+
+template <> struct traits< terminal::controls::end >
+{
+    template < typename T > static bool output_if_end( bool started ) { if( started ) { std::cerr << T::end; } return true; }
+    static void output( const terminal::controls::end& s ) {}
+};
+
+} // namespace impl {
+
+template < typename T >
+class ostream
+{
+    public:
+        ~ostream() { if( _started ) { std::cerr << T::end; _started = false; } }
+
+        static terminal::controls::end end() { return terminal::controls::end(); } // convenience method
+
+        template < typename S >
+        ostream& operator<<( const S& s )
+        {
+            if( impl::traits< S >::template output_if_end< T >( _started ) )
+            {
+                _started = false;
+            }
+            else
+            {
+                if( !_started ) { std::cerr << T::start; _started = true; }
+                impl::traits< S >::output( s );
+            }
+            return *this;
+        }
+
+    protected:
+        bool _started{false};
+};
+
+typedef ostream< controls::titlebar > titlebar_ostream;
+
+} } } // namespace comma { namespace io { namespace terminal {
diff --git a/io/test/CMakeLists.txt b/io/test/CMakeLists.txt
index eaa86c42b..bf72a07db 100644
--- a/io/test/CMakeLists.txt
+++ b/io/test/CMakeLists.txt
@@ -1,16 +1,12 @@
-SET( KIT io )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base comma_string comma_io ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread rt )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/io/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_io )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_io ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_io WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_io
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/io/test/io-cat/repeat/expected b/io/test/io-cat/repeat/expected
new file mode 100644
index 000000000..fa9664e7c
--- /dev/null
+++ b/io/test/io-cat/repeat/expected
@@ -0,0 +1,29 @@
+repeat[0]/output/line[0]="1,2,3"
+repeat[0]/output/line[1]="4,5,6"
+repeat[0]/output/line[2]="1,2,3"
+repeat[0]/output/line[3]="4,5,6"
+repeat[0]/output/line[4]="1,2,3"
+repeat[0]/output/line[5]="4,5,6"
+repeat[0]/status=0
+repeat[1]/output/line[0]="1,2,3"
+repeat[1]/output/line[1]="4,5,6"
+repeat[1]/output/line[2]="1,2,3"
+repeat[1]/output/line[3]="4,5,6"
+repeat[1]/output/line[4]="1,2,3"
+repeat[1]/output/line[5]="4,5,6"
+repeat[1]/status=0
+repeat[2]/output/line[0]="1,2,3"
+repeat[2]/output/line[1]="4,5,6"
+repeat[2]/output/line[2]="1,2,3"
+repeat[2]/output/line[3]="4,5,6"
+repeat[2]/status=0
+repeat[3]/output/line[0]="0,0,0"
+repeat[3]/output/line[1]="1,1,1"
+repeat[3]/output/line[2]="2,2,2"
+repeat[3]/output/line[3]="0,0,0"
+repeat[3]/output/line[4]="1,1,1"
+repeat[3]/output/line[5]="2,2,2"
+repeat[3]/output/line[6]="0,0,0"
+repeat[3]/output/line[7]="1,1,1"
+repeat[3]/output/line[8]="2,2,2"
+repeat[3]/status=0
diff --git a/io/test/io-cat/repeat/input b/io/test/io-cat/repeat/input
new file mode 100644
index 000000000..850130f89
--- /dev/null
+++ b/io/test/io-cat/repeat/input
@@ -0,0 +1,4 @@
+repeat[0]="( echo 1,2,3; echo 4,5,6 ) | io-cat - --repeat=3"
+repeat[1]="( echo 1,2,3; echo 4,5,6 ) | csv-to-bin 3ui | io-cat - --repeat=3 | csv-from-bin 3ui"
+repeat[2]="( echo 1,2,3; echo 4,5,6 ) | io-cat - --repeat-forever | head -n4"
+repeat[3]="( echo 0,0,0; echo 1,1,1 ) | io-cat - <( echo 2,2,2 ) --repeat=3"
diff --git a/io/test/io-cat/single_feed/test b/io/test/io-cat/single_feed/test
index 52799eab8..f08a94b25 100755
--- a/io/test/io-cat/single_feed/test
+++ b/io/test/io-cat/single_feed/test
@@ -6,6 +6,8 @@ prefix=io-cat
 declare -A pids
 declare -A files
 
+type -p netstat >/dev/null || { echo "$0: netstat not found; to install run: sudo apt install net-tools" >&2; exit 1; }
+
 function bye
 {
     trap '' INT TERM HUP  # ignore signals
diff --git a/io/test/io-publish/on-demand/input b/io/test/io-publish/on-demand/input
index fd04a154e..4fdc5e2ab 100644
--- a/io/test/io-publish/on-demand/input
+++ b/io/test/io-publish/on-demand/input
@@ -13,25 +13,32 @@ export -f exec_cmd
 
 function read_port()
 {
-    echo "test: creating reader" >&2
+    echo "test: creating reader..." >&2
     socat tcp:localhost:$port -
+    echo "test: created reader" >&2
 }
 
 function client_cmd()
 {
     sleep 5
+    echo "test: starting client 1 of 3..." >&2
     read_port &
     first_client_pid=$!
+    echo "test: started client 1 of 3 with pid $first_client_pid" >&2
     sleep 5
+    echo "test: starting client 2 of 3..." >&2
     read_port &
     second_client_pid=$!
+    echo "test: started client 2 of 3 with pid $second_client_pid" >&2
     sleep 5
     kill_pid_and_children $first_client_pid
     sleep 5
     kill_pid_and_children $second_client_pid
     sleep 5
+    echo "test: starting client 3 of 3..." >&2
     read_port &
     third_client_pid=$!
+    echo "test: started client 3 of 3 with pid $third_client_pid" >&2
     sleep 5
     kill_pid_and_children $third_client_pid
     sleep 5
diff --git a/io/test/io-publish/stdin/input b/io/test/io-publish/stdin/input
index 34d7c54f6..9e388eec8 100644
--- a/io/test/io-publish/stdin/input
+++ b/io/test/io-publish/stdin/input
@@ -1,12 +1,12 @@
 port=42641
 
 function stdin_cmd()
-{
+{ 
     yes
 }
 export -f stdin_cmd
 
 function client_cmd()
 {
-    socat tcp:localhost:$port - | head -10 > client.out
+    socat tcp:localhost:$port - | head -n10 > client.out
 }
diff --git a/io/test/io-publish/test b/io/test/io-publish/test
index f88757263..29b6582b6 100755
--- a/io/test/io-publish/test
+++ b/io/test/io-publish/test
@@ -15,11 +15,11 @@ function kill_pid_and_children()
 {
     pid=$1
     local child_pids=$( pgrep -P $pid )
-    echo "killing children: $child_pids" >&2
-    [[ $child_pids ]] && kill $child_pids
-    echo "killing $pid" >&2
+    if [[ -n "$child_pids" ]]; then echo "killing children with pid(s): $child_pids" >&2; kill $child_pids; fi
+    echo "test: killing $pid" >&2
     kill $pid 2> /dev/null
     wait $pid
+    echo "test: killed $pid" >&2
 }
 
 [[ -d output ]] || mkdir output
@@ -28,22 +28,23 @@ cd output
 [[ $( type -t exec_cmd ) == "function" ]] && options+=" --exec exec_cmd"
 
 if [[ $( type -t stdin_cmd ) == "function" ]]; then
-    stdin_cmd | io-publish tcp:$port $options &
+    stdin_cmd | io-publish tcp:$port $options --verbose &
 else
-    io-publish tcp:$port $options &
+    io-publish tcp:$port $options --verbose &
 fi
 io_publish_pid=$!
-echo "io_publish_pid=$io_publish_pid" >&2
+echo "test: io_publish_pid: $io_publish_pid port: $port" >&2
 
 if [[ $( type -t client_cmd ) == "function" ]]; then
     sleep 1                     # allow time for io-publish to open the port
+    echo "test: running client command..." >&2
     client_cmd > /dev/null &
     client_cmd_pid=$!
-    echo "client_cmd_pid=$client_cmd_pid" >&2
+    echo "test: client_cmd_pid=$client_cmd_pid" >&2
 fi
 
-[[ $test_duration ]] || test_duration=10
-[[ $report_interval ]] || report_interval=1
+[[ -n "$test_duration" ]] || test_duration=10
+[[ -n "$report_interval" ]] || report_interval=1
 
 loops=$( echo "$test_duration / $report_interval" | bc -l | sed 's/\.[0-9]*$//' )
 
@@ -57,12 +58,11 @@ done | sed 's/,$//;s/,[^,]* <defunct>//g' | grep -v ",bash$" | uniq \
 # when logging the processes above, we filter out lines with just bash at the
 # end, as they are in transition, with their children having just died
 
-if [[ $client_cmd_pid ]]; then
-    kill_pid_and_children $client_cmd_pid
-fi
-echo "killing io-publish: $io_publish_pid" >&2
+if [[ $client_cmd_pid ]]; then kill_pid_and_children $client_cmd_pid; fi
+echo "test: killing io-publish: $io_publish_pid" >&2
 kill_pid_and_children $io_publish_pid
 
 if [[ -f client.out ]]; then
+    echo "test: outputting $( realpath client.out )" >&2
     cat client.out | name-value-from-csv line --prefix output -n -d @
 fi
diff --git a/io/test/io-tee/comma_tee_function/expected b/io/test/io-tee/comma_tee_function/expected
index 9dfe99951..59c671aae 100644
--- a/io/test/io-tee/comma_tee_function/expected
+++ b/io/test/io-tee/comma_tee_function/expected
@@ -20,9 +20,9 @@ pipeline/stdout/matches="true"
 
 # commands (with quotes transformed to strings)
 
-basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-function_call_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > out(SQUOTE)"
-unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-unbuffered_fn_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > out(SQUOTE)"
-pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > out(SQUOTE)"
+basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+function_call_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+unbuffered_fn_test/command="bash -c (SQUOTE)example_function (DQUOTE)two (DQUOTE) (DQUOTE)one(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+pipeline/command="bash -c (SQUOTE)grep (SQUOTE)(BSLASH)(SQUOTE)(SQUOTE)^t(SQUOTE)(BSLASH)(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 
diff --git a/io/test/io-tee/comma_tee_function/test b/io/test/io-tee/comma_tee_function/test
index 510f80da4..954ac65c1 100755
--- a/io/test/io-tee/comma_tee_function/test
+++ b/io/test/io-tee/comma_tee_function/test
@@ -41,7 +41,7 @@ function run_test()
     local -r expected_file="$test_name.expected"
     if [[ -z "$expected" ]]; then > $expected_file; else echo -e "$expected" > $expected_file; fi
     echo "test: $test_name: command is: $@" >&2
-    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed 's/"/(DQUOTE)/g'"; s/'/(SQUOTE)/g" )\""
+    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed -e 's/"/(DQUOTE)/g' -e "s/'/(SQUOTE)/g" -e 's/\\/(BSLASH)/g' )\""
     cat $input | comma_tee_function $options $tee_file $dashdash "$@" > $stdout_file
     if [[ $? != 0 ]]; then
         echo "test: io-tee call failed" >&2
diff --git a/io/test/io-tee/simple/expected b/io/test/io-tee/simple/expected
index 6b47dcb31..6e9d6d841 100644
--- a/io/test/io-tee/simple/expected
+++ b/io/test/io-tee/simple/expected
@@ -12,7 +12,7 @@ pipeline/stdout/matches="true"
 
 # commands (with quotes transformed to strings)
 
-basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > out(SQUOTE)"
-pipeline/command="bash -c (SQUOTE)grep (SQUOTE)\(SQUOTE)(SQUOTE)^t(SQUOTE)\(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > out(SQUOTE)"
+basic_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+unbuffered_test/command="bash -c (SQUOTE)grep (DQUOTE)one two(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
+pipeline/command="bash -c (SQUOTE)grep (SQUOTE)(BSLASH)(SQUOTE)(SQUOTE)^t(SQUOTE)(BSLASH)(SQUOTE)(SQUOTE) | grep (DQUOTE)o$(DQUOTE) > (DQUOTE)out(DQUOTE)(SQUOTE)"
 
diff --git a/io/test/io-tee/simple/test b/io/test/io-tee/simple/test
index 21d6e0513..2b1cadefe 100755
--- a/io/test/io-tee/simple/test
+++ b/io/test/io-tee/simple/test
@@ -41,7 +41,7 @@ function run_test()
     local -r expected_file="$test_name.expected"
     if [[ -z "$expected" ]]; then > $expected_file; else echo -e "$expected" > $expected_file; fi
     echo "test: $test_name: command is: $@" >&2
-    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed 's/"/(DQUOTE)/g'"; s/'/(SQUOTE)/g" )\""
+    echo "$test_name/command=\"$( io-tee --dry $options out -- "$@" | sed -e 's/"/(DQUOTE)/g' -e "s/'/(SQUOTE)/g" -e 's/\\/(BSLASH)/g' )\""
     cat $input | io-tee $options $tee_file $dashdash "$@" > $stdout_file
     if [[ $? != 0 ]]; then
         echo "test: io-tee call failed" >&2
diff --git a/io/test/io-topics/commands/substitution/config.json b/io/test/io-topics/commands/substitution/config.json
new file mode 100644
index 000000000..106acde84
--- /dev/null
+++ b/io/test/io-topics/commands/substitution/config.json
@@ -0,0 +1,7 @@
+{
+    "topic1":
+    {
+        "command": "echo command: echo ${log_dir} ${my_var} ${another_var}",
+        "on_exit": "echo on_exit: echo ${log_dir}"
+    }
+}
diff --git a/io/test/io-topics/commands/substitution/expected b/io/test/io-topics/commands/substitution/expected
new file mode 100644
index 000000000..d80b50e68
--- /dev/null
+++ b/io/test/io-topics/commands/substitution/expected
@@ -0,0 +1,9 @@
+log/dir/output/line[0]="command: echo my-dir"
+log/dir/output/line[1]="on_exit: echo my-dir"
+log/dir/status=0
+log/log_dir/output/line[0]="command: echo my-log-dir"
+log/log_dir/output/line[1]="on_exit: echo my-log-dir"
+log/log_dir/status=0
+log/evn/output/line[0]="command: echo my-dir hello world"
+log/evn/output/line[1]="on_exit: echo my-dir"
+log/evn/status=0
diff --git a/io/test/io-topics/commands/substitution/input b/io/test/io-topics/commands/substitution/input
new file mode 100644
index 000000000..d48192f35
--- /dev/null
+++ b/io/test/io-topics/commands/substitution/input
@@ -0,0 +1,3 @@
+log/dir="io-topics log --config config.json --dir my-dir --verbose"
+log/log_dir="io-topics log --config config.json --log-dir my-log-dir --verbose"
+log/evn="io-topics log --config config.json --dir my-dir --env 'my_var=hello;another_var=world' --verbose"
diff --git a/io/test/io-topics/commands/test b/io/test/io-topics/commands/test
new file mode 100755
index 000000000..152895e63
--- /dev/null
+++ b/io/test/io-topics/commands/test
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands
diff --git a/io/test/stream_test.cpp b/io/test/stream_test.cpp
index 388702229..30adc818e 100644
--- a/io/test/stream_test.cpp
+++ b/io/test/stream_test.cpp
@@ -1,46 +1,21 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <cstdio>
 #include <fstream>
 #include <gtest/gtest.h>
+#include <boost/asio/io_service.hpp>
 #include <boost/asio/ip/tcp.hpp>
 #include <boost/asio/local/stream_protocol.hpp>
-#include <boost/filesystem/operations.hpp>
+#include "../impl/filesystem.h"
+#include "../load.h" // just to make sure it compiles
 #include "../select.h"
 #include "../stream.h"
 
 TEST( io, file_stream )
 {
     {
-        boost::filesystem::remove( "./test.pipe" );
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.pipe" );
+        comma::filesystem::remove( "./test.file" );
         comma::io::ostream ostream( "./test.file" );
         comma::io::istream istream( "./test.file" );
         std::string line;
@@ -50,19 +25,108 @@ TEST( io, file_stream )
         EXPECT_EQ( line, "hello, world" );
         ostream.close();
         istream.close();
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.file" );
     }
     // todo: more testing?
-    system( "mkfifo test.pipe" );
-    EXPECT_TRUE( boost::filesystem::exists( "./test.pipe" ) );
-    EXPECT_TRUE( !boost::filesystem::is_regular_file( "./test.pipe" ) );
+    EXPECT_EQ( system( "mkfifo test.pipe" ), 0 );
+    EXPECT_TRUE( comma::filesystem::exists( "./test.pipe" ) );
+    EXPECT_TRUE( !comma::filesystem::is_regular_file( "./test.pipe" ) );
     EXPECT_TRUE( ::open( "./test.pipe", O_RDONLY | O_NONBLOCK ) > 0 );
     comma::io::ostream os( "./test.pipe" );
     EXPECT_TRUE( os() != NULL );
     EXPECT_TRUE( os->good() );
-    system( "rm ./test.pipe" );
+    EXPECT_EQ( system( "rm ./test.pipe" ), 0 );
 }
 
+TEST(io, istreams) {
+    std::vector<std::string> files = { "./file1.txt" };
+
+    // --- single file ---
+    {
+        std::ofstream os1(files[0]);
+        os1 << "abc";
+        os1.close();
+
+        comma::io::istreams single(files);
+
+        char buf1[4] = {0};
+
+        // partial read
+        bool ok = single.read(buf1, 2);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf1[0], 'a');
+        EXPECT_EQ(buf1[1], 'b');
+        EXPECT_FALSE(single.eof()); // not at EOF yet
+
+        // read the remainder
+        ok = single.read(buf1 + 2, 1);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf1[2], 'c');
+        EXPECT_FALSE(single.eof()); // EOF not flagged until next attempt
+
+        // attempt to read past EOF
+        ok = single.read(buf1, 1);
+        EXPECT_FALSE(ok);
+        EXPECT_TRUE(single.eof());
+
+        // edge case: zero-size read should succeed and not change EOF
+        ok = single.read(buf1, 0);
+        EXPECT_TRUE(ok);
+        EXPECT_TRUE(single.eof());
+    }
+
+    // --- multiple files ---
+    {
+        files.emplace_back("./file2.txt");
+        std::ofstream os2(files[1]);
+        os2 << "def";
+        os2.close();
+
+        files.emplace_back("./file3.txt");
+        std::ofstream os3(files[2]);
+        os3 << "ghi";
+        os3.close();
+
+        comma::io::istreams multi(files);
+
+        char buf2[10] = {0};
+
+        // first file, partial read
+        bool ok = multi.read(buf2, 3);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf2[0], 'a');
+        EXPECT_EQ(buf2[1], 'b');
+        EXPECT_EQ(buf2[2], 'c');
+        EXPECT_FALSE(multi.eof());
+
+        // read across files 1 -> 2 -> 3
+        ok = multi.read(buf2 + 3, 5);
+        EXPECT_TRUE(ok);
+        EXPECT_EQ(buf2[3], 'd');
+        EXPECT_EQ(buf2[4], 'e');
+        EXPECT_EQ(buf2[5], 'f');
+        EXPECT_EQ(buf2[6], 'g');
+        EXPECT_EQ(buf2[7], 'h');
+        EXPECT_FALSE(multi.eof());
+
+        // read remainder, but request too many
+        ok = multi.read(buf2 + 8, 3); // only 'i' available
+        EXPECT_FALSE(ok);             // not enough to fill request
+        EXPECT_EQ(buf2[8], 'i');
+        EXPECT_EQ(buf2[9], '\0');     // untouched
+        EXPECT_TRUE(multi.eof());
+
+        // edge case: further reads must stay at EOF
+        ok = multi.read(buf2, 1);
+        EXPECT_FALSE(ok);
+        EXPECT_TRUE(multi.eof());
+    }
+
+    // cleanup
+    for (const auto& f : files) { comma::filesystem::remove(f); }
+}
+
+
 TEST( io, std_stream )
 {
     comma::io::istream istream( "-" );
@@ -115,7 +179,7 @@ TEST( io, local_stream )
 {
     #ifndef WIN32
     {
-        boost::filesystem::remove( "./test.localsocket" );
+        comma::filesystem::remove( "./test.localsocket" );
         boost::asio::local::stream_protocol::endpoint endpoint( "test.localsocket" );
         EXPECT_TRUE( !boost::asio::local::stream_protocol::iostream( endpoint ) );
         boost::asio::io_service service;
@@ -127,17 +191,17 @@ TEST( io, local_stream )
         ostream.close();
         acceptor.close();
         EXPECT_TRUE( !boost::asio::local::stream_protocol::iostream( endpoint ) );
-        EXPECT_TRUE( !boost::filesystem::is_regular_file( "./test.localsocket" ) );
-        boost::filesystem::remove( "./test.localsocket" );
+        EXPECT_TRUE( !comma::filesystem::is_regular_file( "./test.localsocket" ) );
+        comma::filesystem::remove( "./test.localsocket" );
     }
     {
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.file" );
         comma::io::ostream ostream( "./test.file" );
         ostream.close();
         boost::asio::io_service service;
         boost::asio::local::stream_protocol::endpoint endpoint( "test.file" );
         try { boost::asio::local::stream_protocol::acceptor acceptor( service, endpoint ); EXPECT_TRUE( false ); } catch( ... ) {}
-        boost::filesystem::remove( "./test.file" );
+        comma::filesystem::remove( "./test.file" );
     }
     #endif
 }
@@ -146,4 +210,5 @@ int main( int argc, char* argv[] )
 {
     ::testing::InitGoogleTest(&argc, argv);
     return RUN_ALL_TESTS();
-}
\ No newline at end of file
+}
+
diff --git a/io/test/test b/io/test/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/io/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands
diff --git a/io/traits.h b/io/traits.h
new file mode 100644
index 000000000..40d92a7f9
--- /dev/null
+++ b/io/traits.h
@@ -0,0 +1,28 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include "../visiting/traits.h"
+#include "serial.h"
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::io::serial::port::properties >
+{
+    template< typename K, typename V > static void visit( const K&, comma::io::serial::port::properties& t, V& v )
+    {
+        v.apply( "name", t.name );
+        v.apply( "baud_rate", t.baud_rate );
+    }
+    
+    template< typename K, typename V > static void visit( const K&, const comma::io::serial::port::properties& t, V& v )
+    {
+        v.apply( "name", t.name );
+        v.apply( "baud_rate", t.baud_rate );
+    }
+};
+
+} } // namespace comma { namespace visiting { 
diff --git a/math/compare.h b/math/compare.h
index b55b62600..d87951abb 100644
--- a/math/compare.h
+++ b/math/compare.h
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
diff --git a/math/exponential_moving_average.h b/math/exponential_moving_average.h
new file mode 100644
index 000000000..c38792a54
--- /dev/null
+++ b/math/exponential_moving_average.h
@@ -0,0 +1,55 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include "../base/exception.h"
+#include "../base/none.h"
+#include "../base/types.h"
+
+namespace comma { namespace math {
+
+template < typename T >
+class exponential_moving_average
+{
+    public:
+        typedef T value_type;
+
+        exponential_moving_average( double alpha = 0.5, comma::uint64 initial_count = 1 );
+
+        template < typename S >
+        exponential_moving_average& operator+=( const S& lhs );
+
+        const T& operator()() const { if( _count > 0 ) { return _value; } COMMA_THROW( comma::exception, "no values provided yet" ); }
+
+        comma::uint64 count() const { return _count; }
+
+    private:
+        double _alpha{0.5};
+        comma::uint64 _initial_count{1};
+        comma::uint64 _count{0};
+        T _value;
+};
+
+template < typename T >
+inline exponential_moving_average< T >::exponential_moving_average( double alpha, comma::uint64 initial_count )
+    : _alpha( alpha )
+    , _initial_count( initial_count )
+{
+}
+
+// todo! better casting, otherwise it does not work well on integral-like values (e.g. integers or boost::posix_time::time_duration)
+template < typename T >
+template < typename S >
+inline exponential_moving_average< T >& exponential_moving_average< T >::operator+=( const S& t )
+{
+    if( _count == 0 ) { _value = T( t ); }
+    else if( _count < _initial_count ) { _value = ( _value * _count + T( t ) ) * 1. / ( _count + 1 ); }
+    else { _value = _value * ( 1. - _alpha ) + T( t ) * _alpha; }
+    ++_count;
+    return *this;
+}
+
+} } // namespace comma { namespace math {
diff --git a/math/interval.h b/math/interval.h
index 23f491601..5fbec8d23 100644
--- a/math/interval.h
+++ b/math/interval.h
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
diff --git a/math/test/CMakeLists.txt b/math/test/CMakeLists.txt
index 4eed24bae..96c00afbc 100644
--- a/math/test/CMakeLists.txt
+++ b/math/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT math )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT math )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/name_value/CMakeLists.txt b/name_value/CMakeLists.txt
index b1b30b945..c61830fed 100644
--- a/name_value/CMakeLists.txt
+++ b/name_value/CMakeLists.txt
@@ -7,12 +7,20 @@ FILE( GLOB impl_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/*.h )
 SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} ${impl_includes} )
 #ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} ${impl_includes} comma_application comma_string comma_xpath )
 
+if( comma_BUILD_NAME_VALUE_YAML )
+    # find_package( yaml REQUIRED ) # todo
+    set( CMAKE_CXX_FLAGS "-Dcomma_BUILD_NAME_VALUE_YAML ${CMAKE_CXX_FLAGS}" ) # todo? move to the main CMakeLists.txt?
+    set( source "${source};${SOURCE_CODE_BASE_DIR}/${PROJECT}/impl/yaml.cpp" )
+endif( comma_BUILD_NAME_VALUE_YAML )
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
 INSTALL( FILES ${impl_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/impl )
 
 ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
 SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
-TARGET_LINK_LIBRARIES( ${TARGET_NAME} comma_application comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} )
+target_link_libraries( ${TARGET_NAME} comma_string comma_xpath ${comma_ALL_EXTERNAL_LIBRARIES} ) # comma_application
+if( comma_BUILD_NAME_VALUE_YAML )
+    target_link_libraries( ${TARGET_NAME} yaml )
+endif( comma_BUILD_NAME_VALUE_YAML )
 INSTALL(
     TARGETS ${TARGET_NAME}
     RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
diff --git a/name_value/applications/CMakeLists.txt b/name_value/applications/CMakeLists.txt
index 48ec29ad5..76611190c 100644
--- a/name_value/applications/CMakeLists.txt
+++ b/name_value/applications/CMakeLists.txt
@@ -12,16 +12,28 @@ TARGET_LINK_LIBRARIES( name-value-get comma_application comma_string comma_xpath
 TARGET_LINK_LIBRARIES( name-value-eval-preparse comma_application comma_name_value )
 TARGET_LINK_LIBRARIES( name-value-permute comma_application comma_string comma_xpath comma_name_value )
 
-INSTALL( TARGETS name-value-convert name-value-get name-value-eval-preparse name-value-permute
-         RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR}
-         COMPONENT Runtime )
+set_target_properties( name-value-convert PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( name-value-get PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( name-value-eval-preparse PROPERTIES LINK_FLAGS_RELEASE -s )
+set_target_properties( name-value-permute PROPERTIES LINK_FLAGS_RELEASE -s )
 
-install( PROGRAMS name-value-eval name-value-calc name-value-apply DESTINATION ${comma_INSTALL_BIN_DIR} )
+INSTALL( TARGETS name-value-convert
+                 name-value-get
+                 name-value-eval-preparse
+                 name-value-permute
+                 RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
          
 add_executable( name-value-from-csv ${dir}/name-value-from-csv.cpp )
 target_link_libraries( name-value-from-csv comma_application comma_string )
+set_target_properties( name-value-from-csv PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS name-value-from-csv RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 add_executable( name-value-to-csv ${dir}/name-value-to-csv.cpp )
 target_link_libraries( name-value-to-csv comma_application comma_string )
+set_target_properties( name-value-to-csv PROPERTIES LINK_FLAGS_RELEASE -s )
 install( TARGETS name-value-to-csv RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+
+install( PROGRAMS name-value-apply DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS name-value-calc DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS name-value-eval DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS name-value-forms DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/name_value/applications/name-value-apply b/name_value/applications/name-value-apply
index 2b064142b..a5f540966 100755
--- a/name_value/applications/name-value-apply
+++ b/name_value/applications/name-value-apply
@@ -3,7 +3,7 @@
 
 source $( type -p comma-application-util )
 
-function say() { echo "$scriptname: $@" >&2; }
+function say() { echo "name-value-apply: $@" >&2; }
 function die() { say "$@"; exit 1; }
 function bye() { say "$@"; exit 0; }
 function mangle_options() { comma-options-to-name-value "$@" | { grep '='; :; } | comma_path_value_mangle | sed 's/^/local options_/g'; comma_status_ok; }
@@ -11,8 +11,9 @@ function mangle_options() { comma-options-to-name-value "$@" | { grep '='; :; }
 function description()
 {
     cat <<EOF
---help,-h; output instructions for using this program and exit.
---source; for each name, show the source config instead of its value.
+--help,-h; output instructions for using this program and exit
+--source; for each name, show the source config instead of its value
+--unquote-numbers,-u; unquote numbers
 EOF
 }
 
@@ -22,23 +23,26 @@ function usage()
 {
     cat >&2 <<EOF
 
-Derive a config from multiple input configs.
+take multiple path-value inputs, apply on top of each other
+    
+e.g: assume we have a default config file and then the user would like to set just some values and leave
+     the rest as default; then we simply apply the user's config on top of default as in examples below
 
-Usage:
-    $scriptname [<options>] <files...>
+usage
+    name-value-apply [<options>] <files...>
 
-Options:
+options
 $( description | sed 's/^/    /' )
 
-Example:
+example
     > ( echo a=5; echo b=7 ) > cfg1.pv; ( echo a=6; echo c=8 ) > cfg2.pv
 
-    > $scriptname cfg1.pv cfg2.pv
+    > name-value-apply cfg1.pv cfg2.pv
     a="6"
     b="7"
     c="8"
 
-    > $scriptname --source cfg*
+    > name-value-apply --source cfg*
     a="cfg2.pv"
     b="cfg1.pv"
     c="cfg2.pv"
@@ -51,23 +55,18 @@ function combine_files() { for ff in "${files[@]}"; do cat "$ff" | name-value-co
 
 function execute()
 {
-    local -r scriptname=$( basename "$0" )
-
     (( $( comma_options_has --bash-completion $@ ) )) && { bash_completion; exit 0; }
     (( $( comma_options_has --help $@ ) || $( comma_options_has -h $@ ) )) && usage
-
     local mangle_text ff
     local -a files
     mangle_text=$( description | mangle_options "$@"; comma_status_ok ) || die "Invalid arguments."; eval "$mangle_text"
     mangle_text="files=( $( description | comma-options-to-name-value "$@" | grep '^"' ) )"; eval "$mangle_text"; unset mangle_text
-
-    for ff in "${files[@]}"
-    do
-        { name-value-convert < "$ff" |
-            { [[ -z $options_source ]] &&  cat - || cut -d = -f1 |  sed "s~$~=\"$ff\"~g";}
-        }
-    done | name-value-convert --take-last
+    local unquote_numbers_option
+    (( !options_unquote_numbers )) || unquote_numbers_option="--unquote-numbers"
+    
+    for ff in "${files[@]}"; do
+        name-value-convert < "$ff" | { [[ -z $options_source ]] &&  cat - || cut -d = -f1 |  sed "s~$~=\"$ff\"~g"; }
+    done | name-value-convert --take-last $unquote_numbers_option
 }
 
 [[ $( basename $0 ) != "name-value-apply" ]] || execute "$@"
-
diff --git a/name_value/applications/name-value-calc b/name_value/applications/name-value-calc
index 638c11719..3db8ce4ab 100755
--- a/name_value/applications/name-value-calc
+++ b/name_value/applications/name-value-calc
@@ -1,51 +1,22 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 name=$( basename $0 )
 
-source $( which comma-application-util ) || { echo "$name: cannot source 'comma-application-util'" >&2; exit 1; }
+source $( type -p comma-application-util )
 
 simple_usage()
 {
-    cat <<EOF
-Usage: $name <file1> <file2> ... [--add|--sub|--other-operations] [-h|--help]
-       ${name//?/ } [--json] [--strict] [--details] [--exclude path]
-EOF
-    if [[ $# != 0 ]]; then exit $1; fi
+    cat <<eof >&2
+Usage: name-value-calc <file1> <file2> ... [--add|--sub|--other-operations] [-h|--help] [--json] [--strict] [--details] [--exclude <path>]
+eof
 }
 
 usage()
 {
     simple_usage
-    cat >&2 <<EOF
+    cat <<eof >&2
 
 Perform simple calculations on corresponding values in multiple name=value or .json input files.
 
@@ -89,40 +60,36 @@ Notes on comparison:
 
 Examples:
 
-    $name f1 f2 f3 --add
+    name-value-calc f1 f2 f3 --add
         -- add all values in f1, f2 and f3
 
-    $name f1.json --sub f2.json --json
+    name-value-calc f1.json --sub f2.json --json
         -- subtract all values in f2.json from f1.json (output in .json format)
 
-    $name f1.json f2.json --sub --json
+    name-value-calc f1.json f2.json --sub --json
         -- same as above; placement of the operation option does not matter
 
-    v=\$( $name f1 f2 --less )
+    v=\$( name-value-calc f1 f2 --less )
         -- capture the comparison result in a variable; v is 1 if comparison is true
 
-    (( $($name f1 --less f2) == 1 )) && echo "f1 < f2" || echo "f1 is not < f2"
+    (( \$( name-value-calc f1 --less f2 ) == 1 )) && echo "f1 < f2" || echo "f1 is not < f2"
         -- compares values in f1 and f2 and reports the outcome
 
-    $name f1 f2 --sub --strict > outfile
-    (( $? == 0 )) || exit 1
+    name-value-calc f1 f2 --sub --strict > outfile
+    (( \$? == 0 )) || exit 1
         -- will fail if the first input file contains string data (operation '-' is not
            defined for strings)
 
-    $name f1 f2 --sub --strict --exclude "path/to/string" > outfile
+    name-value-calc f1 f2 --sub --strict --exclude "path/to/string" > outfile
         -- specifically exclude a specified data path from the operation, e.g., because
            the '-' operation is not defined for strings
 
-EOF
-    if [[ $# != 0 ]]; then exit $1; fi
+eof
+    exit
 }
 
-function bye()
-{
-    if [[ -z $1 ]] ; then exit 1 ; else exit $1; fi
-}
+function bye() { [[ -z "$1" ]] || exit 1; exit $1; }
 
-# arguments are an error message to print
 function die()
 {
     echo "$name: $*" >&2
@@ -134,12 +101,7 @@ function inlist()
 {
     local value="$1"
     local list="$2"
-    local c
-    for c in $list ; do
-        if [[ "$c" == "$value" ]]; then
-            return 0
-        fi
-    done
+    for c in $list ; do [[ "$c" != "$value" ]] || return 0; done
     return 1
 }
 
@@ -156,7 +118,10 @@ function logical_op()
 function python_converter()
 {
     # todo? python2 -c "import operator...
-    python -c "import operator
+    python3 -c "
+from __future__ import division
+from __future__ import print_function
+import operator
 from sys import stdin
 filesep = '$file_separator'
 what = '$operation'
@@ -174,11 +139,12 @@ operands = {
              '==' : operator.eq,
              '<>' : operator.ne,
              '!=' : operator.ne,
-             '/'  : operator.div,
+             '/'  : operator.truediv,
+             '//' : operator.floordiv,
              '*'  : operator.mul,
            }
 
-arithmetic = [ '+', '-', '/', '*' ]
+arithmetic = [ '+', '-', '/', '//', '*' ]
 
 names = {}
 ordered_names = []
@@ -216,7 +182,7 @@ while True:
             names[n] = ( False, v )
             ordered_names.append( n )
     else:
-        if names.has_key( n ):
+        if n in names:
             try:
                 names[n] = ( True, op(names[n][1], v) )
             except TypeError:
@@ -225,7 +191,7 @@ while True:
 
 for n in ordered_names:
     v = names[n]
-    print '%s=\"%s\"' % ( n, str(output(v[0], v[1], logical)) )
+    print( '%s=\"%s\"' % ( n, str(output(v[0], v[1], logical)) ) )
 "
 }
 
@@ -237,7 +203,7 @@ function invert_grep()
     echo $?
 }
 
-if [[ $# == 0 ]]; then simple_usage 1; fi
+[[ $# > 0 ]] || { simple_usage; exit 1; }
 
 input_files=()
 operation=
@@ -249,34 +215,35 @@ debug=1
 
 while [[ $# -gt 0 ]]; do
     case "$1" in
-        -h|--help)               usage 0;;
-        --add)                   operation="+";;
-        --sub|--subtract)        operation="-";;
-        --mul|--mult|--multiply) operation="*";;
-        --div|--divide)          operation="/";;
-        --less)                  operation="<";;
-        --less-or-equal)         operation="<=";;
-        --more)                  operation=">";;
-        --more-or-equal)         operation=">=";;
-        --equal)                 operation="==";;
-        --non-equal)             operation="!=";;
-        --not-equal)             operation="!=";;
-        --json)                  json_format=1;;
-        --strict)                strict=1;;
-        --detailed)              detailed=1;;
-        --debug)                 debug=1;;
-        --no-debug)              debug=0;;
-        --exclude)               shift; if [[ $# == 0 ]] ; then echo "$name: --exclude lack argument" >&2; exit 1; fi; excluded+=( "$1" );;
-        -*)                      echo "$name: unrecognized option '$1'" >&2; exit 1;;
-        *)                       input_files+=( "$1" );;
+        -h|--help)                usage;;
+        --add)                    operation="+";;
+        --sub|--subtract)         operation="-";;
+        --mul|--mult|--multiply)  operation="*";;
+        --div|--divide|--truediv) operation="/";;
+        --floordiv)               operation="//";;
+        --less)                   operation="<";;
+        --less-or-equal)          operation="<=";;
+        --more)                   operation=">";;
+        --more-or-equal)          operation=">=";;
+        --equal)                  operation="==";;
+        --non-equal)              operation="!=";;
+        --not-equal)              operation="!=";;
+        --json)                   json_format=1;;
+        --strict)                 strict=1;;
+        --detailed)               detailed=1;;
+        --debug)                  debug=1;;
+        --no-debug)               debug=0;;
+        --exclude)                shift; if [[ $# == 0 ]] ; then echo "$name: --exclude lack argument" >&2; exit 1; fi; excluded+=( "$1" );;
+        -*)                       echo "$name: unrecognized option '$1'" >&2; exit 1;;
+        *)                        input_files+=( "$1" );;
     esac
     shift
 done
 
-binary_operands=( "-" "/" "<" "<=" ">" ">=" "==" "!=" )
+binary_operands=( "-" "/" "//" "<" "<=" ">" ">=" "==" "!=" )
 logical_operands=( "<" "<=" ">" ">=" "==" "!=" )
 
-if [[ ${#input_files[@]} == 0 ]]; then simple_usage 1; fi
+[[ ${#input_files[@]} != 0 ]] || { simple_usage; exit 1; }
 if [[ ${#input_files[@]} == 1 ]]; then echo "$name: at least two input files required" >&2; exit 1; fi
 if [[ -z "$operation" ]]; then echo "$name: operation must be specified (e.g. --subtract)" >&2; exit 1; fi
 if binary_op "$operation" && [[ ${#input_files[@]} > 2 ]]; then echo "$name: only two input files permitted with $operation operation"; exit 1; fi
diff --git a/name_value/applications/name-value-convert.cpp b/name_value/applications/name-value-convert.cpp
index 6c0ac8d18..4c80d0d1d 100644
--- a/name_value/applications/name-value-convert.cpp
+++ b/name_value/applications/name-value-convert.cpp
@@ -1,38 +1,10 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
+#include <fstream>
 #include <iostream>
-#include <boost/bind.hpp>
-#include <boost/function.hpp>
+#include <map>
 #include <boost/property_tree/info_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include <boost/property_tree/json_parser.hpp>
@@ -40,10 +12,10 @@
 #include <boost/regex.hpp>
 #include <boost/version.hpp>
 #include "../../base/exception.h"
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../name_value/ptree.h"
 #include "../../name_value/serialize.h"
+#include "../../string/split.h"
 #include "../../xpath/xpath.h"
 
 static void usage( bool verbose = false )
@@ -54,31 +26,43 @@ static void usage( bool verbose = false )
     std::cerr << "usage: cat data.xml | name-value-convert [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "data options" << std::endl;
-    std::cerr << "    --from <format>: input format; if this options is omitted, input format will be guessed (only for json, xml, and path-value)" << std::endl;
-    std::cerr << "    --to <format>: output format; default path-value" << std::endl;
+    std::cerr << "    --from <format>: input format; if this options is omitted, input format will be guessed; formats: json, xml, path-value/pv" << std::endl;
+    std::cerr << "    --to <format>: output format; formats: ini, json, xml, path-value (pv), dot; default: path-value" << std::endl;
+    std::cerr << "    --path=[[<filename>:]<path>]; output data at a given path in the input" << std::endl;
+    std::cerr << "                                  multiple instances of --path supported" << std::endl;
+    std::cerr << "                                  <filename> supported only for a single --path" << std::endl;
+    std::cerr << "                                  e.g. --path path/inside/json/file" << std::endl;
+    std::cerr << "                                       --path my-config.json:path/inside/json/file" << std::endl;
+    std::cerr << "                                  regex expression support: todo" << std::endl;
+    std::cerr << "    --strict: return error if path specified in --path not found" << std::endl;
     std::cerr << std::endl;
     std::cerr << "formats" << std::endl;
-    std::cerr << "    info: info data (see boost::property_tree)" << std::endl;
-    std::cerr << "    ini: ini data" << std::endl;
-    std::cerr << "    json: json data" << std::endl;
-    std::cerr << "    xml: xml data" << std::endl;
-    std::cerr << "    path-value: path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
+    std::cerr << "    dot        : as graphviz dot language, see: https://graphviz.org/doc/info/lang.html" << std::endl;
+    std::cerr << "    info       : info data (see boost::property_tree)" << std::endl;
+    std::cerr << "    ini        : ini data" << std::endl;
+    std::cerr << "    json       : json data" << std::endl;
+    std::cerr << "    path-value : path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
+    std::cerr << "    xml        : xml data" << std::endl;
+    std::cerr << "    yaml       : implementing..." << std::endl;
     std::cerr << std::endl;
-    std::cerr << "name/path-value options:" << std::endl;
+    std::cerr << "name/path-value options" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal sign>: default '='" << std::endl;
     std::cerr << "    --delimiter,-d=<delimiter>: default ','" << std::endl;
     std::cerr << "    --no-brackets: show indices as path elements e.g. y/0/x/z/1=\"a\"" << std::endl;
-    std::cerr << "          by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "                   by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "path-value options:" << std::endl;
+    std::cerr << "path-value output options" << std::endl;
     std::cerr << "    --take-last: if paths are repeated, take last path=value" << std::endl;
     std::cerr << "    --verify-unique,--unique-input: ensure that all input paths are unique (takes precedence over --take-last)" << std::endl;
-    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
     std::cerr << std::endl;
     std::cerr <<      "warning: if paths are repeated, output value selected from these inputs in not deterministic" << std::endl;
     std::cerr << std::endl;
     std::cerr << "json options" << std::endl;
     std::cerr << "    --minify: if present, output minified json" << std::endl;
+    std::cerr << "    --quote-numbers,--quote: force quoting the numbers and booleans" << std::endl;
+    std::cerr << "                             unfortunately, historically path-value and xml quote numbers by default and json unquotes numbers by default" << std::endl;
+    std::cerr << "                             this default behaviour is left unchaged to keep backward compatibility" << std::endl;
     std::cerr << std::endl;
     std::cerr << "xml options" << std::endl;
     std::cerr << "    --indented: if present, output indented xml" << std::endl;
@@ -88,24 +72,35 @@ static void usage( bool verbose = false )
     std::cerr << "    --linewise,-l: if present, treat each input line as a record" << std::endl;
     std::cerr << "                   if absent, treat all of the input as one record" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
+    std::cerr << "examples" << std::endl;
+    if( verbose )
+    {
+        std::cerr << "dot" << std::endl;
+        std::cerr << "    sudo apt install graphviz" << std::endl;
+        std::cerr << "    { echo a/b/c=hello; echo a/c/d=world; } | name-value-convert --to dot | dot -Tsvg > test.svg" << std::endl;
+        std::cerr << "    eog test.svg" << std::endl;
+    }
+    else
+    {
+        std::cerr << "    run: name-value-convert --help --verbose for more..." << std::endl;
+    }
     std::cerr << std::endl;
-    exit( 1 );
+    exit( 0 );
 }
 
 static comma::property_tree::xml_writer_settings_t xml_writer_settings;
-
 static char equal_sign;
 static char path_value_delimiter;
 static bool linewise;
 static bool minify_json;
 static bool unquote_numbers;
+static bool quote_numbers;
 typedef comma::property_tree::path_mode path_mode;
 static path_mode indices_mode = comma::property_tree::disabled;
 static bool use_index = true;
 static comma::property_tree::path_value::check_repeated_paths check_type( comma::property_tree::path_value::no_check );
 
-enum Types { ini, info, json, xml, path_value, void_t };
+enum Types { ini, info, json, xml, yaml, path_value, dot, void_t };
 
 template < Types Type > struct traits {};
 
@@ -129,19 +124,19 @@ template <> struct traits< info >
 template <> struct traits< json >
 {
     static void input( std::istream& is, boost::property_tree::ptree& ptree ) { boost::property_tree::read_json( is, ptree ); }
-    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::name_value::impl::write_json( os, ptree, !minify_json ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::name_value::impl::write_json( os, ptree, !minify_json, !quote_numbers ); }
+};
+
+template <> struct traits< yaml >
+{
+    static void input( std::istream& is, boost::property_tree::ptree& ptree ) { comma::property_tree::read_yaml( is, ptree ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::property_tree::write_yaml( os, ptree ); }
 };
 
 template <> struct traits< xml >
 {
-    static void input( std::istream& is, boost::property_tree::ptree& ptree ) 
-    { 
-        comma::property_tree::read_xml( is, ptree ); 
-    }
-    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode )
-    {
-        comma::property_tree::write_xml( os, ptree, xml_writer_settings);
-    }
+    static void input( std::istream& is, boost::property_tree::ptree& ptree ) { comma::property_tree::read_xml( is, ptree ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode ) { comma::property_tree::write_xml( os, ptree, xml_writer_settings ); }
 };
 
 template <> struct traits< path_value > // quick and dirty
@@ -160,6 +155,34 @@ template <> struct traits< path_value > // quick and dirty
     }
 };
 
+template <> struct traits< dot >
+{
+    static void input( std::istream& is, boost::property_tree::ptree& ptree ) { COMMA_THROW_BRIEF( comma::exception, "--from dot: not implemented (and most likely never will)" ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const path_mode mode )
+    { 
+        const auto& pv = comma::property_tree::to_path_value( ptree, comma::xpath(), mode ); // todo: optional root
+        std::set< std::string > r; // super-quick and dirty; ordered set: slower, but neater output
+        std::map< std::string, std::pair< std::string, std::string > > nodes;
+        std::set< std::string > edges;
+        os << "digraph callgraph {" << std::endl;
+        for( const auto& p: pv )
+        {
+            std::string q = p.first.elements[0].to_string();
+            nodes.insert( std::make_pair( q, std::make_pair( q, p.first.elements.size() == 1 ? p.second : std::string() ) ) );
+            for( unsigned int i = 1; i < p.first.elements.size(); ++i )
+            {
+                auto s = p.first.elements[i].to_string();
+                edges.insert( "\"" + q + "\" -> \"" + q + "/" + s + "\"" );
+                q += "/" + s;
+                nodes.insert( std::make_pair( q, std::make_pair( s, i + 1 == p.first.elements.size() ? p.second : std::string() ) ) );
+            }
+        }
+        for( const auto& n: nodes ) { os << "    \"" << n.first << "\" [label=\"" << n.second.first << ( n.second.second.empty() ? std::string() : ( ":\n" + n.second.second ) ) << "\"]" << std::endl; }
+        for( const auto& e: edges ) { os << "    " << e << std::endl; }
+        os << "}" << std::endl;
+    }
+};
+
 void ( * input )( std::istream& is, boost::property_tree::ptree& ptree );
 void ( * output )( std::ostream& is, const boost::property_tree::ptree& ptree, const path_mode );
 
@@ -173,31 +196,57 @@ int main( int ac, char** av )
         equal_sign = options.value( "--equal-sign,-e", '=' );
         linewise = options.exists( "--linewise,-l" );
         minify_json = options.exists( "--minify" );
+        options.assert_mutually_exclusive( "--unquote-numbers,--unquote", "--quote-numbers,--quote" );
+        options.assert_mutually_exclusive( "--path", "--linewise" );
         unquote_numbers = options.exists( "--unquote-numbers,--unquote" );
+        quote_numbers = options.exists( "--quote-numbers,--quote" ) && !unquote_numbers; // todo: quick and dirty, combine logic, it sucks now that there is different logic for json and everything else
         if ( options.exists( "--take-last" ) ) check_type = comma::property_tree::path_value::take_last;
         if ( options.exists( "--verify-unique,--unique-input" ) ) check_type = comma::property_tree::path_value::unique_input;
         xml_writer_settings.indent_count = options.value( "--indent", options.exists( "--indented" ) ? 4 : 0 );
         boost::optional< char > delimiter = options.optional< char >( "--delimiter,-d" );
         path_value_delimiter = delimiter ? *delimiter : ( linewise ? ',' : '\n' );
+        auto paths = options.values< std::string >( "--path" );
+        std::string filename;
+        std::ifstream ifs;
+        if( !paths.empty() )
+        {
+            const auto& s = comma::split_tail( paths[0], 2, ':' );
+            COMMA_ASSERT_BRIEF( paths.size() == 1 || s.size() == 1, "<filename>:<path>: currently supported only for a single --path option" );
+            if( s.size() == 2 )
+            {
+                filename = s[0];
+                paths[0] = s[1];
+                ifs.open( filename );
+                COMMA_ASSERT_BRIEF( ifs.is_open(), "failed to open '" << filename << "'" );
+            }
+        }
+        std::istream& istream = filename.empty() ? static_cast< std::istream& >( std::cin ) : static_cast< std::istream& >( ifs );
+        bool strict = options.exists( "--strict" );
+        bool output_line_breaks = to == "path-value" && path_value_delimiter != '\n'; // hyper-quick and dirty
         if( from )
         {
             if( *from == "ini" ) { input = &traits< ini >::input; }
             else if( *from == "info" ) { input = &traits< info >::input; }
             else if( *from == "json" ) { input = &traits< json >::input; }
             else if( *from == "xml" ) { input = &traits< xml >::input; }
-            else if( *from == "path-value" ) { input = &traits< path_value >::input; }
-            else { std::cerr << "name-value-convert: expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
+            else if( *from == "yaml" ) { input = &traits< yaml >::input; }
+            else if( *from == "path-value" || *from == "pv" ) { input = &traits< path_value >::input; }
+            else if( *from == "dot" ) { input = &traits< dot >::input; }
+            else { comma::say() << "expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         }
         else
         {
-            if( linewise ) {  std::cerr << "name-value-convert: if --linewise is present, --from must be given" << std::endl; return 1; }
+            if( linewise ) {  comma::say() << "if --linewise is present, --from must be given" << std::endl; return 1; }
             input = &traits< void_t >::input;
         }
         if( to == "ini" ) { output = &traits< ini >::output; }
         else if( to == "info" ) { output = &traits< info >::output; }
         else if( to == "json" ) { output = &traits< json >::output; }
+        else if( to == "yaml" ) { output = &traits< yaml >::output; }
         else if( to == "xml" ) { output = &traits< xml >::output; }
-        else { output = &traits< path_value >::output; }
+        else if( to == "path-value" || to == "pv" ) { output = &traits< path_value >::output; }
+        else if( to == "dot" ) { output = &traits< dot >::output; }
+        else { comma::say() << "expected --to format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         if( use_index )
         {
             if( options.exists( "--no-brackets" ) ) { indices_mode = comma::property_tree::without_brackets; }
@@ -208,8 +257,8 @@ int main( int ac, char** av )
             while( std::cout.good() )
             {
                 std::string line;
-                std::getline( std::cin, line );
-                if( !std::cin.good() || std::cin.eof() ) { break; }
+                std::getline( istream, line );
+                if( !istream.good() || istream.eof() ) { break; }
                 std::istringstream iss( line );
                 boost::property_tree::ptree ptree;
                 input( iss, ptree );
@@ -237,31 +286,40 @@ int main( int ac, char** av )
         else
         {
             boost::property_tree::ptree ptree;
-            input( std::cin, ptree );
-            output( std::cout, ptree, indices_mode );
+            input( istream, ptree );
+            if( paths.empty() )
+            {
+                output( std::cout, ptree, indices_mode );
+            }
+            else
+            {
+                std::string eol;
+                for( const auto& path: paths )
+                {
+                    auto child = comma::property_tree::get_tree( ptree, path ); // paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' )
+                    if( !child ) { if( strict ) { comma::say() << "path \"" << path << "\" not found" << std::endl; return 1; } else { continue; } }
+                    boost::optional< std::string > value = child->get_optional< std::string >( "" );
+                    std::cout << eol;
+                    if( value && !value->empty() ) // todo? output empty values?
+                    {
+                        boost::property_tree::ptree t;
+                        t.add_child( comma::split( path, '/' ).back(), boost::property_tree::ptree() ).put_value( *value ); // quick and dirty; lame...
+                        output( std::cout, t, indices_mode );
+                    }
+                    else
+                    {
+                        output( std::cout, *child, indices_mode );
+                    }
+                    if( output_line_breaks ) { eol = std::string( 1, path_value_delimiter ); } // quick and dirty
+                }
+            }
         }
         return 0;
     }
-    catch( boost::property_tree::ptree_bad_data& ex )
-    {
-        std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_bad_path& ex )
-    {
-        std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_error& ex )
-    {
-        boost::regex e( "<unspecified file>" );
-        std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl;
-    }
-    catch( std::exception& ex )
-    {
-        std::cerr << "name-value-convert: " << ex.what() << std::endl;
-    }
-    catch( ... )
-    {
-        std::cerr << "name-value-convert: unknown exception" << std::endl;
-    }
+    catch( boost::property_tree::ptree_bad_data& ex ) { comma::say() << "bad data: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_bad_path& ex ) { comma::say() << "bad path: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_error& ex ) { boost::regex e( "<unspecified file>" ); comma::say() << "parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl; }
+    catch( std::exception& ex ) { comma::say() << ex.what() << std::endl; }
+    catch( ... ) { comma::say() << "unknown exception" << std::endl; }
     return 1;
 }
diff --git a/name_value/applications/name-value-eval b/name_value/applications/name-value-eval
index d1eb5709d..5e190eb6b 100755
--- a/name_value/applications/name-value-eval
+++ b/name_value/applications/name-value-eval
@@ -73,7 +73,7 @@ Options:
 Examples:
 
     $name --variables=vars.pv commands.py
-    
+
     cat commands.py | $name --variables=vars.pv
 
     cat vars.pv | $name commands.py
@@ -134,7 +134,8 @@ output_vars_option=
 input=
 tmpdir="."
 # python_cmd="python2"
-python_cmd="python"
+# python_cmd="python"
+python_cmd="python3"
 
 while [[ $# -gt 0 ]]; do
     arg="${1#*=}"
@@ -191,11 +192,15 @@ else name-value-eval-preparse --assign > $tmp_vars; fi
 preparse_options=$output_vars_option
 if (( test_option )); then preparse_options+=" --test"; fi
 
-( cat "$tmp_vars";
+( echo "from __future__ import print_function" # uber quick and dirty
+  cat "$tmp_vars";
   if [[ -n "$input" ]]; then name-value-eval-preparse $preparse_options "$input"
   else name-value-eval-preparse $preparse_options; fi ) > $python_input
-  
+
 if (( debug )); then cat $python_input | sed 's/^/debug: /g' > /dev/tty; fi
+
+#cat "$python_input" > ./python_input
+
 $python_cmd $python_input 2> $err > $out
 
 exit_code=0
@@ -211,4 +216,3 @@ else
 fi
 
 exit $exit_code
-
diff --git a/name_value/applications/name-value-eval-preparse.cpp b/name_value/applications/name-value-eval-preparse.cpp
index f1f72db67..068824190 100644
--- a/name_value/applications/name-value-eval-preparse.cpp
+++ b/name_value/applications/name-value-eval-preparse.cpp
@@ -43,7 +43,7 @@
 static const char *exec_name = "";
 static std::string kwd_expect = "expect";
 
-void usage()
+void usage(bool)
 {
     std::cerr << "Usage: " << exec_name << " [-h|--help] [-a|--assign] [-t|--test] [-o|--output-variables=<file>] [-d|--demangle] [<input_file>]\n"
 "\n"
@@ -133,6 +133,7 @@ void usage()
 "    rules. Normally all variables that are assigned any value in the rules are output, but this can be\n"
 "    restricted to the variables listed in a file (one per line) using --output-variables.\n"
 "\n";
+exit( 0 );
 }
 
 // command line options
@@ -935,7 +936,7 @@ void process_test(std::vector<Token> &tokens, const std::string &original_line,
 
     std::cout << "# SRCLINE " << line_num << " " << input_line_prefix << input_line << '\n'
         << spaces(leading_spaces) << "_result_ = (" << tokens << ")\n"
-        << spaces(leading_spaces) << "if __builtin__.type(_result_) != bool: err_expr_not_bool()\n"
+        << spaces(leading_spaces) << "if builtins_module.type(_result_) != bool: err_expr_not_bool()\n"
         << spaces(leading_spaces) << "elif not _result_:\n";
 
     if (vars.size() != 0)
@@ -957,22 +958,22 @@ void process_test(std::vector<Token> &tokens, const std::string &original_line,
 
             std::cout
                 << spaces(leading_spaces)
-                << "    print '" << i->first << "/expected=" << quote(expr_str, '"') << "'\n"
+                << "    print( '" << i->first << "/expected=" << quote(expr_str, '"') << "' )\n"
                 << spaces(leading_spaces)
                 << "    sys.stdout.write('" << i->first << "/actual=\"')\n"
                 << spaces(leading_spaces)
-                << "    if __builtin__.type(" << i->second << ") == __builtin__.type({}): print dict_str(" << i->second << ")+'\"'\n"
+                << "    if builtins_module.type(" << i->second << ") == builtins_module.type({}): print( dict_str(" << i->second << ")+'\"' )\n"
                 << spaces(leading_spaces)
                 // use a Python trick to force repr() to use double quotes instead of single
                 // (for an explanation, see: http://www.gossamer-threads.com/lists/python/python/157285
                 // -- search that page for "Python delimits a string it by single quotes preferably")
-                << "    else: print repr(\"'\\0\"+str(" << i->second << "))[6:]\n";
+                << "    else: print( repr(\"'\\0\"+str(" << i->second << "))[6:] )\n";
         }
     }
     else
     {
         std::cout << spaces(leading_spaces)
-            << "    print 'false=" << quote(input_line, '\"') << "'\n";
+            << "    print( 'false=" << quote(input_line, '\"') << "' )\n";
     }
 }
 
@@ -999,7 +1000,9 @@ void process_command(const std::vector<Token> &tokens, Varmap &assigned_vars, co
 void print_header()
 {
     std::cout
-        << "import sys, re, inspect, math, __builtin__\n"
+        << "import sys, re, inspect, math\n"
+        << "if sys.version_info.major == 2: import __builtin__; builtins_module=__builtin__\n"
+        << "else: import builtins; builtins_module=builtins\n"
         << "def near(x, y, eps): return abs(x - y) <= eps\n"
         << "def near_percent(x, y, percent): return abs(x - y) <= abs(x) * percent * 0.01\n"
         << "def max_index(dict) : return max(dict.keys())\n"
@@ -1023,8 +1026,8 @@ void print_header()
         << "    res_val = math.sin(lat_delta / 2.0) * math.sin(lat_delta / 2.0) + math.cos(phi1) * math.cos(phi2) * math.sin(lon_delta / 2.0) * math.sin(lon_delta / 2.0)\n"
         << "    return 6366.70702 * 2.0 * math.atan2(math.sqrt(res_val), math.sqrt(1.0 - res_val))\n"
         << "def sphere_distance_nm(lat1, lon1, lat2, lon2): return km_to_nm(sphere_distance_km(lat1, lon1, lat2, lon2))\n"
-        << "def err_expr_not_bool(): print >> sys.stderr, 'File \"?\", line ' + str(inspect.currentframe().f_back.f_lineno) + '\\nTypeError: expected a true or false expression'\n"
-        << "def err_var_is_obj(v_name): print >> sys.stderr, 'TypeError: variable \"' + v_name + '\" is used in an expression but is an object (example: \"a/b = 3; a < 0\")'\n"
+        << "def err_expr_not_bool(): print( 'File \"?\", line ' + str(inspect.currentframe().f_back.f_lineno) + '\\nTypeError: expected a true or false expression', file = sys.stderr )\n"
+        << "def err_var_is_obj(v_name): print( 'TypeError: variable \"' + v_name + '\" is used in an expression but is an object (example: \"a/b = 3; a < 0\")', file = sys.stderr )\n"
         << "def dict_str(d): return \"<array of size \" + str(len(d.keys())) + \">\"\n";
         // note: err_expr_not_bool() imitates standard Python error printing:
         // 'File "name", line n' on one line, followed by the error message
@@ -1039,7 +1042,7 @@ void print_assigned_variables(const Varmap &assigned_vars)
     {
         // i->first is the demangled (original) name, i->second is the mangled name
         // (repr() puts single quotes around strings; replace with double quotes)
-        std::cout << "print '" << i->first << "='+repr(" << i->second << ").replace(\"'\", '\"')\n";
+        std::cout << "print( '" << i->first << "='+repr(" << i->second << ").replace(\"'\", '\"') )\n";
     }
 }
 
@@ -1123,49 +1126,32 @@ void process(const std::string &filename, const Options &opt, const std::set<std
 void read_restrict_vars(const std::string &filename, std::set<std::string> &restrict_vars)
 {
     std::ifstream file(filename.c_str());
-
-    if (!file)
-    {
-        std::cerr << exec_name << ": cannot open " << filename << '\n';
-        exit(1);
-    }
-
+    if (!file.is_open()) { std::cerr << exec_name << ": cannot open " << filename << '\n'; exit(1); }
     std::string line;
     while (std::getline(file, line))
     {
         std::string var_name = trim_spaces(line);
         if (!var_name.empty()) { restrict_vars.insert(mangle_id(var_name)); }
     }
-
-    if (restrict_vars.size() == 0)
-    {
-        std::cerr << exec_name << ": empty --output-variables file: " << filename << '\n';
-        exit(1);
-    }
+    if(restrict_vars.size() == 0) { std::cerr << exec_name << ": empty --output-variables file: " << filename << '\n'; exit(1); }
 }
 
 int main(int argc, char* argv[])
 {
     exec_name = argv[0];
-    comma::command_line_options options(argc, argv);
-    if (options.exists("-h,--help")) { usage(); return 0; }
-
-    // get flags
+    comma::command_line_options options(argc, argv, usage);
     Options opt;
     opt.assign = options.exists("-a,--assign");
     opt.test = options.exists("-t,--test");
     opt.restrict_vars = options.exists("-o,--output-variables");
     opt.command = !(opt.assign || opt.test);
     opt.demangle = options.exists("-d,--demangle");
-
     if (opt.test)
     {
         if (opt.assign) { std::cerr << exec_name << ": cannot have --assign and --test\n"; exit(1); }
         if (opt.restrict_vars) { std::cerr << exec_name << ": cannot have --output-variables and --test\n"; exit(1); }
     }
-
-    if (opt.demangle && (opt.assign || opt.test))
-    { std::cerr << exec_name << ": cannot use --demangle with --assign or --test\n"; exit(1); }
+    if (opt.demangle && (opt.assign || opt.test)) { std::cerr << exec_name << ": cannot use --demangle with --assign or --test\n"; exit(1); }
 
     // get unnamed options
     const char *valueless_options = "-a,--assign,-t,--test,-d,--demangle";
@@ -1173,21 +1159,19 @@ int main(int argc, char* argv[])
     std::vector<std::string> unnamed = options.unnamed(valueless_options, options_with_values);
     std::set<std::string> restrict_vars;
     std::string filename;
-
     for (size_t i = 0;i < unnamed.size();++i)
     {
         if (unnamed[i][0] == '-') { std::cerr << exec_name << ": unknown option \"" << unnamed[i] << "\"\n"; exit(1); }
         else if (filename.empty()) { filename = unnamed[i]; }
         else { std::cerr << exec_name << ": unexpected argument \"" << unnamed[i] << "\"\n"; exit(1); }
     }
-
+    
     if (opt.restrict_vars)
     {
         std::string restrict_filename = options.value<std::string> ("-o,--output-variables");
         if (restrict_filename.empty()) { std::cerr << exec_name << ": expected filename for --output-variables\n"; exit(1); }
         read_restrict_vars(restrict_filename, restrict_vars);
     }
-
     if (!opt.assign && !opt.demangle) { print_header(); }
     process(filename, opt, restrict_vars);
     return 0;
diff --git a/name_value/applications/name-value-forms b/name_value/applications/name-value-forms
new file mode 100755
index 000000000..cb7b645c4
--- /dev/null
+++ b/name_value/applications/name-value-forms
@@ -0,0 +1,88 @@
+#!/bin/bash
+
+# Copyright (c) 2024 Vsevolod Vlaskine
+
+type -p zenity >/dev/null || { echo "$0: please install zenity (zenity is great!): sudo apt install zenity" >&2; exit 1; }
+source $( type -p comma-application-util ) || { echo "tinysar-simulation-console: you need to install comma and snark to run this utility" >&2; exit 1; }
+source $( type -p comma-name-value-util )
+
+function prologue()
+{
+    cat <<eof
+read name-value pairs on stdin, display form, output initialised
+name-value pairs to stdout
+
+usage: cat <input> | name-value-forms
+
+<input>     : <name>[=<value>]
+<value>     : [<default>][<delimiter><combo list values>]
+<delimiter> : value of --delimiter option (default: ',')
+eof
+}
+
+function epilogue()
+{
+    cat <<eof
+examples (try them)
+    plain vanilla
+        { echo "hello"; echo "world"; } | name-value-forms
+    form title
+        { echo "hello"; echo "world"; } | name-value-forms --title "HELLO"
+    default values
+        { echo "hello"; echo "world=XXX"; } | name-value-forms
+    combo lists
+        { echo "hello"; echo "world=,a,b,c"; } | name-value-forms
+    combo lists with defaults
+        { echo "hello"; echo "world=b,a,b,c"; } | name-value-forms
+    dry run
+        { echo "hello"; echo "world"; } | name-value-forms --dry
+eof
+}
+
+function options-description()
+{
+    cat <<eof
+--delimiter=<character>; default=,; value delimiter
+--dry-run,--dry; print zenity command and exit
+--height=[<pixels>]
+--title=[<title>]
+--verbose,-v
+--width=[<pixels>]
+eof
+}
+
+function _run()
+{
+    local command="zenity --forms"
+    [[ -z "$options_width" ]] || command+=" --width='$options_width'" # todo? adaptive width
+    [[ -z "$options_height" ]] || command+=" --width='$options_height'" # todo? adaptive height
+    [[ -z "$options_title" ]] || command+=" --text='$options_title'"
+    local input=$( cat | grep -v '^#' )
+    local label name value default_value combo_list names=() defaults=() values=()
+    function _strip() { sed -e 's#^"##' -e "s#^'##" -e 's#"$##' -e "s#'\$##"; } # todo: handle trailing whitespaces and alike
+    #local max_len=$( while IFS== read name value; do echo "${#name}"; done <<< "$input" | sort | tail -n1 )
+    while IFS== read name value; do
+        stripped="$( _strip <<< "$value" )"
+        IFS="$options_delimiter" read default_value combo_list <<< "$stripped"
+        label="$name"
+        names+=( "$name" )
+        defaults+=( "$default_value" )
+        #[[ -z "$default_value" ]] || { n=$(( max_len - ${#name} + 2 )) label+="$( printf ".%.0s" $( seq 1 $n ) )default: $default_value"; }
+        [[ -z "$default_value" ]] || { label+=" (default: $default_value)"; } # todo? zenity does not support markup for items
+        if [[ -n "$combo_list" ]]; then
+            [[ -z "$default_value" ]] || combo_list="$default_value,$combo_list"
+            command+=" --add-combo='$label' --combo-values='$( sed 's#,#|#g' <<< "$combo_list" )'"
+        else
+            command+=" --add-entry='$label'"
+        fi
+    done <<< "$input"
+    (( ! options_dry_run )) || { echo "$command"; exit; }
+    while read value; do values+=( "$value" ); done < <( eval "$command" 2> >( if (( options_verbose )); then cat; else cat >/dev/null; fi ) | tr '|' '\n' )
+    for (( i = 0; i < ${#names[@]}; ++i )); do # keeping it plain vanilla; todo? use comma utilities
+        if [[ -n "${values[$i]}" ]]; then echo "${names[$i]}=\"${values[$i]}\""; else echo "${names[$i]}=\"${defaults[$i]}\""; fi
+    done
+    comma_status_ok || die "failed"
+}
+
+comma-application-init "$@" < <( options-description )
+_run
\ No newline at end of file
diff --git a/name_value/applications/name-value-from-csv.cpp b/name_value/applications/name-value-from-csv.cpp
index a6302d60a..eddcd99cd 100644
--- a/name_value/applications/name-value-from-csv.cpp
+++ b/name_value/applications/name-value-from-csv.cpp
@@ -31,7 +31,6 @@
 
 #include <iostream>
 #include <boost/lexical_cast.hpp>
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../string/split.h"
 
@@ -82,7 +81,6 @@ static void usage( bool verbose = false )
     std::cerr << "    a[1]/foo/bar/baz[\"aa\"]/c=3" << std::endl;
     std::cerr << "    a[4]/foo/bar/baz[\"bb\"]/c=6" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
@@ -107,7 +105,7 @@ int main( int ac, char** av )
         
         if( fields.empty() )
         { 
-            const std::vector< std::string >& unnamed = options.unnamed( "--strict,--no-brackets,--output-line-number,--line-number,-n,--indices", "-.*" );
+            const std::vector< std::string >& unnamed = options.unnamed( "--strict,--no-brackets,--output-line-number,--line-number,-n,--indices,--unquote-numbers", "-.*" );
             if( unnamed.empty() || unnamed[0].empty() ) { std::cerr << "name-value-from-csv: please specify fields" << std::endl; return 1; }
             fields = unnamed[0];
         }
diff --git a/name_value/applications/name-value-get.cpp b/name_value/applications/name-value-get.cpp
index 17600b684..745992e9a 100644
--- a/name_value/applications/name-value-get.cpp
+++ b/name_value/applications/name-value-get.cpp
@@ -1,48 +1,20 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
+#include <fstream>
 #include <iostream>
-#include <boost/bind.hpp>
-#include <boost/function.hpp>
 #include <boost/property_tree/info_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/regex.hpp>
-#include "../../base/exception.h"
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
+#include "../../base/exception.h"
+#include "../../base/none.h"
 #include "../../name_value/ptree.h"
 #include "../../name_value/serialize.h"
+#include "../../string/split.h"
 #include "../../xpath/xpath.h"
 
 static const std::string regex_characters_ =  ".{}()\\*+?|^$";
@@ -53,6 +25,7 @@ static void usage( bool verbose = false )
     std::cerr << "take json, xml, or path-value formatted data on stdin and output value at given path on stdout" << std::endl;
     std::cerr << std::endl;
     std::cerr << "usage: cat data.xml | name-value-get <paths> [<options>]" << std::endl;
+    std::cerr << "       name-value-get data.xml:<paths> [<options>]" << std::endl;
     std::cerr << std::endl;
     std::cerr << "<paths>: x-path, e.g. \"command/type\" or posix regular expressions" << std::endl;
     std::cerr << "    if <paths> doesn't contain any of regex characters: \"" << regex_characters_ << "\" it will be treated as x-path" << std::endl;
@@ -72,24 +45,27 @@ static void usage( bool verbose = false )
     std::cerr << "    xml: xml data" << std::endl;
     std::cerr << "    path-value: path=value-style data; e.g. x/a=1,x/b=2,y=3" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "name/path-value options:" << std::endl;
+    std::cerr << "name/path-value options" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal sign>: default '='" << std::endl;
     std::cerr << "    --delimiter,-d=<delimiter>: default ','" << std::endl;
-    std::cerr << "    --output-path: if path-value, output path (for regex)" << std::endl;
+    std::cerr << "    --minify: if present, output minified json" << std::endl;
     std::cerr << "    --no-brackets: show indices as path elements e.g. y/0/x/z/1=\"a\"" << std::endl;
-    std::cerr << "          by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "                   by default array items will be shown with index e.g. y[0]/x/z[1]=\"a\"" << std::endl;
+    std::cerr << "    --output-path: if path-value, output path (for regex)" << std::endl;
+    std::cerr << "    --quote-numbers,--quote: force quoting the numbers and booleans" << std::endl;
+    std::cerr << "                             unfortunately, historically path-value and xml quote numbers by default and json unquotes numbers by default" << std::endl;
+    std::cerr << "                             this default behaviour is left unchaged to keep backward compatibility" << std::endl;
+    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "path-value options:" << std::endl;
+    std::cerr << "path-value output options" << std::endl;
     std::cerr << "    --take-last: if paths are repeated, take last path=value" << std::endl;
     std::cerr << "    --verify-unique,--unique-input: ensure that all input paths are unique (takes precedence over --take-last)" << std::endl;
-    std::cerr << "    --unquote-numbers,--unquote: unquote the numbers and booleans" << std::endl;
-    std::cerr << "warning: if paths are repeated, output value selected from these inputs in not deterministic" << std::endl;
+    std::cerr << "    warning: if paths are repeated, output value selected from these inputs in not deterministic" << std::endl;
     std::cerr << std::endl;
     std::cerr << "data flow options:" << std::endl;
     std::cerr << "    --linewise,-l: if present, treat each input line as a record" << std::endl;
     std::cerr << "                   if absent, treat all of the input as one record" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 1 );
 }
@@ -97,9 +73,11 @@ static void usage( bool verbose = false )
 static char equal_sign;
 static char path_value_delimiter;
 static bool linewise;
+static bool minify;
 static bool option_regex;
 static bool output_path;
 static bool unquote_numbers;
+static bool quote_numbers;
 typedef comma::property_tree::path_mode path_mode;
 static path_mode indices_mode = comma::property_tree::disabled;
 static comma::property_tree::path_value::check_repeated_paths check_type( comma::property_tree::path_value::no_check );
@@ -128,7 +106,7 @@ template <> struct traits< info >
 template <> struct traits< json >
 {
     static void input( std::istream& is, boost::property_tree::ptree& ptree ) { boost::property_tree::read_json( is, ptree ); }
-    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const std::string& ) { comma::name_value::impl::write_json( os, ptree ); }
+    static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const std::string& ) { comma::name_value::impl::write_json( os, ptree, minify, !quote_numbers ); }
 };
 
 template <> struct traits< xml >
@@ -147,7 +125,7 @@ template <> struct traits< path_value > // quick and dirty
         ptree = comma::property_tree::from_path_value_string( line, equal_sign, path_value_delimiter, check_type, true );
     }
     static void output( std::ostream& os, const boost::property_tree::ptree& ptree, const std::string& path )
-    { 
+    {
         static bool first = true; // todo: will not work linewise, fix
         if( !first ) { std::cout << path_value_delimiter; }
         first = false;
@@ -160,30 +138,36 @@ static std::vector< boost::property_tree::ptree::path_type > paths;
 static std::vector< boost::optional< boost::regex > > path_regex;
 static void ( * input )( std::istream& is, boost::property_tree::ptree& ptree );
 static void ( * output )( std::ostream& is, const boost::property_tree::ptree& ptree, const std::string& );
+static bool output_last_line_break = false;
 
 static void match_( std::ostream& os, const boost::property_tree::ptree& ptree )
 {
     static const boost::property_tree::ptree::path_type empty;
+    bool found = false;
     for( std::size_t i = 0; i < paths.size(); ++i )
     {
         boost::optional< const boost::property_tree::ptree& > child = comma::property_tree::get_tree(ptree, path_strings[i]);
         if( !child ) { continue; }
         boost::optional< std::string > value = child->get_optional< std::string >( empty );
-        if( value && !value->empty() )
-        { 
+        if( value && !value->empty() ) // todo! homogenise single values with path-value pairs; currently the following example will output junk: ( echo x/z=0; echo y=1 ) | name-value-get x y
+        {
+            if( found ) { os << path_value_delimiter; }
             if( output_path ) { os << path_strings[i] << equal_sign; }
-            os << *value << std::endl;
+            os << *value;
         }
         else
-        { 
+        {
             output( os, *child, path_strings[i] );
         }
+        found = true;
     }
+    if( found && output_last_line_break ) { os << std::endl; }
 }
 
-static void traverse_( std::ostream& os, const boost::property_tree::ptree& ptree, boost::property_tree::ptree::const_iterator it, comma::xpath& path )
+static bool traverse_( std::ostream& os, const boost::property_tree::ptree& ptree, boost::property_tree::ptree::const_iterator it, comma::xpath& path )
 {
     static const boost::property_tree::ptree::path_type empty;
+    static bool found = false;
     path /= it->first;
     const std::string& s = path.to_string( '/' ); // quick and dirty
     for( std::size_t i = 0; i < paths.size(); ++i ) // todo: quick and dirty: can prune much earlier, i guess...
@@ -193,38 +177,40 @@ static void traverse_( std::ostream& os, const boost::property_tree::ptree& ptre
         boost::optional< const boost::property_tree::ptree& > child = ptree.get_child_optional( path.to_string( '.' ) ); // quick and dirty, watch performance
         if( !child ) { continue; }
         boost::optional< std::string > value = child->get_optional< std::string >( empty );
-        if( value && !value->empty() )
-        { 
+        if( value && !value->empty() ) // todo! homogenise single values with path-value pairs; currently the following example will output junk: ( echo x/z=0; echo y=1 ) | name-value-get x y
+        {
+            if( found ) { os << path_value_delimiter; }
             if( output_path ) { os << s << equal_sign; }
-            os << *value << std::endl;
+            os << *value;
         }
         else
         {
             output( os, *child, s );
         }
+        found = true;
     }
-    for( boost::property_tree::ptree::const_iterator j = it->second.begin(); j != it->second.end(); ++j )
-    {
-        traverse_( os, ptree, j, path );
-    }
-    if( !(it->first.empty()) ) { path = path.head(); }
+    for( boost::property_tree::ptree::const_iterator j = it->second.begin(); j != it->second.end(); ++j ) { traverse_( os, ptree, j, path ); }
+    if( !( it->first.empty() ) ) { path = path.head(); }
+    return found; // todo! aweful!
 }
 
 void match_regex_( std::ostream& os, const boost::property_tree::ptree& ptree )
 {
+    bool found = false;
     for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
     {
         comma::xpath path;
-        traverse_( os, ptree, i, path );
+        found = traverse_( os, ptree, i, path ) || found;
     }
+    if( found && output_last_line_break ) { os << std::endl; }
 }
 
 static bool is_regex_(const std::string& s)
 {
     std::string regex_characters = regex_characters_;
-    if (option_regex) { regex_characters += "[]"; }
+    if( option_regex ) { regex_characters += "[]"; }
     for( unsigned int k = 0; k < regex_characters.size(); ++k )
-    { 
+    {
         if( s.find_first_of( regex_characters[k] ) != std::string::npos ) { return true; }
     }
     return false;
@@ -235,41 +221,45 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
-        path_strings = options.unnamed( "--linewise,-l,--output-path,--use-buffer,--regex", "--from,--to,--equal-sign,-e,--delimiter,-d" );
-        if( path_strings.empty() ) { std::cerr << std::endl << "name-value-get: xpath missing" << std::endl; usage(); }
+        path_strings = options.unnamed( "--linewise,-l,--minify,--output-path,--use-buffer,--regex,--quote-numbers,--quote,--unquote-numbers,--unquote", "-.*" );
+        if( path_strings.empty() ) { std::cerr << std::endl << "name-value-get: please specify at least one path" << std::endl; usage(); }
         path_regex.resize( path_strings.size() );
         paths.resize( path_strings.size() );
         bool has_regex = false;
         option_regex = options.exists( "--regex" );
+        std::string filename;
+        if( !option_regex )
+        {
+            const auto& s = comma::split_tail( path_strings[0], 2, ':' );
+            COMMA_ASSERT_BRIEF( !option_regex || s.size() == 1 || path_strings.size() == 1, "<filename>:<path> syntax is supported only for a single query path" );
+            if( s.size() == 2 ) { filename = s[0]; path_strings[0] = s[1]; }
+        }
         for( std::size_t i = 0; i < path_strings.size(); ++i )
         {
-            if ( is_regex_(path_strings[i]) )
-            {
-                path_regex[i] = boost::regex( path_strings[i], boost::regex::extended );
-                has_regex = true;
-            }
-            else
-            { 
-                paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' ); 
-            }
+            if( is_regex_( path_strings[i] ) ) { path_regex[i] = boost::regex( path_strings[i], boost::regex::extended ); has_regex = true; }
+            else { paths[i] = boost::property_tree::ptree::path_type( path_strings[i], '/' ); }
         }
         boost::optional< std::string > from = options.optional< std::string >( "--from" );
         std::string to = options.value< std::string >( "--to", "path-value" );
         equal_sign = options.value( "--equal-sign,-e", '=' );
         linewise = options.exists( "--linewise,-l" );
+        minify = options.exists( "--minify" );
+        options.assert_mutually_exclusive( "--unquote-numbers,--unquote", "--quote-numbers,--quote" );
         unquote_numbers = options.exists( "--unquote-numbers,--unquote" );
+        quote_numbers = options.exists( "--quote-numbers,--quote" ) && !unquote_numbers; // todo: quick and dirty, combine logic, it sucks now that there is different logic for json and everything else
         if ( options.exists( "--take-last" ) ) check_type = comma::property_tree::path_value::take_last;
         if ( options.exists( "--verify-unique,--unique-input" ) ) check_type = comma::property_tree::path_value::unique_input;
         boost::optional< char > delimiter = options.optional< char >( "--delimiter,-d" );
         path_value_delimiter = delimiter ? *delimiter : ( linewise ? ',' : '\n' );
         output_path = options.exists( "--output-path" );
+        if( output_path && to != "path-value" ) { std::cerr << "name-value-get: --output-path is compatible only with --to=path-value; got: --to=" << to << std::endl; return 1; }
         if( from )
         {
             if( *from == "ini" ) { input = &traits< ini >::input; }
             else if( *from == "info" ) { input = &traits< info >::input; }
             else if( *from == "json" ) { input = &traits< json >::input; }
             else if( *from == "xml" ) { input = &traits< xml >::input; }
-            else if( *from == "path-value" ) { input = &traits< path_value >::input; }
+            else if( *from == "path-value" ) { input = &traits< path_value >::input; } // super-quick and dirty!
             else { std::cerr << "name-value-get: expected --from format to be ini, info, json, xml, or path-value, got " << *from << std::endl; return 1; }
         }
         else
@@ -281,16 +271,24 @@ int main( int ac, char** av )
         else if( to == "info" ) { output = &traits< info >::output; }
         else if( to == "json" ) { output = &traits< json >::output; }
         else if( to == "xml" ) { output = &traits< xml >::output; }
-        else if( to == "path-value" ) { output = &traits< path_value >::output; }
+        else if( to == "path-value" ) { output = &traits< path_value >::output; output_last_line_break = true; }
         else { std::cerr << "name-value-get: expected --to format to be ini, info, json, xml, or path-value, got " << to << std::endl; return 1; }
         indices_mode = options.exists( "--no-brackets" ) ? comma::property_tree::without_brackets : comma::property_tree::with_brackets;
+        //auto ifstream = comma::silent_none< std::ifstream >();
+        std::ifstream ifs;
+        if( !filename.empty() )
+        {
+            ifs.open( filename );
+            COMMA_ASSERT_BRIEF( ifs.is_open(), "failed to open '" << filename << "'" );
+        }
+        std::istream& istream = filename.empty() ? static_cast< std::istream& >( std::cin ) : static_cast< std::istream& >( ifs );
         if( linewise )
         {
             while( std::cout.good() )
             {
                 std::string line;
-                std::getline( std::cin, line );
-                if( !std::cin.good() || std::cin.eof() ) { break; }
+                std::getline( istream, line );
+                if( !istream.good() || istream.eof() ) { break; }
                 std::istringstream iss( line );
                 boost::property_tree::ptree ptree;
                 input( iss, ptree );
@@ -310,7 +308,6 @@ int main( int ac, char** av )
                         case '"' : quoted = !quoted; break;
                         case '\n': if( !quoted ) { s[i] = ' '; } break;
                     }
-
                 }
                 std::cout << s << std::endl;
             }
@@ -318,32 +315,15 @@ int main( int ac, char** av )
         else
         {
             boost::property_tree::ptree ptree;
-            input( std::cin, ptree );
+            input( istream, ptree );
             if( has_regex ) { match_regex_( std::cout, ptree ); } else { match_( std::cout, ptree ); }
         }
+        return 0;
     }
-    catch( boost::property_tree::ptree_bad_data& ex )
-    {
-        std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_bad_path& ex )
-    {
-        std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl;
-    }
-    catch( boost::property_tree::ptree_error& ex )
-    {
-        boost::regex e( "<unspecified file>" );
-        std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl;
-    }
-    catch( std::exception& ex )
-    {
-        std::cerr << std::endl << "name-value-get: " << ex.what() << std::endl << std::endl;
-        return 1;
-    }
-    catch( ... )
-    {
-        std::cerr << std::endl << "name-value-get: unknown exception" << std::endl << std::endl;
-        return 1;
-    }
-    return 0;
+    catch( boost::property_tree::ptree_bad_data& ex ) { std::cerr << "name-value-convert: bad data: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_bad_path& ex ) { std::cerr << "name-value-convert: bad path: " << ex.what() << std::endl; }
+    catch( boost::property_tree::ptree_error& ex ) { boost::regex e( "<unspecified file>" ); std::cerr << "name-value-convert: parsing error: " << boost::regex_replace( std::string( ex.what() ), e, "line" ) << std::endl; }
+    catch( std::exception& ex ) { std::cerr << std::endl << "name-value-get: " << ex.what() << std::endl << std::endl; }
+    catch( ... ) { std::cerr << std::endl << "name-value-get: unknown exception" << std::endl << std::endl; }
+    return 1;
 }
diff --git a/name_value/applications/name-value-permute.cpp b/name_value/applications/name-value-permute.cpp
index bd845f266..743e39e6d 100644
--- a/name_value/applications/name-value-permute.cpp
+++ b/name_value/applications/name-value-permute.cpp
@@ -31,8 +31,8 @@
 #include <fstream>
 #include <boost/lexical_cast.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/math/special_functions.hpp>
 #include "../../base/exception.h"
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../string/split.h"
 
@@ -68,7 +68,6 @@ static void usage( bool verbose = false )
     std::cerr << "          string=\"a,\";b;c" << std::endl;
     std::cerr << "          unchanged=unchanged' | name-value-permute --stdout --delimiter=';'" << std::endl;
     std::cerr << std::endl;
-    std::cerr << comma::contact_info << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
diff --git a/name_value/applications/name-value-to-csv.cpp b/name_value/applications/name-value-to-csv.cpp
index b9d678e65..5133a5120 100644
--- a/name_value/applications/name-value-to-csv.cpp
+++ b/name_value/applications/name-value-to-csv.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// Copyright (c) 2019 Vsevolod Vlaskine
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2020 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
@@ -37,7 +10,8 @@
 #include <unordered_set>
 #include <boost/optional.hpp>
 #include "../../application/command_line_options.h"
-#include "../../string.h"
+#include "../../base/none.h"
+#include "../../string/string.h"
 #include "../../xpath/xpath.h"
 
 static void usage( bool )
@@ -51,13 +25,18 @@ static void usage( bool )
     std::cerr << "    --delimiter,-d=<delimiter>; default=','; csv delimiter" << std::endl;
     std::cerr << "    --equal-sign,-e=<equal_sign>; default='='; equal sign" << std::endl;
     std::cerr << "    --fields,-f=<fields>; fields to output" << std::endl;
+    std::cerr << "    --map,--dict; prefixed paths are a map, not list; expects input sorted by path" << std::endl;
+    std::cerr << "                  run example below to make sense of it" << std::endl;
     std::cerr << "    --prefix,--path,-p=[<prefix>]; optional prefix" << std::endl;
     std::cerr << "    --unindexed-fields=<fields>; if no --fields specified, output unindexed fields once, if --fields specified, append given unindexed fields to all records" << std::endl;
+    std::cerr << "    --unindexed-stream,--stream; read a stream of key-value pairs, on every input record output csv record with the field value set and other fields empty, see example below" << std::endl;
+    std::cerr << "    --unindexed-stream-update,--update; read a stream of key-value pairs, on every input record output all up-to-date values of fields present in --unindexed-fields, see example below" << std::endl;
+    std::cerr << "    --unquote; unquote string values" << std::endl;
     std::cerr << "    --unsorted; the input data is not sorted by index" << std::endl;
     std::cerr << std::endl;
     std::cerr << "examples" << std::endl;
     std::cerr << "    indexed data" << std::endl;
-    std::cerr << "        cat <<EOF | $scriptname --fields=name,value,status --prefix=my/test" << std::endl;
+    std::cerr << "        cat <<EOF | name-value-to-csv --fields=name,value,status --prefix=my/test" << std::endl;
     std::cerr << "        my/test[0]/name=a" << std::endl;
     std::cerr << "        my/test[0]/value=10" << std::endl;
     std::cerr << "        my/test[0]/status=0" << std::endl;
@@ -67,24 +46,47 @@ static void usage( bool )
     std::cerr << "        EOF" << std::endl;
     std::cerr << std::endl;
     std::cerr << "        yields:" << std::endl;
+    std::cerr << "            a,10,0" << std::endl;
+    std::cerr << "            b,20,1" << std::endl;
     std::cerr << std::endl;
-    std::cerr << "        a,10,0" << std::endl;
-    std::cerr << "        b,20,1" << std::endl;
+    std::cerr << "        cat <<EOF | name-value-to-csv --map --fields=name,value,status --prefix=my/test" << std::endl;
+    std::cerr << "        my/test/x/name=a" << std::endl;
+    std::cerr << "        my/test/x/value=10" << std::endl;
+    std::cerr << "        my/test/x/status=0" << std::endl;
+    std::cerr << "        my/test/y/name=b" << std::endl;
+    std::cerr << "        my/test/y/status=1" << std::endl;
+    std::cerr << "        EOF" << std::endl;
+    std::cerr << std::endl;
+    std::cerr << "        yields:" << std::endl;
+    std::cerr << "            x,a,10,0" << std::endl;
+    std::cerr << "            y,b,,1" << std::endl;
     std::cerr << std::endl;
     std::cerr << "    unindexed fields" << std::endl;
     std::cerr << "        todo" << std::endl;
+    std::cerr << "    unindexed fields with --unindexed-stream" << std::endl;
+    std::cerr << "        > ( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream" << std::endl;
+    std::cerr << "        1," << std::endl;
+    std::cerr << "        ,3" << std::endl;
+    std::cerr << "        2," << std::endl;
+    std::cerr << "        ,4" << std::endl;
+    std::cerr << "    unindexed fields with --unindexed-stream-update" << std::endl;
+    std::cerr << "        > ( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream" << std::endl;
+    std::cerr << "        1," << std::endl;
+    std::cerr << "        1,3" << std::endl;
+    std::cerr << "        2,3" << std::endl;
+    std::cerr << "        2,4" << std::endl;
     std::cerr << std::endl;
     exit( 0 );
 }
 
 typedef std::unordered_map< std::string, std::string > values_t;
 
-static std::string join( const std::vector< std::string >& fields, values_t& values, char delimiter )
+static std::string join( const std::vector< std::string >& fields, values_t& values, char delimiter, bool clear = true )
 {
     std::ostringstream oss;
     std::string comma;
     for( const auto& f: fields ) { oss << comma << values[f]; comma = delimiter; } // quick and dirty as everything else
-    values.clear();
+    if( clear ) { values.clear(); }
     return oss.str();
 }
 
@@ -93,10 +95,13 @@ int main( int ac, char** av )
     try
     {
         comma::command_line_options options( ac, av, usage );
+        options.assert_mutually_exclusive( "--fields", "--unindexed-stream,--stream,--unindexed-stream-update,--update" );
         std::string fs = options.value< std::string >( "--fields,-f", "" );
         std::vector< std::string > fields = comma::split( fs, ',' );
         std::vector< std::string > unindexed_fields;
         std::string ufs = options.value< std::string >( "--unindexed-fields", "" );
+        bool unindexed_stream_update = options.exists( "--unindexed-stream-update,--update" );
+        bool unindexed_stream = options.exists( "--unindexed-stream,--stream" ) || unindexed_stream_update;
         std::unordered_set< std::string > unindexed_fields_set;
         if( !ufs.empty() )
         { 
@@ -106,43 +111,66 @@ int main( int ac, char** av )
         if( fields[0].empty() && unindexed_fields.empty() ) { std::cerr << "name-value-to-csv: please specify --fields or --unindexed-fields" << std::endl; return 1; }
         bool unindexed = fields[0].empty();
         values_t unindexed_values;
-        options.assert_mutually_exclusive( "--unsorted", "--unindexed,--no-index" );
-        options.assert_mutually_exclusive( "--unindexed,--no-index", "--unindexed-fields" );
+        bool unquote = options.exists( "--unquote" );
         bool unsorted = options.exists( "--unsorted" );
         char delimiter = options.value( "--delimiter,-d", ',' );
         char equal_sign = options.value( "--equal-sign,-e", '=' );
         std::string prefix = options.value< std::string >( "--prefix,--path,-p", "" );
         values_t values; // quick and dirty; watch performance?
         std::map< unsigned int, values_t > map;
-        boost::optional< unsigned int > index;
+        boost::optional< unsigned int > index{ comma::silent_none< unsigned int >() };
+        std::string key;
+        bool is_map = options.exists( "--dict,--map" );
+        if( is_map && unsorted ) { comma::say() << "combination of --map and --unsorted: todo, just ask" << std::endl; return 1; }
+        std::string::size_type e = std::string::npos;
+        auto value = [&]( const std::string& s ) { const std::string& t = s.substr( e + 1 ); return unquote && t.size() >= 2 ? comma::strip( t, "\"" ) : t; };
         while( std::cin.good() && !std::cin.eof() )
         {
             std::string s;
             std::getline( std::cin, s );
             if( comma::strip( s, " \t" ).empty() || comma::strip( s, " \t" )[0] == '#' ) { continue; }
-            auto e = s.find_first_of( equal_sign ); // todo: use boost::spirit
+            e = s.find_first_of( equal_sign ); // todo: use boost::spirit
             if( e == std::string::npos ) { std::cerr << "name-value-to-csv: expected path-value pair; got: '" << s << "'" << std::endl; return 1; }
             std::string name = s.substr( 0, e );
-            if( unindexed_fields_set.find( name ) != unindexed_fields_set.end() ) { unindexed_values[name] = s.substr( e + 1 ); continue; }
+            if( unindexed_fields_set.find( name ) != unindexed_fields_set.end() )
+            {
+                unindexed_values[name] = value( s );
+                if( unindexed_stream ) { std::cout << join( unindexed_fields, unindexed_values, delimiter, !unindexed_stream_update ) << std::endl; }
+                continue;
+            }
             if( name.substr( 0, prefix.size() ) != prefix ) { continue; }
             if( unindexed )
             {
-                if( prefix.empty() ) { values[name] = s.substr( e + 1 ); }
-                else if( name[ prefix.size() ] == '/' ) { values[ name.substr( prefix.size() + 1 ) ] = s.substr( e + 1 ); }
+                if( prefix.empty() ) { values[name] = value( s ); }
+                else if( name[ prefix.size() ] == '/' ) { values[ name.substr( prefix.size() + 1 ) ] = value( s ); }
                 continue;
             }
-            if( name[prefix.size()] != '[' ) { continue; }
-            auto b = s.find_first_of( ']', prefix.size() );
-            if( b == std::string::npos ) { std::cerr << "name-value-to-csv: expected path-value pair with valid indices; got: '" << s << "'" << std::endl; return 1; }
-            if( s[ b + 1 ] != '/' ) { continue; }
-            unsigned int current_index = boost::lexical_cast< unsigned int >( name.substr( prefix.size() + 1, b - prefix.size() - 1 ) );
-            if( unsorted || !unindexed_fields.empty() ) { map[current_index][name.substr( b + 2 )] = s.substr( e + 1 ); continue; }
-            if( index && current_index < *index ) { std::cerr << "name-value-to-csv: expected sorted index, got index " << current_index << " after " << *index << " in line: '" << comma::strip( s ) << "'" << std::endl; return 1; }
-            if( index && current_index > *index ) { std::cout << join( fields, values, delimiter ) << std::endl; }
-            values[name.substr( b + 2 )] = s.substr( e + 1 );
-            index = current_index;
+            if( is_map )
+            {
+                if( name[prefix.size()] != '/' ) { continue; }
+                auto b = s.find_first_of( '/', prefix.size() + 1 );
+                if( b == std::string::npos ) { std::cerr << "name-value-to-csv: with prefix \"" << prefix << "\" expected path-value pair with valid keys; got: '" << s << "'" << std::endl; return 1; }
+                std::string current_key = name.substr( prefix.size() + 1, b - prefix.size() - 1 );
+                if( unsorted ) {} // todo
+                if( !key.empty() && current_key != key ) { std::cout << key << delimiter << join( fields, values, delimiter ) << std::endl; }
+                values[name.substr( b + 1 )] = value( s );
+                key = current_key;
+            }
+            else
+            {
+                if( name[prefix.size()] != '[' ) { continue; }
+                auto b = s.find_first_of( ']', prefix.size() );
+                if( b == std::string::npos ) { std::cerr << "name-value-to-csv: with prefix \"" << prefix << "\" expected path-value pair with valid indices; got: '" << s << "'" << std::endl; return 1; }
+                if( s[ b + 1 ] != '/' ) { continue; }
+                unsigned int current_index = boost::lexical_cast< unsigned int >( name.substr( prefix.size() + 1, b - prefix.size() - 1 ) );
+                if( unsorted || !unindexed_fields.empty() ) { map[current_index][name.substr( b + 2 )] = value( s ); continue; }
+                if( index && current_index < *index ) { std::cerr << "name-value-to-csv: expected sorted index, got index " << current_index << " after " << *index << " in line: '" << comma::strip( s ) << "'" << std::endl; return 1; }
+                if( index && current_index > *index ) { std::cout << join( fields, values, delimiter ) << std::endl; }
+                values[name.substr( b + 2 )] = value( s );
+                index = current_index;
+            }
         }
-        if( unindexed )
+        if( unindexed && !unindexed_stream )
         { 
             std::cout << join( unindexed_fields, unindexed_values, delimiter ) << std::endl;
         }
@@ -161,6 +189,10 @@ int main( int ac, char** av )
         {
             std::cout << join( fields, values, delimiter ) << std::endl;
         }
+        else if( is_map && !key.empty() )
+        {
+            std::cout << key << delimiter << join( fields, values, delimiter ) << std::endl;
+        }
         return 0;
     }
     catch( std::exception& ex ) { std::cerr << "name-value-to-csv: " << ex.what() << std::endl; }
diff --git a/name_value/examples/name-value-forms/menu.json b/name_value/examples/name-value-forms/menu.json
new file mode 100644
index 000000000..5263bcc7b
--- /dev/null
+++ b/name_value/examples/name-value-forms/menu.json
@@ -0,0 +1,20 @@
+{
+    "breakfast":
+    {
+        "number_of_people": 1,
+        "food": "toast,egg,poached egg,poached rhino",
+        "drink": "coffee,tea"
+    },
+    "lunch":
+    {
+        "number_of_people": 20,
+        "food": "",
+        "drink": "water,beer"
+    },
+    "dinner":
+    {
+        "number_of_people": 2,
+        "food": "spam,spam,spam,lovely spam",
+        "drink": "wine"
+    }
+}
diff --git a/name_value/examples/name-value-forms/run b/name_value/examples/name-value-forms/run
new file mode 100755
index 000000000..97531d8cd
--- /dev/null
+++ b/name_value/examples/name-value-forms/run
@@ -0,0 +1,8 @@
+#!/bin/bash
+
+echo "======== example 1: hello world =========================="
+( echo hello; echo world; echo star=sun,antares,betelgeuse ) | name-value-forms --title "hello world"
+
+echo "======== example 2: json ================================="
+cat menu.json | name-value-convert | name-value-forms --title menu | name-value-convert --to json
+
diff --git a/name_value/impl/from_name_value.h b/name_value/impl/from_name_value.h
index 2da37b876..a88b18117 100644
--- a/name_value/impl/from_name_value.h
+++ b/name_value/impl/from_name_value.h
@@ -27,14 +27,16 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author cedric wohlleber
 
-#ifndef COMMA_APPLICATION_FROM_NAME_VALUE_H
-#define COMMA_APPLICATION_FROM_NAME_VALUE_H
+#pragma once
 
 #include <deque>
 #include <map>
+#include <memory>
+#if __cplusplus >= 201703L
+#include <optional>
+#endif // #if __cplusplus >= 201703L
 #include <boost/date_time/posix_time/posix_time.hpp>
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
@@ -59,35 +61,34 @@ class from_name_value
     /// constructor
     /// @param values values to read from
     /// @param full_path_as_name use full path as name
-    from_name_value( const map_type& values, bool full_path_as_name = true ):
-        m_values( values ), m_full_path_as_name(full_path_as_name){};
+    from_name_value( const map_type& values, bool full_path_as_name = true ): _values( values ), _full_path_as_name( full_path_as_name ) {};
+
+    template < typename K, typename T > void apply( const K& name, boost::optional< T >& value ) { _apply_optional< K, T >( name, value ); }
 
-    /// apply
-    template < typename K, typename T > void apply( const K& name, boost::optional< T >& value );
+    #if __cplusplus >= 201703L
+    template < typename K, typename T > void apply( const K& name, std::optional< T >& value ) { _apply_optional< K, T >( name, value ); }
+    #endif // #if __cplusplus >= 201703L
     
-    /// apply
-    template < typename K, typename T > void apply( const K& name, boost::scoped_ptr< T >& value );
+    template < typename K, typename T > void apply( const K& name, boost::scoped_ptr< T >& value ) { _apply_ptr< K, T >( name, value ); }
     
-    /// apply
-    template < typename K, typename T > void apply( const K& name, boost::shared_ptr< T >& value );
+    template < typename K, typename T > void apply( const K& name, boost::shared_ptr< T >& value ) { _apply_ptr< K, T >( name, value ); }
+
+    template < typename K, typename T > void apply( const K& name, std::unique_ptr< T >& value ) { _apply_ptr< K, T >( name, value ); }
         
-    /// apply
     template < typename K, typename T > void apply( const K& name, T& value );
 
-    /// apply to non-leaf elements
     template < typename K, typename T > void apply_next( const K& name, T& value );
 
-    /// apply to leaf elements
     template < typename K, typename T > void apply_final( const K& name, T& value );
 
 private:
-    const map_type& m_values;
-    bool m_full_path_as_name;
-    xpath m_xpath;
-    std::deque< bool > m_empty;
-    static void lexical_cast( bool& v, const std::string& s ) { v = s == "" || boost::lexical_cast< bool >( s ); }
-    static void lexical_cast( boost::posix_time::ptime& v, const std::string& s ) { v = boost::posix_time::from_iso_string( s ); }
-    static void lexical_cast( boost::posix_time::time_duration& v, const std::string& s )
+    const map_type& _values;
+    bool _full_path_as_name;
+    xpath _xpath;
+    std::deque< bool > _empty;
+    static void _lexical_cast( bool& v, const std::string& s ) { v = s == "" || boost::lexical_cast< bool >( s ); }
+    static void _lexical_cast( boost::posix_time::ptime& v, const std::string& s ) { v = boost::posix_time::from_iso_string( s ); }
+    static void _lexical_cast( boost::posix_time::time_duration& v, const std::string& s )
     {
         std::vector< std::string > t = comma::split( s, '.' );
         if( t.size() > 2 ) { COMMA_THROW_STREAM( comma::exception, "expected duration in seconds, got " << s ); }
@@ -98,65 +99,49 @@ class from_name_value
         if( seconds < 0 ) { microseconds = -microseconds; }
         v = boost::posix_time::seconds( seconds ) + boost::posix_time::microseconds( microseconds );
     }
-    template < typename T > static void lexical_cast( T& v, const std::string& s ) { v = boost::lexical_cast< T >( s ); }
+    template < typename T > static void _lexical_cast( T& v, const std::string& s ) { v = boost::lexical_cast< T >( s ); }
+    template < typename K, typename T, template < typename > class Optional > void _apply_optional( const K& name, Optional< T >& value );
+    template < typename K, typename T, template < typename > class Ptr > void _apply_ptr( const K& name, Ptr< T >& value );
 };
 
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, boost::optional< T >& value )
-{
-    if( value ) { apply( name, *value ); return; }
-    T t;
-    m_empty.push_back( true );
-    apply( name, t );
-    if( !m_empty.back() ) { value = t; }
-    m_empty.pop_back();
-}
-
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, boost::scoped_ptr< T >& value )
+template < typename K, typename T, template < typename > class Optional > inline void from_name_value::_apply_optional( const K& name, Optional< T >& value )
 {
     if( value ) { apply( name, *value ); return; }
     T t;
-    m_empty.push_back( true );
+    _empty.push_back( true );
     apply( name, t );
-    if( !m_empty.back() ) { value.reset( new T( t ) ); }
-    m_empty.pop_back();
+    if( !_empty.back() ) { value = t; }
+    _empty.pop_back();    
 }
 
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, boost::shared_ptr< T >& value )
+template < typename K, typename T, template < typename > class Ptr > inline void from_name_value::_apply_ptr( const K& name, Ptr< T >& value )
 {
     if( value ) { apply( name, *value ); return; }
     T t;
-    m_empty.push_back( true );
+    _empty.push_back( true );
     apply( name, t );
-    if( !m_empty.back() ) { value.reset( new T( t ) ); }
-    m_empty.pop_back();
+    if( !_empty.back() ) { value.reset(); value.reset( new T( t ) ); } // todo? emplace? 
+    _empty.pop_back();
 }
 
-template < typename K, typename T >
-inline void from_name_value::apply( const K& name, T& value )
+template < typename K, typename T > inline void from_name_value::apply( const K& name, T& value )
 {
-    m_xpath /= xpath::element( name );
+    _xpath /= xpath::element( name );
     visiting::do_while<    !boost::is_fundamental< T >::value
                         && !boost::is_same< T, boost::posix_time::ptime >::value
                         && !boost::is_same< T, boost::posix_time::time_duration >::value
                         && !boost::is_same< T, std::string >::value >::visit( name, value, *this );
-    m_xpath = m_xpath.head();
+    _xpath = _xpath.head();
 }
 
-template < typename K, typename T >
-inline void from_name_value::apply_next( const K& name, T& value ) { comma::visiting::visit( name, value, *this ); }
+template < typename K, typename T > inline void from_name_value::apply_next( const K& name, T& value ) { comma::visiting::visit( name, value, *this ); }
 
-template < typename K, typename T >
-inline void from_name_value::apply_final( const K& key, T& value )
+template < typename K, typename T > inline void from_name_value::apply_final( const K& key, T& value )
 {
-    map_type::const_iterator iter = m_values.find( m_full_path_as_name ? m_xpath.to_string() : m_xpath.elements.back().to_string() );
-    if( iter == m_values.end() ) { return; }
-    lexical_cast( value, iter->second );
-    for( std::size_t i = 0; i < m_empty.size(); ++i ) { m_empty[i] = false; }
+    map_type::const_iterator iter = _values.find( _full_path_as_name ? _xpath.to_string() : _xpath.elements.back().to_string() );
+    if( iter == _values.end() ) { return; }
+    _lexical_cast( value, iter->second );
+    for( std::size_t i = 0; i < _empty.size(); ++i ) { _empty[i] = false; }
 }
 
 } } } // namespace comma { namespace name_value { namespace impl {
-
-#endif // COMMA_APPLICATION_FROM_NAME_VALUE_H
diff --git a/name_value/impl/json_writer.h b/name_value/impl/json_writer.h
index 619c5cb05..a1a33ae9b 100644
--- a/name_value/impl/json_writer.h
+++ b/name_value/impl/json_writer.h
@@ -1,77 +1,53 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_NAME_VALUE_JSON_WRITER_H_
-#define COMMA_NAME_VALUE_JSON_WRITER_H_
+#pragma once
 
+#include <algorithm>
 #include <iostream>
 #include <sstream>
 #include <string>
-#include <algorithm>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/lexical_cast.hpp>
+#include <boost/regex.hpp>
 #include "../../base/exception.h"
 
-
 namespace comma { namespace name_value { namespace impl {
 
-// NOTE: assume valid json.
-template< typename C > void json_remove_quotes( std::basic_string< C >& json_text )
+template< typename C > inline void json_remove_quotes( std::basic_string< C >& json_text, bool pretty = true ) // assuming valid json
 {
     using string_type = std::basic_string< C >;
-
-    string_type const true_str( std::initializer_list< C >{ 't', 'r', 'u', 'e' } );
-    string_type const false_str( std::initializer_list< C >{ 'f', 'a', 'l', 's', 'e' } );
-
+    static string_type const true_str( std::initializer_list< C >{ 't', 'r', 'u', 'e' } );
+    static string_type const false_str( std::initializer_list< C >{ 'f', 'a', 'l', 's', 'e' } );
+    static boost::regex number_like_string( "^0[0-9][0-9]*$" );
     auto source = json_text.begin();
     auto target = json_text.cbegin();
-
     while( target != json_text.cend() )
     {
         auto value_begin = std::find( target, json_text.cend(), '"' );
         while( target != value_begin ) { *source++ = *target++; }
         if( json_text.cend() == value_begin ) { break; }
-
         auto value_end = value_begin;
-        do { value_end = std::find( value_end + 1, json_text.cend(), '"' ); } while( '\\' == *( value_end - 1 ) );
+        //do { value_end = std::find( value_end + 1, json_text.cend(), '"' ); } while( '\\' == *( value_end - 1 ) );
+        while( true )
+        {
+            value_end = std::find( value_end + 1, json_text.cend(), '"' );
+            unsigned int backslash_count = 0;
+            for( auto i = value_end - 1; *i == '\\'; ++backslash_count, --i );
+            if( backslash_count % 2 == 0 ) { break; } // hyper quick and dirty fix, sigh
+        }
         auto next_token = std::find_if_not( value_end + 1, json_text.cend(), []( C ch ) { return ' ' == ch || '\t' == ch || '\n' == ch; } );
-
         bool quoted = true;
         if( ':' != *next_token )
         {
-            auto const value = std::string( value_begin + 1, value_end );
+            auto value = std::string( value_begin + 1, value_end );
+            for( char& c: value ) { c = std::tolower( c ); } // quick and dirty, watch performance
             if( true_str == value || false_str == value ) { quoted = false; }
-            else { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
+            else if( value == "nan" || value == "inf" ) { quoted = true; } // lexical cast thinks it's a number
+            else if( !boost::regex_match( value, number_like_string ) ) { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} } // todo? try to avoid lexical_cast+exception to improve performace?
         }
-
         if( !quoted ) { value_begin++; }
         while( value_begin != value_end ) { *source++ = *value_begin++; }
         if( !quoted ) { value_end++; } 
@@ -79,75 +55,25 @@ template< typename C > void json_remove_quotes( std::basic_string< C >& json_tex
         *source++ = *next_token++;
         target = next_token;
     }
-    json_text.erase( source, json_text.cend() );
+    json_text.erase( pretty ? source : ( source - 1 ), json_text.end() );
 }
 
-inline void remove_quotes( std::string& s )
+template< class PTree > void write_json( std::basic_ostream< typename PTree::key_type::value_type > &stream, const PTree &ptree, bool const pretty = true, bool unquote_numbers = true )
 {
-    unsigned int size = 0;
-    char* end = &s[0] + s.length();
-    char* target = &s[0];
-    std::string value;
-    struct looking_for { enum what { first_quote, second_quote, escaped, colon }; };
-    looking_for::what state = looking_for::first_quote;
-
-    for( char* source = &s[0]; source != end; ++source )
+    std::basic_ostringstream< typename PTree::key_type::value_type > oss;
+    boost::property_tree::write_json( oss, ptree, pretty );
+    if( unquote_numbers )
     {
-        switch( state )
-        {
-            case looking_for::first_quote:
-                if( *source == '"' ) { state = looking_for::second_quote; } else { *target++ = *source; ++size; }
-                break;
-            case looking_for::second_quote:
-                if( *source == '"' ) { state = looking_for::colon; }
-                else { value += *source; if( *source == '\\' ) { state = looking_for::escaped; } }
-                break;
-            case looking_for::escaped:
-                value += *source;
-                state = looking_for::second_quote;
-                break;
-            case looking_for::colon:
-            {
-                bool quoted = true;
-                bool skip = false;
-                switch( *source )
-                {
-                    case ' ': case '\t': case '\n':
-                        skip=true;
-                        // todo
-                        break;
-                    case ':':
-                        break;
-                    default:
-                        try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} // hyper quick and dirty for now
-                        
-                }
-                if( skip ) { break; }
-                if( quoted ) { *target++ = '"'; ++size; }
-                ::memcpy( target, &value[0], value.size() );
-                target += value.size();
-                size += value.size();
-                if( quoted ) { *target++ = '"'; ++size; }
-                *target++ = *source;
-                ++size;
-                value.clear();
-                state = looking_for::first_quote;
-                break;
-            }
-        }
+        std::string s = oss.str();
+        json_remove_quotes( s, pretty );
+        stream << s;
     }
-    s.resize( size );
-}
-
-template<class Ptree> void write_json(std::basic_ostream< typename Ptree::key_type::value_type > &stream, const Ptree &ptree, bool const pretty = true )
-{
-    std::basic_ostringstream< typename Ptree::key_type::value_type > string_stream;
-    boost::property_tree::write_json( string_stream, ptree, pretty );
-    auto json_text = string_stream.str();
-    json_remove_quotes( json_text );
-    stream << json_text << std::flush;
+    else
+    {
+        if( pretty ) { stream << oss.str(); }
+        else { std::string s = oss.str(); stream << s.substr( 0, s.size() - 1 ); } // unfortunately, boost adds trailing end of line, which we don't want in minified mode
+    }
+    stream << std::flush;
 }
  
 } } }
-
-#endif //COMMA_NAME_VALUE_JSON_WRITER_H_
diff --git a/name_value/impl/to_name_value.h b/name_value/impl/to_name_value.h
index d57c6c2e6..de6fa961f 100644
--- a/name_value/impl/to_name_value.h
+++ b/name_value/impl/to_name_value.h
@@ -1,39 +1,15 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2022 Vsevolod Vlaskine
 
+/// @authors cedric wohlleber, vsevolod vlaskine
 
-/// @author cedric wohlleber
-
-#ifndef COMMA_APPLICATION_TO_NAME_VALUE_H
-#define COMMA_APPLICATION_TO_NAME_VALUE_H
+#pragma once
 
 #include <map>
+#include <memory>
+#if __cplusplus >= 201703L
+#include <optional>
+#endif // #if __cplusplus >= 201703L
 #include <boost/lexical_cast.hpp>
 #include <boost/optional.hpp>
 #include <boost/scoped_ptr.hpp>
@@ -53,97 +29,38 @@ class to_name_value
     /// constructor
     /// @param delimiter delimiter between name and value
     /// @param full_path_as_name use full path as name
-    to_name_value( char delimiter = '=', bool full_path_as_name = true ):
-        m_delimiter(delimiter), m_full_path_as_name(full_path_as_name){};
-
-    /// apply
-    template < typename K, typename T > void apply( const K& name, const boost::optional< T >& value );
-    
-    /// apply
-    template < typename K, typename T > void apply( const K& name, const boost::scoped_ptr< T >& value );
-    
-    /// apply
-    template < typename K, typename T > void apply( const K& name, const boost::shared_ptr< T >& value );        
-        
-    /// apply
-    template < typename K, typename T >
-    void apply( const K& name, const T& value );
-
-    /// apply to non-leaf elements
-    template < typename K, typename T >
-    void apply_next( const K& name, const T& value );
-
-    /// apply to leaf elements
-    template < typename K, typename T >
-    void apply_final( const K& name, const T& value );
-
-    /// return named values as strings
-    const std::vector< std::string >& strings() const { return m_strings; }
+    to_name_value( char delimiter = '=', bool full_path_as_name = true ): _delimiter(delimiter), _full_path_as_name( full_path_as_name ) {};
+    template < typename K, typename T > void apply( const K& name, const boost::optional< T >& value ) { if( value ) { apply( name, *value ); } }
+    #if __cplusplus >= 201703L
+    template < typename K, typename T > void apply( const K& name, const std::optional< T >& value ) { if( value ) { apply( name, *value ); } }
+    #endif // #if __cplusplus >= 201703L
+    template < typename K, typename T > void apply( const K& name, const boost::scoped_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
+    template < typename K, typename T > void apply( const K& name, const boost::shared_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
+    template < typename K, typename T > void apply( const K& name, const std::unique_ptr< T >& value ) { if( value ) { apply( name, *value ); } }
+    template < typename K, typename T > void apply( const K& name, const T& value );
+    template < typename K, typename T > void apply_next( const K& name, const T& value ) { comma::visiting::visit( name, value, *this ); }
+    template < typename K, typename T > void apply_final( const K& name, const T& value );
+    const std::vector< std::string >& strings() const { return _strings; }
 
 private:
-    template < typename T >
-        std::string as_string( T v )
-        {
-            std::ostringstream oss;
-            oss << v;
-            return oss.str();
-        }
-        
-    char m_delimiter;
-    bool m_full_path_as_name;
-    std::vector< std::string > m_strings;
-    xpath m_xpath;
-     
-};
+    char _delimiter;
+    bool _full_path_as_name;
+    std::vector< std::string > _strings;
+    xpath _xpath;
 
-template < typename K, typename T >
-inline void to_name_value::apply( const K& name, const boost::optional< T >& value )
-{
-    if( value ) { apply( name, *value ); }
-}
-
-template < typename K, typename T >
-inline void to_name_value::apply( const K& name, const boost::scoped_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); }
-}
-
-template < typename K, typename T >
-inline void to_name_value::apply( const K& name, const boost::shared_ptr< T >& value )
-{
-    if( value ) { apply( name, *value ); }
-}
+    template < typename T > std::string _as_string( T v ) { std::ostringstream oss; oss << v; return oss.str(); } 
+};
 
 template < typename K, typename T >
 inline void to_name_value::apply( const K& name, const T& value )
 {
-    m_xpath /= xpath::element( name );
+    _xpath /= xpath::element( name );
     visiting::do_while<    !boost::is_fundamental< T >::value
                         && !boost::is_same< T, std::string >::value >::visit( name, value, *this );
-    m_xpath = m_xpath.head();
+    _xpath = _xpath.head();
 }
 
-
-
-template < typename K, typename T >
-inline void to_name_value::apply_next( const K& name, const T& value ) { comma::visiting::visit( name, value, *this ); }
-
 template < typename K, typename T >
-inline void to_name_value::apply_final( const K&, const T& value )
-{
-    std::string string;
-    if( m_full_path_as_name )
-    {
-        string += m_xpath.to_string();
-    }
-    else
-    {
-        string += m_xpath.elements.back().to_string();
-    }
-    string += m_delimiter + as_string( value );
-    m_strings.push_back( string );
-}
+inline void to_name_value::apply_final( const K&, const T& value ) { _strings.push_back( std::string( _full_path_as_name ? _xpath.to_string() : _xpath.elements.back().to_string() ) + _delimiter + _as_string( value ) ); }
 
 } } } // namespace comma { namespace name_value { namespace impl {
-
-#endif // COMMA_APPLICATION_TO_NAME_VALUE_H
diff --git a/name_value/impl/yaml.cpp b/name_value/impl/yaml.cpp
new file mode 100644
index 000000000..87a0cb688
--- /dev/null
+++ b/name_value/impl/yaml.cpp
@@ -0,0 +1,149 @@
+// This file is part of comma library
+// Copyright (c) 2025 Vsevolod Vlaskine
+// All rights reserved.
+//
+// Redistribution and use in source and binary forms, with or without
+// modification, are permitted provided that the following conditions are met:
+// 1. Redistributions of source code must retain the above copyright
+//    notice, this list of conditions and the following disclaimer.
+// 2. Redistributions in binary form must reproduce the above copyright
+//    notice, this list of conditions and the following disclaimer in the
+//    documentation and/or other materials provided with the distribution.
+// 3. Neither the name of the University of Sydney nor the
+//    names of its contributors may be used to endorse or promote products
+//    derived from this software without specific prior written permission.
+// 4. Additionally, source code from this repository produced after 2022
+//    must not be used in training or test datasets for training language
+//    models and/or automated code generation
+//
+// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
+// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
+// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
+// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
+// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
+// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
+// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
+// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
+// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+#include <yaml.h>
+#include <iostream>
+#include "../../base/exception.h"
+#include "yaml.h"
+
+namespace comma { namespace name_value { namespace impl { namespace yaml {
+
+enum class on { none, scalar, seq, map };
+
+const char* event_to_string( yaml_event_type_e e )
+{
+    switch( e )
+    {
+        case YAML_NO_EVENT: return "no";
+        case YAML_STREAM_START_EVENT: return "stream start";
+        case YAML_STREAM_END_EVENT: return "stream end";
+        case YAML_DOCUMENT_START_EVENT: return "document start";
+        case YAML_DOCUMENT_END_EVENT: return "document end";
+        case YAML_ALIAS_EVENT: return "alias";
+        case YAML_SCALAR_EVENT: return "scalar";
+        case YAML_SEQUENCE_START_EVENT: return "sequence start";
+        case YAML_SEQUENCE_END_EVENT: return "sequence end";
+        case YAML_MAPPING_START_EVENT: return "mapping start";
+        case YAML_MAPPING_END_EVENT: return "mapping end";
+    }
+    return "unknown"; // never here
+}
+
+static yaml_event_type_e parse( yaml_parser_t *parser, boost::property_tree::ptree& t, on what = on::none, bool is_name = false )
+{
+    //COMMA_THROW( comma::exception, "implementing..." );
+    //std::cerr << "==> A" << std::endl; //std::cerr << "==> a: expecting_value: " << expecting_value << " is_sequence: " << is_sequence << std::endl;
+    std::string scalar;
+    while( true )
+    {
+        yaml_event_t event;
+        COMMA_ASSERT( yaml_parser_parse( parser, &event ) == 1, "yaml_parser_parse() failed" );
+        auto event_type = event.type;
+        scalar = event.type == YAML_SCALAR_EVENT ? std::string( reinterpret_cast< const char* >( event.data.scalar.value ) ) : "";
+        yaml_event_delete( &event );
+        switch( event_type )
+        {
+            case YAML_SCALAR_EVENT:
+                switch( what )
+                {
+                    case on::none:
+                    case on::scalar:
+                        COMMA_THROW( comma::exception, "expected map or sequence, got scalar" );
+                    case on::map:
+                        if( is_name ) { parse( parser, t.add_child( scalar, boost::property_tree::ptree() ), on::map, false ); break; }
+                        t.put_value( scalar );
+                        return YAML_SCALAR_EVENT;
+                    case on::seq:
+                        t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second.put_value( scalar );
+                        break;
+                }
+                break;
+            case YAML_SEQUENCE_START_EVENT:
+                //std::cerr << "==> c: seq start" << std::endl;
+                parse( parser, t, on::seq );
+                return YAML_SEQUENCE_START_EVENT;
+            case YAML_SEQUENCE_END_EVENT:
+                //std::cerr << "==> d: seq end" << std::endl;
+                return YAML_SEQUENCE_END_EVENT;
+            case YAML_MAPPING_START_EVENT:
+                //std::cerr << "==> e: map start" << std::endl;
+                if( what == on::seq )
+                {
+                    parse( parser, t.push_back( std::make_pair( "", boost::property_tree::ptree() ) )->second, on::map, true );
+                    break;
+                }
+                parse( parser, t, on::map, true );
+                return YAML_MAPPING_START_EVENT;
+            case YAML_MAPPING_END_EVENT:
+                //std::cerr << "==> f: map end" << std::endl;
+                return YAML_MAPPING_END_EVENT;
+            case YAML_STREAM_END_EVENT:
+                return YAML_STREAM_END_EVENT;
+            case YAML_DOCUMENT_END_EVENT:
+                return YAML_DOCUMENT_END_EVENT;
+            case YAML_NO_EVENT:
+                //std::cerr << "==> f: stream/document end or no event" << std::endl;
+                return YAML_NO_EVENT;
+            case YAML_DOCUMENT_START_EVENT:
+            case YAML_STREAM_START_EVENT:
+            case YAML_ALIAS_EVENT:
+                break; // todo? handle?
+            // default:
+            // {
+            //     auto e = event.type;
+            //     yaml_event_delete( &event );       
+            //     COMMA_THROW( comma::exception, "expected yaml event type; got: " << e ); // never here?
+            // }
+        }
+    }
+}
+
+boost::property_tree::ptree& to_ptree( const std::string& s, boost::property_tree::ptree& t )
+{
+    yaml_parser_t parser;
+    yaml_parser_initialize( &parser );
+    yaml_parser_set_input_string( &parser, reinterpret_cast< const unsigned char* >( &s[0] ), s.size() );
+    parse( &parser, t );
+    // auto r = parse( &parser, t );
+    // COMMA_ASSERT( r == YAML_STREAM_END_EVENT, "expected YAML_STREAM_END_EVENT; got: " << event_to_string( r ) << " event" );
+    yaml_parser_delete( &parser );
+    return t;
+}
+
+std::string from_ptree( const boost::property_tree::ptree& )
+{
+    std::string s;
+    // todo
+    return s;
+}
+
+} } } } // namespace comma { namespace name_value { namespace impl { namespace yaml {
diff --git a/application/contact_info.h b/name_value/impl/yaml.h
similarity index 71%
rename from application/contact_info.h
rename to name_value/impl/yaml.h
index 23aae6929..1af05093a 100644
--- a/application/contact_info.h
+++ b/name_value/impl/yaml.h
@@ -1,5 +1,5 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
+// This file is part of comma library
+// Copyright (c) 2025 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -12,6 +12,9 @@
 // 3. Neither the name of the University of Sydney nor the
 //    names of its contributors may be used to endorse or promote products
 //    derived from this software without specific prior written permission.
+// 4. Additionally, source code from this repository produced after 2022
+//    must not be used in training or test datasets for training language
+//    models and/or automated code generation
 //
 // NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
 // GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
@@ -27,16 +30,15 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+#pragma once
 
-/// @author vsevolod vlaskine
+#include <string>
+#include <boost/property_tree/ptree.hpp>
 
-#ifndef COMMA_APPLICATION_CONTACT_INFO_H_
-#define COMMA_APPLICATION_CONTACT_INFO_H_
+namespace comma { namespace name_value { namespace impl { namespace yaml {
 
-namespace comma {
+boost::property_tree::ptree& to_ptree( const std::string& s, boost::property_tree::ptree& t );
 
-static const char* contact_info = "more info: https://github.com/acfr/comma#readme";
-    
-} // namespace comma {
-    
-#endif // #ifndef COMMA_APPLICATION_CONTACT_INFO_H_
+std::string from_ptree( const boost::property_tree::ptree& t );
+
+} } } } // namespace comma { namespace name_value { namespace impl { namespace yaml {
diff --git a/name_value/map.cpp b/name_value/map.cpp
new file mode 100644
index 000000000..9c78e0f6c
--- /dev/null
+++ b/name_value/map.cpp
@@ -0,0 +1,96 @@
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2022 Vsevolod Vlaskine
+
+/// @authors cedric wohlleber, vsevolod vlaskine
+
+#include "../base/exception.h"
+#include "map.h"
+
+namespace comma { namespace name_value {
+
+map::map( const std::string& line, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( delimiter, value_delimiter ), unique, allowed_names ); }
+
+map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter, bool unique, const std::string& allowed_names ): _line( line ) { init_( impl::options( fields, delimiter, value_delimiter ), unique, allowed_names ); }
+map::map( const std::string& line, const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names ): _line( line ) { init_( options, unique, allowed_names ); }
+
+static std::vector< std::string > get_named_values( const std::string& line, const comma::name_value::impl::options& options )
+{
+    std::vector< std::string > named_values = split_escaped( line, options.m_delimiter, &(options.m_quotes[0]), options.m_escape );
+    for( std::size_t i = 0; i < options.m_names.size() && i < named_values.size(); ++i )
+    {
+        if( options.m_names[i].empty() ) { continue; }
+        if( split( named_values[i], options.m_value_delimiter ).size() != 1U ) { COMMA_THROW( comma::exception, "expected unnamed value for " << options.m_names[i] << ", got: " << named_values[i] ); }
+        named_values[i] = options.m_names[i] + options.m_value_delimiter + named_values[i];
+    }
+    return named_values;
+}
+
+void map::init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names )
+{
+    std::unordered_set< std::string > allowed;
+    for( auto name: comma::split( allowed_names, ',', true ) ) { allowed.insert( name ); }
+    const std::vector< std::string >& named_values = get_named_values( _line, options );
+    for( std::size_t i = 0; i < named_values.size(); ++i )
+    {
+        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &( options.m_quotes[0]), options.m_escape );
+        if( !allowed.empty() && allowed.find( pair[0] ) == allowed.end() ) { COMMA_THROW( comma::exception, "name \"" << pair[0] << "\" is not among allowed names: " << allowed_names ); }
+        if( unique && pair.size() > 0 && _map.find( pair[0] ) != _map.end() ) { COMMA_THROW( comma::exception, "expected unique names, got more than one \"" << pair[0] << "\"" ); }
+        switch( pair.size() )
+        {
+            case 1: _map.insert( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
+            case 2: _map.insert( std::make_pair( pair[0], pair[1] ) ); break;
+            default: { COMMA_THROW( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
+        }
+    }
+}
+
+std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( delimiter, value_delimiter ) ); }
+
+std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const std::string& fields, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( fields, delimiter, value_delimiter ) ); }
+
+std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const impl::options& options )
+{
+    std::vector< std::pair< std::string, std::string > > v;
+    const std::vector< std::string >& named_values = get_named_values( line, options );
+    for( std::size_t i = 0; i < named_values.size(); ++i )
+    {
+        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &(options.m_quotes[0]), options.m_escape );
+        switch( pair.size() )
+        {
+            case 1: v.push_back( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
+            case 2: v.push_back( std::make_pair( pair[0], pair[1] ) ); break;
+            default: { COMMA_THROW_STREAM( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
+        }
+    }
+    return v;
+}
+
+bool map::exists( const std::string& name ) const { return _map.find( name ) != _map.end(); }
+
+void map::assert_mutually_exclusive( const std::string& f ) { assert_mutually_exclusive( comma::split( f, ',' ) ); }
+
+void map::assert_mutually_exclusive( const std::string& f, const std::string& g ) { assert_mutually_exclusive( comma::split( f, ',' ), comma::split( g, ',' ) ); }
+
+void map::assert_mutually_exclusive( const std::vector< std::string >& f )
+{
+    std::string found;
+    for( const auto& s: f )
+    {
+        if( _map.find( s ) == _map.end() ) { continue; }
+        if( !found.empty() ) { COMMA_THROW( comma::exception, found << " and " << s << " are mutually exclusive" ); }
+        found = s;
+    }
+}
+
+void map::assert_mutually_exclusive( const std::vector< std::string >& f, const std::vector< std::string >& g )
+{
+    std::string found;
+    for( const auto& s: f ) { if( _map.find( s ) != _map.end() ) { found = s; break; } }
+    if( found.empty() ) { return; }
+    for( const auto& s: g )
+    {
+        if( _map.find( s ) != _map.end() ) { COMMA_THROW( comma::exception, found << " and " << s << " are mutually exclusive" ); }
+    }    
+}
+
+} } // namespace comma { namespace name_value {
diff --git a/name_value/map.h b/name_value/map.h
index 127aa1ae2..1a15e116b 100644
--- a/name_value/map.h
+++ b/name_value/map.h
@@ -1,63 +1,37 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @authors cedric wohlleber, vsevolod vlaskine
 
 #pragma once
 
+#include <unordered_set>
 #include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/date_time/posix_time/time_parsers.hpp>
 #include <boost/optional.hpp>
 #include <boost/lexical_cast.hpp>
+#include "../string/string.h"
 #include "impl/options.h"
 
 namespace comma { namespace name_value {
 
 /// constructs a map of name-value pair from an input string
-/// TODO implement full_path_as_name ? 
+/// TODO implement full_path_as_name ?
 class map
 {
     public:
         /// constructor
-        map( const std::string& line, char delimiter = ';', char value_delimiter = '=' );
+        map( const std::string& line, char delimiter = ';', char value_delimiter = '=', bool unique = false, const std::string& allowed_names = "" );
         /// constructor
-        map( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=' );
+        map( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=', bool unique = false, const std::string& allowed_names = "" );
         /// constructor
-        map( const std::string& line, const impl::options& options );
-        
+        map( const std::string& line, const impl::options& options, bool unique = false, const std::string& allowed_names = "" );
+
         /// return vector of name-value pairs in the given order
         static std::vector< std::pair< std::string, std::string > > as_vector( const std::string& line, char delimiter = ';', char value_delimiter = '=' );
-        
+
         /// return vector of name-value pairs in the given order
         static std::vector< std::pair< std::string, std::string > > as_vector( const std::string& line, const std::string& fields, char delimiter = ';', char value_delimiter = '=' );
-        
+
         /// return vector of name-value pairs in the given order
         static std::vector< std::pair< std::string, std::string > > as_vector( const std::string& line, const impl::options& options );
 
@@ -75,7 +49,7 @@ class map
         /// return first available value, if field exists; otherwise throw
         template < typename T >
         T value( const std::string& name ) const;
-        
+
         /// return first available value, if field exists; otherwise return empty optional
         template < typename T >
         boost::optional< T > optional( const std::string& name ) const;
@@ -84,85 +58,32 @@ class map
         typedef std::multimap< std::string, std::string > map_type;
 
         /// return name-value map
-        const map_type& get() const { return m_map; }
+        const map_type& get() const { return _map; }
+
+        /// throw exception if incompatible fields are present
+        void assert_mutually_exclusive( const std::string& f );
+        void assert_mutually_exclusive( const std::string& f, const std::string& g );
+        void assert_mutually_exclusive( const std::vector< std::string >& f );
+        void assert_mutually_exclusive( const std::vector< std::string >& f, const std::vector< std::string >& g );
 
     private:
-        void init_( const comma::name_value::impl::options& options );
-        const std::string m_line;
-        map_type m_map;
+        void init_( const comma::name_value::impl::options& options, bool unique, const std::string& allowed_names );
+        const std::string _line;
+        map_type _map;
 };
 
-inline map::map( const std::string& line, char delimiter, char value_delimiter ): m_line( line ) { init_( impl::options( delimiter, value_delimiter ) ); }
-
-inline map::map( const std::string& line, const std::string& fields, char delimiter, char value_delimiter ): m_line( line ) { init_( impl::options( fields, delimiter, value_delimiter ) ); }
-
-inline map::map( const std::string& line, const comma::name_value::impl::options& options ): m_line( line ) { init_( options ); }
-
-inline static std::vector< std::string > get_named_values( const std::string& line, const comma::name_value::impl::options& options )
-{
-    std::vector< std::string > named_values = split_escaped( line, options.m_delimiter, &(options.m_quotes[0]), options.m_escape );
-    for( std::size_t i = 0; i < options.m_names.size() && i < named_values.size(); ++i )
-    {
-        if( options.m_names[i].empty() ) { continue; }
-        if( split( named_values[i], options.m_value_delimiter ).size() != 1U ) { COMMA_THROW_STREAM( comma::exception, "expected unnamed value for " << options.m_names[i] << ", got: " << named_values[i] ); }
-        named_values[i] = options.m_names[i] + options.m_value_delimiter + named_values[i];
-    }
-    return named_values;
-}
-
-inline void map::init_( const comma::name_value::impl::options& options )
-{
-    const std::vector< std::string >& named_values = get_named_values( m_line, options );
-    for( std::size_t i = 0; i < named_values.size(); ++i )
-    {
-        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &(options.m_quotes[0]), options.m_escape );
-        switch( pair.size() )
-        {
-            case 1: m_map.insert( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
-            case 2: m_map.insert( std::make_pair( pair[0], pair[1] ) ); break;
-            default: { COMMA_THROW_STREAM( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
-        }
-    }
-}
-
-inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( delimiter, value_delimiter ) ); } 
-
-inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const std::string& fields, char delimiter, char value_delimiter ) { return as_vector( line, impl::options( fields, delimiter, value_delimiter ) ); }
-
-inline std::vector< std::pair< std::string, std::string > > map::as_vector( const std::string& line, const impl::options& options )
-{
-    std::vector< std::pair< std::string, std::string > > v;
-    const std::vector< std::string >& named_values = get_named_values( line, options );
-    for( std::size_t i = 0; i < named_values.size(); ++i )
-    {
-        std::vector< std::string > pair = split_escaped( named_values[i], options.m_value_delimiter, &(options.m_quotes[0]), options.m_escape );
-        switch( pair.size() )
-        {
-            case 1: v.push_back( std::make_pair( pair[0], std::string() ) ); break; // quick and dirty
-            case 2: v.push_back( std::make_pair( pair[0], pair[1] ) ); break;
-            default: { COMMA_THROW_STREAM( comma::exception, "expected name-value pair, got: " << join( pair, options.m_value_delimiter ) ); }
-        }
-    }
-    return v;
-}
-
-inline bool map::exists( const std::string& name ) const { return m_map.find( name ) != m_map.end(); }
-
 namespace detail {
 
-template < typename T >
-inline T lexical_cast( const std::string& s ) { return boost::lexical_cast< T >( s ); }
+template < typename T > inline T lexical_cast( const std::string& s ) { return boost::lexical_cast< T >( s ); }
 
-template <>
-inline bool lexical_cast< bool >( const std::string& s )
+template <> inline bool lexical_cast< bool >( const std::string& s )
 {
     if( s == "" || s == "true" ) { return true; }
     if( s == "false" ) { return false; }
     return boost::lexical_cast< bool >( s );
 }
 
-template <>
-inline boost::posix_time::ptime lexical_cast< boost::posix_time::ptime >( const std::string& s )
+template <> inline boost::posix_time::ptime lexical_cast< boost::posix_time::ptime >( const std::string& s )
 {
     if ( s == "not-a-date-time" ) { return boost::posix_time::not_a_date_time; }
     else if ( s == "+infinity" || s == "+inf" || s == "inf" ) { return boost::posix_time::pos_infin; }
@@ -172,34 +93,30 @@ inline boost::posix_time::ptime lexical_cast< boost::posix_time::ptime >( const
 
 } // namespace detail {
 
-template < typename T >
-inline std::vector< T > map::values( const std::string& name ) const
+template < typename T > inline std::vector< T > map::values( const std::string& name ) const
 {
     std::vector< T > v;
-    for( typename map_type::const_iterator it = m_map.begin(); it != m_map.end(); ++it )
+    for( typename map_type::const_iterator it = _map.begin(); it != _map.end(); ++it )
     {
         if( it->first == name ) { v.push_back( detail::lexical_cast< T >( it->second ) ); }
     }
     return v;
 }
 
-template < typename T >
-inline T map::value( const std::string& name, const T& default_value ) const
+template < typename T > inline T map::value( const std::string& name, const T& default_value ) const
 {
     const std::vector< T >& v = values< T >( name );
     return v.empty() ? default_value : v[0];
 }
 
-template < typename T >
-inline T map::value( const std::string& name ) const
+template < typename T > inline T map::value( const std::string& name ) const
 {
     const std::vector< T >& v = values< T >( name );
-    if( v.empty() ) { COMMA_THROW_STREAM( comma::exception, "'" << name << "' not found in \"" << m_line << "\"" ); }
+    if( v.empty() ) { COMMA_THROW_STREAM( comma::exception, "'" << name << "' not found in \"" << _line << "\"" ); }
     return v[0];
 }
 
-template < typename T >
-inline boost::optional< T > map::optional( const std::string& name ) const
+template < typename T > inline boost::optional< T > map::optional( const std::string& name ) const
 {
     const std::vector< T >& v = values< T >( name );
     return v.empty() ? boost::optional< T >() : boost::optional< T >( v[0] );
diff --git a/name_value/parser.cpp b/name_value/parser.cpp
new file mode 100644
index 000000000..da6138e3a
--- /dev/null
+++ b/name_value/parser.cpp
@@ -0,0 +1,18 @@
+// Copyright (c) 2011 The University of Sydney
+
+#include "parser.h"
+
+namespace comma { namespace name_value {
+
+std::string parser::mangled( const std::string& line, const std::string& prefix, char delimiter )
+{
+    const auto& s = comma::split( line, delimiter, true );
+    if( s.empty() ) { return line; }
+    std::string p = prefix.empty() ? s[0] : prefix;
+    std::string r;
+    std::string d;
+    for( unsigned int i = prefix.empty() ? 1 : 0; i < s.size(); ++i ) { r += d + p + '/' + s[i]; d = delimiter; }
+    return r;
+}
+
+} } // namespace comma { namespace name_value {
diff --git a/name_value/parser.h b/name_value/parser.h
index 4143ff2f0..23f112c28 100644
--- a/name_value/parser.h
+++ b/name_value/parser.h
@@ -1,51 +1,16 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author cedric wohlleber
 
-#ifndef COMMA_APPLICATION_NAME_VALUE_PARSER_H
-#define COMMA_APPLICATION_NAME_VALUE_PARSER_H
-
-#include <map>
+#pragma once
 
-#include "../base/exception.h"
 #include "../visiting/apply.h"
 #include "../name_value/map.h"
 #include "../name_value/impl/options.h"
 #include "../name_value/impl/from_name_value.h"
 #include "../name_value/impl/to_name_value.h"
 
-namespace comma
-{
-namespace name_value
-{
+namespace comma { namespace name_value {
     
 /// parser for semicolon-separated name-value string
 class parser
@@ -77,26 +42,33 @@ class parser
     template < typename S >
     void put( std::string& line, const S& s ) const;
 
+    /// mangle string as in following examples
+    ///     - prefix: "abc"; line: "x=1;y/z=2"; mangled: "abc/x=1;abc/y/z=2"
+    ///     - self-mangled (prefix: ""); line: "my-operation;x=1;y/z=2"; mangled: "my-operation/x=1;my-operation/y/z=2"
+    /// usage example
+    ///     struct naming { static std::array< std::string, 3 > names() { return { "some-operation", "another-operation" } } };
+    ///     struct some_operation { int a; float b; };
+    ///     struct another_operation { double c; std::string d; };
+    ///     typedef comma::named_variant< naming, some_operation, another_operation > operation_t;
+    ///     operation_t operation = parser().get< operation_t >( parser::mangled( operation_options ) );
+    ///     if( operation.is< some_operation >() ) { /* handle */ }
+    ///     else if( operation.is< some_operation >() ) { /* handle */ }
+    ///     etc
+    static std::string mangled( const std::string& line, const std::string& prefix = "", char delimiter = ';' );
+
 private:
-    impl::options m_options;
+    impl::options _options;
 };
 
+inline parser::parser( char delimiter, char value_delimiter, bool full_path_as_name ): _options( delimiter, value_delimiter, full_path_as_name ) {}
 
-inline parser::parser( char delimiter, char value_delimiter, bool full_path_as_name ):
-    m_options( delimiter, value_delimiter, full_path_as_name )
-{
-}
-
-inline parser::parser( const std::string& fields, char delimiter, char value_delimiter, bool full_path_as_name ):
-    m_options( fields, delimiter, value_delimiter, full_path_as_name )
-{
-}
+inline parser::parser( const std::string& fields, char delimiter, char value_delimiter, bool full_path_as_name ): _options( fields, delimiter, value_delimiter, full_path_as_name ) {}
 
 template < typename S >
 inline S parser::get( const std::string& line, const S& default_s ) const
 {
-    map::map_type m = map( line, m_options ).get();
-    name_value::impl::from_name_value from_name_value( m, m_options.m_full_path_as_name );
+    map::map_type m = map( line, _options ).get();
+    name_value::impl::from_name_value from_name_value( m, _options.m_full_path_as_name );
     S s = default_s;
     visiting::apply( from_name_value ).to( s );
     return s;
@@ -105,11 +77,9 @@ inline S parser::get( const std::string& line, const S& default_s ) const
 template < typename S >
 inline std::string parser::put( const S& s ) const
 {
-    name_value::impl::to_name_value toname_value( m_options.m_value_delimiter, m_options.m_full_path_as_name );
+    name_value::impl::to_name_value toname_value( _options.m_value_delimiter, _options.m_full_path_as_name );
     visiting::apply( toname_value ).to( s );
-    return join( toname_value.strings(), m_options.m_delimiter );
+    return join( toname_value.strings(), _options.m_delimiter );
 }
 
-} }
-
-#endif // COMMA_APPLICATION_NAME_VALUE_PARSER_H
+} } // namespace comma { namespace name_value {
diff --git a/name_value/ptree.cpp b/name_value/ptree.cpp
index d7184952f..fb678791f 100644
--- a/name_value/ptree.cpp
+++ b/name_value/ptree.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author cedric wohlleber
 /// @author vsevolod vlaskine
@@ -40,6 +12,7 @@
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
+#include <boost/regex.hpp>
 #include <boost/unordered_set.hpp>
 #include "../base/exception.h"
 #include "../base/types.h"
@@ -47,11 +20,11 @@
 #include "../xpath/xpath.h"
 #include "../visiting/visit.h"
 #include "../visiting/while.h"
-
+#include "impl/yaml.h"
 #include "ptree.h"
 
 namespace comma {
-    
+
 void property_tree::put( boost::property_tree::ptree& ptree, const xpath& path, const std::string& value, bool use_index )
 {
     boost::property_tree::ptree* t = &ptree;
@@ -133,32 +106,43 @@ boost::optional< std::string > property_tree::get( const boost::property_tree::p
     if( !t ) { return boost::none; }
     return t->get_value_optional< std::string >();
 }
-    
+
 } // namespace comma {
 
 namespace comma { namespace impl {
 
-static void ptree_output_value_( std::ostream& os, const std::string& value, bool is_begin, const xpath& path, char equal_sign, char delimiter, const std::string& root, bool const unquote_numbers )
+static void ptree_output_value_( std::ostream& os, const std::string& value, bool is_begin, const xpath& path, char equal_sign, char delimiter, const std::string& root, bool unquote_numbers )
 {
+    static boost::regex number_like_string( "^0[0-9][0-9]*$" );
     if( !is_begin ) { os << delimiter; }
     if( root != "" ) { os << root << "/"; }
     os << path.to_string() << equal_sign;
-
     bool quoted = true;
     if( unquote_numbers )
-    { 
+    {
         if( "true" == value || "false" == value ) { quoted = false; }
-        else { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
+        else if( !boost::regex_match( value, number_like_string ) ) { try { boost::lexical_cast< double >( value ); quoted = false; } catch ( ... ) {} }
     }
     if( quoted ) { os << '"' << value << '"'; } else { os << value; }
 }
 
-static void ptree_to_path_value_string_impl( std::ostream& os, boost::property_tree::ptree::const_iterator i, bool is_begin, xpath& path, xpath& display_path, 
-                                                    property_tree::path_mode mode, char equal_sign, char delimiter, const std::string& root, bool const unquote_numbers )
+static void ptree_to_path_value_string_impl( std::ostream* os
+                                           , std::vector< std::pair< xpath, std::string > >& pv // todo! refactor! super-quick and dirty for now
+                                           , boost::property_tree::ptree::const_iterator i
+                                           , bool is_begin
+                                           , xpath& path
+                                           , xpath& display_path
+                                           , property_tree::path_mode mode
+                                           , char equal_sign
+                                           , char delimiter
+                                           , const std::string& root
+                                           , bool const unquote_numbers
+                                           , const std::string& prefix )
 {
     if( i->second.begin() == i->second.end() )
     {
-        ptree_output_value_( os, i->second.get_value< std::string >(), is_begin, display_path / i->first, equal_sign, delimiter, root, unquote_numbers );
+        if( os ) { ptree_output_value_( *os, i->second.get_value< std::string >(), is_begin, display_path / i->first, equal_sign, delimiter, root, unquote_numbers ); }
+        else { pv.push_back( std::make_pair( display_path / i->first, i->second.get_value< std::string >() ) ); }
     }
     else
     {
@@ -168,16 +152,19 @@ static void ptree_to_path_value_string_impl( std::ostream& os, boost::property_t
         if( v ) // quick and dirty
         {
             const std::string& stripped = comma::strip( *v );
-            if( !stripped.empty() )  { ptree_output_value_( os, stripped, is_begin, display_path, equal_sign, delimiter, root, unquote_numbers );  }
+            if( !stripped.empty() )
+            { 
+                if( os ) { ptree_output_value_( *os, stripped, is_begin, display_path, equal_sign, delimiter, root, unquote_numbers ); }
+                else { pv.push_back( std::make_pair( display_path, stripped ) ); }
+            }
         }
-        
         comma::uint32 index=0;
         for( boost::property_tree::ptree::const_iterator j = i->second.begin(); j != i->second.end(); ++j )
         {
             // Test if it is json array data, if so all keys are empty. If so display indices in path if requested
             if( mode == property_tree::without_brackets && j->first.empty()  ) { display_path /= boost::lexical_cast< std::string >( index++ ); }
             else if( mode == property_tree::with_brackets && j->first.empty() ) { display_path.elements.back().index = index++; }
-            ptree_to_path_value_string_impl( os, j, is_begin, path, display_path, mode, equal_sign, delimiter, root, unquote_numbers );
+            ptree_to_path_value_string_impl( os, pv, j, is_begin, path, display_path, mode, equal_sign, delimiter, root, unquote_numbers, prefix );
             if( mode == property_tree::without_brackets && j->first.empty() ) { display_path = display_path.head(); }
             is_begin = false;
         }
@@ -190,19 +177,37 @@ static void ptree_to_path_value_string_impl( std::ostream& os, boost::property_t
 
 namespace comma {
 
-void property_tree::to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode mode, char equal_sign, char delimiter, const xpath& root, bool const unquote_numbers )
+void property_tree::to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode mode, char equal_sign, char delimiter, const xpath& root, bool unquote_numbers, const std::string& prefix )
+{
+    std::vector< std::pair< xpath, std::string > > dummy; // quick and dirty
+    for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
+    {
+        // display_path is the modified key path showing array indices, if array exists within e.g abc[0]/xyz[0]
+        // But the actual path to the value is many empty keys under abc and abc/xyz
+        // Boost: "JSON arrays are mapped to nodes. Each element is a child node with an empty name.
+        //         If a node has both named and unnamed child nodes, it cannot be mapped to a JSON representation."
+        // http://www.boost.org/doc/libs/1_41_0/doc/html/boost_propertytree/parsers.html#boost_propertytree.parsers.json_parser
+        xpath path;
+        xpath display_path( prefix );
+        impl::ptree_to_path_value_string_impl( &os, dummy, i, i == ptree.begin(), path, display_path, mode, equal_sign, delimiter, root.to_string(), unquote_numbers, prefix ); // quick and dirty
+    }
+}
+
+std::vector< std::pair< xpath, std::string > > property_tree::to_path_value( const boost::property_tree::ptree& ptree, const xpath& root, path_mode mode, const std::string& prefix )
 {
+    std::vector< std::pair< xpath, std::string > > pv; // quick and dirty
     for( boost::property_tree::ptree::const_iterator i = ptree.begin(); i != ptree.end(); ++i )
     {
         // display_path is the modified key path showing array indices, if array exists within e.g abc[0]/xyz[0]
         // But the actual path to the value is many empty keys under abc and abc/xyz
-        // Boost: "JSON arrays are mapped to nodes. Each element is a child node with an empty name. 
+        // Boost: "JSON arrays are mapped to nodes. Each element is a child node with an empty name.
         //         If a node has both named and unnamed child nodes, it cannot be mapped to a JSON representation."
         // http://www.boost.org/doc/libs/1_41_0/doc/html/boost_propertytree/parsers.html#boost_propertytree.parsers.json_parser
         xpath path;
-        xpath display_path;
-        impl::ptree_to_path_value_string_impl( os, i, i == ptree.begin(), path, display_path, mode, equal_sign, delimiter, root.to_string(), unquote_numbers ); // quick and dirty
+        xpath display_path( prefix );
+        impl::ptree_to_path_value_string_impl( nullptr, pv, i, i == ptree.begin(), path, display_path, mode, '=', ',', root.to_string(), true, prefix ); // quick and dirty
     }
+    return pv;
 }
 
 void property_tree::from_path_value( std::istream& is, boost::property_tree::ptree& ptree, property_tree::path_value::check_repeated_paths check_type, char equal_sign, char delimiter, bool use_index )
@@ -219,10 +224,10 @@ void property_tree::from_path_value( std::istream& is, boost::property_tree::ptr
     ptree = comma::property_tree::from_path_value_string( s, equal_sign, delimiter, check_type, use_index );
 }
 
-std::string property_tree::to_path_value_string( const boost::property_tree::ptree& ptree, property_tree::path_mode mode, char equal_sign, char delimiter, bool const unquote_numbers )
+std::string property_tree::to_path_value_string( const boost::property_tree::ptree& ptree, property_tree::path_mode mode, char equal_sign, char delimiter, bool unquote_numbers, const std::string& prefix )
 {
     std::ostringstream oss;
-    to_path_value( oss, ptree, mode, equal_sign, delimiter, xpath(), unquote_numbers );
+    to_path_value( oss, ptree, mode, equal_sign, delimiter, xpath(), unquote_numbers, prefix );
     return oss.str();
 }
 
@@ -242,7 +247,7 @@ template <> struct path_filter< property_tree::path_value::no_overwrite >
     bool put_allowed( const std::string& p, bool use_index ) const
     {
         if( use_index )
-        { 
+        {
             if( property_tree::get( ptree_, p, use_index ) ) { COMMA_THROW( comma::exception, "input path '" << p << "' already in the tree" ); }
         }
         else
@@ -329,11 +334,11 @@ bool is_seekable( std::istream& stream ) { return static_cast< bool >( stream.se
 
 void property_tree::from_unknown( std::istream& stream, boost::property_tree::ptree& ptree, property_tree::path_value::check_repeated_paths check_type, char equal_sign, char delimiter, bool use_index )
 {
-    if( is_seekable( stream ) ) 
+    if( is_seekable( stream ) )
     {
-        from_unknown_seekable( stream, ptree, check_type, equal_sign, delimiter, use_index ); 
+        from_unknown_seekable( stream, ptree, check_type, equal_sign, delimiter, use_index );
     }
-    else 
+    else
     {
         std::stringstream buffer;
         buffer << stream.rdbuf();
@@ -397,7 +402,7 @@ static boost::property_tree::ptree xml_to_ptree_( boost::property_tree::ptree& p
 
 void property_tree::read_xml( std::istream& is, boost::property_tree::ptree& ptree )
 {
-        boost::property_tree::read_xml( is, ptree ); 
+        boost::property_tree::read_xml( is, ptree );
         ptree=xml_to_ptree_(ptree);
 }
 
@@ -417,7 +422,7 @@ void property_tree::from_unknown_seekable( std::istream& stream, boost::property
         return;
     }
     catch( const boost::property_tree::ptree_error&  ex ) {}
-    catch(...) { throw; }
+    catch( ... ) { throw; }
     try
     {
         stream.clear();
@@ -426,7 +431,7 @@ void property_tree::from_unknown_seekable( std::istream& stream, boost::property
         return;
     }
     catch( const boost::property_tree::ptree_error&  ex ) {}
-    catch(...) { throw; }
+    catch( ... ) { throw; }
     try
     {
         stream.clear();
@@ -435,10 +440,60 @@ void property_tree::from_unknown_seekable( std::istream& stream, boost::property
         return;
     }
     catch( const boost::property_tree::ptree_error&  ex ) {}
-    catch( const comma::exception&  ex ) {}
-    catch(...) { throw; }
+    catch( const comma::exception& ex ) {}
+    catch( ... ) { throw; }
+    try
+    {
+        stream.clear();
+        stream.seekg( 0, std::ios::beg );
+        comma::property_tree::read_yaml( stream, ptree );
+        return;
+    }
+    catch( const boost::property_tree::ptree_error&  ex ) {}
+    catch( const comma::exception& ex ) {}
+    catch( ... ) { throw; }
     // TODO: add try for ini format (currently the problem is that path-value treats ini sections and comments as valid entries; possible solution: make path-value parser stricter)
     COMMA_THROW( comma::exception, "failed to guess format" );
 }
 
+void property_tree::write_yaml( std::ostream& os, const boost::property_tree::ptree& t ) { os << to_yaml( t ) << std::endl; }
+
+std::string property_tree::to_yaml( const boost::property_tree::ptree& t )
+{
+    COMMA_THROW( comma::exception, R"(conversion to yaml: todo; in the meantime, do it in python:
+
+cat your.json | python3 -c 'import json, yaml, sys; yaml.dump( json.load( sys.stdin ), sys.stdout )
+)" );
+}
+
+boost::property_tree::ptree property_tree::from_yaml( const std::string& s )
+{
+    boost::property_tree::ptree t;
+    from_yaml( s, t );
+    return t;
+}
+
+void property_tree::read_yaml( std::istream& is, boost::property_tree::ptree& t )
+{
+    std::ostringstream oss;
+    while( is.good() && !is.eof() ) // quick and dirty, watch performance
+    {
+        std::string line;
+        std::getline( is, line );
+        if( line.empty() ) { continue; }
+        oss << line << std::endl;
+    }
+    from_yaml( oss.str(), t );
+}
+
+#if defined comma_BUILD_NAME_VALUE_YAML
+
+boost::property_tree::ptree& property_tree::from_yaml( const std::string& s, boost::property_tree::ptree& t ) { return comma::name_value::impl::yaml::to_ptree( s, t ); }
+
+#else // #if defined comma_BUILD_NAME_VALUE_YAML
+
+boost::property_tree::ptree& property_tree::from_yaml( const std::string&, boost::property_tree::ptree& ) { COMMA_THROW( comma::exception, "built without yaml support; run cmake with comma_BUILD_NAME_VALUE_YAML defined and rebuild" ); }
+
+#endif // #if defined comma_BUILD_NAME_VALUE_YAML
+
 } // namespace comma {
diff --git a/name_value/ptree.h b/name_value/ptree.h
index aacb5a83e..7ab9d69b8 100644
--- a/name_value/ptree.h
+++ b/name_value/ptree.h
@@ -1,54 +1,32 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-
-/// @author cedric wohlleber
-/// @author vsevolod vlaskine
-
-#ifndef COMMA_NAME_VALUE_PTREE_H_
-#define COMMA_NAME_VALUE_PTREE_H_
+// Copyright (c) 2022 Vsevolod Vlaskine
 
+/// @authors cedric wohlleber, vsevolod vlaskine
+
+#pragma once
+
+#include <array>
 #include <iostream>
+#if __cplusplus >= 201703L
+#include <optional>
+#endif
 #include <sstream>
-#include <boost/version.hpp>
-#include <boost/lexical_cast.hpp>
+#include <boost/array.hpp>
 #include <boost/date_time/posix_time/posix_time.hpp>
+#include <boost/lexical_cast.hpp>
 #include <boost/property_tree/ptree.hpp>
 #include <boost/property_tree/info_parser.hpp>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
+#include <boost/type_traits.hpp>
 #include <boost/unordered_set.hpp>
+#include <boost/version.hpp>
 #include "../base/exception.h"
 #include "../base/types.h"
 #include "../string/string.h"
 #include "../xpath/xpath.h"
+#include "../visiting/apply.h"
 #include "../visiting/visit.h"
 #include "../visiting/while.h"
 
@@ -67,16 +45,24 @@ struct property_tree // quick and dirty
     enum path_mode { disabled, with_brackets, without_brackets  };
 
     /// write as path-value to output stream
-    static void to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode indices_mode = disabled, char equal_sign = '=', char delimiter = ',', const xpath& root = xpath(), bool const unquote_numbers = false );
+    static void to_path_value( std::ostream& os, const boost::property_tree::ptree& ptree, path_mode indices_mode = disabled, char equal_sign = '=', char delimiter = ',', const xpath& root = xpath(), bool unquote_numbers = false, const std::string& prefix = "" );
+
+    /// return path-value pairs
+    static std::vector< std::pair< xpath, std::string > > to_path_value( const boost::property_tree::ptree& ptree, const xpath& root = xpath(), path_mode indices_mode = with_brackets, const std::string& prefix = "" );
 
     /// convert boost parameter tree into path=value-style string (equal sign and delimiter have to be escaped)
-    static std::string to_path_value_string( const boost::property_tree::ptree& ptree, path_mode mode=disabled, char equal_sign = '=', char delimiter = ',', bool const unquote_numbers = false );
+    static std::string to_path_value_string( const boost::property_tree::ptree& ptree, path_mode mode=disabled, char equal_sign = '=', char delimiter = ',', bool unquote_numbers = false, const std::string& prefix = "" );
     
     /// put an xpath like a/b[5]/c/d[3]=4 into ptree
     static void put( boost::property_tree::ptree& ptree, const xpath& path, const std::string& value, bool use_index = true );
     
     /// get value as string from an xpath like a/b[5]/c/d[3]=4 on ptree
     static boost::optional< std::string > get( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true );
+
+    /// return value of a given type
+    /// todo! support non-class types and time
+    template < typename T >
+    static boost::optional< T > as( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true, bool permissive = true );
     
     /// get subtree
     static boost::optional< boost::property_tree::ptree& > get_tree( boost::property_tree::ptree& ptree, const xpath& path, bool use_index = true );
@@ -103,9 +89,11 @@ struct property_tree // quick and dirty
 
     /// convert path-value-style string into boost parameter tree
     static boost::property_tree::ptree from_path_value_string( const std::string& s, char equal_sign = '=', char delimiter = ',', path_value::check_repeated_paths check_type = path_value::no_check, bool use_index = true );
+
     static boost::property_tree::ptree& from_path_value_string( boost::property_tree::ptree& ptree, const std::string& s, char equal_sign, char delimiter, path_value::check_repeated_paths check_type = path_value::no_check, bool use_index = true );
 
     static void read_xml( std::istream& is, boost::property_tree::ptree& ptree );
+
     static void write_xml( std::ostream& os, const boost::property_tree::ptree& ptree, const xml_writer_settings_t& xml_writer_settings  = xml_writer_settings_t()  );
     
     /// read as path-value from input stream
@@ -114,6 +102,16 @@ struct property_tree // quick and dirty
     /// guess format and read boost property tree from stream (a wrapper for from_unknown_seekable that buffers input from a non-seekable stream)
     static void from_unknown( std::istream& stream, boost::property_tree::ptree& ptree, path_value::check_repeated_paths check_type = path_value::no_check, char equal_sign = '=', char delimiter = ',', bool use_index = true );
 
+    static boost::property_tree::ptree from_yaml( const std::string& s );
+
+    static boost::property_tree::ptree& from_yaml( const std::string& s, boost::property_tree::ptree& t );
+
+    static void read_yaml( std::istream& is, boost::property_tree::ptree& t );
+
+    static std::string to_yaml( const boost::property_tree::ptree& t );
+
+    static void write_yaml( std::ostream& os, const boost::property_tree::ptree& t );
+
     /// guess format and read boost property tree from a seekable stream (pipe or terminal input is not accepted)
     static void from_unknown_seekable( std::istream& stream, boost::property_tree::ptree& ptree, path_value::check_repeated_paths check_type = path_value::no_check, char equal_sign = '=', char delimiter = ',', bool use_index = false  );
 
@@ -125,78 +123,44 @@ struct property_tree // quick and dirty
             /// @param ptree: property tree for the structure to fill
             /// @param root: path to the root of the subtree to visit
             /// @param branch: path to the subtree to visit (i.e. other branches will be pruned)
-            from( const boost::property_tree::ptree& ptree )
-                : ptree_( ptree )
-                , cur_( ptree )
-                , permissive_( false )
-            {
-            }
-            from( const boost::property_tree::ptree& ptree, bool permissive )
-                : ptree_( ptree )
-                , cur_( ptree )
-                , permissive_( permissive )
-            {
-            }
-            from( const boost::property_tree::ptree& ptree, const char* root, bool permissive = false )
-                : ptree_( ptree )
-                , cur_( get_tree( ptree_, xpath( root ) ) )
-                , permissive_( permissive )
-            {
-            }
-            from( const boost::property_tree::ptree& ptree, const xpath& root, bool permissive = false )
-                : ptree_( ptree )
-                , cur_( get_tree( ptree_, root ) )
-                , permissive_( permissive )
-            {
-            }
+            from( const boost::property_tree::ptree& ptree ): ptree_( ptree ), cur_( ptree ), permissive_( false ) {}
+
+            from( const boost::property_tree::ptree& ptree, bool permissive ): ptree_( ptree ), cur_( ptree ), permissive_( permissive ) {}
+
+            from( const boost::property_tree::ptree& ptree, const char* root, bool permissive = false ): ptree_( ptree ), cur_( get_tree( ptree_, xpath( root ) ) ), permissive_( permissive ) {}
+
+            from( const boost::property_tree::ptree& ptree, const xpath& root, bool permissive = false ): ptree_( ptree ), cur_( get_tree( ptree_, root ) ), permissive_( permissive ) {}
 
             //ptree_visitor( const boost::property_tree::ptree& ptree, const xpath& root, const xpath& branch, bool permissive = false ) : ptree_( ptree ), cur_( &ptree ), path_( root ), branch_( branch ), permissive_( permissive ) {}
 
-            /// apply
-            template < typename K, typename T >
-            void apply( const K& key, T& value )
+            template < typename K, typename T > void apply( const K& key, T& value )
             {
                 visiting::do_while<    !boost::is_fundamental< T >::value
                                     && !boost::is_same< T, boost::posix_time::ptime >::value
                                     && !boost::is_same< T, std::string >::value >::visit( key, value, *this );
             }
 
-            /// apply on boost optional
-            template < typename K, typename T >
-            void apply_next( const K& name, boost::optional< T >& value )
+            template < typename K, typename T > void apply_next( const K& name, boost::optional< T >& value )
             {
                 if( !cur_ || cur_->find( name ) == cur_->not_found() ) { return; }
                 if( !value ) { value = T(); }
                 apply( name, *value );
             }
 
-            /// apply to vector
-            template < typename K, typename T, typename A >
-            void apply_next( const K& key, std::vector< T, A >& value )
+            #if __cplusplus >= 201703L
+            template < typename K, typename T > void apply_next( const K& name, std::optional< T >& value )
             {
-                std::string name = boost::lexical_cast< std::string >( key );
-                boost::optional< const boost::property_tree::ptree& > t = cur_ && !name.empty() ? cur_->get_child_optional( name ) : cur_;
-                if( t )
-                {
-                    const boost::property_tree::ptree& parent = *cur_;
-                    value.resize( t->size() );
-                    std::size_t i = 0;
-                    for( boost::property_tree::ptree::const_assoc_iterator j = t->ordered_begin(); j != t->not_found(); ++j, ++i )
-                    {
-                        cur_ = j->second;
-                        //std::size_t index = j->first == "" ? i : boost::lexical_cast< std::size_t >( j->first ); // way quick and dirty
-                        //if( index >= t->size() ) { COMMA_THROW( comma::exception, "expected index less than " << t->size() << "; got: " << index ); }
-                        visiting::do_while<    !boost::is_fundamental< T >::value
-                                            && !boost::is_same< T, boost::posix_time::ptime >::value
-                                            && !boost::is_same< T, std::string >::value >::visit( "", value[i], *this );
-                    }
-                    cur_ = parent;
-                }
-                else if( !permissive_ )
-                {
-                    COMMA_THROW( comma::exception, "key " << key << " not found" );
-                }
+                if( !cur_ || cur_->find( name ) == cur_->not_found() ) { return; }
+                if( !value ) { value = T(); }
+                apply( name, *value );
             }
+            #endif
+
+            template < typename K, typename T, typename A > void apply_next( const K& key, std::vector< T, A >& value ) { _apply_to_arraylike( key, value ); }
+
+            template < typename K, typename T, std::size_t Size > void apply_next( const K& key, boost::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
+
+            template < typename K, typename T, std::size_t Size > void apply_next( const K& key, std::array< T, Size >& value ) { _apply_to_arraylike( key, value ); }
 
             /// apply to map
             template < typename K, typename L, typename T, typename A >
@@ -252,6 +216,7 @@ struct property_tree // quick and dirty
             const boost::property_tree::ptree& ptree_;
             boost::optional< const boost::property_tree::ptree& > cur_;
             const bool permissive_;
+
             void value_( const std::string& name, boost::optional< boost::posix_time::ptime >& v ) // quick and dirty, imlement traits instead
             {
                 if( !cur_ ) { return; }
@@ -259,12 +224,49 @@ struct property_tree // quick and dirty
                 if( !s ) { s = cur_->get_optional< std::string >( "<xmlattr>." + name ); }
                 if( s ) { v = boost::posix_time::from_iso_string( *s ); }
             }
+
             template < typename T > void value_( const std::string& name, boost::optional< T >& v )
             {
                 if( !cur_ ) { return; }
                 v = name.empty() ? cur_->get_value_optional< T >() : cur_->get_optional< T >( name );
                 if( !v ) { v = cur_->get_optional< T >( "<xmlattr>." + name ); }
             }
+
+            template < typename T, typename A > void resize_( std::vector< T, A >& a, unsigned int size ) { a.resize( size ); }
+
+            template < typename A > void resize_( A& a, unsigned int size ) {}
+
+            template < typename K, typename A >
+            void _apply_to_arraylike( const K& key, A& value ) // todo? std::array? boost::array?
+            {
+                std::string name = boost::lexical_cast< std::string >( key );
+                boost::optional< const boost::property_tree::ptree& > t = cur_ && !name.empty() ? cur_->get_child_optional( name ) : cur_;
+                if( t )
+                {
+                    const boost::property_tree::ptree& parent = *cur_;
+                    resize_( value, t->size() );
+                    std::size_t i = 0;
+                    for( boost::property_tree::ptree::const_assoc_iterator j = t->ordered_begin(); j != t->not_found(); ++j, ++i )
+                    {
+                        cur_ = j->second;
+                        std::size_t index = i; // super-quick and dirty for now
+                        if( j->first != "" )
+                        {
+                            try { index = boost::lexical_cast< std::size_t >( j->first ); }
+                            catch( ... ) { index = i; }
+                        }
+                        //if( index >= t->size() ) { COMMA_THROW( comma::exception, "expected index less than " << t->size() << "; got: " << index ); }
+                        visiting::do_while<    !boost::is_fundamental< typename A::value_type >::value
+                                            && !boost::is_same< typename A::value_type, boost::posix_time::ptime >::value
+                                            && !boost::is_same< typename A::value_type, std::string >::value >::visit( "", value[index], *this );
+                    }
+                    cur_ = parent;
+                }
+                else if( !permissive_ )
+                {
+                    COMMA_THROW( comma::exception, "key " << key << " not found" );
+                }
+            }
     };
 };
 
@@ -280,24 +282,27 @@ class to_ptree
         /// @param branch: path to the subtree to visit (i.e. other branches will be pruned)
         to_ptree( boost::property_tree::ptree& ptree, const xpath& root = xpath(), const xpath& branch = xpath() ) : ptree_( ptree ), path_( root ), branch_( branch ) {}
 
-        /// constructor
         to_ptree( boost::property_tree::ptree& ptree, const char* root ) : ptree_( ptree ), path_( root ) {}
 
-        /// apply_next on boost optional
-        template < typename K, typename T >
-        void apply_next( const K& name, const boost::optional< T >& value )
+        template < typename K, typename T > void apply_next( const K& name, const boost::optional< T >& value )
         {
-            if( value )
-            {
-                visiting::do_while<    !boost::is_fundamental< T >::value
-                                    && !boost::is_same< T, boost::posix_time::ptime >::value
-                                    && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
-            }
+            if( !value ) { return; }
+            visiting::do_while<    !boost::is_fundamental< T >::value
+                                && !boost::is_same< T, boost::posix_time::ptime >::value
+                                && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
         }
 
-        /// apply
-        template < typename K, typename T, typename A >
-        void apply( const K& name, const std::vector< T, A >& value )
+        #if __cplusplus >= 201703L
+        template < typename K, typename T > void apply_next( const K& name, const std::optional< T >& value )
+        {
+            if( !value ) { return; }
+            visiting::do_while<    !boost::is_fundamental< T >::value
+                                && !boost::is_same< T, boost::posix_time::ptime >::value
+                                && !boost::is_same< T, std::string >::value >::visit( name, *value, *this );
+        }
+        #endif
+
+        template < typename K, typename T, typename A > void apply( const K& name, const std::vector< T, A >& value ) // do we even need it?
         {
             if( !( path_ <= branch_ ) ) { return; } // visit, only if on the branch
             append_( name );
@@ -313,8 +318,7 @@ class to_ptree
         }
 
         /// apply
-        template < typename K, typename T >
-        void apply( const K& name, const T& value )
+        template < typename K, typename T > void apply( const K& name, const T& value )
         {
             if( !( path_ <= branch_ ) ) { return; } // visit, only if on the branch
             const std::string& s = boost::lexical_cast< std::string >( name );
@@ -326,15 +330,10 @@ class to_ptree
         }
 
         /// apply to non-leaf elements
-        template < typename K, typename T >
-        void apply_next( const K& name, const T& value )
-        {
-            comma::visiting::visit( name, value, *this );
-        }
+        template < typename K, typename T > void apply_next( const K& name, const T& value ) { comma::visiting::visit( name, value, *this ); }
 
         /// apply to leaf elements
-        template < typename K, typename T >
-        void apply_final( const K&, const T& value ) { ptree_.put( path_.to_string( '.' ), value_( value ) ); }
+        template < typename K, typename T > void apply_final( const K&, const T& value ) { ptree_.put( path_.to_string( '.' ), value_( value ) ); }
 
     private:
         boost::property_tree::ptree& ptree_;
@@ -352,6 +351,15 @@ class to_ptree
         template < typename T > static T value_( T v ) { return v; }
 };
 
-} // namespace comma
+template < typename T >
+boost::optional< T > property_tree::as( const boost::property_tree::ptree& ptree, const xpath& path, bool use_index, bool permissive )
+{
+    auto p = property_tree::get_tree( ptree, path, use_index );
+    if( !p ) { return boost::none; }
+    comma::from_ptree from_ptree( *p, xpath(), permissive );
+    T t;
+    comma::visiting::apply( from_ptree ).to( t );
+    return t;
+}
 
-#endif /*COMMA_NAME_VALUE_PTREE_H_*/
+} // namespace comma
diff --git a/name_value/serialize.h b/name_value/serialize.h
index 270ee46d2..4a88dd46c 100644
--- a/name_value/serialize.h
+++ b/name_value/serialize.h
@@ -1,5 +1,6 @@
 // This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2023 Vsevolod Vlaskine
 // All rights reserved.
 //
 // Redistribution and use in source and binary forms, with or without
@@ -29,20 +30,20 @@
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_NAME_VALUE_SERIALIZE_H_
-#define COMMA_NAME_VALUE_SERIALIZE_H_
+#pragma once
 
 #include <fstream>
 #include <iostream>
+#include <sstream>
 #include <string>
 #include <boost/property_tree/json_parser.hpp>
 #include <boost/property_tree/xml_parser.hpp>
 #include <boost/property_tree/ini_parser.hpp>
 #include "../base/exception.h"
-#include "../xpath/xpath.h"
+#include "../string/split.h"
 #include "../visiting/apply.h"
+#include "../xpath/xpath.h"
 #include "impl/json_writer.h"
-
 #include "ptree.h"
 
 namespace comma {
@@ -53,12 +54,14 @@ template < typename T > T read( const std::string& filename, const xpath& root,
 template < typename T > T read( const std::string& filename, const char* root, bool permissive );
 template < typename T > T read( const std::string& filename, const xpath& root );
 template < typename T > T read( const std::string& filename, const char* root );
+template < typename T > T read( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read( const std::string& filename, bool permissive );
 template < typename T > T read( const std::string& filename );
 template < typename T > void read( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read( T& t, const std::string& filename, const char* root );
+template < typename T > void read( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read( T& t, const std::string& filename, bool permissive );
 template < typename T > void read( T& t, const std::string& filename );
 template < typename T > T read( std::istream& stream, const xpath& root, bool permissive );
@@ -81,12 +84,14 @@ template < typename T > T read_json( const std::string& filename, const char* ro
 template < typename T > T read_json( const std::string& filename, const xpath& root );
 template < typename T > T read_json( const std::string& filename, const char* root );
 template < typename T > T read_json( const std::string& filename, bool permissive );
+template < typename T > T read_json( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_json( const std::string& filename );
 template < typename T > void read_json( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_json( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_json( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_json( T& t, const std::string& filename, const char* root );
 template < typename T > void read_json( T& t, const std::string& filename, bool permissive );
+template < typename T > void read_json( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_json( T& t, const std::string& filename );
 template < typename T > T read_json( std::istream& stream, const xpath& root, bool permissive );
 template < typename T > T read_json( std::istream& stream, const char* root, bool permissive );
@@ -107,12 +112,14 @@ template < typename T > T read_xml( const std::string& filename, const xpath& ro
 template < typename T > T read_xml( const std::string& filename, const char* root, bool permissive );
 template < typename T > T read_xml( const std::string& filename, const xpath& root );
 template < typename T > T read_xml( const std::string& filename, const char* root );
+template < typename T > T read_xml( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_xml( const std::string& filename, bool permissive );
 template < typename T > T read_xml( const std::string& filename );
 template < typename T > void read_xml( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_xml( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_xml( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_xml( T& t, const std::string& filename, const char* root );
+template < typename T > void read_xml( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_xml( T& t, const std::string& filename, bool permissive );
 template < typename T > void read_xml( T& t, const std::string& filename );
 template < typename T > T read_xml( std::istream& stream, const xpath& root, bool permissive );
@@ -128,6 +135,35 @@ template < typename T > void read_xml( T& t, std::istream& stream, const char* r
 template < typename T > void read_xml( T& t, std::istream& stream, bool permissive );
 template < typename T > void read_xml( T& t, std::istream& stream );
 
+/// read object from xml file or stream
+/// convenience wrappers for comma::property_tree boiler-plate code
+template < typename T > T read_yaml( const std::string& filename, const xpath& root, bool permissive );
+template < typename T > T read_yaml( const std::string& filename, const char* root, bool permissive );
+template < typename T > T read_yaml( const std::string& filename, const xpath& root );
+template < typename T > T read_yaml( const std::string& filename, const char* root );
+template < typename T > T read_yaml( const std::string& filename, bool permissive, bool split_filename );
+template < typename T > T read_yaml( const std::string& filename, bool permissive );
+template < typename T > T read_yaml( const std::string& filename );
+template < typename T > void read_yaml( T& t, const std::string& filename, const xpath& root, bool permissive );
+template < typename T > void read_yaml( T& t, const std::string& filename, const char* root, bool permissive );
+template < typename T > void read_yaml( T& t, const std::string& filename, const xpath& root );
+template < typename T > void read_yaml( T& t, const std::string& filename, const char* root );
+template < typename T > void read_yaml( T& t, const std::string& filename, bool permissive, bool split_filename );
+template < typename T > void read_yaml( T& t, const std::string& filename, bool permissive );
+template < typename T > void read_yaml( T& t, const std::string& filename );
+template < typename T > T read_yaml( std::istream& stream, const xpath& root, bool permissive );
+template < typename T > T read_yaml( std::istream& stream, const char* root, bool permissive );
+template < typename T > T read_yaml( std::istream& stream, const xpath& root );
+template < typename T > T read_yaml( std::istream& stream, const char* root );
+template < typename T > T read_yaml( std::istream& stream, bool permissive );
+template < typename T > T read_yaml( std::istream& stream );
+template < typename T > void read_yaml( T& t, std::istream& stream, const xpath& root, bool permissive );
+template < typename T > void read_yaml( T& t, std::istream& stream, const char* root, bool permissive );
+template < typename T > void read_yaml( T& t, std::istream& stream, const xpath& root );
+template < typename T > void read_yaml( T& t, std::istream& stream, const char* root );
+template < typename T > void read_yaml( T& t, std::istream& stream, bool permissive );
+template < typename T > void read_yaml( T& t, std::istream& stream );
+
 /// read object from path-value file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 template < typename T > T read_path_value( const std::string& filename, const xpath& root, bool permissive );
@@ -135,11 +171,13 @@ template < typename T > T read_path_value( const std::string& filename, const ch
 template < typename T > T read_path_value( const std::string& filename, const xpath& root );
 template < typename T > T read_path_value( const std::string& filename, const char* root );
 template < typename T > T read_path_value( const std::string& filename, bool permissive );
+template < typename T > T read_path_value( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_path_value( const std::string& filename );
 template < typename T > void read_path_value( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_path_value( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_path_value( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_path_value( T& t, const std::string& filename, const char* root );
+template < typename T > void read_path_value( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_path_value( T& t, const std::string& filename, bool permissive );
 template < typename T > void read_path_value( T& t, const std::string& filename );
 template < typename T > T read_path_value( std::istream& stream, const xpath& root, bool permissive );
@@ -161,12 +199,14 @@ template < typename T > T read_ini( const std::string& filename, const xpath& ro
 template < typename T > T read_ini( const std::string& filename, const char* root, bool permissive );
 template < typename T > T read_ini( const std::string& filename, const xpath& root );
 template < typename T > T read_ini( const std::string& filename, const char* root );
+template < typename T > T read_ini( const std::string& filename, bool permissive, bool split_filename );
 template < typename T > T read_ini( const std::string& filename, bool permissive );
 template < typename T > T read_ini( const std::string& filename );
 template < typename T > void read_ini( T& t, const std::string& filename, const xpath& root, bool permissive );
 template < typename T > void read_ini( T& t, const std::string& filename, const char* root, bool permissive );
 template < typename T > void read_ini( T& t, const std::string& filename, const xpath& root );
 template < typename T > void read_ini( T& t, const std::string& filename, const char* root );
+template < typename T > void read_ini( T& t, const std::string& filename, bool permissive, bool split_filename );
 template < typename T > void read_ini( T& t, const std::string& filename, bool permissive );
 template < typename T > void read_ini( T& t, const std::string& filename );
 template < typename T > T read_ini( std::istream& stream, const xpath& root, bool permissive );
@@ -184,41 +224,62 @@ template < typename T > void read_ini( T& t, std::istream& stream );
 
 /// write json object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
-template < typename T > void write_json( const T& t, const std::string& filename, const xpath& root );
-template < typename T > void write_json( const T& t, const std::string& filename, const char* root );
-template < typename T > void write_json( const T& t, const std::string& filename );
-template < typename T > void write_json( const T& t, std::ostream& stream, const xpath& root );
-template < typename T > void write_json( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_json( const T& t, std::ostream& stream );
+template < typename T > void write_json( const T& t, const std::string& filename, const xpath& root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > void write_json( const T& t, const std::string& filename, const char* root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > void write_json( const T& t, const std::string& filename, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::ostream& write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::ostream& write_json( const T& t, std::ostream& stream, const char* root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::ostream& write_json( const T& t, std::ostream& stream, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::string json_to_string( const T& t, const xpath& root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::string json_to_string( const T& t, const char* root, bool pretty = true, bool unquote_numbers = true );
+template < typename T > std::string json_to_string( const T& t, bool pretty = true, bool unquote_numbers = true );
 
 /// write xml object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 template < typename T > void write_xml( const T& t, const std::string& filename, const xpath& root );
 template < typename T > void write_xml( const T& t, const std::string& filename, const char* root );
 template < typename T > void write_xml( const T& t, const std::string& filename );
-template < typename T > void write_xml( const T& t, std::ostream& stream, const xpath& root );
-template < typename T > void write_xml( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_xml( const T& t, std::ostream& stream );
+template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream, const xpath& root );
+template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_xml( const T& t, std::ostream& stream );
+
+/// write yaml object to file or stream
+/// convenience wrappers for comma::property_tree boiler-plate code
+template < typename T > void write_yaml( const T& t, const std::string& filename, const xpath& root );
+template < typename T > void write_yaml( const T& t, const std::string& filename, const char* root );
+template < typename T > void write_yaml( const T& t, const std::string& filename );
+template < typename T > std::ostream& write_yaml( const T& t, std::ostream& stream, const xpath& root );
+template < typename T > std::ostream& write_yaml( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_yaml( const T& t, std::ostream& stream );
 
 /// write path-value object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 /// @todo parametrize on equality sign and delimiter?
-template < typename T > void write_path_value( const T& t, const std::string& filename, const xpath& root );
+template < typename T > void write_path_value( const T& t, const std::string& filename, const xpath& root, const std::string& prefix = "" );
 template < typename T > void write_path_value( const T& t, const std::string& filename, const char* root );
 template < typename T > void write_path_value( const T& t, const std::string& filename );
-template < typename T > void write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers = false );
-template < typename T > void write_path_value( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_path_value( const T& t, std::ostream& stream );
+template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool unquote_numbers = false, const std::string& prefix = "" );
+template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_path_value( const T& t, std::ostream& stream );
 
 /// write ini object to file or stream
 /// convenience wrappers for comma::property_tree boiler-plate code
 template < typename T > void write_ini( const T& t, const std::string& filename, const xpath& root );
 template < typename T > void write_ini( const T& t, const std::string& filename, const char* root );
 template < typename T > void write_ini( const T& t, const std::string& filename );
-template < typename T > void write_ini( const T& t, std::ostream& stream, const xpath& root );
-template < typename T > void write_ini( const T& t, std::ostream& stream, const char* root );
-template < typename T > void write_ini( const T& t, std::ostream& stream );
+template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream, const xpath& root );
+template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream, const char* root );
+template < typename T > std::ostream& write_ini( const T& t, std::ostream& stream );
+
+namespace impl {
 
+inline std::pair< std::string, xpath > _split( const std::string& filename )
+{
+    const auto& s = comma::split_tail( filename, 2, ':' );
+    return s.size() == 1 ? std::pair< std::string, xpath >{ filename, xpath() } : std::pair< std::string, xpath >{ s[0], xpath( s[1] ) };
+}
+
+} // namespace impl {
 
 template < typename T > inline void read_json( T& t, const std::string& filename, const xpath& root, bool permissive )
 {
@@ -240,6 +301,7 @@ template < typename T > inline T read_json( const std::string& filename, const x
 template < typename T > inline T read_json( const std::string& filename, const char* root, bool permissive ) { return root ? read_json< T >( filename, xpath( root ), permissive ) : read_json< T >( filename, permissive ); }
 template < typename T > inline T read_json( const std::string& filename, const xpath& root ) { return read_json< T >( filename, root, true ); }
 template < typename T > inline T read_json( const std::string& filename, const char* root ) { return root ? read_json< T >( filename, xpath( root ), true ) : read_json< T >( filename, true ); }
+template < typename T > inline T read_json( const std::string& filename, bool permissive, bool split_filename ) { T t; read_json< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_json( const std::string& filename, bool permissive ) { return read_json< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_json( const std::string& filename ) { return read_json< T >( filename, xpath(), true ); }
 template < typename T > inline T read_json( std::istream& stream, const xpath& root, bool permissive ) { T t; read_json< T >( t, stream, root, permissive ); return t; }
@@ -251,6 +313,11 @@ template < typename T > inline T read_json( std::istream& stream ) { return read
 template < typename T > inline void read_json( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_json< T >( t, filename, xpath( root ), permissive ); } else { read_json< T >( t, filename, permissive ); } }
 template < typename T > inline void read_json( T& t, const std::string& filename, const xpath& root ) { read_json< T >( t, filename, root, true ); }
 template < typename T > inline void read_json( T& t, const std::string& filename, const char* root ) { if( root ) { read_json< T >( t, filename, xpath( root ), true ); } else { read_json< T >( t, filename, true ); } }
+template < typename T > inline void read_json( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    return read_json< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_json( T& t, const std::string& filename, bool permissive ) { read_json< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read_json( T& t, const std::string& filename ) { return read_json< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_json( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_json< T >( t, stream, xpath( root ), permissive ); } else { read_json< T >( t, stream, permissive ); } }
@@ -279,6 +346,7 @@ template < typename T > inline T read_xml( const std::string& filename, const xp
 template < typename T > inline T read_xml( const std::string& filename, const char* root, bool permissive ) { return root ? read_xml< T >( filename, xpath( root ), permissive ) : read_xml< T >( filename, permissive ); }
 template < typename T > inline T read_xml( const std::string& filename, const xpath& root ) { return read_xml< T >( filename, root, true ); }
 template < typename T > inline T read_xml( const std::string& filename, const char* root ) { return root ? read_xml< T >( filename, xpath( root ), true ) : read_xml< T >( filename, true ); }
+template < typename T > inline T read_xml( const std::string& filename, bool permissive, bool split_filename ) { T t; read_xml< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_xml( const std::string& filename, bool permissive ) { return read_xml< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_xml( const std::string& filename ) { return read_xml< T >( filename, xpath(), true ); }
 template < typename T > inline T read_xml( std::istream& stream, const xpath& root, bool permissive ) { T t; read_xml< T >( t, stream, root, permissive ); return t; }
@@ -290,14 +358,64 @@ template < typename T > inline T read_xml( std::istream& stream ) { return read_
 template < typename T > inline void read_xml( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_xml< T >( t, filename, xpath( root ), permissive ); } else { read_xml< T >( t, filename, permissive ); } }
 template < typename T > inline void read_xml( T& t, const std::string& filename, const xpath& root ) { read_xml< T >( t, filename, root, true ); }
 template < typename T > inline void read_xml( T& t, const std::string& filename, const char* root ) { if( root ) { read_xml< T >( t, filename, xpath( root ), true ); } else { read_xml< T >( t, filename, true ); } }
+template < typename T > inline void read_xml( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_xml< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_xml( T& t, const std::string& filename, bool permissive ) { read_xml< T >( t, filename, xpath(), permissive ); }
-template < typename T > inline void read_xml( T& t, const std::string& filename ) { return read_xml< T >( t, filename, xpath(), true ); }
+template < typename T > inline void read_xml( T& t, const std::string& filename ) { read_xml< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_xml( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_xml< T >( t, stream, xpath( root ), permissive ); } else { read_xml< T >( t, stream, permissive ); } }
 template < typename T > inline void read_xml( T& t, std::istream& stream, const xpath& root ) { read_xml< T >( t, stream, root, true ); }
 template < typename T > inline void read_xml( T& t, std::istream& stream, const char* root ) { if( root ) { read_xml< T >( t, stream, xpath( root ), true ); } else { read_xml< T >( t, stream, true ); } }
 template < typename T > inline void read_xml( T& t, std::istream& stream, bool permissive ) { read_xml< T >( t, stream, xpath(), permissive ); }
 template < typename T > inline void read_xml( T& t, std::istream& stream ) { read_xml< T >( t, stream, xpath(), true ); }
 
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const xpath& root, bool permissive )
+{
+    std::ifstream ifs( &filename[0] );
+    if( !ifs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
+    read_yaml< T >( t, ifs, root, permissive );
+    ifs.close();
+}
+
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const xpath& root, bool permissive )
+{
+    boost::property_tree::ptree p;
+    comma::property_tree::read_yaml( stream, p );
+    comma::from_ptree from_ptree( p, root, permissive );
+    comma::visiting::apply( from_ptree ).to( t );
+}
+
+template < typename T > inline T read_yaml( const std::string& filename, const xpath& root, bool permissive ) { T t; read_yaml< T >( t, filename, root, permissive ); return t; }
+template < typename T > inline T read_yaml( const std::string& filename, const char* root, bool permissive ) { return root ? read_yaml< T >( filename, xpath( root ), permissive ) : read_yaml< T >( filename, permissive ); }
+template < typename T > inline T read_yaml( const std::string& filename, const xpath& root ) { return read_yaml< T >( filename, root, true ); }
+template < typename T > inline T read_yaml( const std::string& filename, const char* root ) { return root ? read_yaml< T >( filename, xpath( root ), true ) : read_yaml< T >( filename, true ); }
+template < typename T > inline T read_yaml( const std::string& filename, bool permissive, bool split_filename ) { T t; read_yaml< T >( t, filename, permissive, split_filename ); return t; }
+template < typename T > inline T read_yaml( const std::string& filename, bool permissive ) { return read_yaml< T >( filename, xpath(), permissive ); }
+template < typename T > inline T read_yaml( const std::string& filename ) { return read_yaml< T >( filename, xpath(), true ); }
+template < typename T > inline T read_yaml( std::istream& stream, const xpath& root, bool permissive ) { T t; read_yaml< T >( t, stream, root, permissive ); return t; }
+template < typename T > inline T read_yaml( std::istream& stream, const char* root, bool permissive ) { return root ? read_yaml< T >( stream, xpath( root ), permissive ) : read_yaml< T >( stream, permissive ); }
+template < typename T > inline T read_yaml( std::istream& stream, const xpath& root ) { return read_yaml< T >( stream, root, true ); }
+template < typename T > inline T read_yaml( std::istream& stream, const char* root ) { return root ? read_yaml< T >( stream, xpath( root ), true ) : read_yaml< T >( stream, true ); }
+template < typename T > inline T read_yaml( std::istream& stream, bool permissive ) { return read_yaml< T >( stream, xpath(), permissive ); }
+template < typename T > inline T read_yaml( std::istream& stream ) { return read_yaml< T >( stream, xpath(), true ); }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_yaml< T >( t, filename, xpath( root ), permissive ); } else { read_yaml< T >( t, filename, permissive ); } }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const xpath& root ) { read_yaml< T >( t, filename, root, true ); }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, const char* root ) { if( root ) { read_yaml< T >( t, filename, xpath( root ), true ); } else { read_yaml< T >( t, filename, true ); } }
+template < typename T > inline void read_yaml( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_yaml< T >( t, p.first, p.second, permissive );
+}
+template < typename T > inline void read_yaml( T& t, const std::string& filename, bool permissive ) { read_yaml< T >( t, filename, xpath(), permissive ); }
+template < typename T > inline void read_yaml( T& t, const std::string& filename ) { read_yaml< T >( t, filename, xpath(), true ); }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_yaml< T >( t, stream, xpath( root ), permissive ); } else { read_yaml< T >( t, stream, permissive ); } }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const xpath& root ) { read_yaml< T >( t, stream, root, true ); }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, const char* root ) { if( root ) { read_yaml< T >( t, stream, xpath( root ), true ); } else { read_yaml< T >( t, stream, true ); } }
+template < typename T > inline void read_yaml( T& t, std::istream& stream, bool permissive ) { read_yaml< T >( t, stream, xpath(), permissive ); }
+template < typename T > inline void read_yaml( T& t, std::istream& stream ) { read_yaml< T >( t, stream, xpath(), true ); }
+
 template < typename T > inline void read_path_value( T& t, std::istream& stream, const xpath& root, bool permissive )
 {
     boost::property_tree::ptree p;
@@ -318,6 +436,7 @@ template < typename T > inline T read_path_value( const std::string& filename, c
 template < typename T > inline T read_path_value( const std::string& filename, const char* root, bool permissive ) { return root ? read_path_value< T >( filename, xpath( root ), permissive ) : read_path_value< T >( filename, permissive ); }
 template < typename T > inline T read_path_value( const std::string& filename, const xpath& root ) { return read_path_value< T >( filename, root, true ); }
 template < typename T > inline T read_path_value( const std::string& filename, const char* root ) { return root ? read_path_value< T >( filename, xpath( root ), true ) : read_path_value< T >( filename, true ); }
+template < typename T > inline T read_path_value( const std::string& filename, bool permissive, bool split_filename ) { T t; read_path_value< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_path_value( const std::string& filename, bool permissive ) { return read_path_value< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_path_value( const std::string& filename ) { return read_path_value< T >( filename, xpath(), true ); }
 template < typename T > inline T read_path_value( std::istream& stream, const xpath& root, bool permissive ) { T t; read_path_value< T >( t, stream, root, permissive ); return t; }
@@ -329,6 +448,11 @@ template < typename T > inline T read_path_value( std::istream& stream ) { retur
 template < typename T > inline void read_path_value( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_path_value< T >( t, filename, xpath( root ), permissive ); } else { read_path_value< T >( t, filename, permissive ); } }
 template < typename T > inline void read_path_value( T& t, const std::string& filename, const xpath& root ) { read_path_value< T >( t, filename, root, true ); }
 template < typename T > inline void read_path_value( T& t, const std::string& filename, const char* root ) { if( root ) { read_path_value< T >( t, filename, xpath( root ), true ); } else { read_path_value< T >( t, filename, true ); } }
+template < typename T > inline void read_path_value( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_path_value< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_path_value( T& t, const std::string& filename, bool permissive ) { read_path_value< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read_path_value( T& t, const std::string& filename ) { return read_path_value< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_path_value( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_path_value< T >( t, stream, xpath( root ), permissive ); } else { read_path_value< T >( t, stream, permissive ); } }
@@ -357,6 +481,7 @@ template < typename T > inline T read_ini( const std::string& filename, const xp
 template < typename T > inline T read_ini( const std::string& filename, const char* root, bool permissive ) { return root ? read_ini< T >( filename, xpath( root ), permissive ) : read_ini< T >( filename, permissive ); }
 template < typename T > inline T read_ini( const std::string& filename, const xpath& root ) { return read_ini< T >( filename, root, true ); }
 template < typename T > inline T read_ini( const std::string& filename, const char* root ) { return root ? read_ini< T >( filename, xpath( root ), true ) : read_ini< T >( filename, true ); }
+template < typename T > inline T read_ini( const std::string& filename, bool permissive, bool split_filename ) { T t; read_ini< T >( t, filename, permissive, split_filename ); return t; }
 template < typename T > inline T read_ini( const std::string& filename, bool permissive ) { return read_ini< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read_ini( const std::string& filename ) { return read_ini< T >( filename, xpath(), true ); }
 template < typename T > inline T read_ini( std::istream& stream, const xpath& root, bool permissive ) { T t; read_ini< T >( t, stream, root, permissive ); return t; }
@@ -368,6 +493,11 @@ template < typename T > inline T read_ini( std::istream& stream ) { return read_
 template < typename T > inline void read_ini( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read_ini< T >( t, filename, xpath( root ), permissive ); } else { read_ini< T >( t, filename, permissive ); } }
 template < typename T > inline void read_ini( T& t, const std::string& filename, const xpath& root ) { read_ini< T >( t, filename, root, true ); }
 template < typename T > inline void read_ini( T& t, const std::string& filename, const char* root ) { if( root ) { read_ini< T >( t, filename, xpath( root ), true ); } else { read_ini< T >( t, filename, true ); } }
+template < typename T > inline void read_ini( T& t, const std::string& filename, bool permissive, bool split_filename )
+{
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read_ini< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read_ini( T& t, const std::string& filename, bool permissive ) { read_ini< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read_ini( T& t, const std::string& filename ) { return read_ini< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read_ini( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read_ini< T >( t, stream, xpath( root ), permissive ); } else { read_ini< T >( t, stream, permissive ); } }
@@ -376,27 +506,38 @@ template < typename T > inline void read_ini( T& t, std::istream& stream, const
 template < typename T > inline void read_ini( T& t, std::istream& stream, bool permissive ) { read_ini< T >( t, stream, xpath(), permissive ); }
 template < typename T > inline void read_ini( T& t, std::istream& stream ) { read_ini< T >( t, stream, xpath(), true ); }
 
-template < typename T > inline void write_json( const T& t, const std::string& filename, const xpath& root )
+template < typename T > inline void write_json( const T& t, const std::string& filename, const xpath& root, bool pretty, bool unquote_numbers )
 {
     std::ofstream ofs( &filename[0] );
     if( !ofs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
-    write_json< T >( t, ofs, root );
+    write_json< T >( t, ofs, root, pretty, unquote_numbers );
     ofs.close();
 }
 
-template < typename T > inline void write_json( const T& t, std::ostream& stream, const xpath& root )
+template < typename T > inline std::ostream& write_json( const T& t, std::ostream& stream, const xpath& root, bool pretty, bool unquote_numbers )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
-    comma::name_value::impl::write_json( stream, p );
+    comma::name_value::impl::write_json( stream, p, pretty, unquote_numbers );
+    return stream;
 }
 
-template < typename T > inline void write_json( const T& t, const std::string& filename, const char* root ) { write_json( t, filename, xpath( root ) ); }
-template < typename T > inline void write_json( const T& t, const std::string& filename ) { write_json( t, filename, xpath() ); }
-template < typename T > inline void write_json( const T& t, std::ostream& stream, const char* root ) { write_json( t, stream, xpath( root ) ); }
-template < typename T > inline void write_json( const T& t, std::ostream& stream ) { write_json( t, stream, xpath() ); }
+template < typename T > inline void write_json( const T& t, const std::string& filename, const char* root, bool pretty, bool unquote_numbers ) { write_json( t, filename, xpath( root ), pretty, unquote_numbers ); }
+template < typename T > inline void write_json( const T& t, const std::string& filename, bool pretty, bool unquote_numbers ) { write_json( t, filename, xpath(), pretty, unquote_numbers ); }
+template < typename T > inline std::ostream& write_json( const T& t, std::ostream& stream, const char* root, bool pretty, bool unquote_numbers ) { return write_json( t, stream, xpath( root ), pretty, unquote_numbers ); }
+template < typename T > inline std::ostream& write_json( const T& t, std::ostream& stream, bool pretty, bool unquote_numbers ) { return write_json( t, stream, xpath(), pretty, unquote_numbers ); }
+
+template < typename T > inline std::string json_to_string( const T& t, const char* root, bool pretty, bool unquote_numbers ) { return json_to_string( t, xpath( root ), pretty, unquote_numbers ); }
+template < typename T > inline std::string json_to_string( const T& t, bool pretty, bool unquote_numbers ) { return json_to_string( t, xpath(), pretty, unquote_numbers ); }
+
+template < typename T > inline std::string json_to_string( const T& t, const xpath& root, bool pretty, bool unquote_numbers )
+{
+    std::ostringstream os;
+    write_json( t, os, root, pretty, unquote_numbers );
+    return os.str();
+}
 
 template < typename T > inline void write_xml( const T& t, const std::string& filename, const xpath& root )
 {
@@ -406,49 +547,75 @@ template < typename T > inline void write_xml( const T& t, const std::string& fi
     ofs.close();
 }
 
-template < typename T > inline void write_xml( const T& t, std::ostream& stream, const xpath& root )
+template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream, const xpath& root )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
     boost::property_tree::write_xml( stream, p );
+    return stream;
 }
 
 template < typename T > inline void write_xml( const T& t, const std::string& filename, const char* root ) { write_xml( t, filename, xpath( root ) ); }
 template < typename T > inline void write_xml( const T& t, const std::string& filename ) { write_xml( t, filename, xpath() ); }
-template < typename T > inline void write_xml( const T& t, std::ostream& stream, const char* root ) { write_xml( t, stream, xpath( root ) ); }
-template < typename T > inline void write_xml( const T& t, std::ostream& stream ) { write_xml( t, stream, xpath() ); }
+template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream, const char* root ) { return write_xml( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_xml( const T& t, std::ostream& stream ) { return write_xml( t, stream, xpath() ); }
+
+template < typename T > inline void write_yaml( const T& t, const std::string& filename, const xpath& root )
+{
+    std::ofstream ofs( &filename[0] );
+    if( !ofs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
+    write_yaml< T >( t, ofs, root );
+    ofs.close();
+}
+
+template < typename T > inline std::ostream& write_yaml( const T& t, std::ostream& stream, const xpath& root )
+{
+    boost::property_tree::ptree p;
+    comma::to_ptree to_ptree( p, root );
+    comma::visiting::apply( to_ptree ).to( t );
+    stream.precision( 16 ); // quick and dirty
+    comma::property_tree::write_yaml( stream, p );
+    return stream;
+}
+
+template < typename T > inline void write_yaml( const T& t, const std::string& filename, const char* root ) { write_yaml( t, filename, xpath( root ) ); }
+template < typename T > inline void write_yaml( const T& t, const std::string& filename ) { write_yaml( t, filename, xpath() ); }
+template < typename T > inline std::ostream& write_yaml( const T& t, std::ostream& stream, const char* root ) { return write_yaml( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_yaml( const T& t, std::ostream& stream ) { return write_yaml( t, stream, xpath() ); }
 
-template < typename T > inline void write_path_value( const T& t, std::ostream& stream, const xpath& root, bool const unquote_numbers )
+template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream, const xpath& root, bool unquote_numbers, const std::string& prefix )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
-    comma::property_tree::to_path_value( stream, p, comma::property_tree::disabled, '=', '\n', xpath(), unquote_numbers );
+    comma::property_tree::to_path_value( stream, p, comma::property_tree::disabled, '=', '\n', xpath(), unquote_numbers, prefix );
+    return stream;
 }
 
-template < typename T > inline void write_path_value( const T& t, const std::string& filename, const xpath& root )
+template < typename T > inline void write_path_value( const T& t, const std::string& filename, const xpath& root, const std::string& prefix )
 {
     std::ofstream ofs( &filename[0] );
     if( !ofs.is_open() ) { COMMA_THROW( comma::exception, "failed to open \"" << filename << "\"" ); }
-    write_path_value< T >( t, ofs, root );
+    write_path_value< T >( t, ofs, root, prefix );
     ofs.close();
 }
 
 template < typename T > inline void write_path_value( const T& t, const std::string& filename, const char* root ) { write_path_value( t, filename, xpath( root ) ); }
 template < typename T > inline void write_path_value( const T& t, const std::string& filename ) { write_path_value( t, filename, xpath() ); }
-template < typename T > inline void write_path_value( const T& t, std::ostream& stream, const char* root ) { write_path_value( t, stream, xpath( root ) ); }
-template < typename T > inline void write_path_value( const T& t, std::ostream& stream ) { write_path_value( t, stream, xpath() ); }
+template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream, const char* root ) { return write_path_value( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_path_value( const T& t, std::ostream& stream ) { return write_path_value( t, stream, xpath() ); }
 
-template < typename T > inline void write_ini( const T& t, std::ostream& stream, const xpath& root )
+template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream, const xpath& root )
 {
     boost::property_tree::ptree p;
     comma::to_ptree to_ptree( p, root );
     comma::visiting::apply( to_ptree ).to( t );
     stream.precision( 16 ); // quick and dirty
     boost::property_tree::write_ini( stream, p );
+    return stream;
 }
 
 template < typename T > inline void write_ini( const T& t, const std::string& filename, const xpath& root )
@@ -461,9 +628,8 @@ template < typename T > inline void write_ini( const T& t, const std::string& fi
 
 template < typename T > inline void write_ini( const T& t, const std::string& filename, const char* root ) { write_ini( t, filename, xpath( root ) ); }
 template < typename T > inline void write_ini( const T& t, const std::string& filename ) { write_ini( t, filename, xpath() ); }
-template < typename T > inline void write_ini( const T& t, std::ostream& stream, const char* root ) { write_ini( t, stream, xpath( root ) ); }
-template < typename T > inline void write_ini( const T& t, std::ostream& stream ) { write_ini( t, stream, xpath() ); }
-
+template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream, const char* root ) { return write_ini( t, stream, xpath( root ) ); }
+template < typename T > inline std::ostream& write_ini( const T& t, std::ostream& stream ) { return write_ini( t, stream, xpath() ); }
 
 template < typename T > inline void read( T& t, std::istream& stream, const xpath& root, bool permissive )
 {
@@ -485,6 +651,7 @@ template < typename T > inline T read( const std::string& filename, const xpath&
 template < typename T > inline T read( const std::string& filename, const char* root, bool permissive ) { return root ? read_json< T >( filename, xpath( root ), permissive ) : read< T >( filename, permissive ); }
 template < typename T > inline T read( const std::string& filename, const xpath& root ) { return read< T >( filename, root, true ); }
 template < typename T > inline T read( const std::string& filename, const char* root ) { return root ? read< T >( filename, xpath( root ), true ) : read< T >( filename, true ); }
+template < typename T > inline T read( const std::string& filename, bool permissive, bool split_filename ) { T t; read< T >( t, filename, permissive, split_filename ); }
 template < typename T > inline T read( const std::string& filename, bool permissive ) { return read< T >( filename, xpath(), permissive ); }
 template < typename T > inline T read( const std::string& filename ) { return read< T >( filename, xpath(), true ); }
 template < typename T > inline T read( std::istream& stream, const xpath& root, bool permissive ) { T t; read< T >( t, stream, root, permissive ); return t; }
@@ -496,6 +663,11 @@ template < typename T > inline T read( std::istream& stream ) { return read< T >
 template < typename T > inline void read( T& t, const std::string& filename, const char* root, bool permissive ) { if( root ) { read< T >( t, filename, xpath( root ), permissive ); } else { read< T >( t, filename, permissive ); } }
 template < typename T > inline void read( T& t, const std::string& filename, const xpath& root ) { read< T >( t, filename, root, true ); }
 template < typename T > inline void read( T& t, const std::string& filename, const char* root ) { if( root ) { read< T >( t, filename, xpath( root ), true ); } else { read< T >( t, filename, true ); } }
+template < typename T > inline void read( T& t, const std::string& filename, bool permissive, bool split_filename )
+{ 
+    std::pair< std::string, xpath > p = split_filename ? impl::_split( filename ) : std::pair< std::string, xpath >{ filename, xpath() };
+    read< T >( t, p.first, p.second, permissive );
+}
 template < typename T > inline void read( T& t, const std::string& filename, bool permissive ) { read< T >( t, filename, xpath(), permissive ); }
 template < typename T > inline void read( T& t, const std::string& filename ) { return read< T >( t, filename, xpath(), true ); }
 template < typename T > inline void read( T& t, std::istream& stream, const char* root, bool permissive ) { if( root ) { read< T >( t, stream, xpath( root ), permissive ); } else { read< T >( t, stream, permissive ); } }
@@ -505,5 +677,3 @@ template < typename T > inline void read( T& t, std::istream& stream, bool permi
 template < typename T > inline void read( T& t, std::istream& stream ) { read< T >( t, stream, xpath(), true ); }
 
 } // namespace comma {
-
-#endif // COMMA_NAME_VALUE_SERIALIZE_H_
diff --git a/name_value/test/CMakeLists.txt b/name_value/test/CMakeLists.txt
index 000281672..e95a9deb3 100644
--- a/name_value/test/CMakeLists.txt
+++ b/name_value/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET( KIT name_value )
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*_test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_xpath comma_string comma_name_value ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT name_value )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_xpath comma_string comma_name_value ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/name_value/test/eval/data/input_3 b/name_value/test/eval/data/input_3
index 936c66d69..e3bd4042d 100644
--- a/name_value/test/eval/data/input_3
+++ b/name_value/test/eval/data/input_3
@@ -7,4 +7,4 @@ x != 3
 x != "some string"
 
 # integer division
-x = 11 / 5
+x = 11 // 5
diff --git a/name_value/test/eval/data/stderr_13 b/name_value/test/eval/data/stderr_13
index 49a434b97..ec96e98a6 100644
--- a/name_value/test/eval/data/stderr_13
+++ b/name_value/test/eval/data/stderr_13
@@ -1 +1,2 @@
-name-value-eval: line 1: AttributeError: OBJ instance has no attribute 'whatever'
+python2:name-value-eval: line 1: AttributeError: OBJ instance has no attribute 'whatever'
+python3:name-value-eval: line 1: AttributeError: 'OBJ' object has no attribute 'whatever'
\ No newline at end of file
diff --git a/name_value/test/eval/data/stderr_14 b/name_value/test/eval/data/stderr_14
index 224f578e7..cfa22eede 100644
--- a/name_value/test/eval/data/stderr_14
+++ b/name_value/test/eval/data/stderr_14
@@ -1 +1,2 @@
-name-value-eval: line 2: AttributeError: OBJ instance has no attribute '__getitem__'
+python2:name-value-eval: line 2: AttributeError: OBJ instance has no attribute '__getitem__'
+python3:name-value-eval: line 2: TypeError: 'OBJ' object does not support indexing
\ No newline at end of file
diff --git a/name_value/test/eval/data/stderr_27 b/name_value/test/eval/data/stderr_27
index 811dc83b2..e2105bdbe 100644
--- a/name_value/test/eval/data/stderr_27
+++ b/name_value/test/eval/data/stderr_27
@@ -1 +1,2 @@
-name-value-eval: TypeError: variable "route" is used in an expression but is an object (example: "a/b = 3; a < 0")
+python2:name-value-eval: TypeError: variable "route" is used in an expression but is an object (example: "a/b = 3; a < 0")
+python3:name-value-eval: line 1: TypeError: unorderable types: OBJ() > int()
\ No newline at end of file
diff --git a/name_value/test/eval/data/stderr_8 b/name_value/test/eval/data/stderr_8
index 790deb67b..0570fd918 100644
--- a/name_value/test/eval/data/stderr_8
+++ b/name_value/test/eval/data/stderr_8
@@ -1 +1,2 @@
-name-value-eval: line 1: TypeError: cannot concatenate 'str' and 'int' objects
+python2:name-value-eval: line 1: TypeError: cannot concatenate 'str' and 'int' objects
+python3:name-value-eval: line 1: TypeError: Can't convert 'int' object to str implicitly
\ No newline at end of file
diff --git a/name_value/test/eval/test b/name_value/test/eval/test
index b6f7de6e9..7edada245 100755
--- a/name_value/test/eval/test
+++ b/name_value/test/eval/test
@@ -11,7 +11,8 @@ if [[ ! -d "$data_dir" ]]; then
 fi
 
 tmpdir="output/tmp"
-mkdir $tmpdir
+rm -rf $tmpdir
+mkdir $tmpdir -p
 verbose=0
 
 while [[ $# -gt 0 ]]; do
@@ -27,20 +28,38 @@ done
 variables="$data_dir/variable_vals"
 pass_count=0
 total_count=0
+#python_version="$( python -c "from __future__ import print_function; import sys; print( sys.version_info.major )" )" # sigh...
+#python_prefix="python${python_version}:"
+python_prefix="python3:"
 
-for input in $data_dir/input*; do
+for input in $data_dir/input_*; do # for input in $data_dir/input*; do
     (( ++total_count ))
     suffix=${input#*input_}
     if (( verbose )); then echo "$name: running test $suffix" >&2; fi
     stdout="$tmpdir/stdout.$suffix"
     stderr="$tmpdir/stderr.$suffix"
+    if grep -q "$python_prefix" < "$data_dir/stderr_$suffix"; then
+        expected_stderr="$( grep "^$python_prefix" < "$data_dir/stderr_$suffix" | sed "s#^$python_prefix##" )" # quick and dirty; sigh...
+    else
+        expected_stderr="$( cat "$data_dir/stderr_$suffix" )"
+    fi
     cat $input | name-value-eval --variables=$variables --test > $stdout 2> $stderr
+    actual_stderr=$( cat $stderr )
     if ! cmp --quiet $stdout $data_dir/stdout_$suffix; then
         echo "$name: test failed for input_$suffix (stdout is different):" >&2
         diff $stdout $data_dir/stdout_$suffix >&2
-    elif ! cmp --quiet $stderr $data_dir/stderr_$suffix; then
-        echo "$name: test failed for input_$suffix (stderr is different):" >&2
-        diff $stderr $data_dir/stderr_$suffix >&2
+    elif [[ "$actual_stderr" != "$expected_stderr" ]]; then # quick and dirty; sigh...
+        # quick and dirty; sigh... error messages keep changing from one python version to the next
+        if (( python_version == 2 )) || [[ "$( cut -d: -f3 <<< "$actual_stderr" )" != "$( cut -d: -f3 <<< "$expected_stderr" )" ]]; then
+            echo "expected error message:" >&2
+            echo "$expected_stderr" | sed 's#^#    #' >&2
+            echo "actual error message:" >&2
+            echo "$actual_stderr" | sed 's#^#    #' >&2
+        else
+            (( ++pass_count ))
+            if (( verbose )); then echo "$name: test $suffix passed" >&2; fi
+            echo $(basename "$input" )"=\"pass\""
+        fi
     else
         (( ++pass_count ))
         if (( verbose )); then echo "$name: test $suffix passed" >&2; fi
diff --git a/name_value/test/name-value-convert/expected b/name_value/test/name-value-convert/expected
new file mode 100644
index 000000000..ba8ce1e95
--- /dev/null
+++ b/name_value/test/name-value-convert/expected
@@ -0,0 +1,34 @@
+quoting[0]/output='{"a":"01"}'
+quoting[1]/output='a="01"'
+quoting[2]/output='a="01"'
+quoting[3]/output='{"a":1}'
+quoting[5]/output='a="1"'
+quoting[6]/output='a=1'
+quoting[4]/output='{"a":"1"}'
+quoting[5]/output='a="1"'
+quoting[6]/output='a=1'
+quoting[7]/output='{"a":"inf","b":"iNf","c":"nan","d":"NaN"}'
+quoting[8]/output='{"a":"inf","b":"iNf","c":"nan","d":"NaN"}'
+
+paths[0]/output='a/b="1";a/c="2";x/y="3";x/z="4"'
+paths[1]/output='b="1";c="2"'
+paths[2]/output='b=1;c=2'
+paths[3]/output='y="3";z="4";b="1";c="2"'
+paths[4]/output='y="3"'
+paths[5]/output='y=3'
+paths[6]/output='z="4";y="3"'
+paths[7]/output='y=3;z=4'
+paths[8]/output='z="4";y="3";b="1";c="2"'
+paths[9]/output=''
+paths[9]/status=0
+paths[10]/status=1
+paths[11]/output='b="1";c="2";'
+paths[12]/output='y="3";z="4";b="1";c="2";'
+paths[13]/output='y="3";'
+paths[14]/output='z="4";y="3";'
+paths[15]/output='z="4";y="3";b="1";c="2";'
+
+file[0]/output/line[0]="a=3"
+file[0]/output/line[1]="b=4"
+file[1]/output="a=3"
+file[2]/output=""
diff --git a/name_value/test/name-value-convert/input b/name_value/test/name-value-convert/input
new file mode 100644
index 000000000..bc009d1f6
--- /dev/null
+++ b/name_value/test/name-value-convert/input
@@ -0,0 +1,32 @@
+quoting[0]="echo a=01 | name-value-convert --to json --minify"
+quoting[1]="echo a=01 | name-value-convert --to json --minify | name-value-convert"
+quoting[2]="echo a=01 | name-value-convert --to json --minify | name-value-convert --unquote-numbers"
+quoting[3]="echo a=1 | name-value-convert --to json --minify"
+quoting[5]="echo a=1 | name-value-convert --to json --minify | name-value-convert"
+quoting[6]="echo a=1 | name-value-convert --to json --minify | name-value-convert --unquote-numbers"
+quoting[4]="echo a=1 | name-value-convert --to json --quote-numbers --minify"
+quoting[5]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert"
+quoting[6]="echo a=1 | name-value-convert --to json --quote-numbers --minify | name-value-convert --unquote-numbers"
+quoting[7]="( echo a=inf; echo b=iNf; echo c=nan; echo d=NaN ) | name-value-convert --to json --minify"
+quoting[8]="( echo a=inf; echo b=iNf; echo c=nan; echo d=NaN ) | name-value-convert --to json --minify --unquote-numbers"
+
+paths[0]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --delimiter=';'"
+paths[1]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path a --delimiter=';'"
+paths[2]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path a --delimiter=';' --unquote-numbers"
+paths[3]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x --path a --delimiter=';'"
+paths[4]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y --delimiter=';'"
+paths[5]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y --delimiter=';' --unquote-numbers"
+paths[6]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y --delimiter=';'"
+paths[7]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y --path x/z --delimiter=';' --unquote-numbers"
+paths[8]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y --path a --delimiter=';'"
+paths[9]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path s/t --delimiter=';'"
+paths[10]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path s/t --strict --delimiter=';'"
+paths[11]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path a | tr '\\n' ';'"
+paths[12]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x --path a | tr '\\n' ';'"
+paths[13]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/y | tr '\\n' ';'"
+paths[14]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y | tr '\\n' ';'"
+paths[15]="( echo a/b=1; echo a/c=2; echo x/y=3; echo x/z=4 ) | name-value-convert --path x/z --path x/y --path a | tr '\\n' ';'"
+
+file[0]="name-value-convert --path <( echo x/y/a=3; echo x/y/b=4 )':x/y' --unquote"
+file[1]="name-value-convert --path <( echo x/y/a=3; echo x/y/b=4 )':x/y/a' --unquote"
+file[2]="name-value-convert --path <( echo x/y/a=3; echo x/y/b=4 )':x/y/c' --unquote"
diff --git a/name_value/test/name-value-get/expected b/name_value/test/name-value-get/expected
index bdc7f1975..e0640a9a9 100644
--- a/name_value/test/name-value-get/expected
+++ b/name_value/test/name-value-get/expected
@@ -11,14 +11,14 @@ empty_input[0]/output=''
 non_existant[0]/output=''
 non_existant[1]/output=''
 
-multiple_results[0]/output='c="0";c="1"'
-multiple_results[1]/output='c="0";d="1";e="2"'
+multiple_results[0]/output='c="0";c="1";'
+multiple_results[1]/output='c="0";d="1";e="2";'
 
 indexed_path[0]/output='1'
 indexed_path[1]/output='1'
-indexed_path[2]/output='c="0"'
+indexed_path[2]/output='c="0";'
 indexed_path[3]/output='1'
-indexed_path[4]/output='b[0]/c="0";b[1]/c="1"'
+indexed_path[4]/output='b[0]/c="0";b[1]/c="1";'
 
 regex[0]/output='1'
 regex[1]/output='0;1;'
@@ -26,3 +26,9 @@ regex[2]/output='0;2;'
 
 whitespace[0]/output='2'
 whitespace[1]/output='2'
+
+file[0]/output/line[0]="c=111"
+file[0]/output/line[1]="d=222"
+file[1]/output="111"
+file[2]/output=""
+
diff --git a/name_value/test/name-value-get/input b/name_value/test/name-value-get/input
index e17167dda..9afbc617d 100644
--- a/name_value/test/name-value-get/input
+++ b/name_value/test/name-value-get/input
@@ -1,28 +1,32 @@
-basics[0]=echo a=1 | name-value-get a
-basics[1]=echo '{ "a": 1, "b": 2, "c": 3}' | name-value-get b
+basics[0]="echo a=1 | name-value-get a"
+basics[1]="echo '{ \"a\": 1, \"b\": 2, \"c\": 3}' | name-value-get b"
 
-path[0]=echo '{ "a": 1, "b": 2, "c": { "d": 3 }}' | name-value-get c/d
-path[1]=( echo a/b/c=0; echo a/b/d=-1; ) | name-value-get a/b/d
+path[0]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": 3 }}' | name-value-get c/d"
+path[1]="( echo a/b/c=0; echo a/b/d=-1; ) | name-value-get a/b/d"
 
-xml[0]=echo '{ "a": 1, "b": 2, "c": { "d": "omega" }}' | name-value-convert --to xml | name-value-get c/d
+xml[0]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": \"omega\" }}' | name-value-convert --to xml | name-value-get c/d"
 
-non_existant[0]=echo '{ "a": 1, "b": 2, "c": { "d": 3 }}' | name-value-get d
-non_existant[1]=echo '{ "a": 1, "b": 2, "c": { "d": 3 }}' | name-value-get x/b
+non_existant[0]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": 3 }}' | name-value-get d"
+non_existant[1]="echo '{ \"a\": 1, \"b\": 2, \"c\": { \"d\": 3 }}' | name-value-get x/b"
 
-empty_input[0]=name-value-get x < /dev/null
+empty_input[0]="name-value-get x < /dev/null"
 
-multiple_results[0]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-convert --to json | name-value-get a/b | tr \'\\\n\' \';\'"
-multiple_results[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/e=2; ) | name-value-get a/b | tr \'\\\n\' \';\'"
+multiple_results[0]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-convert --to json | name-value-get a/b | tr '\\n' ';'"
+multiple_results[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/e=2; ) | name-value-get a/b | tr '\\n' ';'"
 
 indexed_path[0]="echo a[0]=1 | name-value-get a[0]"
 indexed_path[1]="echo a[0]=1 | name-value-convert --to json | name-value-get a[0]"
-indexed_path[2]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a/b[0] | tr \'\\\n\' \';\'"
+indexed_path[2]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a/b[0] | tr '\\n' ';'"
 indexed_path[3]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a/b[1]/c"
-indexed_path[4]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a | tr \'\\\n\' \';\'"
+indexed_path[4]="( echo a/b[0]/c=0 ; echo a/b[1]/c=1 ) | name-value-get a | tr '\\n' ';'"
 
 regex[0]="( echo a/alpha=0 ; echo a/aleph=1 ) | name-value-get 'a/ale.*' "
-regex[1]="( echo a/alpha=0 ; echo a/aleph=1; echo a/chi=2; ) | name-value-get 'a/al.*' | tr \'\\\n\' \';\'"
-regex[2]="( echo a/phi=0 ; echo a/psi=1; echo a/rho=2; ) | name-value-get --regex 'a/[pr]h[io]' | tr \'\\\n\' \';\'"
+regex[1]="( echo a/alpha=0 ; echo a/aleph=1; echo a/chi=2; ) | name-value-get 'a/al.*' | tr '\\n' ';'"
+regex[2]="( echo a/phi=0 ; echo a/psi=1; echo a/rho=2; ) | name-value-get --regex 'a/[pr]h[io]' | tr '\\n' ';'"
 
 whitespace[0]="( echo a/b/c=0; echo; echo a/b/d=1; echo; echo a/b/e=2; ) | name-value-get a/b/e"
 whitespace[1]="( echo a/b/c=0; echo a/b/d=1; echo a/b/ e =2; ) | name-value-get 'a/b/ e '"
+
+file[0]="name-value-get <( echo a/b/c=111; echo a/b/d=222 )':a/b' --unquote"
+file[1]="name-value-get <( echo a/b/c=111; echo a/b/d=222 )':a/b/c' --unquote"
+file[2]="name-value-get <( echo a/b/c=111; echo a/b/d=222 )':a/b/c/d' --unquote"
diff --git a/name_value/test/name-value-to-csv/basic/expected b/name_value/test/name-value-to-csv/basic/expected
index 335e6a7c6..0f2b23313 100644
--- a/name_value/test/name-value-to-csv/basic/expected
+++ b/name_value/test/name-value-to-csv/basic/expected
@@ -1,3 +1,18 @@
-line[0]="a,1"
-line[1]="b,2"
-status=0
+basics[0]/output/line[0]="a,1"
+basics[0]/output/line[1]="b,2"
+basics[0]/status=0
+unquote[0]/output/line[0]="\"a\",1"
+unquote[0]/output/line[1]="\"b\",2"
+unquote[0]/status=0
+unquote[1]/output/line[0]="a,1"
+unquote[1]/output/line[1]="b,2"
+unquote[1]/status=0
+unquote[2]/output/line[0]="\"a\",1"
+unquote[2]/output/line[1]="\"b\",2"
+unquote[2]/status=0
+unquote[3]/output/line[0]="\"a\",1,3,z"
+unquote[3]/output/line[1]="\"b\",2,3,z"
+unquote[3]/status=0
+unquote[4]/output/line[0]="a,1,3,z"
+unquote[4]/output/line[1]="b,2,3,z"
+unquote[4]/status=0
diff --git a/name_value/test/name-value-to-csv/basic/input b/name_value/test/name-value-to-csv/basic/input
index 7e2e2a24d..6a89da8fb 100644
--- a/name_value/test/name-value-to-csv/basic/input
+++ b/name_value/test/name-value-to-csv/basic/input
@@ -1,5 +1,6 @@
-[0]/name=a
-[0]/value=1
-[1]/name=b
-[1]/value=2
-
+basics[0]="( echo [0]/name=a; echo [0]/value=1; echo [1]/name=b; echo [1]/value=2 ) | name-value-to-csv --fields name,value"
+unquote[0]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2 ) | name-value-to-csv --fields name,value"
+unquote[1]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2 ) | name-value-to-csv --fields name,value --unquote"
+unquote[2]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2; echo c=3 ) | name-value-to-csv --fields name,value"
+unquote[3]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2; echo c=3; echo d="z" ) | name-value-to-csv --fields name,value --unindexed-fields c,d"
+unquote[4]="( echo [0]/name=\\\"a\\\"; echo [0]/value=1; echo [1]/name=\\\"b\\\"; echo [1]/value=2; echo c=3; echo d="z" ) | name-value-to-csv --fields name,value --unindexed-fields c,d --unquote"
diff --git a/name_value/test/name-value-to-csv/basic/options b/name_value/test/name-value-to-csv/basic/options
deleted file mode 100644
index 5241b8824..000000000
--- a/name_value/test/name-value-to-csv/basic/options
+++ /dev/null
@@ -1 +0,0 @@
---fields=name,value
diff --git a/name_value/test/name-value-to-csv/basic/test b/name_value/test/name-value-to-csv/basic/test
new file mode 100755
index 000000000..988ba14ee
--- /dev/null
+++ b/name_value/test/name-value-to-csv/basic/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+comma_test_commands
diff --git a/name_value/test/name-value-to-csv/map/expected b/name_value/test/name-value-to-csv/map/expected
new file mode 100644
index 000000000..494667105
--- /dev/null
+++ b/name_value/test/name-value-to-csv/map/expected
@@ -0,0 +1,5 @@
+map/basics[0]/output/line[0]="x,0,1"
+map/basics[0]/output/line[1]="y,2,"
+map/basics[0]/status=0
+map/basics[1]/output="x,0,1"
+map/basics[1]/status=0
diff --git a/name_value/test/name-value-to-csv/map/input b/name_value/test/name-value-to-csv/map/input
new file mode 100644
index 000000000..247604259
--- /dev/null
+++ b/name_value/test/name-value-to-csv/map/input
@@ -0,0 +1,2 @@
+map/basics[0]="( echo p/x/a/b=0; echo p/x/c=1; echo p/y/a/b=2 ) | name-value-to-csv --map --prefix=p --fields a/b,c"
+map/basics[1]="( echo p/x/a/b=0; echo p/x/c=1 ) | name-value-to-csv --map --prefix=p --fields a/b,c"
diff --git a/name_value/test/name-value-to-csv/map/test b/name_value/test/name-value-to-csv/map/test
new file mode 100755
index 000000000..988ba14ee
--- /dev/null
+++ b/name_value/test/name-value-to-csv/map/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+comma_test_commands
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
new file mode 100644
index 000000000..2d3b5bd94
--- /dev/null
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/expected
@@ -0,0 +1,11 @@
+unindexed_stream/basics[0]/output/line[0]="1,"
+unindexed_stream/basics[0]/output/line[1]=",3"
+unindexed_stream/basics[0]/output/line[2]="2,"
+unindexed_stream/basics[0]/output/line[3]=",4"
+unindexed_stream/basics[0]/status=0
+
+unindexed_stream/basics[1]/output/line[0]="1,"
+unindexed_stream/basics[1]/output/line[1]="1,3"
+unindexed_stream/basics[1]/output/line[2]="2,3"
+unindexed_stream/basics[1]/output/line[3]="2,4"
+unindexed_stream/basics[1]/status=0
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
new file mode 100644
index 000000000..20cea67ab
--- /dev/null
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/input
@@ -0,0 +1,2 @@
+unindexed_stream/basics[0]="( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream"
+unindexed_stream/basics[1]="( echo a=1; echo c=3; echo b=3; echo a=2; echo b=4 ) | name-value-to-csv --unindexed-fields a,b --unindexed-stream-update"
\ No newline at end of file
diff --git a/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/test b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/test
new file mode 100755
index 000000000..988ba14ee
--- /dev/null
+++ b/name_value/test/name-value-to-csv/unindexed_fields/unindexed_stream/test
@@ -0,0 +1,3 @@
+#!/bin/bash
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+comma_test_commands
diff --git a/name_value/test/name_value_test.cpp b/name_value/test/name_value_test.cpp
index d166e1390..f4c8b98cb 100644
--- a/name_value/test/name_value_test.cpp
+++ b/name_value/test/name_value_test.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 #include <gtest/gtest.h>
 #include "../../name_value/parser.h"
@@ -110,12 +82,12 @@ template <> struct traits< nested_with_optional >
         v.apply( "c", t.c );
         v.apply( "d", t.d );
     }
-    
+
     template < typename Key, class Visitor > static void visit( Key, nested_with_optional& t, Visitor& v )
     {
         v.apply( "c", t.c );
         v.apply( "d", t.d );
-    }    
+    }
 };
 
 template <> struct traits< struct_with_optional >
@@ -126,13 +98,13 @@ template <> struct traits< struct_with_optional >
         v.apply( "b", t.b );
         v.apply( "nested", t.nested );
     }
-    
+
     template < typename Key, class Visitor > static void visit( Key, struct_with_optional& t, Visitor& v )
     {
         v.apply( "a", t.a );
         v.apply( "b", t.b );
         v.apply( "nested", t.nested );
-    }    
+    }
 };
 
 } } // namespace comma { namespace visiting {
@@ -174,7 +146,7 @@ template <> struct traits< config >
 
 } } // namespace comma { namespace visiting {
 
-    
+
 namespace comma { namespace name_value { namespace test {
 
 TEST( name_value, get )
@@ -299,10 +271,13 @@ TEST( name_value, exists )
 
 TEST( name_value, serialize_json )
 {
+    EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\\\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\\\" }" ) );
     EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\"b\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\"b\" }" ) );
+    EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\\c\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\\c\" }" ) );
+    EXPECT_EQ( "{ \"a\": \"a\", \"b\": \"b\\\\\\\"b\" }", json_remove_quotes_wrapper( "{ \"a\": \"a\", \"b\": \"b\\\\\\\"b\" }" ) );
     EXPECT_EQ( "{ \"a\": 1, \"b\": \"val\" }", json_remove_quotes_wrapper( "{ \"a\": \"1\", \"b\": \"val\" }" ) );
     EXPECT_EQ( "{ \"a\": [ 4.44, true, \"e\" ] }", json_remove_quotes_wrapper( "{ \"a\": [ \"4.44\", \"true\", \"e\" ] }" ) );
-    
+
     EXPECT_EQ( "{ \"a\": [ { \"b\": { \"c\": [ { \"d\": 1, \"e\": false }, { \"d\":2, \"e\": true } ] } } ], \"p\": { \"q\": { \"r\": 3.9e8, \"s\": \"t\"} }, \"x\": { \"y\": [ \"z\", 0.1e-3 ] } }", json_remove_quotes_wrapper( "{ \"a\": [ { \"b\": { \"c\": [ { \"d\": \"1\", \"e\": \"false\" }, { \"d\":2, \"e\": \"true\" } ] } } ], \"p\": { \"q\": { \"r\": \"3.9e8\", \"s\": \"t\"} }, \"x\": { \"y\": [ \"z\", \"0.1e-3\" ] } }" ) );
 
     //minify
@@ -362,6 +337,20 @@ TEST( name_value, as_vector )
     }
 }
 
+TEST( name_value, unique )
+{
+    void( name_value::map( "a=1;b;c=2", ';', '=', true ) );
+    EXPECT_THROW( name_value::map( "a=1;b;a=2;c=2", ';', '=', true ), comma::exception );
+    EXPECT_THROW( name_value::map( "a=1;b;b;c=2", ';', '=', true ), comma::exception );
+}
+
+TEST( name_value, allowed_names )
+{
+    void( name_value::map( "a=1;b;c=2", ';', '=', false, "a,b,c" ) );
+    EXPECT_THROW( name_value::map( "a=1;b;x;a=2;c=2", ';', '=', false, "a,b,c" ), comma::exception );
+    EXPECT_THROW( name_value::map( "a=1;b;x=5;b;c=2", ';', '=', false, "a,b,c" ), comma::exception );
+}
+
 } } }
 
 int main( int argc, char* argv[] )
diff --git a/name_value/test/ptree_test.cpp b/name_value/test/ptree_test.cpp
index b59941bf4..d4335a2e1 100644
--- a/name_value/test/ptree_test.cpp
+++ b/name_value/test/ptree_test.cpp
@@ -1,34 +1,10 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
+#include <array>
+#include <vector>
+#include <boost/array.hpp>
 #include <boost/function.hpp>
 #include <boost/optional.hpp>
 #include <boost/property_tree/json_parser.hpp>
@@ -176,6 +152,12 @@ TEST( ptree, basics )
         EXPECT_TRUE( !t.world );
         EXPECT_TRUE( !t1.world );
         EXPECT_EQ( t.nested->moon, t1.nested->moon );
+
+        comma::name_value::impl::write_json( std::cerr, tree1 );
+        auto a = property_tree::as< nested_type >( tree1, "test_type/nested" );
+        EXPECT_TRUE( a );
+        EXPECT_EQ( a->moon, t.nested->moon );
+        // todo! way more tests
     }
     {
         boost::property_tree::ptree ptree;
@@ -272,7 +254,6 @@ TEST( ptree, from_path_value )
         EXPECT_EQ( 2, m[6].nested->moon );
         EXPECT_EQ( "world",  *m[6].nested->value );
     }
-
 }
 
 TEST( ptree, permissive_visiting )
@@ -384,8 +365,11 @@ TEST( ptree, array )
         std::istringstream iss( s );
         property_tree::from_path_value( iss, ptree );
         from_ptree from_ptree( ptree );
-        boost::array< std::string, 3 > array;
-        try { visiting::apply( from_ptree, array ); EXPECT_TRUE( false ); } catch( ... ) {}
+        boost::array< std::string, 3 > array{ "bye", "moon", "stars" };
+        visiting::apply( from_ptree, array );
+        EXPECT_EQ( array[0], "hello" );
+        EXPECT_EQ( array[1], "world" );
+        EXPECT_EQ( array[2], "stars" );
     }
     {
         boost::property_tree::ptree ptree;
diff --git a/name_value/test/regex/expected b/name_value/test/regex/expected
index bd52695f3..624277f58 100644
--- a/name_value/test/regex/expected
+++ b/name_value/test/regex/expected
@@ -10,13 +10,13 @@ test[4]/output='b'
 test[4]/status=0
 #test[5]/output='a;b;'
 #test[5]/status=0
-test[6]/output='y[0]="a";y[1]="b"'
+test[6]/output='y[0]="a";y[1]="b";'
 test[6]/status=0
-test[7]/output='y[0]="4";y[0]="5"'
+test[7]/output='y[0]="4";y[0]="5";'
 test[7]/status=0
 test[8]/output='4'
 test[8]/status=0
 test[9]/output='5'
 test[9]/status=0
 test[10]/output='6;7;'
-test[10]/status=0
\ No newline at end of file
+test[10]/status=0
diff --git a/name_value/test/serialise_guess_test.cpp b/name_value/test/serialise_guess_test.cpp
index c8a40bf60..f6f8f67a5 100644
--- a/name_value/test/serialise_guess_test.cpp
+++ b/name_value/test/serialise_guess_test.cpp
@@ -233,7 +233,7 @@ TEST( serialise, guess_path_value_root ) { std::istringstream iss( path_value_ro
 
 TEST( serialise, guess_corrupted_json )
 {
-    std::istringstream iss( "{ \"name\": \"dummy\", }" );
+    std::istringstream iss( "{ \"name\": \"dummy\"," );
     config c; 
     ASSERT_THROW( comma::read< config >( c, iss ), comma::exception );
 }
diff --git a/name_value/test/serialise_test.cpp b/name_value/test/serialise_test.cpp
index 706cc9910..7ae8f8e79 100644
--- a/name_value/test/serialise_test.cpp
+++ b/name_value/test/serialise_test.cpp
@@ -29,6 +29,7 @@
 
 
 #include <gtest/gtest.h>
+#include "../../base/variant.h"
 #include "../../name_value/serialize.h"
 #include "../../visiting/traits.h"
 #include "../../xpath/xpath.h"
@@ -356,6 +357,146 @@ TEST( serialise, path_value )
         comma::read_path_value< config >( c, ss, comma::xpath( "root/item" ), true );
         test_config( c );
     }
+    {
+        std::stringstream ss;
+        comma::write_path_value< config >( d, ss, "root/item", true, "hello/world" );
+        config c;
+        comma::read_path_value< config >( c, ss, "hello/world/root/item", true );
+        test_config( c );
+    }
 }
 
 } } } // namespace comma { namespace test { namespace serialise {
+
+struct forest
+{
+    struct sounds
+    {
+        struct chirp { int a{1}; int b{2}; };
+        struct whistle { int a{3}; int b{4}; };
+        struct warble { int x{5}; int y{6}; };
+        struct silence {};
+    };
+
+    struct naming { static std::array< std::string, 3 > names() { return { "chirp", "whistle", "warble" }; } };
+
+    typedef comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble > variant_t;
+    comma::make_named_variant< naming >::variant< sounds::chirp, sounds::whistle, sounds::warble >::type madeup; // todo
+    std::array< variant_t, 3 > choir; // todo
+    comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble, sounds::silence > maybesound; // todo
+    comma::named_variant< naming, sounds::chirp, sounds::whistle, sounds::warble > sound;
+    
+};
+
+namespace comma { namespace visiting {
+
+template <> struct traits< forest::sounds::chirp >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::chirp& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+};
+
+template <> struct traits< forest::sounds::whistle >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::whistle& t, Visitor& v ) { v.apply( "a", t.a ); v.apply( "b", t.b ); }
+};
+
+template <> struct traits< forest::sounds::warble >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::warble& t, Visitor& v ) { v.apply( "x", t.x ); v.apply( "y", t.y ); }
+};
+
+template <> struct traits< forest::sounds::silence >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest::sounds::silence& t, Visitor& v ) {}
+    template < typename Key, class Visitor > static void visit( Key, const forest::sounds::silence& t, Visitor& v ) {}
+};
+
+template <> struct traits< forest >
+{
+    template < typename Key, class Visitor > static void visit( Key, forest& t, Visitor& v )
+    {
+        v.apply( "madeup", t.madeup ); // todo
+        v.apply( "choir", t.choir ); // todo
+        v.apply( "maybesound", t.maybesound ); // todo
+        v.apply( "sound", t.sound );
+    }
+    template < typename Key, class Visitor > static void visit( Key, const forest& t, Visitor& v )
+    {
+        v.apply( "madeup", t.madeup ); // todo
+        v.apply( "choir", t.choir ); // todo
+        v.apply( "maybesound", t.maybesound ); // todo
+        v.apply( "sound", t.sound );
+    }
+};
+
+} } // namespace comma { namespace visiting {
+
+TEST( serialise, variant )
+{
+    {
+        forest f;
+        {
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{}" );
+        }
+        {
+            f.sound.set( forest::sounds::chirp{11, 22} );
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{\"sound\":{\"chirp\":{\"a\":11,\"b\":22}}}" );
+        }
+        {
+            f.sound.set( forest::sounds::whistle{33, 44} );
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{\"sound\":{\"whistle\":{\"a\":33,\"b\":44}}}" );
+        }
+        {
+            f.sound.set( forest::sounds::warble{55, 66} );
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{\"sound\":{\"warble\":{\"x\":55,\"y\":66}}}" );
+        }
+        {
+            f.sound.reset();
+            std::ostringstream oss;
+            comma::write_json( f, oss, false );
+            EXPECT_EQ( oss.str(), "{}" );
+        }
+    }
+    // { // todo?
+    //     forest f;
+    //     std::ostringstream oss;
+    //     comma::write_json( f, oss, false );
+    //     EXPECT_EQ( oss.str(), "{}" );
+    //     f.maybesound.set( forest::sounds::silence() );
+    //     comma::write_json( f, oss, false );
+    //     //EXPECT_EQ( oss.str(), "{\"sound\":{\"silence\":\"\"}}" );
+    // }
+}
+
+TEST( deserialise, variant )
+{
+    {
+        forest g;
+        {
+            std::istringstream iss( "{\"sound\":{\"warble\":{\"x\":55,\"y\":66}}}" );
+            comma::read_json( g, iss );
+            EXPECT_TRUE( g.sound.is< forest::sounds::warble >() );
+            EXPECT_EQ( g.sound.get< forest::sounds::warble >().x, 55 );
+            EXPECT_EQ( g.sound.get< forest::sounds::warble >().y, 66 );
+            
+        }
+        {
+            std::istringstream iss( "{\"sound\":{\"chirp\":{\"a\":77,\"b\":88}}}" );
+            comma::read_json( g, iss );
+            EXPECT_TRUE( g.sound.is< forest::sounds::chirp >() );
+            EXPECT_EQ( g.sound.get< forest::sounds::chirp >().a, 77 );
+            EXPECT_EQ( g.sound.get< forest::sounds::chirp >().b, 88 );
+        }
+    }
+}
diff --git a/name_value/test/test b/name_value/test/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/name_value/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands
diff --git a/packed/CMakeLists.txt b/packed/CMakeLists.txt
index 4475ab364..648c65102 100644
--- a/packed/CMakeLists.txt
+++ b/packed/CMakeLists.txt
@@ -3,11 +3,13 @@ SET( TARGET_NAME comma_${PROJECT} )
 
 FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp )
 FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h )
-SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
-ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
+FILE( GLOB detail_includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/detail/*.h )
+SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} ${detail_includes} )
+ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} ${detail_includes} )
 # target_link_libraries( ${TARGET_NAME} comma_string )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+INSTALL( FILES ${detail_includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/detail )
 
 IF( comma_BUILD_TESTS )
     ADD_SUBDIRECTORY( test )
diff --git a/packed/big_endian.h b/packed/big_endian.h
index 017a6f215..b837587d1 100644
--- a/packed/big_endian.h
+++ b/packed/big_endian.h
@@ -1,167 +1,55 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_BIG_ENDIAN_H_
-#define COMMA_PACKED_BIG_ENDIAN_H_
+#pragma once
 
-#include <algorithm>
-#include <boost/static_assert.hpp>
-#include "../base/exception.h"
-#include "../base/types.h"
-#include "../packed/field.h"
+#include "detail/endian.h"
 
 namespace comma { namespace packed {
 
-namespace detail {
-
-template < typename T > struct net_traits {};
-
-template <> struct net_traits< comma::uint16 >
-{
-    static comma::uint16 hton( comma::uint16 v ) { return htons( v ); }
-    static comma::uint16 ntoh( comma::uint16 v ) { return ntohs( v ); }
-};
-
-template <> struct net_traits< comma::int16 >
-{
-    static comma::int16 hton( comma::int16 v ) { return htons( v ); }
-    static comma::int16 ntoh( comma::int16 v ) { return ntohs( v ); }
-};
-
-template <> struct net_traits< comma::uint32 >
-{
-    static comma::uint32 hton( comma::uint32 v ) { return htonl( v ); }
-    static comma::uint32 ntoh( comma::uint32 v ) { return ntohl( v ); }
-};
-
-template <> struct net_traits< comma::int32 >
-{
-    static comma::int32 hton( comma::int32 v ) { return htonl( v ); }
-    static comma::int32 ntoh( comma::int32 v ) { return ntohl( v ); }
-};
-
-BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
-
-template < typename type, typename uint_of_same_size >
-inline type pack_float( type value )
-{
-    char storage[sizeof(type)];
-    uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-    for( unsigned int i = 0; i < sizeof( type ); ++i, *p >>= 8 ) { storage[sizeof(type)-i-1] = *p & 0xff; } 
-    const type* result = reinterpret_cast< const type* >( &storage );
-    return *result;
-}
-
-template< typename type, typename uint_of_same_size >
-inline type unpack_float( type value ) 
-{
-    const char* storage = reinterpret_cast< const char* >( &value ); 
-    uint_of_same_size v = 0;
-    unsigned int shift = 0;
-    for( unsigned int i = 0; i < sizeof( type ); ++i, shift += 8 ) { v += static_cast< uint_of_same_size >( ( unsigned char )( storage[sizeof(type)-i-1] ) ) << shift; }
-    const type* result = reinterpret_cast< const type* >( &v );
-    return *result;
-}
-
-template <> struct net_traits< float >
-{
-    typedef comma::uint32 uint_of_same_size;
-    static float hton( float value ) { return pack_float< float, uint_of_same_size >( value ); }
-    static float ntoh( float value ) { return unpack_float< float, uint_of_same_size >( value ); }
-};
-
-template <> struct net_traits< double >
-{
-    typedef comma::uint64 uint_of_same_size;
-    static double hton( double value ) { return pack_float< double, uint_of_same_size >( value ); }
-    static double ntoh( double value ) { return unpack_float< double, uint_of_same_size >( value ); }
-};
-
-template < typename T >
-class big_endian : public packed::field< big_endian< T >, T, sizeof( T ) >
-{
-    public:
-        enum { size = sizeof( T ) };
-
-        typedef T type;
-
-        typedef packed::field< big_endian< T >, T, size > base_type;
-
-        static type default_value() { return 0; }
-
-        static void pack( char* storage, type value )
-        {
-            type v( net_traits< type >::hton( value ) );
-            ::memcpy( storage, ( void* )&v, size );
-        }
-
-        static type unpack( const char* storage )
-        {
-            type value;
-            ::memcpy( ( void* )&value, storage, size );
-            return net_traits< type >::ntoh( value );
-        }
-
-        const big_endian& operator=( const big_endian& rhs ) { return base_type::operator=( rhs ); }
-
-        const big_endian& operator=( type rhs ) { return base_type::operator=( rhs ); }
-};
-
-} // namespace detail {
-
-/// big endian 16-bit integers
-typedef detail::big_endian< comma::uint16 > big_endian_uint16;
-typedef detail::big_endian< comma::int16 > big_endian_int16;
-/// aliases for big endian 16-bit integers
+typedef detail::endian< detail::big, 2, false > big_endian_uint16;
+typedef detail::endian< detail::big, 2, true > big_endian_int16;
 typedef big_endian_uint16 net_uint16;
 typedef big_endian_int16 net_int16;
-/// big endian 32-bit integers
-typedef detail::big_endian< comma::uint32 > big_endian_uint32;
-typedef detail::big_endian< comma::int32 > big_endian_int32;
-/// aliases for big endian 32-bit integers
+typedef detail::endian< detail::big, 3, false > big_endian_uint24;
+typedef detail::endian< detail::big, 3, true > big_endian_int24;
+typedef big_endian_uint24 net_uint24;
+typedef big_endian_int24 net_int24;
+typedef detail::endian< detail::big, 4, false > big_endian_uint32;
+typedef detail::endian< detail::big, 4, true > big_endian_int32;
 typedef big_endian_uint32 net_uint32;
 typedef big_endian_int32 net_int32;
-/// big endian float and double
-typedef detail::big_endian< float > big_endian_float32;
-typedef detail::big_endian< double > big_endian_float64;
+typedef detail::endian< detail::big, 6, false > big_endian_uint48;
+typedef detail::endian< detail::big, 6, true > big_endian_int48;
+typedef big_endian_uint48 net_uint48;
+typedef big_endian_int48 net_int48;
+typedef detail::endian< detail::big, 4, true, true > big_endian_float32;
+typedef detail::endian< detail::big, 8, true, true > big_endian_float64;
+typedef big_endian_float32 big_endian_float;
 typedef big_endian_float64 big_endian_double;
-/// aliases for big endian float and double
 typedef big_endian_float32 net_float32;
 typedef big_endian_float64 net_float64;
+typedef net_float32 net_float;
 typedef net_float64 net_double;
 
+// all types above deprecated; use namespacing below
+namespace big_endian { // i love namespacing
 
-} } // namespace comma { namespace packed {
+typedef detail::endian< detail::big, 2, false > uint16;
+typedef detail::endian< detail::big, 2, true > int16;
+typedef detail::endian< detail::big, 3, false > uint24;
+typedef detail::endian< detail::big, 3, true > int24;
+typedef detail::endian< detail::big, 4, false > uint32;
+typedef detail::endian< detail::big, 4, true > int32;
+typedef detail::endian< detail::big, 6, false > uint48; // go figure... there are actual people in the world using it in their protocol packets...
+typedef detail::endian< detail::big, 6, true > int48;
+typedef detail::endian< detail::big, 8, false > uint64;
+typedef detail::endian< detail::big, 8, true > int64;
+typedef detail::endian< detail::big, 4, true, true > float32;
+typedef detail::endian< detail::big, 8, true, true > float64;
+
+} // namespace big_endian {
 
-#endif // #ifndef COMMA_PACKED_BIG_ENDIAN_H_
+} } // namespace comma { namespace packed {
diff --git a/packed/bits.h b/packed/bits.h
index cab9bfaad..5de90bb1b 100644
--- a/packed/bits.h
+++ b/packed/bits.h
@@ -1,45 +1,16 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_BITS_HEADER_H_
-#define COMMA_PACKED_BITS_HEADER_H_
+#pragma once
 
+#include <cstring>
 #include <limits>
-#include <string.h>
-#include <boost/static_assert.hpp>
+#include <type_traits>
+#include <boost/type_traits.hpp>
 #include "../packed/field.h"
 #include "../base/types.h"
-#include <boost/type_traits.hpp>
 
 namespace comma { namespace packed {
 
@@ -60,17 +31,17 @@ struct bits : public packed::field< bits< B, Default >, B, sizeof( typename comm
     bits( integer_type v ) { operator=( v ); }
     bits( type t ) : base_type( t ) {}
 
-    static type default_value() { static const integer_type d = Default; type t; ::memcpy( &t, &d, size ); return t; }
+    static type default_value() { static const integer_type d = Default; type t; std::memcpy( ( char* )( &t ), ( const char* )( &d ), size ); return t; }
 
-    static void pack( char* storage, type value ) { ::memcpy( storage, &value, size ); }
+    static void pack( char* storage, type value ) { std::memcpy( storage, ( const char* )( &value ), size ); }
 
-    static type unpack( const char* storage ) { type t; ::memcpy( &t, storage, size ); return t; }
+    static type unpack( const char* storage ) { type t; std::memcpy( ( char* )( &t ), storage, size ); return t; }
 
     const bits& operator=( const bits& rhs ) { return base_type::operator=( rhs ); }
 
     const bits& operator=( type rhs ) { return base_type::operator=( rhs ); }
 
-    const bits& operator=( integer_type rhs ) { type t; ::memcpy( &t, &rhs, size ); return base_type::operator=( t ); }
+    const bits& operator=( integer_type rhs ) { type t; std::memcpy( ( char* )( &t ), &rhs, size ); return base_type::operator=( t ); }
 
     type& fields() { return *( reinterpret_cast< type* >( this ) ); }
 
@@ -81,7 +52,7 @@ struct bits : public packed::field< bits< B, Default >, B, sizeof( typename comm
 
 template< typename T > inline void reverse_bits( T& v )
 {
-    BOOST_STATIC_ASSERT( boost::is_unsigned< T >::value );
+    static_assert( boost::is_unsigned< T >::value, "expected unsigned value" );
     unsigned int s = std::numeric_limits< T >::digits - 1;
     T r = v;
     for( v >>= 1; v; v >>= 1 )
@@ -112,20 +83,17 @@ struct reversed_bits : public packed::field< reversed_bits< B, Default >, B, siz
     reversed_bits( integer_type v ) { operator=( v ); }
     reversed_bits( type t ) : base_type( t ) {}
 
-    static type default_value() { static const integer_type d = Default; type t; ::memcpy( &t, &d, size ); return t; }
+    static type default_value() { static const integer_type d = Default; type t; std::memcpy( ( char* )( &t ), ( const char* )( &d ), size ); return t; }
 
-    static void pack( char* storage, type t ) { integer_type v; ::memcpy( &v, &t, size ); reverse_bits( v ); ::memcpy( storage, &v, size ); }
+    static void pack( char* storage, type t ) { integer_type v; std::memcpy( &v, &t, size ); reverse_bits( v ); std::memcpy( storage, ( const char* )( &v ), size ); }
 
-    static type unpack( const char* storage ) { integer_type v; ::memcpy( &v, storage, size ); reverse_bits( v ); type t; ::memcpy( &t, &v, size ); return t; }
+    static type unpack( const char* storage ) { integer_type v; std::memcpy( &v, storage, size ); reverse_bits( v ); type t; std::memcpy( ( char* )( &t ), ( const char* )( &v ), size ); return t; }
 
     const reversed_bits& operator=( const reversed_bits& rhs ) { return base_type::operator=( rhs ); }
 
     const reversed_bits& operator=( type rhs ) { return base_type::operator=( rhs ); }
 
-    const reversed_bits& operator=( integer_type rhs ) { type t; ::memcpy( &t, &rhs, size ); return base_type::operator=( t ); }
-
+    const reversed_bits& operator=( integer_type rhs ) { type t; std::memcpy( ( char* )( &t ), ( const char* )( &rhs ), size ); return base_type::operator=( t ); }
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // COMMA_PACKED_BITS_HEADER_H_
diff --git a/packed/byte.h b/packed/byte.h
index 24ef1864e..0ef66af3a 100644
--- a/packed/byte.h
+++ b/packed/byte.h
@@ -1,37 +1,8 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_BYTE_HEADER_H_
-#define COMMA_PACKED_BYTE_HEADER_H_
+#pragma once
 
 #if defined(__linux__) || defined(__APPLE__) || defined(__QNXNTO__)
 #include <arpa/inet.h>
@@ -43,7 +14,7 @@
 #endif
 #endif
 
-#include <boost/static_assert.hpp>
+#include <type_traits>
 #include "field.h"
 
 namespace comma { namespace packed {
@@ -53,7 +24,7 @@ struct byte : public packed::field< byte, unsigned char, sizeof( unsigned char )
 {
     enum { size = sizeof( unsigned char ) };
 
-    BOOST_STATIC_ASSERT( size == 1 );
+    static_assert( size == 1, "expected size 1" );
 
     typedef unsigned char type;
 
@@ -76,7 +47,7 @@ struct const_byte : public packed::field< const_byte< C >, unsigned char, sizeof
 {
     enum { size = sizeof( unsigned char ) };
 
-    BOOST_STATIC_ASSERT( size == 1 );
+    static_assert( size == 1, "expected size 1" );
 
     typedef unsigned char type;
 
@@ -98,5 +69,3 @@ struct const_byte : public packed::field< const_byte< C >, unsigned char, sizeof
 typedef byte uint8;
 
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_BYTE_HEADER_H_
diff --git a/packed/detail/endian.h b/packed/detail/endian.h
new file mode 100644
index 000000000..9b4d81cea
--- /dev/null
+++ b/packed/detail/endian.h
@@ -0,0 +1,112 @@
+
+// Copyright (c) 2011 The University of Sydney
+// Copyright (c) 2018 Vsevolod Vlaskine
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <endian.h>
+#include <algorithm>
+#include <type_traits>
+#include "../../base/exception.h"
+#include "../../base/types.h"
+#include "../field.h"
+
+namespace comma { namespace packed { namespace detail {
+
+static_assert( sizeof( float ) == 4, "expected float of 4 bytes" );
+static_assert( sizeof( double ) == 8, "expected double of 8 bytes" );
+
+enum endiannes { little = 0, big = 1 };
+
+template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false > struct endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 6, true > { typedef comma::int64 type; typedef comma::uint64 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 6, false > { typedef comma::uint64 type; typedef comma::uint64 uint_of_same_size; };
+template < endiannes Endianness > struct endian_traits< Endianness, 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
+
+template < typename T > struct net_traits;
+
+template <> struct net_traits< comma::uint16 >
+{
+    static comma::uint16 htobe( comma::uint16 v ) { return htobe16( v ); }
+    static comma::uint16 betoh( comma::uint16 v ) { return be16toh( v ); }
+    static comma::uint16 htole( comma::uint16 v ) { return htole16( v ); }
+    static comma::uint16 letoh( comma::uint16 v ) { return le16toh( v ); }
+};
+
+template <> struct net_traits< comma::uint32 >
+{
+    static comma::uint32 htobe( comma::uint32 v ) { return htobe32( v ); }
+    static comma::uint32 betoh( comma::uint32 v ) { return be32toh( v ); }
+    static comma::uint32 htole( comma::uint32 v ) { return htole32( v ); }
+    static comma::uint32 letoh( comma::uint32 v ) { return le32toh( v ); }
+};
+
+template <> struct net_traits< comma::uint64 >
+{
+    static comma::uint64 htobe( comma::uint64 v ) { return htobe64( v ); }
+    static comma::uint64 betoh( comma::uint64 v ) { return be64toh( v ); }
+    static comma::uint64 htole( comma::uint64 v ) { return htole64( v ); }
+    static comma::uint64 letoh( comma::uint64 v ) { return le64toh( v ); }
+};
+
+template < endiannes Endianness > struct convert;
+
+template <> struct convert< packed::detail::little >
+{
+    template < typename T > static T from_host( T t ) { return net_traits< T >::htole( t ); }
+    template < typename T > static T to_host( T t ) { return net_traits< T >::letoh( t ); }
+};
+
+template <> struct convert< packed::detail::big >
+{
+    template < typename T > static T from_host( T t ) { return net_traits< T >::htobe( t ); }
+    template < typename T > static T to_host( T t ) { return net_traits< T >::betoh( t ); }
+};
+
+template < unsigned int Size > struct ff { enum { value = ff< Size - 1 >::value << 8 + 0xff }; };
+template <> struct ff< 1 > { enum { value = 0xff }; };
+
+template < endiannes Endianness, unsigned int Size, bool Signed, bool Floating = false >
+struct endian : public packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size >
+{
+    static const unsigned int size = Size;
+
+    typedef typename endian_traits< Endianness, Size, Signed, Floating >::type type;
+
+    static_assert( size <= sizeof( type ), "expected size less than size of type" );
+
+    static_assert( Signed || !Floating, "expected signed or non-floating point type" ); // unsigned floats don't make sense
+
+    typedef packed::field< endian< Endianness, Size, Signed, Floating >, typename endian_traits< Endianness, Size, Signed, Floating >::type, Size > base_type;
+
+    static type default_value() { return 0; }
+
+    typedef typename endian_traits< Endianness, size, Signed, Floating >::uint_of_same_size uint_of_same_size;
+
+    static void pack( char* storage, type value )
+    {
+        uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
+        *p = convert< Endianness >::from_host( *p );
+        ::memcpy( storage, reinterpret_cast< char * >( p ) + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), size );
+    }
+
+    static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
+    {
+        uint_of_same_size i = ( !Floating && Signed && ( storage[ Endianness == little ? size - 1 : 0 ] & 0x80 ) ) ? -1 : 0;
+        ::memcpy( reinterpret_cast< char * >( &i ) + ( Endianness == little ? 0 : sizeof( uint_of_same_size ) - size ), storage, size );
+        i = convert< Endianness >::to_host( i );
+        const type* p = reinterpret_cast< type* >( &i );
+        return *p;
+    }
+
+    const endian& operator=( const endian& rhs ) { return base_type::operator=( rhs ); }
+
+    const endian& operator=( const type& rhs ) { return base_type::operator=( rhs ); }
+};
+
+} } } // namespace comma { namespace packed { namespace detail {
diff --git a/packed/field.h b/packed/field.h
index c532d7786..ac888832d 100644
--- a/packed/field.h
+++ b/packed/field.h
@@ -1,41 +1,12 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_FIELD_H_
-#define COMMA_PACKED_FIELD_H_
+#pragma once
 
 #include <string.h>
-#include <boost/static_assert.hpp>
+#include <type_traits> // #include <boost/static_assert.hpp>
 
 namespace comma { namespace packed {
 
@@ -44,27 +15,27 @@ template < typename Derived, typename T, size_t S >
 class field
 {
     public:
-        enum { size = S };
+        static constexpr unsigned int size = S;
 
-        BOOST_STATIC_ASSERT( size > 0 );
+        static_assert( size > 0, "expected positive size" );
 
         typedef T type;
 
         field()
         {
-            BOOST_STATIC_ASSERT( sizeof( field ) == size );
+            static_assert( sizeof( field ) == size, "field size does not match stated size" );
             Derived::pack( storage_, Derived::default_value() );
         }
 
         field( const type& t )
         {
-            BOOST_STATIC_ASSERT( sizeof( field ) == size );
+            static_assert( sizeof( field ) == size, "field size does not match stated size" );
             Derived::pack( storage_, t );
         }
 
         field( const field& rhs )
         {
-            BOOST_STATIC_ASSERT( sizeof( field ) == size );
+            static_assert( sizeof( field ) == size, "field size does not match stated size" );
             operator=( rhs );
         }
 
@@ -97,5 +68,3 @@ class field
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // COMMA_PACKED_FIELD_H_
diff --git a/packed/little_endian.h b/packed/little_endian.h
index 5d419f095..a85fbcc2d 100644
--- a/packed/little_endian.h
+++ b/packed/little_endian.h
@@ -1,128 +1,55 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
-/// @author Vsevolod Vlaskine 2010-2011
+/// @author vsevolod vlaskine
 
-#ifndef COMMA_PACKED_LITTLEENDIAN_H_
-#define COMMA_PACKED_LITTLEENDIAN_H_
+#pragma once
 
-#include <boost/static_assert.hpp>
-#include "../base/exception.h"
-#include "../base/types.h"
-#include "field.h"
+#include "detail/endian.h"
 
 namespace comma { namespace packed {
 
-namespace detail {
-
-BOOST_STATIC_ASSERT( sizeof( float ) == 4 );
-BOOST_STATIC_ASSERT( sizeof( double ) == 8 );
-    
-template < unsigned int Size, bool Signed, bool Floating = false > struct little_endian_traits { typedef typename comma::integer< Size, Signed >::type type; typedef typename comma::integer< Size, false >::type uint_of_same_size; };
-template <> struct little_endian_traits< 3, true > { typedef comma::int32 type; typedef comma::uint32 uint_of_same_size; };
-template <> struct little_endian_traits< 3, false > { typedef comma::uint32 type; typedef comma::uint32 uint_of_same_size; };
-template <> struct little_endian_traits< 4, true, true > { typedef float type; typedef comma::uint32 uint_of_same_size; };
-template <> struct little_endian_traits< 8, true, true > { typedef double type; typedef comma::uint64 uint_of_same_size; };
-
-template < unsigned int Size, bool Signed, bool Floating = false >
-struct little_endian : public packed::field< little_endian< Size, Signed, Floating >, typename little_endian_traits< Size, Signed, Floating >::type, Size >
-{
-    static const unsigned int size = Size;
-
-    typedef typename little_endian_traits< Size, Signed, Floating >::type type;
-    
-    BOOST_STATIC_ASSERT( size <= sizeof( type ) );
-
-    typedef packed::field< little_endian< Size, Signed, Floating >, typename little_endian_traits< Size, Signed, Floating >::type, Size > base_type;
-
-    static type default_value() { return 0; }
-
-    typedef typename little_endian_traits< size, Signed, Floating >::uint_of_same_size uint_of_same_size;
-    
-    static void pack( char* storage, type value )
-    {
-        uint_of_same_size* p = reinterpret_cast< uint_of_same_size* >( &value );
-        for( unsigned int i = 0; i < size; ++i, *p >>= 8 ) { storage[i] = *p & 0xff; }
-    }
-
-    static type unpack( const char* storage ) // for floats it is a real hack, since there is no standard
-    {
-        uint_of_same_size v = 0;
-        unsigned int shift = 0;
-        unsigned int i = 0;
-        for( ; i < size; ++i, shift += 8 )
-        {
-            v += static_cast< uint_of_same_size >( ( unsigned char )( storage[i] ) ) << shift;
-        }
-        if( !Floating && Signed && ( storage[ size - 1 ] & 0x80 ) )
-        {            
-            for( ; i < sizeof( type ); ++i, shift += 8 ) { v +=  static_cast< uint_of_same_size >( 0xff ) << shift; } 
-        }
-        const type* result = reinterpret_cast< const type* >( &v );
-        return *result;
-    }
-
-    const little_endian& operator=( const little_endian& rhs ) { return base_type::operator=( rhs ); }
-
-    const little_endian& operator=( const type& rhs ) { return base_type::operator=( rhs ); }
-};
-
-} // namespace detail {
-
-/// packed little endian 16-bit integers
-typedef detail::little_endian< 2, true > little_endian16;
-typedef detail::little_endian< 2, false > little_endian_uint16;
+typedef detail::endian< detail::little, 2, true > little_endian16;
+typedef detail::endian< detail::little, 2, false > little_endian_uint16;
 typedef little_endian16 int16;
 typedef little_endian_uint16 uint16;
-/// packed little endian 24-bit integers (strangely, there are protocols using it)
-typedef detail::little_endian< 3, true > little_endian24;
-typedef detail::little_endian< 3, false > little_endian_uint24;
+typedef detail::endian< detail::little, 3, true > little_endian24;
+typedef detail::endian< detail::little, 3, false > little_endian_uint24;
 typedef little_endian24 int24;
 typedef little_endian_uint24 uint24;
-/// packed little endian 32-bit integers
-typedef detail::little_endian< 4, true > little_endian32;
-typedef detail::little_endian< 4, false > little_endian_uint32;
+typedef detail::endian< detail::little, 4, true > little_endian32;
+typedef detail::endian< detail::little, 4, false > little_endian_uint32;
 typedef little_endian32 int32;
 typedef little_endian_uint32 uint32;
-/// packed little endian 32-bit integers
-typedef detail::little_endian< 8, true > little_endian64;
-typedef detail::little_endian< 8, false > little_endian_uint64;
+typedef detail::endian< detail::little, 6, true > little_endian48;
+typedef detail::endian< detail::little, 6, false > little_endian_uint48;
+typedef little_endian48 int48;
+typedef little_endian_uint48 uint48;
+typedef detail::endian< detail::little, 8, true > little_endian64;
+typedef detail::endian< detail::little, 8, false > little_endian_uint64;
 typedef little_endian64 int64;
 typedef little_endian_uint64 uint64;
-/// packed floating point number (does it even make sense?)
-typedef detail::little_endian< 4, true, true > little_endian_float32;
-typedef detail::little_endian< 8, true, true > little_endian_float64;
+typedef detail::endian< detail::little, 4, true, true > little_endian_float32;
+typedef detail::endian< detail::little, 8, true, true > little_endian_float64;
 typedef little_endian_float32 float32;
 typedef little_endian_float64 float64;
 
-} } // namespace comma { namespace packed {
+// all types above deprecated; use namespacing below
+namespace little_endian { // i love namespacing
+
+typedef detail::endian< detail::little, 2, false > uint16;
+typedef detail::endian< detail::little, 2, true > int16;
+typedef detail::endian< detail::little, 3, false > uint24;
+typedef detail::endian< detail::little, 3, true > int24;
+typedef detail::endian< detail::little, 4, false > uint32;
+typedef detail::endian< detail::little, 4, true > int32;
+typedef detail::endian< detail::little, 6, false > uint48;
+typedef detail::endian< detail::little, 6, true > int48;
+typedef detail::endian< detail::little, 8, false > uint64;
+typedef detail::endian< detail::little, 8, true > int64;
+typedef detail::endian< detail::little, 4, true, true > float32;
+typedef detail::endian< detail::little, 8, true, true > float64;
 
-#endif // #ifndef COMMA_PACKED_LITTLEENDIAN_H_
+} // namespace little_endian {
+
+} } // namespace comma { namespace packed {
diff --git a/packed/packed.h b/packed/packed.h
index cb6775ed2..8616828a6 100644
--- a/packed/packed.h
+++ b/packed/packed.h
@@ -1,31 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #pragma once
 
diff --git a/packed/string.h b/packed/string.h
index 155200c65..9da7e56b5 100644
--- a/packed/string.h
+++ b/packed/string.h
@@ -1,42 +1,15 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
-/// @author Dewey Nguyen 2014-2014
+/// @author Dewey Nguyen 2014
 
-#ifndef COMMA_PACKED_STRING_H_
-#define COMMA_PACKED_STRING_H_
+#pragma once
 
 #include <cmath>
 #include <iomanip>
 #include <string>
+#include <type_traits>
 #include <boost/lexical_cast.hpp>
 #include "../base/exception.h"
 #include "../string/string.h"
@@ -55,11 +28,13 @@ class string : public packed::field< string< S, Padding >, std::string, S >
 
         typedef packed::field< string< S, Padding >, std::string, S > base_type;
 
-        static const std::string& default_value()
-        {
-            static const std::string s;// static const std::string s( S, Padding );
-            return s;
-        }
+        string() = default;
+
+        string( const std::string& rhs ) { pack( this->data(), rhs ); }
+
+        string( const char* rhs ) { operator=( rhs ); }
+
+        static const std::string& default_value() { static const std::string s; return s; } // static const std::string s( S, Padding );
 
         static void pack( char* storage, const std::string& value )
         {
@@ -68,16 +43,12 @@ class string : public packed::field< string< S, Padding >, std::string, S >
             ::memcpy( storage, &value[0], value.size() );
         }
 
-        static std::string unpack( const char* storage )
-        {
-            return comma::strip( std::string( storage, size ), Padding );
-        }
+        static std::string unpack( const char* storage ) { return comma::strip( std::string( storage, size ), Padding ); }
 
         const string& operator=( const std::string& rhs ) { return base_type::operator=( rhs ); }
 
         const string& operator=( const char* rhs ) { return base_type::operator=( std::string( rhs, size ) ); }
 
-        /// a convenience method, if string represents numeric values
         template < typename T > T as() const { return boost::lexical_cast< T >( this->operator()() ); }
 };
 
@@ -150,7 +121,7 @@ template < typename T, std::size_t S, char Padding = ' ' >
 class ascii_hex : public packed::field< ascii_hex< T, S, Padding >, T, S >
 {
 public:
-    BOOST_STATIC_ASSERT( boost::is_unsigned< T >::value );
+    static_assert( boost::is_unsigned< T >::value, "expected unsigned type" );
     enum { size = S };
     
     typedef T Type;
@@ -173,5 +144,3 @@ class ascii_hex : public packed::field< ascii_hex< T, S, Padding >, T, S >
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_STRING_H_
diff --git a/packed/struct.h b/packed/struct.h
index f5bc8c5f6..4fe5718be 100644
--- a/packed/struct.h
+++ b/packed/struct.h
@@ -1,62 +1,32 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author Matthew Herrmann 2007
 /// @author Vsevolod Vlaskine 2010-2011
 
-#ifndef COMMA_PACKED_STRUCT_HPP_
-#define COMMA_PACKED_STRUCT_HPP_
+#pragma once
 
 #include <cstring>
-#include <boost/static_assert.hpp>
+#include <type_traits>
 
 namespace comma { namespace packed {
 
 /// packed structure
 template < class Derived, size_t S >
-class packed_struct
+struct packed_struct
 {
-    public:
-        enum { size = S };
+    static constexpr unsigned int size = S;
+
+    packed_struct() throw() { static_assert( sizeof( Derived ) == size, "expected derived of provided size" ); }
 
-        packed_struct() throw() { BOOST_STATIC_ASSERT( sizeof( Derived ) == size ); }
+    const char* data() const throw() { return reinterpret_cast< const char* >( this ); }
 
-        const char* data() const throw() { return reinterpret_cast< const char* >( this ); }
+    char* data() throw() { return reinterpret_cast< char* >( this ); }
 
-        char* data() throw() { return reinterpret_cast< char* >( this ); }
+    bool operator==( const packed_struct& rhs ) const { return std::memcmp( this, &rhs, size ) == 0; }
 
-        bool operator==( const packed_struct& rhs ) const { return ::memcmp( this, &rhs, size ) == 0; }
+    bool operator!=( const packed_struct& rhs ) const { return !operator==( rhs ); }
 
-        bool operator!=( const packed_struct& rhs ) const { return !operator==( rhs ); }
+    void clear() { std::memset( ( char* )( this ), 0, size ); }
 };
 
 } } // namespace comma { namespace packed {
-
-#endif // #ifndef COMMA_PACKED_STRUCT_HPP_
diff --git a/packed/test/CMakeLists.txt b/packed/test/CMakeLists.txt
index 940b46fd3..c503d81e2 100644
--- a/packed/test/CMakeLists.txt
+++ b/packed/test/CMakeLists.txt
@@ -1,15 +1,13 @@
-SET( KIT packed )
-SET( DIR ${SOURCE_CODE_BASE_DIR}/${KIT}/test )
-FILE( GLOB source ${DIR}/*_test.cpp )
-FILE( GLOB extras ${DIR}/*.cpp ${DIR}/*.h )
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base comma_string ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT packed )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_application comma_base comma_string ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/packed/test/packed_test.cpp b/packed/test/packed_test.cpp
index e7b891b9d..8c7eb8ea1 100644
--- a/packed/test/packed_test.cpp
+++ b/packed/test/packed_test.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 #ifndef WIN32
 #include <stdlib.h>
@@ -36,6 +8,7 @@
 #include <gtest/gtest.h>
 #include <boost/array.hpp>
 #include "../../packed/packed.h"
+#include "../../packed/traits.h"
 #include "../../math/compare.h"
 #include "../../packed/bits.h"
 #include "../../base/types.h"
@@ -47,8 +20,8 @@ struct test_packed_struct_t : public comma::packed::packed_struct< test_packed_s
 {
     comma::packed::string< 4 > hello;
     comma::packed::string< 5 > world;
-    comma::packed::net_uint16 int16;
-    comma::packed::net_uint32 int32;
+    comma::packed::big_endian::uint16 int16;
+    comma::packed::big_endian::uint32 int32;
     comma::packed::byte byte;
 };
 
@@ -75,62 +48,84 @@ TEST( packed_struct, test_packed_struct )
     EXPECT_EQ( s.byte(), 3 );
 }
 
-template < typename T >
-void test_packed_int( comma::int64 value )
+template < typename T > static void test_packed_int( comma::int64 value )
 {
     T t;
     EXPECT_EQ( true, t == 0 );
     t = value;
     EXPECT_EQ( true, t == value );
+    std::cerr << "-------------------------------------------------" << std::endl;
+    std::cerr << "--> a: value: " << value << " t: " << t() << std::endl;
     EXPECT_EQ( value, t() );
+    std::cerr << "-------------------------------------------------" << std::endl;
 }
 
-template < typename T >
-void test_packed_uint( comma::uint64 value )
+template < typename T > static void test_packed_uint( comma::uint64 value )
 {
     T t;
     EXPECT_EQ( true, t == 0 );
     t = value;
     EXPECT_EQ( true, t == value );
+    std::cerr << "-------------------------------------------------" << std::endl;
+    std::cerr << "--> b: value: " << value << " t: " << t() << std::endl;
     EXPECT_EQ( value, t() );
+    std::cerr << "-------------------------------------------------" << std::endl;
 }
 
-
 TEST( test_packed_struct_test, test_little_endian )
 {
-    test_packed_uint< comma::packed::uint16 >( 1231 );
-    test_packed_uint< comma::packed::uint16 >( 65535 );
-    test_packed_uint< comma::packed::uint24 >( 1232 );
-    test_packed_uint< comma::packed::uint24 >( 16777215 );
-    test_packed_uint< comma::packed::uint32 >( 1233 );
-    test_packed_uint< comma::packed::uint32 >( 4294967295 );
-    test_packed_uint< comma::packed::uint64 >( 4321 );
-    test_packed_uint< comma::packed::uint64 >( comma::uint64( std::numeric_limits< comma::uint64 >::max() ) );
-    test_packed_uint< comma::packed::uint64 >( comma::uint64( 0x1BCDEF1213141500ULL ) );
-
-    test_packed_int< comma::packed::int16 >( 1234 );
-    test_packed_int< comma::packed::int24 >( 1235 );
-    test_packed_int< comma::packed::int24 >( 8388607 );
-    test_packed_int< comma::packed::int32 >( 8388607 );
-    test_packed_int< comma::packed::int32 >( 1236 );
-    test_packed_int< comma::packed::int16 >( -1231 );
-    test_packed_int< comma::packed::int24 >( -1232 );
-    test_packed_int< comma::packed::int24 >( -8388608 );
-    test_packed_int< comma::packed::int32 >( -1233 );
-    test_packed_int< comma::packed::int64 >( -4321 );
-    test_packed_int< comma::packed::int64 >( comma::int64( std::numeric_limits< comma::int64 >::min() ) );
+    test_packed_uint< comma::packed::little_endian::uint16 >( 1231 );
+    test_packed_uint< comma::packed::little_endian::uint16 >( 65535 );
+    test_packed_uint< comma::packed::little_endian::uint24 >( 1232 );
+    test_packed_uint< comma::packed::little_endian::uint24 >( 16777215 );
+    test_packed_uint< comma::packed::little_endian::uint32 >( 1233 );
+    test_packed_uint< comma::packed::little_endian::uint32 >( 4294967295 );
+    test_packed_uint< comma::packed::little_endian::uint64 >( 4321 );
+    test_packed_uint< comma::packed::little_endian::uint64 >( comma::uint64( std::numeric_limits< comma::uint64 >::max() ) );
+    test_packed_uint< comma::packed::little_endian::uint64 >( comma::uint64( 0x1BCDEF1213141500ULL ) );
+
+    test_packed_int< comma::packed::little_endian::int16 >( 1234 );
+    test_packed_int< comma::packed::little_endian::int16 >( 256 * 128 - 1 );
+    test_packed_int< comma::packed::little_endian::int16 >( 0 );
+    test_packed_int< comma::packed::little_endian::int16 >( -1 );
+    test_packed_int< comma::packed::little_endian::int16 >( -2 );
+    test_packed_int< comma::packed::little_endian::int16 >( -256 * 128 + 1 );
+    //for( comma::int16 i = 256 * 128 - 1; i > 0; --i ) { test_packed_uint< comma::packed::little_endian::int16 >( i ); }
+    //for( comma::int16 i = 256 * 128 - 1; i > 0; --i ) { test_packed_int< comma::packed::little_endian::int16 >( -i ); }
+    test_packed_int< comma::packed::little_endian::int24 >( 1235 );
+    test_packed_int< comma::packed::little_endian::int24 >( 8388607 );
+    test_packed_int< comma::packed::little_endian::int32 >( 8388607 );
+    test_packed_int< comma::packed::little_endian::int32 >( 1236 );
+    test_packed_int< comma::packed::little_endian::int16 >( -1231 );
+    test_packed_int< comma::packed::little_endian::int24 >( -1 );
+    test_packed_int< comma::packed::little_endian::int24 >( -2 );
+    test_packed_int< comma::packed::little_endian::int24 >( -256 );
+    test_packed_int< comma::packed::little_endian::int24 >( -1232 );
+    //for( unsigned int i = 0; i < 8388608; ++i ) { test_packed_int< comma::packed::little_endian::int24 >( -i ); }
+    test_packed_int< comma::packed::little_endian::int24 >( -1000000 );
+    test_packed_int< comma::packed::little_endian::int24 >( -8388608 );
+    test_packed_int< comma::packed::little_endian::int32 >( -1233 );
+    test_packed_int< comma::packed::little_endian::int64 >( -4321 );
+    test_packed_int< comma::packed::little_endian::int64 >( comma::int64( std::numeric_limits< comma::int64 >::min() ) );
 }
 
 TEST( test_packed_struct_test, test_big_endian )
 {
-    test_packed_int< comma::packed::net_uint16 >( 1234 );
-    test_packed_int< comma::packed::net_uint16 >( 65535 );
-    test_packed_int< comma::packed::net_uint32 >( 1234 );
-    test_packed_int< comma::packed::net_uint32 >( 4294967295 );
-    test_packed_int< comma::packed::net_int16 >( 1234 );
-    test_packed_int< comma::packed::net_int32 >( 1234 );
-    test_packed_int< comma::packed::net_int16 >( -1234 );
-    test_packed_int< comma::packed::net_int32 >( -1234 );
+    test_packed_int< comma::packed::big_endian::uint16 >( 1234 );
+    test_packed_int< comma::packed::big_endian::uint16 >( 65535 );
+    test_packed_uint< comma::packed::big_endian::uint24 >( 1232 );
+    test_packed_uint< comma::packed::big_endian::uint24 >( 16777215 );
+    test_packed_int< comma::packed::big_endian::uint32 >( 1234 );
+    test_packed_int< comma::packed::big_endian::uint32 >( 4294967295 );
+    test_packed_int< comma::packed::big_endian::int16 >( 1234 );
+    test_packed_int< comma::packed::big_endian::int32 >( 1234 );
+    test_packed_int< comma::packed::big_endian::int16 >( -1234 );
+    test_packed_int< comma::packed::big_endian::int32 >( -1234 );
+    test_packed_int< comma::packed::big_endian::int24 >( -1 );
+    test_packed_int< comma::packed::big_endian::int24 >( -2 );
+    test_packed_int< comma::packed::big_endian::int24 >( -1232 );
+    test_packed_int< comma::packed::big_endian::int24 >( -8388607 );
+    test_packed_int< comma::packed::big_endian::int24 >( -8388608 );
 }
 
 template< typename T >
@@ -151,7 +146,7 @@ static void test_int64_byte_order( comma::int64 value, char byte0, char byte1, c
 TEST( test_packed_struct_test, test_int64_byte_order )
 {
     comma::int64 i = 0xFBCDEF1213141500LL;
-    test_int64_byte_order< comma::packed::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xFB );
+    test_int64_byte_order< comma::packed::little_endian::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xFB );
 }
 
 template< typename T >
@@ -172,12 +167,12 @@ static void test_uint64_byte_order( comma::uint64 value, char byte0, char byte1,
 TEST( test_packed_struct_test, test_uint64_byte_order )
 {
     comma::uint64 i = 0xABCDEF1213141500ULL;
-    test_uint64_byte_order< comma::packed::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xAB );
+    test_uint64_byte_order< comma::packed::little_endian::uint64 >( i, 0x00, 0x15, 0x14, 0x13, 0x12, 0xEF, 0xCD, 0xAB );
 }
 
 static void test_int24_byte_order( int value, char byte0, char byte1, char byte2 )
 {
-    comma::packed::int24 a;
+    comma::packed::little_endian::int24 a;
     a = value;
     EXPECT_EQ( ( 0xff & a.data()[0] ), ( 0xff & byte0 ) );
     EXPECT_EQ( ( 0xff & a.data()[1] ), ( 0xff & byte1 ) );
@@ -201,10 +196,10 @@ TEST( test_packed_struct_test, test_int24_byte_order )
 
 struct test_packed_struct_floats_t : public comma::packed::packed_struct< test_packed_struct_floats_t, 24 >
 {
-    comma::packed::float32 f32;
-    comma::packed::float64 f64;
-    comma::packed::net_float32 nf32;
-    comma::packed::net_float64 nf64;
+    comma::packed::little_endian::float32 f32;
+    comma::packed::little_endian::float64 f64;
+    comma::packed::big_endian::float32 nf32;
+    comma::packed::big_endian::float64 nf64;
 };
 
 TEST( packed_struct, test_packed_struct_floats )
@@ -218,7 +213,7 @@ TEST( packed_struct, test_packed_struct_floats )
     EXPECT_DOUBLE_EQ( 1.23456789, s.f64() );
 }
 
-TEST( packed_struct, test_packed_struct_net_floats )
+TEST( packed_struct, test_packed_struct_big_endian_floats )
 {
     test_packed_struct_floats_t s;
     EXPECT_FLOAT_EQ( true, s.nf32 == 0 );
@@ -231,25 +226,25 @@ TEST( packed_struct, test_packed_struct_net_floats )
 
 TEST( test_packed_struct_test, test_little_endian_floats )
 {
-    comma::packed::float32 a;
+    comma::packed::little_endian::float32 a;
     EXPECT_FLOAT_EQ( 0, a() );
     a = 1.2345;
     EXPECT_FLOAT_EQ( 1.2345, a() );
 
-    comma::packed::float64 b;
+    comma::packed::little_endian::float64 b;
     EXPECT_DOUBLE_EQ( 0, b() );
     b = 1.23456789;
     EXPECT_DOUBLE_EQ( 1.23456789, b() );
 }
 
-TEST( test_packed_struct_test, test_net_floats )
+TEST( test_packed_struct_test, test_big_endian_floats )
 {
-    comma::packed::net_float32 a;
+    comma::packed::big_endian::float32 a;
     EXPECT_FLOAT_EQ( 0, a() );
     a = 1.2345;
     EXPECT_FLOAT_EQ( 1.2345, a() );
 
-    comma::packed::net_float64 b;
+    comma::packed::big_endian::float64 b;
     EXPECT_DOUBLE_EQ( 0, b() );
     b = 1.23456789;
     EXPECT_DOUBLE_EQ( 1.23456789, b() );
@@ -268,14 +263,14 @@ static void test_float32_byte_order( float value, char byte0, char byte1, char b
 
 TEST( test_packed_struct_test, test_float32_byte_order )
 {
-    test_float32_byte_order< comma::packed::float32 >( 5.2, 0x66, 0x66, 0xA6, 0x40 );
-    test_float32_byte_order< comma::packed::float32 >( -5.2, 0x66, 0x66, 0xA6, 0xC0 );
+    test_float32_byte_order< comma::packed::little_endian::float32 >( 5.2, 0x66, 0x66, 0xA6, 0x40 );
+    test_float32_byte_order< comma::packed::little_endian::float32 >( -5.2, 0x66, 0x66, 0xA6, 0xC0 );
 }
 
-TEST( test_packed_struct_test, test_net_float32_byte_order )
+TEST( test_packed_struct_test, test_big_endian_float32_byte_order )
 {
-    test_float32_byte_order< comma::packed::net_float32 >( 5.2, 0x40, 0xA6, 0x66, 0x66 );
-    test_float32_byte_order< comma::packed::net_float32 >( -5.2, 0xC0, 0xA6, 0x66, 0x66 );
+    test_float32_byte_order< comma::packed::big_endian::float32 >( 5.2, 0x40, 0xA6, 0x66, 0x66 );
+    test_float32_byte_order< comma::packed::big_endian::float32 >( -5.2, 0xC0, 0xA6, 0x66, 0x66 );
 }
 
 template< typename T >
@@ -295,18 +290,18 @@ static void test_float64_byte_order( double value, char byte0, char byte1, char
 
 TEST( test_packed_struct_test, test_float64_byte_order )
 {
-    test_float64_byte_order< comma::packed::float64 >( 5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0x40 );
-    test_float64_byte_order< comma::packed::float64 >( -5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0xC0 );
-    test_float64_byte_order< comma::packed::float64 >( -1.2e-123, 0x4E, 0x57, 0x04, 0xD1, 0x71, 0x62, 0x69, 0xA6 );
-    test_float64_byte_order< comma::packed::float64 >( -1.2e+123, 0x21, 0xBD, 0xC3, 0x60, 0x60, 0x0B, 0x7D, 0xD9 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( 5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0x40 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( -5.2, 0xCD, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0x14, 0xC0 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( -1.2e-123, 0x4E, 0x57, 0x04, 0xD1, 0x71, 0x62, 0x69, 0xA6 );
+    test_float64_byte_order< comma::packed::little_endian::float64 >( -1.2e+123, 0x21, 0xBD, 0xC3, 0x60, 0x60, 0x0B, 0x7D, 0xD9 );
 }
 
-TEST( test_packed_struct_test, test_net_float64_byte_order )
+TEST( test_packed_struct_test, test_big_endian_float64_byte_order )
 {
-    test_float64_byte_order< comma::packed::net_float64 >( 5.2, 0x40, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
-    test_float64_byte_order< comma::packed::net_float64 >( -5.2, 0xC0, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
-    test_float64_byte_order< comma::packed::net_float64 >( -1.2e-123, 0xA6, 0x69, 0x62, 0x71, 0xD1, 0x04, 0x57, 0x4E );
-    test_float64_byte_order< comma::packed::net_float64 >( -1.2e+123, 0xD9, 0x7D, 0x0B, 0x60, 0x60, 0xC3, 0xBD, 0x21 );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( 5.2, 0x40, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( -5.2, 0xC0, 0x14, 0xCC, 0xCC, 0xCC, 0xCC, 0xCC, 0xCD );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( -1.2e-123, 0xA6, 0x69, 0x62, 0x71, 0xD1, 0x04, 0x57, 0x4E );
+    test_float64_byte_order< comma::packed::big_endian::float64 >( -1.2e+123, 0xD9, 0x7D, 0x0B, 0x60, 0x60, 0xC3, 0xBD, 0x21 );
 }
 
 static boost::array< std::string, 16 > hex_digits_u = { { "0", "1", "2", "3", "4", "5", "6", "7", "8", "9", "A", "B", "C", "D", "E", "F" } };
diff --git a/packed/traits.h b/packed/traits.h
index e16a5e22e..b8dd0cf0e 100644
--- a/packed/traits.h
+++ b/packed/traits.h
@@ -1,49 +1,37 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author Vsevolod Vlaskine
 
 #pragma once
 
-#include "big_endian.h"
-#include <boost/array.hpp>
+#include <memory>
+#include <string>
 #include "../visiting/traits.h"
+#include "string.h"
 
 namespace comma { namespace visiting {
 
-template < typename T, std::size_t N > struct traits< boost::array<comma::packed::detail::big_endian<T>, N> >
+// todo: add traits for other types
+
+template < std::size_t Size, char Padding > struct traits< comma::packed::string< Size, Padding > >
 {
-    template< typename K, typename V > static void visit( const K& k, const boost::array<comma::packed::detail::big_endian<T>, N>& t, V& v )
+    template < typename Key, class Visitor > static void visit( const Key& k, comma::packed::string< Size, Padding >& p, Visitor& v )
     {
-        for( std::size_t i = 0; i < t.size(); i++ ) { v.apply( i, t[i]() ); }
+        // todo? quick and dirty for now; should we support nacked pointers in visitors?
+        // todo? should we replace Padding with 0?
+        std::string s( p.data(), Size );
+        v.apply( k, s );
+        std::memset( p.data(), Padding, Size );
+        std::memcpy( p.data(), &s[0], std::min( s.size(), Size ) );
     }
-};
-
-
-} } //namespace comma { namespace visiting {
 
+    template < typename Key, class Visitor > static void visit( const Key& k, const comma::packed::string< Size, Padding >& p, Visitor& v )
+    {
+        // todo? quick and dirty for now; should we support nacked pointers in visitors?
+        // todo? should we replace Padding with 0?
+        std::string s( p.data(), Size );
+        v.apply( k, s );
+    }
+};
 
+} } // namespace comma { namespace visiting {
diff --git a/python/CMakeLists.txt b/python/CMakeLists.txt
index b8a695df2..4ec896d52 100644
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@@ -40,16 +40,15 @@ MACRO( set_python_build_lib_directory )
     ENDIF( MODULE_EXIT_CODE MATCHES 0 )
 ENDMACRO( set_python_build_lib_directory )
 
-
 IF( NOT BUILD_PYTHON_PACKAGES )
     disable_python_testing()
     RETURN()
 ENDIF( NOT BUILD_PYTHON_PACKAGES )
 
-FIND_PROGRAM( PYTHON "python" )
+FIND_PROGRAM( PYTHON "python3" )
 
 IF( NOT PYTHON )
-    MESSAGE( WARNING "python not found" )
+    MESSAGE( WARNING "python3 not found" )
     MESSAGE( STATUS "comma/python modules and scripts will not be installed" )
     disable_python_testing()
     RETURN()
@@ -68,7 +67,7 @@ IF( PYTHON_PACKAGE_INSTALL_PREFIX )
     ENDIF( NOT WIN32 )
 ENDIF( PYTHON_PACKAGE_INSTALL_PREFIX )
 
-SET( SETUP_PY "${CMAKE_CURRENT_SOURCE_DIR}/setup.py" )
+SET( SETUP_PY "${CMAKE_CURRENT_SOURCE_DIR}/setup.py" ) # todo: uses pip instead
 
 SET( BUILD_BASE "${CMAKE_CURRENT_BINARY_DIR}/build" )
 
@@ -76,16 +75,29 @@ SET( comma_PYTHON_SOURCE_ROOT_DIR ${CMAKE_CURRENT_SOURCE_DIR} )
 
 set_python_build_lib_directory()
 
-ADD_SUBDIRECTORY( comma )
+add_subdirectory( comma )
+add_subdirectory( bindings )
 
 ADD_CUSTOM_TARGET( python_build ALL
-                ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE}
-                WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )
+                   ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE}
+                   WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )
 
 INSTALL( CODE "EXECUTE_PROCESS(
                     COMMAND ${PYTHON} ${SETUP_PY} build --build-base ${BUILD_BASE} install ${INSTALL_PREFIX_OPTION} --force
                     WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
 
+# setup.py creates a couple of working directories in the current directory: comma_py.egg_info and dist
+# Because it's run in the install stage, and therefore typically as root, these
+# directories are owned by root, which is a bit annoying as they are in the
+# source tree. So set them to being owned by the user.
+INSTALL( CODE "EXECUTE_PROCESS(
+                    COMMAND chown -R $ENV{USER} comma_py.egg-info dist
+                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
+
+#install( CODE "EXECUTE_PROCESS(
+#                    COMMAND ${PYTHON} -m pip install ${CMAKE_CURRENT_SOURCE_DIR} --ignore-installed
+#                    WORKING_DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR} )" )
+
 SET_DIRECTORY_PROPERTIES( PROPERTIES ADDITIONAL_MAKE_CLEAN_FILES build )
 
 IF( ADD_PYTHON_PACKAGES_TO_RPM )
diff --git a/python/README.md b/python/README.md
new file mode 100644
index 000000000..57478d578
--- /dev/null
+++ b/python/README.md
@@ -0,0 +1,16 @@
+**comma** is a generic library for efficient processing of fixed-width
+(comma-separated or binary) data mostly written in C++
+
+**comma-py** is the part of **comma** written in python; the main part of
+it is **csv-eval** command line utility for efficient **numpy**-style
+conversions on an input stream of comma-separated or fixed-width binary
+data.
+
+**comma-py** also has useful modules for dictionary and signal manipulations.
+
+for more details, run:
+```
+csv-eval --help --verbose
+```
+
+**documentation**: [https://gitlab.com/orthographic/comma/-/wikis/home](https://gitlab.com/orthographic/comma/-/wikis/home)
diff --git a/python/bindings/CMakeLists.txt b/python/bindings/CMakeLists.txt
new file mode 100644
index 000000000..005b21bc7
--- /dev/null
+++ b/python/bindings/CMakeLists.txt
@@ -0,0 +1,20 @@
+set( PROJECT "python_bindings" )
+set( TARGET_NAME comma_${PROJECT} )
+set( dir ${SOURCE_CODE_BASE_DIR}/python/bindings )
+
+file( GLOB_RECURSE source ${dir}/*.cpp )
+file( GLOB_RECURSE includes ${dir}/*.h )
+
+source_group( ${TARGET_NAME} FILES ${source} ${includes} )
+
+add_library( ${TARGET_NAME} ${source} ${includes} )
+set_target_properties( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+target_link_libraries( ${TARGET_NAME} comma_base ${comma_ALL_EXTERNAL_LIBRARIES} )
+
+# INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/ )
+install(
+    TARGETS ${TARGET_NAME}
+    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
+    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
+    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
+)
diff --git a/python/bindings/containers/multidimensional/map.cpp b/python/bindings/containers/multidimensional/map.cpp
new file mode 100644
index 000000000..991043d27
--- /dev/null
+++ b/python/bindings/containers/multidimensional/map.cpp
@@ -0,0 +1,185 @@
+#include <iostream>
+
+#include <cstdint>
+#include <limits>
+#include <vector>
+#include "../../../../base/exception.h"
+#include "../../../../containers/multidimensional/map.h"
+#include "map.h"
+
+namespace comma { namespace python { namespace bindings { namespace containers { namespace multidimensional { namespace map { namespace impl {
+
+class base
+{
+    public:
+        base( void* m ): _m( m ) {}
+        virtual ~base() = default;
+        virtual void insert( const void* p, int v ) = 0;
+        virtual const int* at( const void* p, unsigned int* size ) const = 0;
+        virtual const int* nearest( const void* k, unsigned int neighbourhood ) const = 0;
+        virtual unsigned int count() const = 0;
+        virtual unsigned int size() const = 0;
+    protected:
+        void* _m{nullptr};
+};
+
+template < unsigned int D > struct _traits
+{ 
+    static unsigned int power( unsigned int b ) { return _traits< D - 1 >::power( b ) * b; }
+    static std::array< int, D > index( unsigned int v, int b, unsigned int i = D )
+    {
+        std::array< int, D > a;
+        for( int i = D - 1; i >= 0; a[i--] = v % b - b / 2, v /= b );
+        return a;
+    } 
+};
+
+template <> struct _traits< 0 > { static unsigned int power( unsigned int ) { return 1; } };
+
+template < typename K, unsigned int Dim >
+struct proxy: public base
+{
+    typedef std::array< K, Dim > key_t;
+    
+    typedef comma::containers::multidimensional::map< K, std::pair< std::vector< int >, std::vector< key_t > >, Dim > map_t;
+
+    proxy( const void* o, const void* r, const void* p, int size )
+        : base( new map_t( *reinterpret_cast< const key_t* >( o ), *reinterpret_cast< const key_t* >( r ) ) )
+    {
+        if( !p || size == 0 ) { return; }
+        const K* q = reinterpret_cast< const K* >( p );
+        for( int i = 0; i < size; ++i, q += Dim ) { insert( q, i ); }
+    }
+
+    ~proxy() { if( _m ) { delete reinterpret_cast< map_t* >( _m ); } }
+
+    void insert( const void* k, int v )
+    {
+        auto i = map().touch_at( key( k ) );
+        i->second.first.push_back( v );
+        i->second.second.push_back( key( k ) );
+    }
+
+    const int* at( const void* k, unsigned int* size ) const
+    {
+        auto i = map().at( key( k ) );
+        *size = i == map().end() ? 0 : int( i->second.first.size() );
+        return *size == 0 ? nullptr : &i->second.first[0];
+    }
+
+    // todo: up to a given number of nearest points
+    // todo: all points in radius
+    // todo: multple input points
+    const int* nearest( const void* k, unsigned int neighbourhood ) const
+    {
+        auto i = map().index_of( key( k ) );
+        int b = neighbourhood * 2 + 1;
+        double s = std::numeric_limits< double >::max();
+        const int* si{nullptr};
+        for( unsigned int p = 0; p < _traits< Dim >::power( b ); ++p )
+        {
+            typename map_t::index_type j = _traits< Dim >::index( p, b );
+            for( unsigned int m = 0; m < Dim; ++m ) { j[m] += i[m]; }
+            auto n = map().find( j );
+            if( n == map().end() ) { continue; }
+            for( unsigned int q = 0; q < n->second.first.size(); ++q )
+            {
+                double t = 0;
+                for( unsigned int m = 0; m < Dim; ++m )
+                { 
+                    double d = key( k )[m] - n->second.second[q][m]; 
+                    t += d * d;
+                }
+                if( t < s ) { s = t; si = &n->second.first[q]; }
+            }
+        }
+        return si;
+    }
+    
+    unsigned int size() const { return map().size(); }
+
+    unsigned int count() const { unsigned int c{0}; for( auto i: map() ) { c += i.second.first.size(); } return c; }
+
+    map_t& map() { return *reinterpret_cast< map_t* >( _m ); }
+
+    const map_t& map() const { return *reinterpret_cast< const map_t* >( _m ); }
+
+    const key_t& key( const void* p ) const { return *reinterpret_cast< const key_t* >( p ); }
+};
+
+void* make( int key_type, unsigned int dim, const void* o, const void* r, const void* v, unsigned int s )
+{
+    switch( key_type )
+    {
+        case _comma_int32:
+            switch( dim )
+            {
+                case 2: return new proxy< std::int32_t, 2 >( o, r, v, s );
+                case 3: return new proxy< std::int32_t, 3 >( o, r, v, s );
+                case 4: return new proxy< std::int32_t, 4 >( o, r, v, s );
+                case 5: return new proxy< std::int32_t, 5 >( o, r, v, s );
+                case 6: return new proxy< std::int32_t, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with int32 keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        case _comma_int64:
+            switch( dim )
+            {
+                case 2: return new proxy< std::int64_t, 2 >( o, r, v, s );
+                case 3: return new proxy< std::int64_t, 3 >( o, r, v, s );
+                case 4: return new proxy< std::int64_t, 4 >( o, r, v, s );
+                case 5: return new proxy< std::int64_t, 5 >( o, r, v, s );
+                case 6: return new proxy< std::int64_t, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with int64 keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        case _comma_float32:
+            static_assert( sizeof( float ) == 4 );
+            switch( dim )
+            {
+                case 2: return new proxy< float, 2 >( o, r, v, s );
+                case 3: return new proxy< float, 3 >( o, r, v, s );
+                case 4: return new proxy< float, 4 >( o, r, v, s );
+                case 5: return new proxy< float, 5 >( o, r, v, s );
+                case 6: return new proxy< float, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with float32 keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        case _comma_float64:
+            static_assert( sizeof( double ) == 8 );
+            switch( dim )
+            {
+                case 2: return new proxy< double, 2 >( o, r, v, s );
+                case 3: return new proxy< double, 3 >( o, r, v, s );
+                case 4: return new proxy< double, 4 >( o, r, v, s );
+                case 5: return new proxy< double, 5 >( o, r, v, s );
+                case 6: return new proxy< double, 6 >( o, r, v, s );
+                default: COMMA_THROW_BRIEF( comma::exception, "multidimensional map with double keys supports 2 to 6 dimensions; got: " << dim << "; just ask for more" );
+            }
+            break;
+        default:
+            COMMA_THROW_BRIEF( comma::exception, "multidimensional map supports types int32 (0), int64 (1), float32 (2), and float64 (3); got: " << key_type );
+    }
+    return nullptr;
+}
+
+} } } } } } } // namespace comma { namespace python { namespace bindings { namespace containers { namespace multidimensional { namespace map { namespace impl {
+
+static auto as_base( void* p ) { return reinterpret_cast< comma::python::bindings::containers::multidimensional::map::impl::base* >( p ); }
+
+static auto as_base( const void* p ) { return reinterpret_cast< const comma::python::bindings::containers::multidimensional::map::impl::base* >( p ); }
+
+DLL_EXPORT void* comma_containers_multidimensional_map_create( int key_type, unsigned int dim, const void* origin, const void* resolution, const void* values, unsigned int size )
+{
+    return comma::python::bindings::containers::multidimensional::map::impl::make( key_type, dim, origin, resolution, values, size );
+}
+
+DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p ) { delete as_base( p ); }
+
+DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, const void* k, void* size ) { return as_base( p )->at( k, reinterpret_cast< unsigned int* >( size ) ); }
+
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p ) { return as_base( p )->size(); }
+
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void* p ) { return as_base( p )->count(); }
+
+DLL_EXPORT const void* comma_containers_multidimensional_map_nearest( const void* p, const void* k, unsigned int n ) { return as_base( p )->nearest( k, n ); }
\ No newline at end of file
diff --git a/python/bindings/containers/multidimensional/map.h b/python/bindings/containers/multidimensional/map.h
new file mode 100644
index 000000000..c11b4b481
--- /dev/null
+++ b/python/bindings/containers/multidimensional/map.h
@@ -0,0 +1,22 @@
+#pragma once
+
+#include "../../definitions.h"
+#include "../../memory.h"
+
+extern "C" {
+
+enum types { _comma_int32 = 0, _comma_int64 = 1, _comma_float32 = 2, _comma_float64 = 3 };
+
+DLL_EXPORT void* comma_containers_multidimensional_map_create( int key_type, unsigned int dim, const void* origin, const void* resolution, const void* values, unsigned int size );
+
+DLL_EXPORT void comma_containers_multidimensional_map_destroy( void* p );
+
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_size( const void* p );
+
+DLL_EXPORT unsigned int comma_containers_multidimensional_map_count( const void* p );
+
+DLL_EXPORT const void* comma_containers_multidimensional_map_at( const void* p, const void* k, void* size );
+
+DLL_EXPORT const void* comma_containers_multidimensional_map_nearest( const void* p, const void* k, unsigned int n );
+
+}
\ No newline at end of file
diff --git a/python/bindings/definitions.h b/python/bindings/definitions.h
new file mode 100644
index 000000000..f68b7134b
--- /dev/null
+++ b/python/bindings/definitions.h
@@ -0,0 +1,7 @@
+#pragma once
+
+#ifdef _WIN32
+#define DLL_EXPORT __declspec( dllexport )
+#else
+#define DLL_EXPORT
+#endif
diff --git a/python/bindings/memory.cpp b/python/bindings/memory.cpp
new file mode 100644
index 000000000..5f971db25
--- /dev/null
+++ b/python/bindings/memory.cpp
@@ -0,0 +1,4 @@
+#include <stdlib.h>
+#include "memory.h"
+
+DLL_EXPORT void comma_free( void* p ) { ::free( p ); }
diff --git a/python/bindings/memory.h b/python/bindings/memory.h
new file mode 100644
index 000000000..aa43287b4
--- /dev/null
+++ b/python/bindings/memory.h
@@ -0,0 +1,15 @@
+#pragma once
+
+#include "definitions.h"
+
+#ifdef _WIN32
+#define DLL_EXPORT __declspec( dllexport )
+#else
+#define DLL_EXPORT
+#endif
+
+extern "C" {
+
+DLL_EXPORT void comma_free( void* p );
+
+}
diff --git a/python/comma-rpm-post-install.sh b/python/comma-rpm-post-install.sh
index c123837af..1f82ccfe7 100644
--- a/python/comma-rpm-post-install.sh
+++ b/python/comma-rpm-post-install.sh
@@ -1,3 +1,3 @@
 #!/bin/sh
 
-cd /tmp/comma/python_modules_for_rpm_install && python setup.py install
+cd /tmp/comma/python_modules_for_rpm_install && python3 setup.py install
diff --git a/python/comma/CMakeLists.txt b/python/comma/CMakeLists.txt
index 22a8a1305..5df8ec9cc 100644
--- a/python/comma/CMakeLists.txt
+++ b/python/comma/CMakeLists.txt
@@ -1,8 +1,3 @@
-ADD_SUBDIRECTORY( application )
-ADD_SUBDIRECTORY( csv )
-ADD_SUBDIRECTORY( io )
-ADD_SUBDIRECTORY( util )
-
-IF( BUILD_CPP_PYTHON_BINDINGS )
-    ADD_SUBDIRECTORY( cpp_bindings )
-ENDIF( BUILD_CPP_PYTHON_BINDINGS )
+if( BUILD_CPP_PYTHON_BINDINGS )
+    add_subdirectory( cpp_bindings )
+endif( BUILD_CPP_PYTHON_BINDINGS )
diff --git a/python/comma/__init__.py b/python/comma/__init__.py
index 2fd92eed7..878ab83d3 100644
--- a/python/comma/__init__.py
+++ b/python/comma/__init__.py
@@ -1,33 +1,10 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+# Copyright (c) 2013 Vsevolod Vlaskine
 
+from . import containers
 from . import csv
+from . import dictionary
+from . import filesystem
 from . import io
 from . import numpy
 from . import signal
diff --git a/python/comma/application/CMakeLists.txt b/python/comma/application/CMakeLists.txt
deleted file mode 100644
index e69de29bb..000000000
diff --git a/python/comma/application/__init__.py b/python/comma/application/__init__.py
index 3ba012175..d7233de96 100644
--- a/python/comma/application/__init__.py
+++ b/python/comma/application/__init__.py
@@ -27,4 +27,5 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .command_line import *
+from ._command_line import set_dictionary_action, remove_argparse_options
+
diff --git a/python/comma/application/command_line.py b/python/comma/application/_command_line.py
similarity index 99%
rename from python/comma/application/command_line.py
rename to python/comma/application/_command_line.py
index 6f5fbc0b9..e11a2f712 100644
--- a/python/comma/application/command_line.py
+++ b/python/comma/application/_command_line.py
@@ -1,5 +1,3 @@
-#!/usr/bin/python
-
 import argparse
 
 class set_dictionary_action( argparse.Action ):
diff --git a/python/comma/application/test/dict/test b/python/comma/application/test/dict/test
index 70625e611..bf8440ccc 100755
--- a/python/comma/application/test/dict/test
+++ b/python/comma/application/test/dict/test
@@ -10,20 +10,20 @@ function main()
 {
     local value_type
     value_type=${input_value_type:+"value_type=$input_value_type, "}
-    python -c "
+    python3 -c "
 import comma.application
 import argparse
 
 parser = argparse.ArgumentParser( )
 parser.add_argument( '--dict', metavar='DICT', help='populate a dictionary of given type', type=str, action=comma.application.set_dictionary_action, $value_type delimiter=';', default={} )
 args = parser.parse_args()
-for k, v in args.dict.iteritems():
+for k, v in args.dict.items():
     def quote_if_string( v ):
         if type( v ) == str:
             return '\"%s\"' % v
         else:
             return v
-    print '%s=%s' % ( k, quote_if_string( v ) )
+    print( '%s=%s' % ( k, quote_if_string( v ) ) )
 " $input_args
 }
 
diff --git a/python/comma/application/test/remove/test b/python/comma/application/test/remove/test
index 9eb261bb5..de0be364a 100755
--- a/python/comma/application/test/remove/test
+++ b/python/comma/application/test/remove/test
@@ -7,7 +7,7 @@ mkdir -p "$output_dir" || exit 1
 
 function main()
 {
-    python -c "
+    python3 -c "
 import comma.application
 import argparse
 
diff --git a/python/comma/containers/__init__.py b/python/comma/containers/__init__.py
new file mode 100644
index 000000000..602e6d3b6
--- /dev/null
+++ b/python/comma/containers/__init__.py
@@ -0,0 +1 @@
+from . import multidimensional
diff --git a/python/comma/containers/multidimensional/__init__.py b/python/comma/containers/multidimensional/__init__.py
new file mode 100644
index 000000000..ca579ad56
--- /dev/null
+++ b/python/comma/containers/multidimensional/__init__.py
@@ -0,0 +1 @@
+from ._map import Map
diff --git a/python/comma/containers/multidimensional/_map.py b/python/comma/containers/multidimensional/_map.py
new file mode 100644
index 000000000..448551a09
--- /dev/null
+++ b/python/comma/containers/multidimensional/_map.py
@@ -0,0 +1,53 @@
+import ctypes, ctypes.util, numpy, sys
+
+class Map:
+    def __init__( self, resolution, origin=None, values=None ):
+        self._dtype = resolution.dtype
+        # todo: if resolution is not numpy array, try origin; if origin is not numpy array, try values
+        self._bindings = ctypes.CDLL( ctypes.util.find_library( 'comma_python_bindings' ) )
+        self._create = self._bindings.comma_containers_multidimensional_map_create
+        self._create.argtypes = [ ctypes.c_int, ctypes.c_uint, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_void_p, ctypes.c_uint ]
+        self._create.restype = ctypes.c_void_p
+        self._at = self._bindings.comma_containers_multidimensional_map_at
+        self._at.argtypes = [ ctypes.c_void_p, ctypes.c_void_p ]
+        self._at.restype = ctypes.c_void_p
+        self._count = self._bindings.comma_containers_multidimensional_map_count
+        self._count.argtypes = [ ctypes.c_void_p ]
+        self._count.restype = ctypes.c_uint
+        self._size = self._bindings.comma_containers_multidimensional_map_size
+        self._size.argtypes = [ ctypes.c_void_p ]
+        self._size.restype = ctypes.c_uint
+        self._at = self._bindings.comma_containers_multidimensional_map_at
+        self._at.argtypes = [ ctypes.c_void_p, ctypes.c_void_p ]
+        self._at.restype = ctypes.c_void_p
+        self._nearest = self._bindings.comma_containers_multidimensional_map_nearest
+        self._nearest.argtypes = [ ctypes.c_void_p, ctypes.c_void_p, ctypes.c_uint ]
+        self._nearest.restype = ctypes.c_void_p
+        key_types = { numpy.dtype( 'int32' ): 0, numpy.dtype( 'int64' ): 1, numpy.dtype( 'float32' ): 2, numpy.dtype( 'float64' ): 3 }
+        if origin is None: origin = numpy.zeros( resolution.shape[0] )
+        assert self._dtype in key_types, TypeError( f'expected key type in {list(key_types.keys())}; got: {self._dtype}' )
+        self._map = self._create( key_types[self._dtype]
+                        , resolution.shape[0]
+                        , numpy.array( origin, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p )
+                        , numpy.array( resolution, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p )
+                        , numpy.array( [] if values is None else values, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p )
+                        , 0 if values is None else len( values ) )
+        
+    def __enter__( self ): return self
+
+    def __exit__( self, type, value, traceback ): self._bindings.comma_containers_multidimensional_map_destroy( self._map )
+
+    def at( self, value, radius=None ):
+        if radius is None:
+            s = numpy.zeros( 1, dtype=numpy.int32 ) # todo: quick and dirty, figure out the right way
+            p = self._at( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), s.ctypes.data_as( ctypes.c_void_p ) )
+            return None if p is None else numpy.frombuffer( ctypes.string_at( p, s[0] * 4 ), dtype=numpy.int32, count=s[0] )
+        raise NotImplementedError( 'Map.at(...,radius=...): implementing...' )
+
+    def nearest( self, value ):
+        n = self._nearest( self._map, numpy.array( value, dtype=self._dtype ).ctypes.data_as( ctypes.c_void_p ), 1 ) # todo? radius?
+        return None if n is None else ctypes.cast( n, ctypes.POINTER( ctypes.c_uint ) )[0]
+
+    def count( self ): return self._count( self._map )
+    
+    def size( self ): return self._size( self._map )
diff --git a/python/comma/containers/multidimensional/test/test b/python/comma/containers/multidimensional/test/test
new file mode 100755
index 000000000..805e29f9b
--- /dev/null
+++ b/python/comma/containers/multidimensional/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+# todo! consolidate pytests
+name=$( basename $0 )
+type -p pytest >/dev/null || { echo "$0: pytest not found; to install run: sudo apt install python3-pytest" >&2; exit 1; }
+pytest 1>&2 && echo "$name: succeeded" >&2 || { echo "$name: failed" >&2; exit 1; }
diff --git a/python/comma/containers/multidimensional/test/test_multidimensional_map.py b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
new file mode 100644
index 000000000..8f3c39306
--- /dev/null
+++ b/python/comma/containers/multidimensional/test/test_multidimensional_map.py
@@ -0,0 +1,34 @@
+import numpy, pytest, sys
+from comma.containers import multidimensional
+
+def test_multidimensional_map_size():
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).size() == 0
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).count() == 0
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]), values=[[0.5, 0.5, 0.5], [0.5, 0.5, 0.5], [0.5, 0.5, 0.5]] ).size() == 1
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]), values=[[0.5, 0.5, 0.5], [0.5, 0.5, 0.5], [0.5, 0.5, 0.5]] ).count() == 3
+    assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).size() == 1
+    assert multidimensional.Map( resolution=numpy.array([10, 10, 10], dtype=numpy.float32), values=[[1, 2, 3], [4, 5, 6], [7, 8, 9]] ).count() == 3
+
+def test_multidimensional_map_at():
+    assert multidimensional.Map( resolution=numpy.array([1, 1, 1]) ).at([0, 0, 0]) is None
+    m = multidimensional.Map( resolution=numpy.array([2, 2, 2], dtype=float), values=[[0, 0, 0], [0.5, 0.5, 0.5], [1, 1, 1], [2, 2, 2], [3, 3, 3]] )
+    assert m.size() == 2
+    assert m.count() == 5
+    assert m.at( [-1, -1, -1] ) is None
+    assert ( m.at( [0, 0, 0] ) == [0, 1, 2] ).all()
+    assert ( m.at( [2, 2, 2] ) == [3, 4] ).all()
+    assert m.at( [5, 5, 5] ) is None
+    # todo
+    # - single point method? or pass multiple points and decide on shape?
+    # - return list of sizes and list of indices
+    # ? profile performance 
+    # print( m.at( [5, 5, 5], radius=3 ), file=sys.stderr )
+
+def test_multidimensional_map_at():
+    values=[[0, 0, 0], [0.5, 0.5, 0.5], [1, 1, 1], [2, 2, 2], [3, 3, 3]]
+    m = multidimensional.Map( resolution=numpy.array([2, 2, 2], dtype=float), values=values )
+    assert values[ m.nearest( [0, 0, 0] ) ] == [0, 0, 0]
+    assert values[ m.nearest( [0.4, 0.4, 0.4] ) ] == [0.5, 0.5, 0.5]
+    assert values[ m.nearest( [1.4, 1.4, 1.4] ) ] == [1, 1, 1]
+    assert values[ m.nearest( [5, 5, 5] ) ] == [3, 3, 3]
+    assert m.nearest( [7, 7, 7] ) is None
diff --git a/python/comma/csv/CMakeLists.txt b/python/comma/csv/CMakeLists.txt
deleted file mode 100644
index de33d8faa..000000000
--- a/python/comma/csv/CMakeLists.txt
+++ /dev/null
@@ -1 +0,0 @@
-ADD_SUBDIRECTORY( applications )
diff --git a/python/comma/csv/__init__.py b/python/comma/csv/__init__.py
index 53598c0bc..b21d6aceb 100644
--- a/python/comma/csv/__init__.py
+++ b/python/comma/csv/__init__.py
@@ -29,6 +29,6 @@
 
 from . import format
 from . import time
-from .struct import struct
-from .stream import stream, numpy_scalar_to_string
-from .options import add as add_options
+from ._struct import struct
+from ._stream import stream, numpy_scalar_to_string
+from ._options import add as add_options
diff --git a/python/comma/csv/options.py b/python/comma/csv/_options.py
similarity index 100%
rename from python/comma/csv/options.py
rename to python/comma/csv/_options.py
diff --git a/python/comma/csv/stream.py b/python/comma/csv/_stream.py
similarity index 75%
rename from python/comma/csv/stream.py
rename to python/comma/csv/_stream.py
index a950b86e1..8e5064a59 100644
--- a/python/comma/csv/stream.py
+++ b/python/comma/csv/_stream.py
@@ -1,44 +1,23 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+from __future__ import print_function
+import copy
+import functools
+import itertools
 import numpy as np
+import os
 import sys
-import itertools
-import functools
 import warnings
+if sys.version_info.major < 3: from itertools import izip
+else: izip = zip # todo! watch performance! it's reported python3 zip is some 30% slower than izip
 from ..util import warning
 from ..io import readlines_unbuffered
 from ..numpy import merge_arrays, types_of_dtype, structured_dtype
 from . import time as csv_time
-from .struct import struct
+from ._struct import struct
 
 DEFAULT_PRECISION = 12
+NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATCH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
 
 def custom_formatwarning(msg, *args): return __name__ + " warning: " + str(msg) + '\n'
 
@@ -68,6 +47,7 @@ def __init__(self,
         self.flush = flush
         self.source = source
         self.target = target
+        #if np.__version__ >= '1.16.0' and target == sys.stdout: self.stdout = os.fdopen( sys.stdout.fileno(), "wb" )
         self.tied = tied
         self.full_xpath = full_xpath
         self.verbose = verbose
@@ -91,12 +71,11 @@ def __init__(self,
         self.default_values = self._default_values(default_values)
         self.missing_values = self._missing_values()
         self.data_extraction_fields = self._data_extraction_fields()
-        self.struct_and_extraction_fields = zip(self.struct.flat_dtype.names,
-                                                self.data_extraction_fields)
+        self.struct_and_extraction_fields = list( zip( self.struct.flat_dtype.names, self.data_extraction_fields ) )
         #self.write_dtype = self._write_dtype()
         #self.unrolled_write_dtype = structured_dtype( ','.join( types_of_dtype( self.write_dtype, unroll=True ) ) )
-        #print >>sys.stderr, "self.write_dtype.descr = %s" % str(self.write_dtype.descr)
-        #print >>sys.stderr, "self.unrolled_write_dtype = %s" % str(self.unrolled_write_dtype)
+        #print( "self.write_dtype.descr = %s" % str(self.write_dtype.descr), file = sys.stderr )
+        #print( "self.unrolled_write_dtype = %s" % str(self.unrolled_write_dtype), file = sys.stderr )
         self._input_array = None
         self._ascii_buffer = None
         self._strings = functools.partial(map, self.numpy_scalar_to_string)
@@ -124,12 +103,12 @@ def read(self, size=None):
         if no records have been read, return None
         """
         if size is None: size = self.size
-        self._input_array = self._read(size)
+        self._input_array = copy.deepcopy( self._read( size ) ) if sys.version_info.major > 2 else self._read( size ) # todo! watch performance in python3!
         if self._input_array.size == 0: return
         return self._struct_array(self._input_array, self.missing_values)
 
     def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in numpy 1.14; see doc of encoding parameter in https://docs.scipy.org/doc/numpy-1.14.0/reference/generated/numpy.genfromtxt.html
-        if np.__version__ >= '1.14.0':
+        if NUMPY_VERSION_MAJOR_ > 1 or NUMPY_VERSION_MINOR_ >= 14: # quick and dirty, since ubuntu 18.04 python3-numpy still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
             return np.genfromtxt( self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter
@@ -139,7 +118,9 @@ def _genfromtxt( self ): # quick and dirty due to the ugliness of the change in
                                 , comments = None
                                 , encoding = None )
         else:
-            return np.genfromtxt( self._ascii_buffer
+            # https://github.com/numpy/numpy/issues/10511 genfromtxt issue in numpy 1.13.x
+            from io import BytesIO
+            return np.genfromtxt( BytesIO( bytes( '\n'.join( self._ascii_buffer ).encode( 'utf-8' ) ) ) if NUMPY_VERSION_MAJOR_ == 1 and NUMPY_VERSION_MINOR_ == 13 else self._ascii_buffer
                                 , dtype = self.input_dtype
                                 , delimiter = self.delimiter
                                 , converters = self.ascii_converters
@@ -155,11 +136,20 @@ def read_from_line(self, line):
 
     def _read(self, size):
         if self.binary:
-            if size < 0 and self.source == sys.stdin:
-                return np.fromstring(self.source.read(), dtype=self.input_dtype)
+            if sys.version_info.major > 2: #if np.__version__ >= '1.16.0': # sigh...
+                if self.source == sys.stdin:
+                    b = sys.stdin.buffer.read( ( size * self.input_dtype.itemsize ) if size >= 0 else -1 ) # b = sys.stdin.buffer.read( self.input_dtype.itemsize * ( size if size >= 0 else self.size ) )
+                    # todo! test on streams where bytes come with irregular delays!
+                    if len(b) % self.input_dtype.itemsize != 0: raise ValueError( "expected records of size {}, got {} bytes, which is not divisible by record size".format( self.input_dtype.itemsize, len( b ) ) )
+                    return np.frombuffer( b, dtype = self.input_dtype, count = len( b ) // self.input_dtype.itemsize )
+                else:
+                    return np.fromfile( self.source, dtype = self.input_dtype, count = -1 if size < 0 else size ) # this line may not be covered by regression test
             else:
-                count = -1 if size < 0 else size
-                return np.fromfile(self.source, dtype=self.input_dtype, count=count)
+                if size < 0 and self.source == sys.stdin:
+                    return np.fromstring(self.source.read(), dtype=self.input_dtype)
+                else:
+                    count = -1 if size < 0 else size
+                    return np.fromfile(self.source, dtype=self.input_dtype, count=count)
         else:
             with warnings.catch_warnings():
                 warnings.simplefilter('ignore')
@@ -183,7 +173,7 @@ def _missing_values(self):
         missing = np.zeros(1, dtype=self.missing_dtype)
         if self.default_values:
             dtype_name_of = dict(zip(self.missing_fields, self.missing_dtype.names))
-            for field, value in self.default_values.iteritems():
+            for field, value in self.default_values.items():
                 name = dtype_name_of[field]
                 if self.missing_dtype[name] == csv_time.DTYPE:
                     try: missing[name] = csv_time.to_numpy(value)
@@ -210,20 +200,28 @@ def write(self, s):
             msg = "size {} not equal to tied size {}".format(s.size, tied_size)
             raise ValueError(msg)
         if self.binary:
-            if self.tied: self._tie_binary(self.tied._input_array, s).tofile(self.target)
-            else: s.tofile(self.target)
+            if sys.version_info.major > 2 and self.target == sys.stdout: # sigh...
+                #self.stdout.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
+                sys.stdout.buffer.write( self._tie_binary(self.tied._input_array, s).tobytes() if self.tied else s.tobytes() )
+            else:
+                if self.tied: self._tie_binary(self.tied._input_array, s).tofile(self.target)
+                else: s.tofile(self.target)
         else:
             unrolled_array = s.view(self.struct.unrolled_flat_dtype)
             #unrolled_array = s.view( self.unrolled_write_dtype )
             if self.tied: lines = self._tie_ascii(self.tied._ascii_buffer, unrolled_array)
             else: lines = (self._toline(scalars) for scalars in unrolled_array)
-            for line in lines: print >> self.target, line
+            for line in lines: print( line, file = self.target )
         self.target.flush()
 
     def _tie_binary(self, tied_array, array): return merge_arrays(tied_array, array)
 
-    def _tie_ascii(self, tied_buffer, unrolled_array):
-        for tied_line, scalars in itertools.izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + self._strings(scalars))
+    if sys.version_info.major < 3: # python3, sigh... don't ask
+        def _tie_ascii(self, tied_buffer, unrolled_array):
+            for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + self._strings(scalars))
+    else:
+        def _tie_ascii(self, tied_buffer, unrolled_array):
+            for tied_line, scalars in izip(tied_buffer, unrolled_array): yield self.delimiter.join([tied_line] + list(self._strings(scalars)))
 
     def _toline(self, scalars): return self.delimiter.join(self._strings(scalars))
 
@@ -236,9 +234,12 @@ def dump(self, mask=None):
 
     def _dump(self):
         if self.binary:
-            self._input_array.tofile(self.target)
+            if sys.version_info.major > 2 and self.target == sys.stdout: # sigh...
+                sys.stdout.buffer.write( self._input_array.tobytes() )
+            else:
+                self._input_array.tofile( self.target )
         else:
-            for line in self._ascii_buffer: print >> self.target, line
+            for line in self._ascii_buffer: print( line, file = self.target )
         self.target.flush()
 
     def _dump_with_mask(self, mask):
@@ -254,16 +255,21 @@ def _dump_with_mask(self, mask):
             msg = "mask size {} not equal to data size {}".format(mask.size, data_size)
             raise ValueError(msg)
         if self.binary:
-            self._input_array[mask].tofile(self.target)
+            if sys.version_info.major > 2 and self.target == sys.stdout: # sigh...
+                sys.stdout.buffer.write( self._input_array[mask].tobytes() )
+            else:
+                self._input_array[mask].tofile(self.target)
         else:
-            for line, allowed in itertools.izip(self._ascii_buffer, mask):
-                if allowed: print >> self.target, line
+            for line, allowed in izip(self._ascii_buffer, mask):
+                if allowed: print( line, file = self.target )
         self.target.flush()
 
     def _warn(self, msg, verbose=True):
         if verbose:
-            with warning(custom_formatwarning) as warn:
-                warn(msg)
+            if sys.version_info.major < 3: # sigh, something is broken at least in python3.7; dumb it down for now
+                with warning(custom_formatwarning) as warn: warn(msg)
+            else:
+                print( 'stream.py: warning:', msg, file=sys.stderr )
 
     def _struct(self, s):
         if not isinstance(s, struct):
@@ -288,7 +294,7 @@ def _fields(self, fields):
         return tuple(xpath(name) or name for name in fields.split(','))
 
     def _format(self, binary, format):
-        if isinstance(binary, basestring):
+        if isinstance(binary, str): # if isinstance(binary, basestring):
             if self.verbose and binary and format and binary != format:
                 msg = "ignoring '{}' and using '{}' since binary keyword has priority" \
                     .format(format, binary)
@@ -347,7 +353,7 @@ def _input_dtype(self):
     def _default_buffer_size(self):
         if self.tied: return self.tied.size
         elif self.flush: return 1
-        return max( 1, stream.buffer_size_in_bytes / self.input_dtype.itemsize ) # todo? too arbitrary for ascii?
+        return max( 1, stream.buffer_size_in_bytes // self.input_dtype.itemsize ) # todo? too arbitrary for ascii?
 
     def _missing_fields(self):
         missing_fields = [field for field in self.struct.fields if field not in self.fields]
@@ -360,10 +366,10 @@ def _missing_fields(self):
     def _missing_dtype(self):
         if not self.missing_fields: return
         n = len(self.input_dtype.names)
-        missing_names = ['f{}'.format(n + i) for i in xrange(len(self.missing_fields))]
+        missing_names = ['f{}'.format(n + i) for i in range(len(self.missing_fields))] # missing_names = ['f{}'.format(n + i) for i in xrange(len(self.missing_fields))]
         type_of = self.struct.type_of_field.get
         missing_types = [type_of(name) for name in self.missing_fields]
-        return np.dtype(zip(missing_names, missing_types))
+        return np.dtype(list(zip(missing_names, missing_types)))
 
     def _complete_dtype(self):
         if self.missing_dtype: return np.dtype(self.input_dtype.descr + self.missing_dtype.descr)
@@ -437,12 +443,12 @@ def numpy_scalar_to_string(scalar, precision=DEFAULT_PRECISION):
     '20150102T123456.123456'
     >>> numpy_scalar_to_string(np.timedelta64(-123, 's'))
     '-123'
-    """
-    
+    """    
     if scalar.dtype.char in np.typecodes['AllInteger']: return str(scalar)
     elif scalar.dtype.char in np.typecodes['Float']: return "{scalar:.{precision}g}".format(scalar=scalar, precision=precision)
     elif scalar.dtype.char in np.typecodes['Datetime']: return csv_time.from_numpy(scalar)
-    elif scalar.dtype.char in 'S': return scalar
+    elif scalar.dtype.char in 'Sa': return scalar.decode('UTF-8') # quick and dirty, python3, sigh...
+    elif scalar.dtype.char in 'U': return str(scalar) # quick and dirty, python3, sigh...
     elif scalar.dtype.char in '?': return str( int( scalar ) ) #elif scalar.dtype.char in '?': return str( map( int, scalar ) )
     msg = "converting {} to string is not implemented".format(repr(scalar.dtype))
     raise NotImplementedError(msg)
diff --git a/python/comma/csv/struct.py b/python/comma/csv/_struct.py
similarity index 94%
rename from python/comma/csv/struct.py
rename to python/comma/csv/_struct.py
index cb8eae907..f4fe66887 100644
--- a/python/comma/csv/struct.py
+++ b/python/comma/csv/_struct.py
@@ -40,13 +40,13 @@ def __init__(self, concise_fields, *concise_types):
         self.concise_types = concise_types
         self.concise_fields = self._fill_blanks(concise_fields)
         self._check_fields_conciseness()
-        self.dtype = np.dtype(zip(self.concise_fields, self.concise_types))
+        self.dtype = np.dtype(list(zip(self.concise_fields, self.concise_types)))
         self.fields = self._full_xpath_fields()
         self.nondefault_fields = self._nondefault_fields()
         self.types = self._basic_types()
         self.shorthand = self._shorthand()
         self.format = ','.join(self.types)
-        self.flat_dtype = np.dtype(zip(self.fields, self.types))
+        self.flat_dtype = np.dtype(list(zip(self.fields, self.types)))
         unrolled_types = types_of_dtype(self.flat_dtype, unroll=True)
         self.unrolled_flat_dtype = structured_dtype(','.join(unrolled_types))
         self.type_of_field = dict(zip(self.fields, self.types))
@@ -87,7 +87,7 @@ def expand_shorthand(self, compressed_fields):
         >>> outer.expand_shorthand('in')
         ('in/i', 'in/j')
         """
-        if isinstance(compressed_fields, basestring):
+        if isinstance(compressed_fields, str): #if isinstance(compressed_fields, basestring):
             compressed_fields = compressed_fields.split(',')
         expand = self.shorthand.get
         field_tuples = map(lambda name: expand(name) or (name,), compressed_fields)
@@ -107,7 +107,7 @@ def _make_fields_map( m, fields ):
 
     def _assign( self, data, fields_map, convert ):
         functors = {}
-        for k, v in fields_map.iteritems():
+        for k, v in fields_map.items():
             if len( v ) > 0:
                 functors[k] = self._assign( getattr( data, k ), v, convert )
             else:
@@ -115,7 +115,7 @@ def functor( value, key = k ):
                     setattr( data, key, value if convert is None else convert( value ) )
                 functors[k] = functor
         def apply_functors( record ):
-            for k, f in functors.iteritems(): f( record[k] )
+            for k, f in functors.items(): f( record[k] )
         return apply_functors
     
     def _nondefault_fields(self):
@@ -123,7 +123,7 @@ def _nondefault_fields(self):
         return tuple(map(lambda f: '' if f.startswith(default_name) else f, self.fields))
 
     def _fill_blanks(self, fields):
-        if isinstance(fields, basestring):
+        if isinstance(fields, str): # if isinstance(fields, basestring):
             fields = fields.split(',')
         ntypes = len(self.concise_types)
         if len(fields) > ntypes:
@@ -172,7 +172,7 @@ def _shorthand(self):
                 continue
             fields_of_type = [name + '/' + field for field in type.fields]
             shorthand[name] = tuple(fields_of_type)
-            for subname, subfields in type.shorthand.iteritems():
+            for subname, subfields in type.shorthand.items():
                 xpath = name + '/' + subname
                 shorthand[xpath] = tuple(name + '/' + field for field in subfields)
         return shorthand
diff --git a/python/comma/csv/applications/CMakeLists.txt b/python/comma/csv/applications/CMakeLists.txt
deleted file mode 100644
index ef8b8b8e9..000000000
--- a/python/comma/csv/applications/CMakeLists.txt
+++ /dev/null
@@ -1 +0,0 @@
-install( PROGRAMS csv-eval DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/python/comma/csv/applications/__init__.py b/python/comma/csv/applications/__init__.py
index 0cff88821..6cf509948 100644
--- a/python/comma/csv/applications/__init__.py
+++ b/python/comma/csv/applications/__init__.py
@@ -26,3 +26,5 @@
 # WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+
+from . import csv_eval
\ No newline at end of file
diff --git a/python/comma/csv/applications/csv-eval b/python/comma/csv/applications/csv-eval
deleted file mode 100644
index 506d1e7d4..000000000
--- a/python/comma/csv/applications/csv-eval
+++ /dev/null
@@ -1,37 +0,0 @@
-#!/usr/bin/python
-
-# This file is part of comma, a generic and flexible library
-# Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-from comma.csv.applications import csv_eval
-import sys, signal
-try:
-    csv_eval.main()
-except KeyboardInterrupt:
-    sys.exit( 128 + signal.SIGINT )
diff --git a/python/comma/csv/applications/csv_eval.py b/python/comma/csv/applications/csv_eval.py
index efd3ceb88..06f8f7d6d 100644
--- a/python/comma/csv/applications/csv_eval.py
+++ b/python/comma/csv/applications/csv_eval.py
@@ -1,56 +1,25 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# Copyright (c) 2018 Vsevolod Vlaskine
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
-import sys
-import os
-import argparse
-import numpy as np
-import re
-import itertools
-import ast
-import comma
+
+from __future__ import print_function
+import argparse, ast, itertools, numpy as np, os, re, signal, sys
+if sys.version_info.major < 3: from itertools import izip
+else: izip = zip # todo! watch performance! it's reported python3 zip is some 30% slower than izip
+import comma # should not it be a relative path?
 
 description = """
 evaluate numerical expressions and append computed values to csv stream
-"""
 
+using numpy version """ + np.__version__ + "\n"
 
 notes_and_examples = """
 input fields:
-    1) slashes are replaced by underscores if --full-xpath is given, otherwise basenames are used
-    2) for ascii streams, input fields are treated as floating point numbers, unless --format is given
+    - slashes are replaced by underscores if --full-xpath is given, otherwise basenames are used
+    - for ascii streams, input fields are treated as floating point numbers, unless --format is given
 
 output fields:
-    1) inferred from expressions (by default) or specified by --output-fields
-    2) appended to possibly modified input
-    3) treated as floating point numbers, unless --output-format is given
+    - inferred from the names assigned in expression unless specified by --output-fields
+    - appended to input record (input field values can be modified by expression, too)
+    - treated as 64-bit floating point numbers, unless --output-format is given
 
 examples:
     # basic
@@ -78,18 +47,18 @@
     # update input stream values in place
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=x,y "x=x+y; y=y-1"
 
-    # using full xpaths
+    # full xpaths
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=one/x,two/y "x+=1; y-=1"
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=one/x,two/y "one_x+=1; two_y-=1" --full-xpath
 
-    # using default values
+    # default values
     ( echo 1,2 ; echo 3,4 ) | %(prog)s --fields=,y "a=x+y" --default-values="x=0;y=0"
     
-    # using init values: calculate triangular numbers
-    seq 0 10 | %(prog)s --fields=v "sum=sum+v" --init-values="sum=0"
+    # init values: calculate triangular numbers
+    seq 0 10 | csv-eval --fields=v "sum=sum+v" --init-values="sum=0"
     
-    # using init values: calculate fibonacci numbers
-    seq 0 10 | %(prog)s --fields=v "c=b;b=a+b;a=c" --output-fields a,b --init-values="a=0;b=1"
+    # init values: calculate fibonacci numbers
+    seq 0 10 | csv-eval --fields v "a,b=b,a+b" --init-values "a=0;b=1" --output-fields a
 
     # operating on time (internally represented in microseconds)
     echo 20171112T224515.5 | %(prog)s --format=t --fields=t1 "t2=t1+1000000" --output-format t
@@ -140,9 +109,18 @@
 
 string functions:
     http://docs.scipy.org/doc/numpy/reference/routines.char.html
-
+    
     ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(path,"/")' --output-format=ui
     ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'r=char.replace(path,"/","_")' --output-format=s[36]
+    
+    LIMITATION: in python3, csv-eval represents strings as np.bytes_ (for consistent binary support)
+        python2: you could write: ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(path,"/")' --output-format=ui
+        python3: you should write: ( echo 'a'; echo 'a/b' ) | %(prog)s --fields=path --format=s[36] 'n=char.count(char.decode(path),"/")' --output-format=ui
+                 for backward compatibility, use the latter variant
+        it may lead to ugly constructs for python3:
+            python2: csv-eval --fields=s --format s[36] 'u=char.upper(name)' --output-format=s[36]
+            python3: csv-eval --fields=s --format s[36] 'u=char.encode(char.upper(char.decode(name)))' --output-format=s[36]
+        but unfortunately, this limitation is unlikely to go away
 
 time arithmetic:
     http://docs.scipy.org/doc/numpy/reference/arrays.datetime.html#datetime-and-timedelta-arithmetic
@@ -152,14 +130,9 @@
     echo 20151231T000000,20160515T120000 | %(prog)s --fields=t1,t2 --format=2t "dt = (t2-t1)/timedelta64(1,'D')"
 """
 
+class csv_eval_error(Exception): pass
 
-class csv_eval_error(Exception):
-    pass
-
-
-def custom_formatwarning(msg, *args):
-    return __name__ + " warning: " + str(msg) + '\n'
-
+def custom_formatwarning(msg, *args): return __name__ + " warning: " + str(msg) + '\n'
 
 def add_csv_options(parser):
     comma.csv.add_options(parser) # comma.csv.add_options(parser, defaults={'fields': 'x,y,z'})
@@ -173,17 +146,14 @@ def add_csv_options(parser):
         '-o',
         default=None,
         metavar='<names>',
-        help="do not infer output fields from expressions; use specified fields instead")
+        help="do not infer output fields from expressions; output specified fields appended to input instead")
     parser.add_argument(
         '--output-format',
         default='',
         metavar='<format>',
         help="format of output fields (default: 'd' for each)")
-    # the options defined below are left for compatibility
-    # use --output-fields and --output-format instead
-    parser.add_argument('--append-fields', '-F', help=argparse.SUPPRESS)
-    parser.add_argument('--append-binary', '-B', help=argparse.SUPPRESS)
-
+    parser.add_argument('--append-fields', '-F', help=argparse.SUPPRESS) # backward compatibility; use --output-fields instead
+    parser.add_argument('--append-binary', '-B', help=argparse.SUPPRESS) # backward compatibility; use --output-format instead
 
 def get_args():
     parser = argparse.ArgumentParser(
@@ -219,13 +189,18 @@ def get_args():
         '--default',
         default='',
         metavar='<assignments>',
-        help='default values for variables in expressions but not in input stream')
+        help='default values for variables in expressions but not in input stream, applied to every input record')
     parser.add_argument(
         '--init-values',
         '--init',
         default='',
         metavar='<assignments>',
-        help='init values, applied only once')
+        help='init values, applied only once on csv-eval start')
+    parser.add_argument(
+        '--init-format',
+        default='',
+        metavar='<format>',
+        help='format of init non-output variables in the order of appearance in expression (default: "d" for each)')
     parser.add_argument(
         '--with-error',
         default='',
@@ -247,14 +222,11 @@ def get_args():
         help='select and output records of input stream that satisfy the condition')
     args = parser.parse_args()
     if args.help:
-        if args.verbose:
-            parser.epilog += numpy_functions
-        else:
-            parser.epilog += "\nfor more help run '%(prog)s -h -v'"
+        parser.epilog += numpy_functions if args.verbose else "\nfor more help run '%(prog)s -h -v'"
         parser.print_help()
         parser.exit(0)
     if args.fields is None or args.fields == "": sys.exit( "csv-eval: please specify --fields" )
-    if args.init_values == '' and args.verbose: print >>sys.stderr, "csv-eval: --init currently reads one record at a time, which may be slow"
+    if args.init_values == '' and args.verbose: print( "csv-eval: --init currently reads one record at a time, which may be slow", file = sys.stderr )
     return args
 
 def ingest_deprecated_options(args):
@@ -262,34 +234,22 @@ def ingest_deprecated_options(args):
         args.output_format = args.append_binary
         del args.append_binary
         if args.verbose:
-            with comma.util.warning(custom_formatwarning) as warn:
-                msg = "--append-binary is deprecated, consider using --output-format"
-                warn(msg)
+            with comma.util.warning(custom_formatwarning) as warn: warn( "--append-binary is deprecated, consider using --output-format" )
     if args.append_fields:
         args.output_fields = args.append_fields
         del args.append_fields
         if args.verbose:
-            with comma.util.warning(custom_formatwarning) as warn:
-                msg = "--append-fields is deprecated, consider using --output-fields"
-                warn(msg)
+            with comma.util.warning(custom_formatwarning) as warn: warn( "--append-fields is deprecated, consider using --output-fields" )
 
 def check_options(args):
-    if not (args.expressions or args.select or args.exit_if):
-        raise csv_eval_error("no expressions are given")
-    if args.binary and args.format:
-        raise csv_eval_error("--binary and --format are mutually exclusive")
+    if not (args.expressions or args.select or args.exit_if): raise csv_eval_error( "please specify expression" )
+    if args.binary and args.format: raise csv_eval_error("--binary and --format are mutually exclusive")
     if args.select or args.exit_if:
-        if args.expressions:
-            msg = "--select <condition> and --exit-if <condition> cannot be used with expressions"
-            raise csv_eval_error(msg)
-        if args.output_fields or args.output_format:
-            msg = "--select and --exit-if cannot be used with --output-fields or --output-format"
-            raise csv_eval_error(msg)
+        if args.expressions: raise csv_eval_error( "--select <condition> and --exit-if <condition> cannot be used with expressions" )
+        if args.output_fields: raise csv_eval_error( "--select and --exit-if cannot be used with --output-fields" )
+        if args.output_format: raise csv_eval_error( "--select and --exit-if cannot be used with --output-format" )
     if args.with_error:
-        if not args.exit_if:
-            msg = "--with-error is only used with --exit-if"
-            raise csv_eval_error(msg)
-
+        if not args.exit_if: raise csv_eval_error( "--with-error can only be used with --exit-if" )
 
 def format_without_blanks(format, fields=[], unnamed_fields=True):
     """
@@ -321,24 +281,17 @@ def format_without_blanks(format, fields=[], unnamed_fields=True):
      ...
     ValueError: format 'ui,t,d' is longer than fields 'a,b'
     """
-    def comma_type(maybe_type, field, default_type='d', type_of_unnamed_field='s[0]'):
-        return type_of_unnamed_field if not field else maybe_type or default_type
+    def comma_type(maybe_type, field, default_type='d', type_of_unnamed_field='s[0]'): return type_of_unnamed_field if not field else maybe_type or default_type
 
-    if not format and not fields:
-        return ''
+    if not format and not fields: return ''
     maybe_types = comma.csv.format.expand(format).split(',')
     if not unnamed_fields:
-        if '' in fields:
-            msg = "expected all fields to be named, got '{}'".format(','.join(fields))
-            raise ValueError(msg)
-        if len(maybe_types) > len(fields):
-            msg = "format '{}' is longer than fields '{}'".format(format, ','.join(fields))
-            raise ValueError(msg)
-    maybe_typed_fields = itertools.izip_longest(maybe_types, fields)
+        if '' in fields: raise ValueError( "expected all fields to be named, got '{}'".format(','.join(fields)) )
+        if len(maybe_types) > len(fields): raise ValueError( "format '{}' is longer than fields '{}'".format(format, ','.join(fields)) )
+    maybe_typed_fields = itertools.zip_longest(maybe_types, fields) if sys.version_info.major > 2 else itertools.izip_longest(maybe_types, fields) # uber quick and dirty
     types = [comma_type(maybe_type, field) for maybe_type, field in maybe_typed_fields]
     return ','.join(types)
 
-
 def assignment_variable_names(expressions):
     """
     >>> from comma.csv.applications.csv_eval import assignment_variable_names
@@ -355,6 +308,7 @@ def assignment_variable_names(expressions):
     >>> assignment_variable_names("x=1; x=2; y+=1; y+=2; z=1; z+=2")
     ['x', 'y', 'z']
     """
+    if expressions is None: return []
     tree = ast.parse(expressions, '<string>', mode='exec')
     fields = []
     for child in ast.iter_child_nodes(tree):
@@ -396,9 +350,7 @@ def normalise_full_xpath(fields, full_xpath=True):
     ['', 'b', '', 'c', 'e', '']
     """
     full_xpath_fields = split_fields(fields)
-    if full_xpath:
-        return [f.replace('/', '_') for f in full_xpath_fields]
-    return [f.split('/')[-1] for f in full_xpath_fields]
+    return [f.replace('/', '_') for f in full_xpath_fields] if full_xpath else [f.split('/')[-1] for f in full_xpath_fields]
 
 def prepare_options(args):
     ingest_deprecated_options(args)
@@ -415,24 +367,21 @@ def prepare_options(args):
         args.binary = False
     else:
         args.first_line = comma.io.readlines_unbuffered(1, sys.stdin)
-        if not args.first_line:
-            raise csv_eval_error("first record is empty - could not guess format")
+        if not args.first_line: return False
         args.format = comma.csv.format.guess_format(args.first_line)
         args.binary = False
-        if args.verbose:
-            print >> sys.stderr, "{}: guessed format: {}".format(__name__, args.format)
-    if args.select or args.exit_if:
-        return
+        if args.verbose: print( "{}: guessed format: {}".format(__name__, args.format), file = sys.stderr )
+    if args.select or args.exit_if: return True
     var_names = assignment_variable_names(args.expressions)
     args.update_fields = [f for f in var_names if f in args.fields]
-    if args.output_fields is None:
-        args.output_fields = [f for f in var_names if f not in args.fields]
-    else:
-        args.output_fields = split_fields(args.output_fields)
-    args.output_format = format_without_blanks(args.output_format,
-                                               args.output_fields,
-                                               unnamed_fields=False)
-
+    args.output_fields = [f for f in var_names if f not in args.fields] if args.output_fields is None else split_fields(args.output_fields)
+    init_var_names = assignment_variable_names(args.init_values)
+    args.init_fields = [f for f in init_var_names if f not in args.output_fields]
+    if args.init_fields:
+        init_types = format_without_blanks( args.init_format, args.init_fields, unnamed_fields = False )
+        args.init_t = comma.csv.struct( ','.join( args.init_fields ), *comma.csv.format.to_numpy( init_types ) )
+    args.output_format = format_without_blanks( args.output_format, args.output_fields, unnamed_fields = False )
+    return True
 
 def restricted_numpy_env():
     d = np.__dict__.copy()
@@ -440,23 +389,20 @@ def restricted_numpy_env():
     d.pop('sys', None)
     return d
 
-
 def update_buffer(stream, update_array):
     index = stream.fields.index
     if stream.binary:
         fields = stream._input_array.dtype.names
-        for f in update_array.dtype.names:
-            stream._input_array[fields[index(f)]] = update_array[f]
+        for f in update_array.dtype.names: stream._input_array[fields[index(f)]] = update_array[f]
     else:
         def updated_lines():
-            for line, scalars in itertools.izip(stream._ascii_buffer, update_array):
+            for line, scalars in izip(stream._ascii_buffer, update_array):
                 values = line.split(stream.delimiter)
                 for f, s in zip(update_array.dtype.names, stream._strings(scalars)):
                     values[index(f)] = s
                 yield stream.delimiter.join(values)
         stream._ascii_buffer = list(updated_lines())
 
-
 class stream(object):
     def __init__(self, args):
         self.args = args
@@ -472,7 +418,7 @@ def __init__(self, args):
         if self.args.verbose: self.print_info()
 
     def initialize_input(self):
-        self.nonblank_input_fields = filter(None, self.args.fields)
+        self.nonblank_input_fields = list( filter( None, self.args.fields ) )
         if not self.nonblank_input_fields: raise csv_eval_error("please specify input stream fields, e.g. --fields=x,y")
         check_fields(self.nonblank_input_fields)
         types = comma.csv.format.to_numpy(self.args.format)
@@ -497,72 +443,88 @@ def initialize_update_and_output(self):
     def print_info(self, file=sys.stderr):
         fields = ','.join(self.input_t.nondefault_fields)
         format = self.input_t.format
-        print >> file, "expressions: '{}'".format(self.args.expressions)
-        print >> file, "select: '{}'".format(self.args.select)
-        print >> file, "exit_if: '{}'".format(self.args.exit_if)
-        print >> file, "default values: '{}'".format(self.args.default_values)
-        print >> file, "input fields: '{}'".format(fields)
-        print >> file, "input format: '{}'".format(format)
-        if self.args.select or self.args.exit_if:
-            return
+        print( "expressions: '{}'".format(self.args.expressions), file = file )
+        print( "select: '{}'".format(self.args.select), file = file )
+        print( "exit_if: '{}'".format(self.args.exit_if), file = file )
+        print( "default values: '{}'".format(self.args.default_values), file = file )
+        print( "input fields: '{}'".format(fields), file = file )
+        print( "input format: '{}'".format(format), file = file )
+        if self.args.select or self.args.exit_if: return
         update_fields = ','.join(self.update_t.fields) if self.args.update_fields else ''
         output_fields = ','.join(self.output_t.fields) if self.args.output_fields else ''
         output_format = self.output_t.format if self.args.output_fields else ''
-        print >> file, "update fields: '{}'".format(update_fields)
-        print >> file, "output fields: '{}'".format(output_fields)
-        print >> file, "output format: '{}'".format(output_format)
-
+        print( "update fields: '{}'".format(update_fields), file = file )
+        print( "output fields: '{}'".format(output_fields), file = file )
+        print( "output format: '{}'".format(output_format), file = file )
 
 def check_fields(fields, allow_numpy_names=True):
     for field in fields:
         if not re.match(r'^[a-z_]\w*$', field, re.I): raise csv_eval_error("'{}' is not a valid field name".format(field))
-        if field in ['_input', '_update', '_output']: raise csv_eval_error("'{}' is a reserved name".format(field))
+        if field in ['_init', '_input', '_update', '_output']: raise csv_eval_error("'{}' is a reserved name".format(field))
         if not allow_numpy_names and field in np.__dict__: raise csv_eval_error("'{}' is a reserved numpy name".format(field))
 
 def check_output_fields(fields, input_fields):
     check_fields(fields)
     invalid_output_fields = set(fields).intersection(input_fields)
-    if invalid_output_fields:
-        msg = "output fields '{}' are present in input fields '{}'" \
-            .format(','.join(invalid_output_fields), ','.join(input_fields))
-        raise csv_eval_error(msg)
+    if invalid_output_fields: raise csv_eval_error( "output field(s) '{}' should not contain input fields '{}'".format(','.join(invalid_output_fields), ','.join(input_fields)) )
+
+def _numbered( s, line ):
+    t = s.split( '\n' )
+    return '\n'.join( [ '          {} {}\t{}'.format( '*' if i + 1 == line else ' ', i + 1, t[i] ) for i in range( len( t ) ) ] )
+
+def _code_error( what, c, e ):
+    t = e.__traceback__
+    while t is not None: line = t.tb_lineno; t = t.tb_next # todo: quick and dirty, is there a better way?
+    print( "csv-eval: {}: line {}: {}: {}\n{}".format( what, line, type( e ).__name__, str( e ), _numbered( c, line ) ), file = sys.stderr )
 
 def evaluate(stream):
-    def disperse(var, fields): return '\n'.join("{f} = {v}['{f}']".format(v=var, f=f) for f in fields)
-    def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f) for f in fields)
+    def disperse( var, fields, do_copy = False ):
+        if do_copy: return '\n'.join( "{f} = copy( {v}['{f}'] )".format( v = var, f = f ) for f in fields )
+        else: return '\n'.join( "{f} = {v}['{f}']".format( v = var, f = f ) for f in fields )
+    def collect( var, fields ): return '\n'.join("{v}['{f}'] = {f}".format( v = var, f = f ) for f in fields )
     if stream.args.init_values == '':
         read_size = None
         init_code_string = ''
     else:
         read_size = 1
-        init_code_string = '\n'.join([stream.args.default_values,
-                                stream.args.init_values,
-                                disperse('_input', stream.nonblank_input_fields),
-                                collect('_update', stream.args.update_fields),
-                                collect('_output', stream.args.output_fields)])
-    code_string = '\n'.join([stream.args.default_values,
-                             disperse('_input', stream.nonblank_input_fields),
-                             disperse('_output', stream.args.output_fields),
-                             stream.args.expressions,
-                             collect('_update', stream.args.update_fields),
-                             collect('_output', stream.args.output_fields)])
-    init_code = compile(init_code_string, '<string>', 'exec')
-    code = compile(code_string, '<string>', 'exec')
-    env = np.__dict__ if stream.args.permissive else restricted_numpy_env()
+        init_code_string = '\n'.join( [ disperse( '_input', stream.nonblank_input_fields, stream.args.init_values ),
+                                        disperse( '_output', stream.args.output_fields, stream.args.init_values ),
+                                        stream.args.default_values,
+                                        stream.args.init_values,
+                                        collect( '_init', stream.args.init_fields ),
+                                        collect( '_update', stream.args.update_fields ),
+                                        collect( '_output', stream.args.output_fields ) ] )
+    code_string = '\n'.join( [ stream.args.default_values,
+                               disperse( '_init', stream.args.init_fields, stream.args.init_values ),
+                               disperse( '_input', stream.nonblank_input_fields ),
+                               disperse( '_output', stream.args.output_fields, stream.args.init_values ),
+                               stream.args.expressions,
+                               collect( '_init', stream.args.init_fields ),
+                               collect( '_update', stream.args.update_fields ),
+                               collect( '_output', stream.args.output_fields ) ] )
+    #print( "-------- init_code_string --------\n" + init_code_string + "\n--------\n", file=sys.stderr )
+    #print( "-------- code_string --------\n" + code_string + "\n--------\n", file=sys.stderr )
+    init_code = compile( init_code_string, '<string>', 'exec' )
+    code = compile( code_string, '<string>', 'exec' )
+    env = np.__dict__ if stream.args.permissive else restricted_numpy_env()    
     size = None
+    init = None
+    input = None
     update = None
     output = None
-    input = None
-    is_shutdown = comma.signal.is_shutdown()
-    if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
+    is_shutdown = comma.signal.is_shutdown( verbose = stream.args.verbose )
+    if stream.args.first_line: input = stream.input.read_from_line( stream.args.first_line )
     while not is_shutdown:
         if input is not None:
             if size != input.size:
                 size = input.size
+                if stream.args.init_fields: init = stream.args.init_t(size)
                 if stream.args.update_fields: update = stream.update_t(size)
                 if stream.args.output_fields: output = stream.output_t(size)
-                exec init_code in env, {'_input': input, '_update': update, '_output': output}
-            exec code in env, {'_input': input, '_update': update, '_output': output}
+                try: exec( init_code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
+                except Exception as e: _code_error( "init expressions", init_code_string, e ); raise
+            try: exec( code, env, { '_init': init, '_input': input, '_update': update, '_output': output } )
+            except Exception as e: _code_error( "expressions", code_string, e ); raise
             if stream.args.update_fields: update_buffer(stream.input, update)
             if stream.args.output_fields: stream.output.write(output)
             else: stream.input.dump()
@@ -572,15 +534,15 @@ def collect(var, fields): return '\n'.join("{v}['{f}'] = {f}".format(v=var, f=f)
 def select(stream):
     input = None
     env = restricted_numpy_env()
-    exec stream.args.default_values in env
+    exec( stream.args.default_values, env )
     fields = stream.input.fields
     code = compile(stream.args.select, '<string>', 'eval')
     is_shutdown = comma.signal.is_shutdown()
-    if stream.args.first_line:
-        input = stream.input.read_from_line(stream.args.first_line)
+    if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
     while not is_shutdown:
-        if input is not None: 
-            mask = eval(code, env, {f: input[f] for f in fields})
+        if input is not None:
+            try: mask = eval(code, env, {f: input[f] for f in fields})
+            except Exception as e: _code_error( "select expression", stream.args.select, e ); raise
             stream.input.dump(mask=mask)
         input = stream.input.read()
         if input is None: break
@@ -588,43 +550,42 @@ def select(stream):
 def exit_if(stream):
     input = None
     env = restricted_numpy_env()
-    exec stream.args.default_values in env
+    exec( stream.args.default_values, env )
     fields = stream.input.fields
     code = compile(stream.args.exit_if, '<string>', 'eval')
     is_shutdown = comma.signal.is_shutdown()
     if stream.args.first_line: input = stream.input.read_from_line(stream.args.first_line)
     while not is_shutdown:
         if input is not None:
-            mask = eval(code, env, {f: input[f] for f in fields})
+            try: mask = eval( code, env, { f: input[f] for f in fields } )
+            except Exception as e: _code_error( "exit-if expression", stream.args.select, e ); raise
             if mask:
                 if not stream.args.with_error: sys.exit()
                 name = os.path.basename(sys.argv[0])
-                print >> sys.stderr, "{} error: {}".format(name, stream.args.with_error)
+                print( "{} error: {}".format(name, stream.args.with_error), file = sys.stderr )
                 sys.exit(1)
             stream.input.dump()
         input = stream.input.read()
-        if input is None:
-            break
+        if input is None: break
 
 def main():
     try:
+        signal.signal( signal.SIGPIPE, signal.SIG_DFL )
         comma.csv.time.zone('UTC')
         args = get_args()
-        prepare_options(args)
-        if args.select:
-            select(stream(args))
-        elif args.exit_if:
-            exit_if(stream(args))
-        else:
-            evaluate(stream(args))
+        if not prepare_options( args ): sys.exit( 0 ) # no data on stdin
+        if args.select: select(stream(args))
+        elif args.exit_if: exit_if(stream(args))
+        else: evaluate(stream(args))
     except csv_eval_error as e:
         name = os.path.basename(sys.argv[0])
-        print >> sys.stderr, "{} error: {}".format(name, e)
+        print( "{} error: {}".format(name, e), file = sys.stderr )
         sys.exit(1)
-    except StandardError as e:
+    except KeyboardInterrupt:
+        sys.exit(128 + signal.SIGINT)
+    except Exception as e: #except StandardError as e:
         import traceback
         traceback.print_exc(file=sys.stderr)
         sys.exit(1)
 
-if __name__ == '__main__':
-    main()
+if __name__ == '__main__': main()
diff --git a/python/comma/csv/applications/test/csv-eval/default_format/ascii/test b/python/comma/csv/applications/test/csv-eval/default_format/ascii/test
index 4c5bc4761..33e23bfaa 100755
--- a/python/comma/csv/applications/test/csv-eval/default_format/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/default_format/ascii/test
@@ -1,3 +1,3 @@
 #!/bin/bash
 
-csv-eval --fields=,path,x,name --format ,s[36],,s[4] 'n=char.count(path,"/");y=x+1;uname=char.upper(name)' --output-format=s[36],,s[4] | name-value-from-csv blank,path,x,name,n,y,uname --line-number --prefix output | tr -d '"'
+csv-eval --fields=,path,x,name --format ,s[36],,s[4] 'n=char.count(char.decode(path),"/");y=x+1;uname=char.encode(char.upper(char.decode(name)))' --output-format=s[36],,s[4] | name-value-from-csv blank,path,x,name,n,y,uname --line-number --prefix output | tr -d '"'
diff --git a/python/comma/csv/applications/test/csv-eval/init_values/expected b/python/comma/csv/applications/test/csv-eval/init_values/expected
index d0dcb868b..44bb4bfd9 100644
--- a/python/comma/csv/applications/test/csv-eval/init_values/expected
+++ b/python/comma/csv/applications/test/csv-eval/init_values/expected
@@ -1,7 +1,39 @@
-fibonacci/output/line[0]="0,1,1"
-fibonacci/output/line[1]="1,1,2"
-fibonacci/output/line[2]="2,2,3"
-fibonacci/output/line[3]="3,3,5"
-fibonacci/output/line[4]="4,5,8"
-fibonacci/output/line[5]="5,8,13"
-fibonacci/status=0
+fibonacci[0]/output/line[0]="0,1,1"
+fibonacci[0]/output/line[1]="1,1,2"
+fibonacci[0]/output/line[2]="2,2,3"
+fibonacci[0]/output/line[3]="3,3,5"
+fibonacci[0]/output/line[4]="4,5,8"
+fibonacci[0]/output/line[5]="5,8,13"
+fibonacci[0]/status=0
+
+fibonacci[1]/output/line[0]="0,1,1"
+fibonacci[1]/output/line[1]="1,1,2"
+fibonacci[1]/output/line[2]="2,2,3"
+fibonacci[1]/output/line[3]="3,3,5"
+fibonacci[1]/output/line[4]="4,5,8"
+fibonacci[1]/output/line[5]="5,8,13"
+fibonacci[1]/status=0
+
+fibonacci[2]/output/line[0]="0,1,1"
+fibonacci[2]/output/line[1]="1,2,1"
+fibonacci[2]/output/line[2]="2,3,2"
+fibonacci[2]/output/line[3]="3,5,3"
+fibonacci[2]/output/line[4]="4,8,5"
+fibonacci[2]/output/line[5]="5,13,8"
+fibonacci[2]/status=0
+
+fibonacci[3]/output/line[0]="0,1"
+fibonacci[3]/output/line[1]="1,1"
+fibonacci[3]/output/line[2]="2,2"
+fibonacci[3]/output/line[3]="3,3"
+fibonacci[3]/output/line[4]="4,5"
+fibonacci[3]/output/line[5]="5,8"
+fibonacci[3]/status=0
+
+fibonacci[4]/output/line[0]="0,1"
+fibonacci[4]/output/line[1]="1,2"
+fibonacci[4]/output/line[2]="2,3"
+fibonacci[4]/output/line[3]="3,5"
+fibonacci[4]/output/line[4]="4,8"
+fibonacci[4]/output/line[5]="5,13"
+fibonacci[4]/status=0
diff --git a/python/comma/csv/applications/test/csv-eval/init_values/input b/python/comma/csv/applications/test/csv-eval/init_values/input
index 5448c0ca9..501984b70 100644
--- a/python/comma/csv/applications/test/csv-eval/init_values/input
+++ b/python/comma/csv/applications/test/csv-eval/init_values/input
@@ -1 +1,5 @@
-fibonacci="seq 0 5 | csv-eval --fields=v 'c=b;b=a+b;a=c' --output-fields a,b --init-values='a=0;b=1'"
+fibonacci[0]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --init-values='a=0;b=1'"
+fibonacci[1]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields a,b --init-values='a=0;b=1'"
+fibonacci[2]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields b,a --init-values='a=0;b=1'"
+fibonacci[3]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields a --init-values='a=0;b=1'"
+fibonacci[4]="seq 0 5 | csv-eval --fields=v 'a,b=b,a+b' --output-fields b --init-values='a=0;b=1'"
diff --git a/python/comma/csv/applications/test/csv-eval/permissive/ascii/test b/python/comma/csv/applications/test/csv-eval/permissive/ascii/test
index 0f4f67398..8418fab95 100755
--- a/python/comma/csv/applications/test/csv-eval/permissive/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/permissive/ascii/test
@@ -5,13 +5,13 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function csv_eval()
 {
-    csv-eval "$@" --fields=x,y 'import sys; print >> sys.stderr, "Python builtins are present!"; a=x+y'
+    csv-eval "$@" --fields=x,y 'import sys; print( "python builtins are present!" ); a=x+y'
 }
 
 function reformat_output()
 {
     prefix=$1
-    name-value-from-csv x,y,a --line-number --prefix $prefix/output | sed 's/"//g'
+    grep -v "python" | name-value-from-csv x,y,a --line-number --prefix $prefix/output | sed 's/"//g'
 }
 
 input=$( cat )
diff --git a/python/comma/csv/applications/test/csv-eval/permissive/binary/test b/python/comma/csv/applications/test/csv-eval/permissive/binary/test
index b068816d6..51bd6937d 100755
--- a/python/comma/csv/applications/test/csv-eval/permissive/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/permissive/binary/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function csv_eval()
 {
-    csv-eval "$@" --fields=x,y --binary=2d 'import sys; print >> sys.stderr, "Python builtins are present!"; a=x+y'
+    csv-eval "$@" --fields=x,y --binary=2d 'import sys; sys.stderr.write( "python builtins are present!\n" ); a=x+y'
 }
 
 function reformat_output()
diff --git a/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test b/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test
index 714e7a66b..595d55549 100755
--- a/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/select/basic/ascii/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-eval -v --fields=a,b,name --format=2i,s[1] --select "(a < b - 1) & (name == 'y')" \
+csv-eval -v --fields=a,b,name --format=2i,s[1] --select "logical_and( a < b - 1, char.decode( name ) == 'y' )" \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/basic/binary/test b/python/comma/csv/applications/test/csv-eval/select/basic/binary/test
index 12baee557..cd3dafd9d 100755
--- a/python/comma/csv/applications/test/csv-eval/select/basic/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/select/basic/binary/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "(a < b - 1) & (name == 'y')" | csv-from-bin 2i,s[1] \
+csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "logical_and( a < b - 1, char.decode( name ) == 'y' )" | csv-from-bin 2i,s[1] \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test b/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test
index 151033cd8..c6cc4ce90 100755
--- a/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/select/fields/ascii/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-eval -v --fields=a,b,,name --format=2i,,s[1] --select "(a < b - 1) & (name == 'y')" \
+csv-eval -v --fields=a,b,,name --format=2i,,s[1] --select "logical_and(a < b - 1, char.decode(name) == 'y')" \
     | name-value-from-csv a,b,dummy,allow,payload --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/fields/binary/test b/python/comma/csv/applications/test/csv-eval/select/fields/binary/test
index 53c017294..2bd0f5714 100755
--- a/python/comma/csv/applications/test/csv-eval/select/fields/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/select/fields/binary/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-to-bin 2i,2s[1],ui | csv-eval -v --fields=a,b,,name --binary=2i,2s[1],ui --select "(a < b - 1) & (name == 'y')" | csv-from-bin 2i,2s[1],ui \
+csv-to-bin 2i,2s[1],ui | csv-eval -v --fields=a,b,,name --binary=2i,2s[1],ui --select "logical_and(a < b - 1, char.decode(name) == 'y')" | csv-from-bin 2i,2s[1],ui \
     | name-value-from-csv a,b,dummy,allow,payload --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test b/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test
index a7ba750aa..581b09f4f 100755
--- a/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/select/select_all/ascii/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-eval --fields=a,b,name --format=2i,s[1] --select "(a < b) & ( name == 'y')" \
+csv-eval --fields=a,b,name --format=2i,s[1] --select "(a < b) & ( char.decode(name) == 'y')" \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test b/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test
index 6f22710aa..5d339db17 100755
--- a/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/select/select_all/binary/test
@@ -1,4 +1,4 @@
 #!/bin/bash
 
-csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "(a < b) & ( name == 'y')" | csv-from-bin 2i,s[1] \
+csv-to-bin 2i,s[1] | csv-eval --fields=a,b,name --binary=2i,s[1] --select "(a < b) & ( char.decode(name) == 'y')" | csv-from-bin 2i,s[1] \
     | name-value-from-csv a,b,allow --line-number --prefix output | sed 's/"//g'
diff --git a/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test b/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test
index 95fb5eaca..8b3efe3b6 100755
--- a/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test
+++ b/python/comma/csv/applications/test/csv-eval/strings/count/ascii/test
@@ -1,3 +1,3 @@
 #!/bin/bash
 
-csv-eval --fields=,path --format i,s[36],ui,s[4] 'n=char.count(path,"/")' --output-format=s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'
+csv-eval --fields=,path --format i,s[36],ui,s[4] 'n=char.count(char.decode(path),"/")' --output-format=s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'
diff --git a/python/comma/csv/applications/test/csv-eval/strings/count/binary/test b/python/comma/csv/applications/test/csv-eval/strings/count/binary/test
index 0cf2f3691..e44699078 100755
--- a/python/comma/csv/applications/test/csv-eval/strings/count/binary/test
+++ b/python/comma/csv/applications/test/csv-eval/strings/count/binary/test
@@ -1,3 +1,3 @@
 #!/bin/bash
 
-csv-to-bin i,s[36],ui,s[4] | csv-eval --fields=,path --binary i,s[36],ui,s[4] 'n=char.count(path,"/")' --output-format=s[36] | csv-from-bin i,s[36],ui,s[4],s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'
+csv-to-bin i,s[36],ui,s[4] | csv-eval --fields=,path --binary i,s[36],ui,s[4] 'n=char.count(char.decode(path),"/")' --output-format=s[36] | csv-from-bin i,s[36],ui,s[4],s[36] | name-value-from-csv x,path,num,string,n --line-number --prefix output | tr -d '"'
diff --git a/python/comma/csv/test/numpy_format/test b/python/comma/csv/test/numpy_format/test
index 54ff41831..339f99486 100755
--- a/python/comma/csv/test/numpy_format/test
+++ b/python/comma/csv/test/numpy_format/test
@@ -4,13 +4,14 @@ function comma_format_to_numpy
 {
     local compress=$2
     compress=${compress:+", $compress"}
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
 numpy_format = comma.csv.format.to_numpy( '$1' $compress )
 numpy.dtype( ','.join( numpy_format ) )
-print ','.join( numpy_format )
+print( ','.join( numpy_format ) )
 END
 )"
 }
diff --git a/python/comma/csv/test/numpy_guess_format/test b/python/comma/csv/test/numpy_guess_format/test
index 31df8eac3..ce53b3e1b 100755
--- a/python/comma/csv/test/numpy_guess_format/test
+++ b/python/comma/csv/test/numpy_guess_format/test
@@ -2,12 +2,13 @@
 
 function comma_guess_format
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
 guessed_format = comma.csv.format.guess_format( ['$1'] )
-print guessed_format
+print( guessed_format )
 END
 )"
 }
diff --git a/python/comma/csv/test/numpy_time/expected b/python/comma/csv/test/numpy_time/expected
index 4bb01817a..ef29ef5e3 100644
--- a/python/comma/csv/test/numpy_time/expected
+++ b/python/comma/csv/test/numpy_time/expected
@@ -6,6 +6,8 @@ incomplete/output="20150101T010203.123000"
 incomplete/status=0
 microseconds/output="20140101T010203.123456"
 microseconds/status=0
+nanoseconds/output="20140101T010203.123456"
+nanoseconds/status=0
 not_a_date_time/output="not-a-date-time"
 not_a_date_time/status=0
 invalid_month/output=""
diff --git a/python/comma/csv/test/numpy_time/input b/python/comma/csv/test/numpy_time/input
index 13c35aa3d..57b935473 100644
--- a/python/comma/csv/test/numpy_time/input
+++ b/python/comma/csv/test/numpy_time/input
@@ -2,6 +2,7 @@ basic 20150101T010203
 dot 20150101T010203.
 incomplete 20150101T010203.123
 microseconds 20140101T010203.123456
+nanoseconds 20140101T010203.123456789
 invalid_month 20150001T000000
 invalid_format 20150101T0000
 not_a_date_time not-a-date-time
diff --git a/python/comma/csv/test/numpy_time/test b/python/comma/csv/test/numpy_time/test
index d71e39510..c2de5abb6 100755
--- a/python/comma/csv/test/numpy_time/test
+++ b/python/comma/csv/test/numpy_time/test
@@ -1,14 +1,15 @@
 #!/bin/bash
 
 function comma_time_roundabout {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import numpy
 import comma
 
 comma_time = '$@'
 numpy_time = comma.csv.time.to_numpy( comma_time )
 if isinstance( numpy_time, numpy.datetime64 ):
-  print comma.csv.time.from_numpy( numpy_time )
+  print( comma.csv.time.from_numpy( numpy_time ) )
 END
 )"
 }
diff --git a/python/comma/csv/test/stream/array/test b/python/comma/csv/test/stream/array/test
index 9284da636..5810ce637 100755
--- a/python/comma/csv/test/stream/array/test
+++ b/python/comma/csv/test/stream/array/test
@@ -8,7 +8,7 @@ function process_records
 {
     local binary
     if [[ "$1" == "binary" ]]; then binary=True; else binary=False; fi
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test b/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test
index 178f33111..b457fba0e 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_lines/size_1/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 'x', 'u4' )
diff --git a/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test b/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test
index 6ad8c3658..93fc9562f 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_lines/size_all/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 'x', 'u4' )
diff --git a/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test b/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test
index d3176282f..8d9622e83 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_lines/size_default/test
@@ -5,7 +5,7 @@ source $( which comma-application-util ) || { echo "$scriptname: failed to sourc
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 'x', 'u4' )
diff --git a/python/comma/csv/test/stream/ascii_only/blank_values/test b/python/comma/csv/test/stream/ascii_only/blank_values/test
index f9723eb9c..0ab8038d1 100755
--- a/python/comma/csv/test/stream/ascii_only/blank_values/test
+++ b/python/comma/csv/test/stream/ascii_only/blank_values/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 t = comma.csv.struct( 's1,x,y,t,array,s2,z', 'S2', 'i4', 'f8', 'datetime64[us]', '2u1', 'S4', 'f8' )
diff --git a/python/comma/csv/test/stream/ascii_only/default_values/time/test b/python/comma/csv/test/stream/ascii_only/default_values/time/test
index 4fb6effe3..977b47546 100755
--- a/python/comma/csv/test/stream/ascii_only/default_values/time/test
+++ b/python/comma/csv/test/stream/ascii_only/default_values/time/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function default_values
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy as np
 from datetime import datetime
diff --git a/python/comma/csv/test/stream/ascii_only/delimiter/test b/python/comma/csv/test/stream/ascii_only/delimiter/test
index 7f42025fd..01dc2c941 100755
--- a/python/comma/csv/test/stream/ascii_only/delimiter/test
+++ b/python/comma/csv/test/stream/ascii_only/delimiter/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/ascii_only/precision/test b/python/comma/csv/test/stream/ascii_only/precision/test
index bb09387bf..06f963b26 100755
--- a/python/comma/csv/test/stream/ascii_only/precision/test
+++ b/python/comma/csv/test/stream/ascii_only/precision/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test b/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test
index cf1b4f506..3c6b5c7cc 100755
--- a/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test
+++ b/python/comma/csv/test/stream/ascii_only/tied/wrong_delimiter/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/ascii_only/time_converter/test b/python/comma/csv/test/stream/ascii_only/time_converter/test
index 018360c9a..2fbaee398 100755
--- a/python/comma/csv/test/stream/ascii_only/time_converter/test
+++ b/python/comma/csv/test/stream/ascii_only/time_converter/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/basic/test b/python/comma/csv/test/stream/basic/test
index 6391c34d9..d7200ba5d 100755
--- a/python/comma/csv/test/stream/basic/test
+++ b/python/comma/csv/test/stream/basic/test
@@ -8,13 +8,15 @@ function process_records
 {
     local binary
     if [[ "$1" == "binary" ]]; then binary=True; else binary=False; fi
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 'time,coordinates', 'datetime64[us]', point_t )
-record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
+#record_t = comma.csv.struct( 'observer,event', 'U3', timestamped_point_t 
+#record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
+record_t = comma.csv.struct( 'observer,event', 'S8', timestamped_point_t )
 record_stream = comma.csv.stream( record_t, binary=$binary )
 
 for i,r in enumerate( record_stream.iter(), start=1 ):
@@ -31,6 +33,6 @@ echo "$input" | process_records | output ascii
 comma_status_ok
 echo "ascii/status=$?"
 
-echo "$input" | csv-to-bin s[3],t,3d | process_records binary | csv-from-bin s[3],t,3d | output binary
+echo "$input" | csv-to-bin s[8],t,3d | process_records binary | csv-from-bin s[8],t,3d | output binary
 comma_status_ok
 echo "binary/status=$?"
diff --git a/python/comma/csv/test/stream/binary_keyword/false/test b/python/comma/csv/test/stream/binary_keyword/false/test
index 4f7fe1b12..ef93e4356 100755
--- a/python/comma/csv/test/stream/binary_keyword/false/test
+++ b/python/comma/csv/test/stream/binary_keyword/false/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_keyword/format_via_binary/test b/python/comma/csv/test/stream/binary_keyword/format_via_binary/test
index 9b4d49327..ada326a60 100755
--- a/python/comma/csv/test/stream/binary_keyword/format_via_binary/test
+++ b/python/comma/csv/test/stream/binary_keyword/format_via_binary/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_keyword/ignore/format/test b/python/comma/csv/test/stream/binary_keyword/ignore/format/test
index 415225f01..cff48145e 100755
--- a/python/comma/csv/test/stream/binary_keyword/ignore/format/test
+++ b/python/comma/csv/test/stream/binary_keyword/ignore/format/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test b/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test
index 54e592ef8..6247624b2 100755
--- a/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test
+++ b/python/comma/csv/test/stream/binary_keyword/mismatched_with_tied/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function mismatched
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/binary_keyword/true/test b/python/comma/csv/test/stream/binary_keyword/true/test
index 756955a1f..03d0232a5 100755
--- a/python/comma/csv/test/stream/binary_keyword/true/test
+++ b/python/comma/csv/test/stream/binary_keyword/true/test
@@ -4,7 +4,7 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test
index 015830d23..c06dc2427 100755
--- a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test
+++ b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/known_fields/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test
index a513332e2..5bf2ae78c 100755
--- a/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test
+++ b/python/comma/csv/test/stream/binary_only/fields/binary_is_true/unknown_fields/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function unknown_fields
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/binary_only/fields/comma_types/test b/python/comma/csv/test/stream/binary_only/fields/comma_types/test
index fdbad741f..d49d5f4f3 100755
--- a/python/comma/csv/test/stream/binary_only/fields/comma_types/test
+++ b/python/comma/csv/test/stream/binary_only/fields/comma_types/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test b/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test
index ced6d026e..c3532302f 100755
--- a/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test
+++ b/python/comma/csv/test/stream/binary_only/fields/inconsistent_format/test
@@ -5,7 +5,7 @@ function output { csv-paste value="line[" line-number value="]\=" --delimiter '@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/binary_only/not-a-date-time/test b/python/comma/csv/test/stream/binary_only/not-a-date-time/test
index 418466696..18fd42028 100755
--- a/python/comma/csv/test/stream/binary_only/not-a-date-time/test
+++ b/python/comma/csv/test/stream/binary_only/not-a-date-time/test
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 numpy_int=$(
-python -c "
+python3 -c "
 from comma.csv import *
 t = struct( 'f', *format.to_numpy('t') )
 s = stream( t, binary=True )
diff --git a/python/comma/csv/test/stream/buffer_size/expected b/python/comma/csv/test/stream/buffer_size/expected
index 5f647e531..c0a29afba 100644
--- a/python/comma/csv/test/stream/buffer_size/expected
+++ b/python/comma/csv/test/stream/buffer_size/expected
@@ -1,5 +1,5 @@
 #python
 
 expect buffer_size_in_bytes = 65536
-expect size/uint8 = buffer_size_in_bytes / number_of_fields
-expect size/float64 = buffer_size_in_bytes / ( 8 * number_of_fields )
+expect size/uint8 = buffer_size_in_bytes // number_of_fields
+expect size/float64 = buffer_size_in_bytes // ( 8 * number_of_fields )
diff --git a/python/comma/csv/test/stream/buffer_size/test b/python/comma/csv/test/stream/buffer_size/test
index a71d36f9c..3a4ae9b61 100755
--- a/python/comma/csv/test/stream/buffer_size/test
+++ b/python/comma/csv/test/stream/buffer_size/test
@@ -1,16 +1,19 @@
 #!/bin/bash
 
-function get_buffer_size_in_bytes { python -c "import comma; print comma.csv.stream.buffer_size_in_bytes"; }
+function get_buffer_size_in_bytes { python3 -c "from __future__ import print_function; import comma; print( comma.csv.stream.buffer_size_in_bytes )"; }
 
 function get_default_size
 {
     local fields=$1
     local type=$2
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
+import sys
 import comma
 fields='$fields'
 types = ('$type',) * len( fields.split(',') )
-print comma.csv.stream( comma.csv.struct( fields, *types ) ).size
+print( comma.csv.stream( comma.csv.struct( fields, *types ) ).size )
+sys.stdout.flush() # have to flush, since stdout gets highjacked by comma.csv.stream (which kind of make sense)
 END
 )"
 }
@@ -18,6 +21,6 @@ END
 echo "buffer_size_in_bytes=$( get_buffer_size_in_bytes )"
 
 fields="x,y"
-echo "number_of_fields=$( python -c "s = '$fields'; print len( s.split(',') )" )"
+echo "number_of_fields=$( python3 -c "from __future__ import print_function; s = '$fields'; print( len( s.split(',') ) )" )"
 echo "size/uint8=$( get_default_size $fields uint8 )"
 echo "size/float64=$( get_default_size $fields float64 )"
diff --git a/python/comma/csv/test/stream/default_values/basic/test b/python/comma/csv/test/stream/default_values/basic/test
index 7d41d9288..3c7220d5b 100755
--- a/python/comma/csv/test/stream/default_values/basic/test
+++ b/python/comma/csv/test/stream/default_values/basic/test
@@ -6,7 +6,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/full_xpath_is_false/test b/python/comma/csv/test/stream/default_values/full_xpath_is_false/test
index d036f408e..440db7021 100755
--- a/python/comma/csv/test/stream/default_values/full_xpath_is_false/test
+++ b/python/comma/csv/test/stream/default_values/full_xpath_is_false/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test b/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test
index 01a2cc00d..da3e582b8 100755
--- a/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test
+++ b/python/comma/csv/test/stream/default_values/ignore/field_in_stream/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test b/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test
index bb7aea2de..5579a152b 100755
--- a/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test
+++ b/python/comma/csv/test/stream/default_values/ignore/field_not_in_struct/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/no_missing_fields/test b/python/comma/csv/test/stream/default_values/no_missing_fields/test
index 1429b376a..501aaf4b7 100755
--- a/python/comma/csv/test/stream/default_values/no_missing_fields/test
+++ b/python/comma/csv/test/stream/default_values/no_missing_fields/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function default_values
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/default_values/size/test b/python/comma/csv/test/stream/default_values/size/test
index 0b5909c09..bf896ecc4 100755
--- a/python/comma/csv/test/stream/default_values/size/test
+++ b/python/comma/csv/test/stream/default_values/size/test
@@ -8,7 +8,7 @@ function default_values
 {
     local input_format=$1
     local size=$( cat size )
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 comma.csv.time.zone( 'UTC' )
 point_t = comma.csv.struct( 'id,signal,x,y,z', 'uint64', '(2,)float64', 'float64', 'float64', 'int64' )
diff --git a/python/comma/csv/test/stream/dump/no_mask/test b/python/comma/csv/test/stream/dump/no_mask/test
index f9536fe1b..f76a7fc62 100755
--- a/python/comma/csv/test/stream/dump/no_mask/test
+++ b/python/comma/csv/test/stream/dump/no_mask/test
@@ -6,7 +6,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,mask', 'float64', 'float64', 'uint32' )
diff --git a/python/comma/csv/test/stream/dump/with_mask/test b/python/comma/csv/test/stream/dump/with_mask/test
index 7d52d2188..a8e664ddc 100755
--- a/python/comma/csv/test/stream/dump/with_mask/test
+++ b/python/comma/csv/test/stream/dump/with_mask/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,mask', 'float64', 'float64', 'uint32' )
diff --git a/python/comma/csv/test/stream/duplicates/expected_fields/test b/python/comma/csv/test/stream/duplicates/expected_fields/test
index ad2836af7..dacc4a8f3 100755
--- a/python/comma/csv/test/stream/duplicates/expected_fields/test
+++ b/python/comma/csv/test/stream/duplicates/expected_fields/test
@@ -2,7 +2,7 @@
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/duplicates/other_fields/test b/python/comma/csv/test/stream/duplicates/other_fields/test
index 674b0e132..6c24d7eee 100755
--- a/python/comma/csv/test/stream/duplicates/other_fields/test
+++ b/python/comma/csv/test/stream/duplicates/other_fields/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/empty_input/test b/python/comma/csv/test/stream/empty_input/test
index bf4a2ec61..d950ca766 100755
--- a/python/comma/csv/test/stream/empty_input/test
+++ b/python/comma/csv/test/stream/empty_input/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/array/test_1d/test b/python/comma/csv/test/stream/fields/array/test_1d/test
index 5ebce3c24..c24fe2bb9 100755
--- a/python/comma/csv/test/stream/fields/array/test_1d/test
+++ b/python/comma/csv/test/stream/fields/array/test_1d/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/array/test_2d/test b/python/comma/csv/test/stream/fields/array/test_2d/test
index d0f3a4f52..7d4750fed 100755
--- a/python/comma/csv/test/stream/fields/array/test_2d/test
+++ b/python/comma/csv/test/stream/fields/array/test_2d/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/array/test_3d/test b/python/comma/csv/test/stream/fields/array/test_3d/test
index 06e22cda6..98f49489d 100755
--- a/python/comma/csv/test/stream/fields/array/test_3d/test
+++ b/python/comma/csv/test/stream/fields/array/test_3d/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/basic/test b/python/comma/csv/test/stream/fields/basic/test
index b8ff4b082..a36a4d226 100755
--- a/python/comma/csv/test/stream/fields/basic/test
+++ b/python/comma/csv/test/stream/fields/basic/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/extra_field_names/test b/python/comma/csv/test/stream/fields/extra_field_names/test
index d3df29eb5..4773393de 100755
--- a/python/comma/csv/test/stream/fields/extra_field_names/test
+++ b/python/comma/csv/test/stream/fields/extra_field_names/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
    local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/missing_fields/one/test b/python/comma/csv/test/stream/fields/missing_fields/one/test
index 41ea3e7eb..62368ce0d 100755
--- a/python/comma/csv/test/stream/fields/missing_fields/one/test
+++ b/python/comma/csv/test/stream/fields/missing_fields/one/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/fields/missing_fields/several/test b/python/comma/csv/test/stream/fields/missing_fields/several/test
index 12cbca8ba..cd486f230 100755
--- a/python/comma/csv/test/stream/fields/missing_fields/several/test
+++ b/python/comma/csv/test/stream/fields/missing_fields/several/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/csv/test/stream/fields/read/test b/python/comma/csv/test/stream/fields/read/test
index 008f6cd7e..0143734fc 100755
--- a/python/comma/csv/test/stream/fields/read/test
+++ b/python/comma/csv/test/stream/fields/read/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/shorthand/test b/python/comma/csv/test/stream/fields/shorthand/test
index 9d9f31868..2887bb9f9 100755
--- a/python/comma/csv/test/stream/fields/shorthand/test
+++ b/python/comma/csv/test/stream/fields/shorthand/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/fields/size/test b/python/comma/csv/test/stream/fields/size/test
index 97a65250c..a9e8d756e 100755
--- a/python/comma/csv/test/stream/fields/size/test
+++ b/python/comma/csv/test/stream/fields/size/test
@@ -8,7 +8,7 @@ function process_records
 {
     local size=$1
     local input_format=$2
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/files/test b/python/comma/csv/test/stream/files/test
index e379df890..9eed7373e 100755
--- a/python/comma/csv/test/stream/files/test
+++ b/python/comma/csv/test/stream/files/test
@@ -9,7 +9,7 @@ function process_records
     local input_format=$1
     local in=$2
     local out=$3
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/flush/test b/python/comma/csv/test/stream/flush/test
index 577f6ea49..8f626bf59 100755
--- a/python/comma/csv/test/stream/flush/test
+++ b/python/comma/csv/test/stream/flush/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/iter/test b/python/comma/csv/test/stream/iter/test
index 5e2534a6c..ba8e0c2e0 100755
--- a/python/comma/csv/test/stream/iter/test
+++ b/python/comma/csv/test/stream/iter/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/leaves/ambiguous/test b/python/comma/csv/test/stream/leaves/ambiguous/test
index 6a80007ee..71c44631e 100755
--- a/python/comma/csv/test/stream/leaves/ambiguous/test
+++ b/python/comma/csv/test/stream/leaves/ambiguous/test
@@ -2,7 +2,7 @@
 
 function ambiguous_fields
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/leaves/basic/test b/python/comma/csv/test/stream/leaves/basic/test
index 600a383c9..420d61ae9 100755
--- a/python/comma/csv/test/stream/leaves/basic/test
+++ b/python/comma/csv/test/stream/leaves/basic/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/leaves/slash/test b/python/comma/csv/test/stream/leaves/slash/test
index 2347fec04..869c9f64c 100755
--- a/python/comma/csv/test/stream/leaves/slash/test
+++ b/python/comma/csv/test/stream/leaves/slash/test
@@ -2,7 +2,7 @@
 
 function slash
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/one_field/test b/python/comma/csv/test/stream/one_field/test
index 9a90c9a34..76f9a4c5b 100755
--- a/python/comma/csv/test/stream/one_field/test
+++ b/python/comma/csv/test/stream/one_field/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x', 'float64' )
diff --git a/python/comma/csv/test/stream/recarray/test b/python/comma/csv/test/stream/recarray/test
index c4088d4a9..cc025d9cb 100755
--- a/python/comma/csv/test/stream/recarray/test
+++ b/python/comma/csv/test/stream/recarray/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/size/test b/python/comma/csv/test/stream/size/test
index aa61f9d4a..ee912c968 100755
--- a/python/comma/csv/test/stream/size/test
+++ b/python/comma/csv/test/stream/size/test
@@ -8,7 +8,7 @@ function process_records
 {
     local size=$1
     local input_format=$2
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/standard_field_names/test b/python/comma/csv/test/stream/standard_field_names/test
index c1f2a3d7a..bd49a23bb 100755
--- a/python/comma/csv/test/stream/standard_field_names/test
+++ b/python/comma/csv/test/stream/standard_field_names/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y', 'float64', 'float64' )
diff --git a/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test b/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
index 7eba8e0ce..2ad7dfc7a 100755
--- a/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
+++ b/python/comma/csv/test/stream/stdin/corrupt_input/ascii/test
@@ -4,7 +4,8 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
@@ -17,7 +18,7 @@ try:
     for r in record_stream.iter( size=-1 ):
         pass
 except ValueError:
-    print "exception=ValueError"
+    print( "exception=ValueError" )
 END
 )"
 }
diff --git a/python/comma/csv/test/stream/stdin/corrupt_input/binary/test b/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
index d7ed00bbd..81f61352b 100755
--- a/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
+++ b/python/comma/csv/test/stream/stdin/corrupt_input/binary/test
@@ -4,7 +4,8 @@ source $( which comma-application-util )
 
 function process_records
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import comma
 import numpy
 
@@ -17,7 +18,7 @@ try:
     for r in record_stream.iter( size=-1 ):
         pass
 except ValueError:
-    print "exception=ValueError"
+    print( "exception=ValueError" )
 END
 )"
 }
diff --git a/python/comma/csv/test/stream/stdin/simple/test b/python/comma/csv/test/stream/stdin/simple/test
index 311cc7826..04da5b08c 100755
--- a/python/comma/csv/test/stream/stdin/simple/test
+++ b/python/comma/csv/test/stream/stdin/simple/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/tied/basic/test b/python/comma/csv/test/stream/tied/basic/test
index ed2b3f331..ca0f094d4 100755
--- a/python/comma/csv/test/stream/tied/basic/test
+++ b/python/comma/csv/test/stream/tied/basic/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/tied/mixedup/test b/python/comma/csv/test/stream/tied/mixedup/test
index d9a86908b..d3fb26177 100755
--- a/python/comma/csv/test/stream/tied/mixedup/test
+++ b/python/comma/csv/test/stream/tied/mixedup/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 
diff --git a/python/comma/csv/test/stream/timedelta/test b/python/comma/csv/test/stream/timedelta/test
index 4082f1666..151537abf 100755
--- a/python/comma/csv/test/stream/timedelta/test
+++ b/python/comma/csv/test/stream/timedelta/test
@@ -7,7 +7,7 @@ function output { local prefix=$1; gawk '{ print "'${prefix:+$prefix/}'output/li
 function process_records
 {
     local input_format=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
diff --git a/python/comma/csv/test/struct/test b/python/comma/csv/test/struct/test
index 5e9980a19..b2ebab968 100755
--- a/python/comma/csv/test/struct/test
+++ b/python/comma/csv/test/struct/test
@@ -1,14 +1,14 @@
 #!/bin/bash
 
-function types_incorrect_name { python -c "import comma; point_t = comma.csv.struct( 'x', 'invalid' )"; }
-function types_empty_name { python -c "import comma; point_t = comma.csv.struct( 'x', '' )"; }
-function types_insufficient_number { python -c "import comma; point_t = comma.csv.struct( 'x,y', 'float64' )"; }
-function duplicate_field { python -c "import comma; point_t = comma.csv.struct( 'x,x,z', 'float64', 'int32', 'float64' )"; }
-function field_with_slash { python -c "import comma; point_t = comma.csv.struct( 'x,x/y,z', 'float64', 'int32', 'float64' )"; }
+function types_incorrect_name { python3 -c "import comma; point_t = comma.csv.struct( 'x', 'invalid' )"; }
+function types_empty_name { python3 -c "import comma; point_t = comma.csv.struct( 'x', '' )"; }
+function types_insufficient_number { python3 -c "import comma; point_t = comma.csv.struct( 'x,y', 'float64' )"; }
+function duplicate_field { python3 -c "import comma; point_t = comma.csv.struct( 'x,x,z', 'float64', 'int32', 'float64' )"; }
+function field_with_slash { python3 -c "import comma; point_t = comma.csv.struct( 'x,x/y,z', 'float64', 'int32', 'float64' )"; }
 
 function excess_number_of_types
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 point_t = comma.csv.struct( 'x,y', 'float64','float64','uint64' )
@@ -23,7 +23,7 @@ END
 
 function blank_fields
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import comma
 import numpy
 point_t = comma.csv.struct( ',,z', 'float64', 'int32', 'float64' )
@@ -36,7 +36,7 @@ END
 
 function basic
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import numpy
 import comma
 
@@ -51,30 +51,32 @@ END
 
 function shorthand
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 't,coordinates', 'datetime64[us]', point_t )
 record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
 for i,name in enumerate( [ 'event', 'event/coordinates' ] ):
-  print "shorthand[{}]/name={}".format( i, name )
-  print "shorthand[{}]/value={}".format( i, ','.join( record_t.shorthand[name] ) )
+  print( "shorthand[{}]/name={}".format( i, name ) )
+  print( "shorthand[{}]/value={}".format( i, ','.join( record_t.shorthand[name] ) ) )
 END
 )"
 }
 
 function leaves
 {
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 't,coordinates', 'datetime64[us]', point_t )
 observer_t = comma.csv.struct( 'name,id', 'S3', 'uint32' )
 record_t = comma.csv.struct( 'observer,event,value', observer_t, timestamped_point_t, 'float64' )
-for leaf,xpath in record_t.xpath_of_leaf.iteritems():
-  print "leaves/{}={}".format( leaf, record_t.xpath_of_leaf.get( leaf ) )
+for leaf,xpath in record_t.xpath_of_leaf.items():
+  print( "leaves/{}={}".format( leaf, record_t.xpath_of_leaf.get( leaf ) ) )
 END
 )"
 }
@@ -82,13 +84,14 @@ END
 function record
 {
     local what=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
+from __future__ import print_function
 import comma
 
 point_t = comma.csv.struct( 'x,y,z', 'float64', 'float64', 'float64' )
 timestamped_point_t = comma.csv.struct( 't,coordinates', 'datetime64[us]', point_t )
 record_t = comma.csv.struct( 'observer,event', 'S3', timestamped_point_t )
-print ','.join( record_t.$what )
+print( ','.join( record_t.$what ) )
 END
 )"
 }
@@ -96,7 +99,8 @@ END
 function assign()
 {
     local what=$1
-    python -c "
+    python3 -c "
+from __future__ import print_function
 import sys
 import numpy as np
 import time
@@ -106,7 +110,7 @@ class test_class:
     class nested:
         def __init__( self ):
             self.a = int( 3 )
-            
+
     def __init__( self ):
         self.a = int( 1 )
         self.b = float( 2 )
@@ -118,7 +122,7 @@ class test_class:
 
 nested_struct = comma.csv.struct( 'a', 'uint32' )
 #test_struct = comma.csv.struct( 'a,b,c,d,e,f,g', 'uint32', 'float32', 'datetime64[us]', 'S4', nested_struct, 'uint32', ( nested_struct, ( 2, ) ) )
-test_struct = comma.csv.struct( 'a,b,c,d,e', 'uint32', 'float32', 'datetime64[us]', 'S4', nested_struct )
+test_struct = comma.csv.struct( 'a,b,c,d,e', 'uint32', 'float32', 'datetime64[us]', 'U4', nested_struct )
 t = test_struct()
 t['a'] = 10
 t['b'] = 20
@@ -131,23 +135,24 @@ t['e']['a'] = 40
 c = test_class()
 assign = test_struct.assign( c )
 assign( t[0] )
-print 'assign/basic/output/a=' + str( c.a )
-print 'assign/basic/output/b=' + str( c.b )
-print 'assign/basic/output/c=\"' + str( c.c ).split( '+' )[0] + '\"'
-print 'assign/basic/output/d=\"' + str( c.d ) + '\"'
-print 'assign/basic/output/e/a=' + str( c.e.a )
-#print 'assign/basic/output/f[0]=' + str( c.f[0] )
-#print 'assign/basic/output/f[1]=' + str( c.f[1] )
-#print 'assign/basic/output/g[0]/a=' + str( c.g[0].a )
-#print 'assign/basic/output/g[1]/a=' + str( c.g[1].a )
+
+print( 'assign/basic/output/a=' + str( c.a ) )
+print( 'assign/basic/output/b=' + str( c.b ) )
+print( 'assign/basic/output/c=\"' + str( c.c ).split( '+' )[0] + '\"' )
+print( 'assign/basic/output/d=\"' + str( c.d ) + '\"' )
+print( 'assign/basic/output/e/a=' + str( c.e.a ) )
+#print( 'assign/basic/output/f[0]=' + str( c.f[0] ) )
+#print( 'assign/basic/output/f[1]=' + str( c.f[1] ) )
+#print( 'assign/basic/output/g[0]/a=' + str( c.g[0].a ) )
+#print( 'assign/basic/output/g[1]/a=' + str( c.g[1].a ) )
 def convert( v ): return 'customized time: ' + str( v ).split( '+' )[0] if type( v ) == np.datetime64 else v
 assign = test_struct.assign( c, convert )
 assign( t[0] )
-print 'assign/convert/output/a=' + str( c.a )
-print 'assign/convert/output/b=' + str( c.b )
-print 'assign/convert/output/c=\"' + str( c.c ) + '\"'
-print 'assign/convert/output/d=\"' + str( c.d ) + '\"'
-print 'assign/convert/output/e/a=' + str( c.e.a )
+print( 'assign/convert/output/a=' + str( c.a ) )
+print( 'assign/convert/output/b=' + str( c.b ) )
+print( 'assign/convert/output/c=\"' + str( c.c ) + '\"' )
+print( 'assign/convert/output/d=\"' + str( c.d ) + '\"' )
+print( 'assign/convert/output/e/a=' + str( c.e.a ) )
 "
 }
 
diff --git a/python/comma/csv/test/unit/test b/python/comma/csv/test/unit/test
index e4997a032..6724cd089 100755
--- a/python/comma/csv/test/unit/test
+++ b/python/comma/csv/test/unit/test
@@ -3,5 +3,5 @@
 name=$( basename $0 )
 
 for t in test_*.py; do
-    python $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
+    python3 $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
 done
diff --git a/python/comma/csv/test/unit/test_stream.py b/python/comma/csv/test/unit/test_stream.py
index 191a1c58b..d17ef8b3c 100644
--- a/python/comma/csv/test/unit/test_stream.py
+++ b/python/comma/csv/test/unit/test_stream.py
@@ -1,3 +1,4 @@
+from __future__ import print_function
 import unittest
 import numpy as np
 import sys
@@ -16,7 +17,8 @@ def test_use_defaults(self):
         self.assertTrue(s.full_xpath)
 
     def test_override_defaults(self):
-        from cStringIO import StringIO
+        if sys.version_info.major < 3: from cStringIO import StringIO # quick and dirty, sigh...
+        else: from io import StringIO
         source = StringIO("")
         target = StringIO("")
         t = comma.csv.stream(comma.csv.struct('id', 'S4'), delimiter=';')
@@ -133,11 +135,11 @@ def test_size(self):
         s = comma.csv.struct('x,id', 'f8', 'u4')
         tied = comma.csv.stream(comma.csv.struct('i', 'u2'))
         t1 = comma.csv.stream(s)
-        self.assertEqual(t1.size, comma.csv.stream.buffer_size_in_bytes / 12)
+        self.assertEqual(t1.size, comma.csv.stream.buffer_size_in_bytes // 12)
         t2 = comma.csv.stream(s, flush=True)
         self.assertEqual(t2.size, 1)
         t3 = comma.csv.stream(s, tied=tied)
-        self.assertEqual(t3.size, comma.csv.stream.buffer_size_in_bytes / 2)
+        self.assertEqual(t3.size, comma.csv.stream.buffer_size_in_bytes // 2)
 
     def test_ascii_simple_single_field(self):
         s = comma.csv.struct('x', 'f8')
diff --git a/python/comma/csv/time.py b/python/comma/csv/time.py
index 611cf6183..65000e66b 100644
--- a/python/comma/csv/time.py
+++ b/python/comma/csv/time.py
@@ -1,36 +1,10 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import absolute_import
 import numpy as np
 import re
 import os
+import sys
 import time
 
 UNIT = 'us'
@@ -40,6 +14,8 @@
 NOT_A_DATE_TIME = np.datetime64('NaT')
 POSITIVE_INFINITY = np.datetime64('294247-01-09T04:00:54.775807')
 NEGATIVE_INFINITY = np.datetime64('-290308-12-22T19:59:05.224191')
+BASESTRING = basestring if sys.version_info.major < 3 else str # sigh...
+NUMPY_VERSION_MAJOR_, NUMPY_VERSION_MINOR_, NUMPY_VERSION_PATCH_ = ( int( _ ) for _ in np.__version__.split( '.' ) )
 
 def is_undefined(numpy_time): return str(numpy_time) == str(NOT_A_DATE_TIME)
 
@@ -50,6 +26,7 @@ def is_negative_infinity(numpy_time): return numpy_time == NEGATIVE_INFINITY
 def to_numpy(t):
     """
     return numpy datetime64 scalar corresponding to the given comma time string
+    if t has nanoseconds, it will be trunkated (rather than rounded) to microseconds
 
     >>> import numpy as np
     >>> from comma.csv.time import to_numpy
@@ -62,10 +39,11 @@ def to_numpy(t):
     >>> to_numpy('')
     numpy.datetime64('NaT')
     """
+    if NUMPY_VERSION_MAJOR_ == 1 and NUMPY_VERSION_MAJOR_ < 14 and isinstance( t, bytes ): t = t.decode( 'utf-8' ) # quick and dirty, since some packages, e.g. ubuntu 18.04 python3-numpy, still install numpy 1.13; remove once move on with the version since it's waste of cpu cycles
     if t in ['', 'not-a-date-time']: return NOT_A_DATE_TIME
     if t in ['+infinity', '+inf', 'infinity', 'inf']: return POSITIVE_INFINITY
     if t in ['-infinity', '-inf']: return NEGATIVE_INFINITY
-    if not (isinstance(t, basestring) and re.match(r'^(\d{8}T\d{6}(\.\d{0,6})?)$', t)):
+    if not (isinstance(t, BASESTRING) and re.match(r'^(\d{8}T\d{6}(\.\d{0,12})?)$', t)):
         msg = "expected comma time, got '{}'".format(repr(t))
         raise TypeError(msg)
     v = list(t)
@@ -100,7 +78,9 @@ def from_numpy(t):
     if is_undefined(t): return 'not-a-date-time'
     if is_negative_infinity(t): return '-infinity'
     if is_positive_infinity(t): return '+infinity'
-    return re.sub(r'(\.0{6})?([-+]\d{4}|Z)?$', '', str(t)).translate(None, ':-')
+    s = re.sub(r'(\.0{6})?([-+]\d{4}|Z)?$', '', str(t))
+    #return re.sub(r'(\.0{6})?([-+]\d{4}|Z)?$', '', str(t)).translate(None, ':-')
+    return s.translate(str.maketrans('', '', ':-')) if sys.version_info.major > 2 else s.translate(None, ':-') # sigh... cannot believe i am going this...
 
 def ascii_converters(types):
     converters = {}
diff --git a/python/comma/dictionary/__init__.py b/python/comma/dictionary/__init__.py
new file mode 100644
index 000000000..4705183ed
--- /dev/null
+++ b/python/comma/dictionary/__init__.py
@@ -0,0 +1,3 @@
+# Copyright (c) 2023 Vsevolod Vlaskine
+
+from ._util import at, has, leaves, parents, set, update
diff --git a/python/comma/dictionary/_util.py b/python/comma/dictionary/_util.py
new file mode 100644
index 000000000..9bc5a69a5
--- /dev/null
+++ b/python/comma/dictionary/_util.py
@@ -0,0 +1,177 @@
+'''
+operations on dict and dict-like objects with string keys
+made for convenience, not for performance
+'''
+
+import copy, functools, os, sys, typing
+
+def at( d, path, delimiter = '/', no_throw = False, full = False ): # todo: default=...
+    '''
+    return value at a given path in a dictionary
+    
+    params
+    ------
+        d: dictionary
+        path: path in dictionary, e.g 'a/b/c/d'
+        delimiter: path delimiter
+        no_throw: if path not found, return None instead of throwing exception
+        full: output dictionary, not just the key value, see example below
+    
+    examples
+    --------
+        >>> d = { "a": { "b": { "c": 5, "d": 6 } }, "e": [ 7, [ 8, 9, 10 ] ] }
+        >>> comma.dictionary.at( d, "a/b/c" )
+        5
+        >>> comma.dictionary.at( d, "a/b/c", full = True )
+        { "a": { "b": { "c": 5 } } }
+        >>> comma.dictionary.at( d, 'e[0]' )
+        7
+        >>> comma.dictionary.at( d, 'e[1]' )
+        [ 8, 9, 10 ]
+        >>> comma.dictionary.at( d, 'e[2][1]' )
+        10
+        >>> comma.dictionary.at( d, 'e[1][1:]' )assert permissive or has( d, p )
+                
+        [ 9, 10 ]
+        >>> e = [1, 2, {'a': 3} ]
+        >>> comma.dictionary.at( e, '[2]/a' )
+        3
+    '''
+    s = path.split( delimiter )
+    def _value( d, k ):
+        if not k:
+            if no_throw: return None
+            raise ValueError( f'"{path}" has an empty element; remove initial, trailing, or duplicated delimiters' )
+        n = k.split( '[', 1 )
+        if len( n ) == 1: return None if no_throw and ( not isinstance( d, dict ) or not k in d ) else d[k]
+        if full:
+            if no_throw: return None
+            raise KeyError( f'on path "{path}": full=True not supported for array indices, since it cannot be done consistently' )
+        if no_throw:
+            try: return eval( f'd[{n[1]}' if n[0] == '' else f'd[n[0]][{n[1]}', { 'd': d, 'n': n } )
+            except: return None
+        return eval( f'd[{n[1]}' if n[0] == '' else f'd[n[0]][{n[1]}', {'d': d, 'n': n} )
+    r = functools.reduce( lambda d, k: _value( d, k ), s, d )
+    return None if r is None else functools.reduce( lambda d, k: { k: d }, [ r ] + s[::-1] ) if full else r
+
+def has( d, path, delimiter = '/' ):
+    '''
+    return true if element at a given dictionary path exists
+
+    todo: support list indices
+    
+    examples
+    --------
+        >>> d = { "a": { "b": { "c": 1, "d": 2, "e": [ 3, 4, { "f": 5 } ] } } }
+        >>> comma.dictionary.has( d, "a/b/c" )
+        True
+        >>> comma.dictionary.has( d, [ "a", "b", "c" ] )
+        True
+        >>> comma.dictionary.has( d, [ "a", "b", "x" ] )
+        False
+    '''
+    p = path.split( delimiter ) if isinstance( path, str ) else path
+    return functools.reduce( lambda d, k: ( d[k[1]] if k[0] + 1 < len( p ) else True ) if isinstance( d, dict ) and k[1] in d else False, enumerate( p ), d )
+
+def leaves( d, path=None ):
+    '''
+    generator of the leaf items of a nested dictionary or list, yields path-value pairs
+
+    example
+    -------
+        >>> list( comma.dictionary.leaves( { "x": { "y": [ { "z": 0 }, {"w": 2 } ], "v": "hello" } } ) )
+        [('x/y[0]/z', 0), ('x/y[1]/w', 2), ('x/v', 'hello')]
+    '''
+    if path is None: path = ''
+    if isinstance( d, dict ):
+        for key, value in d.items(): yield from leaves( value, f'{path}/{key}' )
+    elif isinstance( d, list ):
+        for i, value in enumerate(d): yield from leaves( value, f'{path}[{i}]' )
+    else:
+        yield path[1:] if path and path[0] == '/' else path, d
+
+def parents( d, path, parent=None ):
+    '''
+    generator of parents of a given path
+
+    todo: usage semantics and examples
+    todo: unit test
+    '''
+    p = path
+    while p not in [ '', '/' ]:
+        if parent is None:
+            p = os.path.dirname( p )
+        else:
+            q = at( d, f'{p}/{parent}', no_throw=True )
+            if q in [ '', '/' ]: break
+            if q is None: p = os.path.dirname( p )
+            else: p = q[1:] if q[0] == '/' else f'{os.path.dirname( p )}/{q}'
+        if p not in [ '', '/' ]: yield p[1:] if p[0] == '/' else p # quick and dirty
+
+def set( d, path, value, delimiter = '/' ):
+    '''
+    assign value to a nested dictionary/list element
+    
+    examples
+    --------
+        >>> d = { "a": { "b": 1, "c": [ 2, 3 ], "d": { "e": 4 } } }
+        >>> comma.dictionary.set( d, 'a/b/c[1]', 5 )
+        todo
+    '''
+    def _set( d, p ):
+        s = p[0].split( '[', 1 )
+        if len( p ) == 1:
+            if len( s ) == 1: d[p[0]] = value
+            else: exec( f'd[{s[1]} = value' if s[0] == '' else f'd["{s[0]}"][{s[1]} = value', { 'd': d, 'value': value } )
+        else:
+            if len( s ) == 1:
+                if not p[0] in d: d[p[0]] = {}
+                _set( d[p[0]], p[ 1: ] )
+            else:
+                if ( len( s ) == 1 or s[0] != '' ) and not s[0] in d: raise KeyError( f'on path {path}: {s[0]} not found' )
+                _set( eval( f'd[{s[1]}' if s[0] == '' else f'd["{s[0]}"][{s[1]}', { 'd': d } ), p[1:])
+    _set( d, path.split( delimiter ) )
+    return d
+
+def update( d0, d, verbose=False ):
+    '''
+    nested update of d0 by values in d
+    
+    examples
+    --------
+        >>> import comma.dictionary
+        >>> comma.dictionary.update( { 'a': 1, 'b': 2, 'c': [3, 4, 5]}, { 'a': 6, 'c': [7, 8, 9, 10] } )
+        { 'a': 6, 'b': 2, 'c': [7, 8, 9, 10]}
+    '''
+    def _update_path( path, k, bracketed=False ):
+        p = copy.deepcopy( path )
+        if bracketed:
+            if len( p ) == 0: p = [ f'[{k}]' ]
+            else: p[-1] = f'{p[-1]}[{k}]'
+        else: p.append( k )
+        return p
+
+    def _update_path_none( path, k, bracketed=False ): return path
+
+    def _assign( _d0, k, v, path, _p ):
+        t = _d0[k]
+        if isinstance( t, typing.Dict ) or isinstance( t, typing.List ): _update( t, v, path, _p )
+        else: _d0[k] = v
+
+    def _update( _d0, _d, path, _p ):
+        if isinstance( _d0, typing.Dict ):
+            assert isinstance( _d, typing.Dict ), f'expected dictionary in d at {"/".join( path )}; got: type(_d)={type(_d)}'
+            for k, v in _d.items():
+                if k in _d0: _assign( _d0, k, v, _p( path, k ), _p )
+                else: _d0[k] = copy.deepcopy( v )
+        elif isinstance( _d0, typing.List ):
+            assert isinstance( _d, typing.List ), f'expected list in d at {"/".join( path )}; got: type(_d)={type(_d)}'
+            for i, v in enumerate( _d ):
+                if i < len( _d0 ): _assign( _d0, i, v, _p( path, i, True ), _p )
+                else: _d0.append( copy.deepcopy( v ) )
+        else:
+            raise NotImplementedError( f'expected list or dictionary in d0 at {"/".join( path )}; got: type(d0)={type(d0)}' )
+
+    _p = _update_path if verbose else _update_path_none
+    _update( d0, d, [], _p )
+    return d0
diff --git a/python/comma/dictionary/test/test b/python/comma/dictionary/test/test
new file mode 100755
index 000000000..805e29f9b
--- /dev/null
+++ b/python/comma/dictionary/test/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+# todo! consolidate pytests
+name=$( basename $0 )
+type -p pytest >/dev/null || { echo "$0: pytest not found; to install run: sudo apt install python3-pytest" >&2; exit 1; }
+pytest 1>&2 && echo "$name: succeeded" >&2 || { echo "$name: failed" >&2; exit 1; }
diff --git a/python/comma/dictionary/test/test_dictionary.py b/python/comma/dictionary/test/test_dictionary.py
new file mode 100644
index 000000000..05f2f0790
--- /dev/null
+++ b/python/comma/dictionary/test/test_dictionary.py
@@ -0,0 +1,131 @@
+import pytest
+from comma import dictionary
+
+def test_dictionary_at():
+    d = { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 }, 'g': 3 } }, 'p': [ 4, 5, { 'q': 6 } ], 'r': { 's': [ [ 7, 8 ] ] } }
+    assert dictionary.at( d, 'a/b/c' ) == { 'd': 1, 'f': 2 }
+    assert dictionary.at( d, 'a.b.c', delimiter = '.' ) == { 'd': 1, 'f': 2 }
+    assert dictionary.at( d, 'a/b/c/d' ) == 1
+    assert dictionary.at( d, 'a/b/g' ) == 3
+    assert dictionary.at( d, 'a', full = True ) == { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 }, 'g': 3 } } }
+    assert dictionary.at( d, 'a/b', full = True ) == { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 }, 'g': 3 } } }
+    assert dictionary.at( d, 'a/b/c', full = True ) == { 'a': { 'b': { 'c': { 'd': 1, 'f': 2 } } } }
+    assert dictionary.at( d, 'a/b/c/d', full = True ) == { 'a': { 'b': { 'c': { 'd': 1 } } } }
+    assert dictionary.at( d, 'a/b/g', full = True ) == { 'a': { 'b': { 'g': 3 } } }
+    with pytest.raises( KeyError ): dictionary.at( d, 'x' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'x/y' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'a/z' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'a/b/c/e' )
+    with pytest.raises( TypeError ): dictionary.at( d, 'a/b/c/d/x' )
+    assert dictionary.at( d, 'x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/b/x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/b/c/x', no_throw = True ) is None
+    assert dictionary.at( d, 'a/b/c/d/x', no_throw = True ) is None
+    assert dictionary.at( d, 'p' ) == [ 4, 5, { 'q': 6 } ]
+    assert dictionary.at( d, 'p[0]' ) == 4
+    assert dictionary.at( d, 'p[1]' ) == 5
+    assert dictionary.at( d, 'p[2]' ) == { 'q': 6 }
+    assert dictionary.at( d, 'p[2]/q' ) == 6
+    assert dictionary.at( d, 'r' ) == { 's': [ [ 7, 8 ] ] }
+    assert dictionary.at( d, 'r/s' ) == [ [ 7, 8 ] ]
+    assert dictionary.at( d, 'r/s[0][0]' ) == 7
+    assert dictionary.at( d, 'r/s[0][1]' ) == 8
+    with pytest.raises( IndexError ): dictionary.at( d, 'r/s[0][2]' )
+    with pytest.raises( KeyError ): dictionary.at( d, 'r/s[0][2]', full = True )
+    assert dictionary.at( d, 'r/s[0][2]', full = True, no_throw = True ) is None
+    assert dictionary.at( { 'a': [11,22,33,44] }, 'a[1:3]' ) == [22, 33]
+    assert dictionary.at( { 'a': [11,22,33,44] }, 'a[1:]' ) == [22, 33, 44]
+    assert dictionary.at([11, 22, 33, 44], '[1:]') == [22, 33, 44]
+    assert dictionary.at([11, {'a': 22}, 33, 44], '[1]/a') == 22
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[1]') == 4
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]') == {'g': 6}
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]/g') == 6
+    assert dictionary.at({'a': {}, 'e': [3, 4, {'g': 6}]}, 'e[2]/g') == 6
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[0]', no_throw=True) == 3
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]', no_throw=True) == {'g': 6}
+    assert dictionary.at({'e': [3, 4, {'g': 6}]}, 'e[2]/g', no_throw=True) == 6
+
+def test_dictionary_has():
+    d = { 'a': { 'b': { 'c': { 'd': 1 } }, 'e': [ 2, { 'f': 3 } ] } }
+    assert dictionary.has( d, 'a/b/c' )
+    assert dictionary.has( d, 'a.b.c', delimiter = '.' )
+    assert dictionary.has( d, 'a/b/c/d' )
+    # assert dictionary.has( d, 'a/b/e' ) # todo: support arrays
+    # assert dictionary.has( d, 'a/b/e[0]' ) # todo: support arrays
+    # assert dictionary.has( d, 'a/b/e[1]' ) # todo: support arrays
+    # assert dictionary.has( d, 'a/b/e[1]/f' ) # todo: support arrays
+    assert not dictionary.has( d, 'x' )
+    assert not dictionary.has( d, 'x/y' )
+    assert not dictionary.has( d, 'a/z' )
+    assert not dictionary.has( d, 'a/b/c/e' )
+    assert not dictionary.has( d, 'a/b/c/d/x' )
+    assert not dictionary.has( d, 'a/b/c/d/x/y' )
+
+def test_dictionary_leaves():
+    assert list( dictionary.leaves( { 'a': 1, 'b': 2, 'c': 3 } ) ) == [ ( 'a', 1 ), ( 'b', 2 ), ( 'c', 3 ) ]
+    assert list( dictionary.leaves( ['a', 'b', 'c', 'd'] ) ) == [ ('[0]', 'a'), ('[1]', 'b'), ('[2]', 'c'), ('[3]', 'd') ]
+    assert list( dictionary.leaves( {'a': {'b': [0, 1]}, 'c': 2} ) ) == [('a/b[0]', 0), ('a/b[1]', 1), ('c', 2)]
+    assert list( dictionary.leaves( [ {'a': 0}, {'b': {'c':1, 'd': 2}} ] ) ) == [('[0]/a', 0), ('[1]/b/c', 1), ('[1]/b/d', 2)]
+    assert list( dictionary.leaves( { 'a': [ {'b': 0}, {'c': 1} ] } ) ) == [('a[0]/b', 0), ('a[1]/c', 1)]
+    assert list( dictionary.leaves( { 'a': { 'b': { 'c': 0 } } } ) ) == [ ( 'a/b/c', 0 ) ]
+    assert list( dictionary.leaves( 'a' ) ) == [ ( '', 'a' ) ]
+    assert list( dictionary.leaves( {} ) ) == []
+    assert list( dictionary.leaves( [] ) ) == []
+
+def test_dictionary_parents():
+    assert list( dictionary.parents( { 'a': { 'b': { 'c': {} } } }, 'a/b/c' ) ) == ['a/b', 'a']
+    assert list( dictionary.parents( { 'a': { 'b': [ 5, { 'c': 6 } ] } }, 'a/b[1]/c' ) ) == ['a/b[1]', 'a']
+    assert list( dictionary.parents( { 'a': { 'b': [ 5, { 'c': 6 } ] } }, 'a/b[1]/c', parent='parent' ) ) == ['a/b[1]', 'a']
+    with pytest.raises( KeyError ): dictionary.at( {}, 'a/b/c' )
+    assert list( dictionary.parents( { 'a': { 'parent': 'd', 'b': [ 5, { 'c': { 'parent': '/a/b[0]' } } ], 'd': 3 } }, 'a/b[1]/c', parent='parent' ) ) == ['a/b[0]', 'a', 'd']
+
+def test_dictionary_set():
+    d = {}
+    dictionary.set( d, 'a/b/c', 5 )
+    assert dictionary.at( d, 'a/b/c' ) == 5
+    dictionary.set( d, 'a/b/c', 10 )
+    assert dictionary.at( d, 'a/b/c' ) == 10
+    dictionary.set( d, 'a.b.c', 15, delimiter = '.' )
+    assert dictionary.at( d, 'a/b/c' ) == 15
+    assert dictionary.set( {}, 'a.b.c', 15, delimiter = '.' ) == { 'a': { 'b': { 'c': 15 } } }
+    d = dictionary.set( {}, 'a.x.y', 3, delimiter = '.' )
+    assert dictionary.set( d, 'a.b.c', 15, delimiter = '.' ) == { 'a': { 'b': { 'c': 15 }, 'x': { 'y': 3 } } }
+    assert d == { 'a': { 'b': { 'c': 15 }, 'x': { 'y': 3 } } }
+    e = { 'a': [0,[11,22,33],{'b': 4},5,6,7] }
+    dictionary.set(e, 'a[0]', 5)
+    dictionary.set(e, 'a[3]', 55)
+    assert e['a'][0] == 5
+    assert e['a'][3] == 55
+    dictionary.set(e, 'a[1][1]', 777)
+    assert e['a'][1][1] == 777
+    dictionary.set(e, 'a[2]/b', 8)
+    dictionary.set(e, 'a[3:5]', [88,99])
+    assert e['a'][3:5] == [88,99]
+    f = [0,1,2,3,{'a': 4}]
+    dictionary.set(f, '[2:4]', [22,33])
+    assert f[2:4] == [22,33]
+    dictionary.set(f, '[4]/a', 44)
+    dictionary.set(f, '[4]/b', 55)
+    assert f[4] == {'a': 44, 'b': 55 }
+
+def test_dictionary_update():
+    assert dictionary.update( {}, {} ) == {}
+    assert dictionary.update( { 'a': 1, 'b': 2 }, {} ) == { 'a': 1, 'b': 2 }
+    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'c': 3 } ) == { 'a': 1, 'b': 2, 'c': 3 }
+    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'c': 3, 'd': { 'e': 4 } } ) == { 'a': 1, 'b': 2, 'c': 3, 'd': { 'e': 4 } }
+    assert dictionary.update( {}, { 'c': 3 } ) == { 'c': 3 }
+    assert dictionary.update( {}, { 'c': 3, 'd': { 'e': 4 } } ) == { 'c': 3, 'd': { 'e': 4 } }
+    assert dictionary.update( { 'a': 1, 'b': 2 }, { 'a': 4, 'c': 3 } ) == { 'a': 4, 'b': 2, 'c': 3 }
+    assert dictionary.update( { 'a': 1, 'b': 2, 'd': { 'e': { 'f': 3 }, 'g': { 'h': 4 } } }, { 'd': { 'e': { 'f': 5 }, 'g': { 'h': 4 } } } ) == { 'a': 1, 'b': 2, 'd': { 'e': { 'f': 5 }, 'g': { 'h': 4 } } }
+    assert dictionary.update( [], [] ) == []
+    assert dictionary.update( [1, 2], [] ) == [1, 2]
+    assert dictionary.update( [1, 2], [3, 4, 5] ) == [3, 4, 5]
+    assert dictionary.update( [1, { 'a': 1, 'b': { 'c': 2 } }], [1, {}, 5] ) == [1, { 'a': 1, 'b': { 'c': 2 } }, 5]
+    assert dictionary.update( [1, { 'a': 1, 'b': { 'c': 2 } }], [1, { 'a': 4 }, 5] ) == [1, { 'a': 4, 'b': { 'c': 2 } }, 5]
+    assert dictionary.update( [1, { 'a': 1, 'b': { 'c': 2 } }], [1, { 'a': 4, 'b': { 'c': 6, 'd': 7 } }, 5] ) == [1, { 'a': 4, 'b': { 'c': 6, 'd': 7 } }, 5]
+    assert dictionary.update( [1, 2, [3, 4, 5]], [] ) == [1, 2, [3, 4, 5]]
+    assert dictionary.update( [], [1, 2, [3, 4, 5]] ) == [1, 2, [3, 4, 5]]
+    assert dictionary.update( [1, 2, [3, 4, 5]], [1, 2, [3, 4, 6, 7]] ) == [1, 2, [3, 4, 6, 7]]
+    assert dictionary.update( { 'a': 1, 'b': 2, 'c': [3, 4, 5]}, { 'a': 6, 'c': [7, 8, 9, 10] } ) == { 'a': 6, 'b': 2, 'c': [7, 8, 9, 10]}
+    # todo: more tests on corner cases, negative cases, etc
diff --git a/python/comma/filesystem/__init__.py b/python/comma/filesystem/__init__.py
new file mode 100644
index 000000000..bd07fc5c1
--- /dev/null
+++ b/python/comma/filesystem/__init__.py
@@ -0,0 +1 @@
+from ._impl import find, walk
\ No newline at end of file
diff --git a/python/comma/filesystem/_impl.py b/python/comma/filesystem/_impl.py
new file mode 100644
index 000000000..cd731e23f
--- /dev/null
+++ b/python/comma/filesystem/_impl.py
@@ -0,0 +1,35 @@
+# Copyright (c) 2024 Vsevolod Vlaskine
+
+import os
+
+# same as os.walk, but with followmounts flag
+def walk( dir, followlinks=False, followmounts=False, excluded=None ):
+    if excluded is None: excluded = []
+    real_root = os.path.realpath( dir )
+    def _valid( i ): # quick and dirty, excessive and inefficient for now
+        p = i[0]
+        if os.path.basename( p ) in excluded: return False
+        if followmounts: return True
+        p = os.path.realpath( i[0] )
+        while True:
+            if p == '/': return True
+            if os.path.ismount( p ): return False
+            if p == '': return True
+            p = os.path.dirname( p )
+    return filter( _valid, os.walk( dir, followlinks=followlinks ) )
+
+def find( what, dirs, find_children=False ):
+    if not isinstance( what, list ): what = [ what ]
+    def _valid( i ): # quick and dirty, inefficient for now
+        p = i[0]
+        if find_children:
+            while True:
+                for q in what:
+                    if os.path.exists( f'{p}/{q}' ): return True # if os.path.isfile( f'{p}/{what}' ) or os.path.isfile( f'{p}/test' ): return True
+                if p in ['', '/']: return False
+                p = os.path.dirname( p )
+        for q in what:
+            if os.path.exists( f'{p}/{q}' ): return True
+        return False
+    return filter( _valid, dirs )
+
diff --git a/python/comma/io/CMakeLists.txt b/python/comma/io/CMakeLists.txt
deleted file mode 100644
index e69de29bb..000000000
diff --git a/python/comma/io/__init__.py b/python/comma/io/__init__.py
index 9acc4e680..477c16ed9 100644
--- a/python/comma/io/__init__.py
+++ b/python/comma/io/__init__.py
@@ -27,4 +27,4 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .readlines_unbuffered import readlines_unbuffered
+from ._readlines_unbuffered import readlines_unbuffered
diff --git a/python/comma/io/readlines_unbuffered.py b/python/comma/io/_readlines_unbuffered.py
similarity index 93%
rename from python/comma/io/readlines_unbuffered.py
rename to python/comma/io/_readlines_unbuffered.py
index 5d34e1561..b8c158524 100644
--- a/python/comma/io/readlines_unbuffered.py
+++ b/python/comma/io/_readlines_unbuffered.py
@@ -28,8 +28,8 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 import sys
-import itertools
-
+if sys.version_info.major < 3: from itertools import ifilter
+else: ifilter = filter # quick and dirty, tired of googling...
 
 def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
     """
@@ -54,7 +54,7 @@ def readlines_unbuffered(size, source=sys.stdin, skip_blank_lines=True):
             number_of_lines += 1
         return lines
     if skip_blank_lines:
-        source_ = itertools.ifilter(lambda line: line.strip(), source)
+        source_ = list( ifilter(lambda line: line.strip(), source) )
     else:
         source_ = source
     return [line.rstrip('\n') for line in source_]
diff --git a/python/comma/io/windows_binary.py b/python/comma/io/windows_binary.py
index 0c56b0883..3123fc897 100644
--- a/python/comma/io/windows_binary.py
+++ b/python/comma/io/windows_binary.py
@@ -1,33 +1,4 @@
-#!/bin/python
-
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 __author__ = 'j.underwood'
 '''
@@ -35,10 +6,8 @@
 '''
 import sys
 
-
 # todo check this still allows ascii
 # todo if not, provide a function instead
 if sys.platform == "win32":
-        import os
-        import msvcrt
-        msvcrt.setmode(sys.stdout.fileno(), os.O_BINARY)
+    import os, msvcrt
+    msvcrt.setmode(sys.stdout.fileno(), os.O_BINARY)
diff --git a/python/comma/numpy/__init__.py b/python/comma/numpy/__init__.py
index fca93ccd7..8cc2cc9dd 100644
--- a/python/comma/numpy/__init__.py
+++ b/python/comma/numpy/__init__.py
@@ -27,4 +27,4 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .functions import *
+from ._functions import merge_arrays, strip_byte_order_prefix, shape_to_string, types_of_dtype, structured_dtype, type_to_string
diff --git a/python/comma/numpy/functions.py b/python/comma/numpy/_functions.py
similarity index 87%
rename from python/comma/numpy/functions.py
rename to python/comma/numpy/_functions.py
index 277e9c8a3..b0214c298 100644
--- a/python/comma/numpy/functions.py
+++ b/python/comma/numpy/_functions.py
@@ -28,9 +28,11 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import absolute_import
+from __future__ import print_function
 import numpy as np
 import operator
 import re
+from functools import reduce
 
 
 def merge_arrays(first, second):
@@ -114,14 +116,14 @@ def types_of_dtype(dtype, unroll=False):
         return tuple(types)
     except ValueError:
         import sys
-        print >>sys.stderr
-        print >>sys.stderr, "ATTENTION: types_of_dtype failed due to the version of numpy on this computer"
-        print >>sys.stderr, "           your applications using comma.csv will mostly work; sometimes they will fail"
-        print >>sys.stderr, "           early (meaning you will know straight away) until types_of_dtype is rewritten"
-        print >>sys.stderr, "           See todo comment in python/comma/numpy/functions.py"
-        print >>sys.stderr
-        for s in sys.exc_info(): print >>sys.stderr, "           " + str( s )
-        print >>sys.stderr
+        print( file = sys.stderr )
+        print( "ATTENTION: types_of_dtype failed due to the version of numpy on this computer", file = sys.stderr )
+        print( "           your applications using comma.csv will mostly work; sometimes they will fail", file = sys.stderr )
+        print( "           early (meaning you will know straight away) until types_of_dtype is rewritten", file = sys.stderr )
+        print( "           See todo comment in python/comma/numpy/functions.py", file = sys.stderr )
+        print( file = sys.stderr )
+        for s in sys.exc_info(): print( "           " + str( s ), file = sys.stderr )
+        print( file = sys.stderr )
         raise
 
 def structured_dtype(format_or_type):
@@ -140,8 +142,7 @@ def structured_dtype(format_or_type):
     >>> np.dtype('f8').names
     """
     dtype = np.dtype(format_or_type)
-    if len(dtype) != 0:
-        return dtype
+    if len(dtype) != 0: return dtype
     return np.dtype([('', format_or_type)])
 
 
diff --git a/python/comma/numpy/test/test b/python/comma/numpy/test/test
index e4997a032..4ee19ed9c 100755
--- a/python/comma/numpy/test/test
+++ b/python/comma/numpy/test/test
@@ -3,5 +3,5 @@
 name=$( basename $0 )
 
 for t in test_*.py; do
-    python $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed" >&2; exit 1; }
+    python3 $t && echo "$name: $t succeeded" >&2 || { echo "$name: $t failed; see $name/output/stdout.log for details" >&2; exit 1; }
 done
diff --git a/python/comma/numpy/test/test_functions.py b/python/comma/numpy/test/test_functions.py
index 6a7f184fd..636b61a0e 100644
--- a/python/comma/numpy/test/test_functions.py
+++ b/python/comma/numpy/test/test_functions.py
@@ -1,3 +1,4 @@
+from __future__ import print_function
 import unittest
 import numpy as np
 from comma.numpy import *
@@ -161,50 +162,50 @@ def test_structure_out_of_order(self):
             itemsize = 43
 
             ndtype1 = np.dtype( dict( names=names1, formats=formats1, offsets=offsets1, itemsize=itemsize ) )
-            sorted_fields1 = sorted( list( ndtype1.fields.iteritems() ), key = lambda t: t[1] )
+            sorted_fields1 = sorted( list( ndtype1.fields.items() ), key = lambda t: t[1] )
 
             names2 = ['a3', 'word', 'a2', 'byte' ]
             formats2 = [np.dtype(('<f8', (3,))), np.dtype('uint16'), np.dtype(('<f8', (2,))), np.dtype('uint8') ]
             offsets2 = [2, 0, 27, 26 ]
 
             ndtype2 = np.dtype( dict( names=names2, formats=formats2, offsets=offsets2, itemsize=itemsize ) )
-            sorted_fields2 = sorted( list( ndtype2.fields.iteritems() ), key = lambda t: t[1] )
+            sorted_fields2 = sorted( list( ndtype2.fields.items() ), key = lambda t: t[1] )
 
             self.assertEqual( sorted_fields1, sorted_fields2 )
             self.assertEqual( len( ndtype1.descr ), 4 )
             self.assertEqual( len( ndtype2.descr ), 5 )  # shall be 4
-            self.assertEqual( len( functions.types_of_dtype( ndtype1 ) ), 4 )
-            self.assertEqual( len( functions.types_of_dtype( ndtype2 ) ), 5 )  # shall be 4
+            self.assertEqual( len( types_of_dtype( ndtype1 ) ), 4 )
+            self.assertEqual( len( types_of_dtype( ndtype2 ) ), 5 )  # shall be 4
         except ValueError:
             import sys
-            print >>sys.stderr
-            print >>sys.stderr, "ATTENTION: test_structure_out_of_order failed due to the version of numpy on this computer"
-            print >>sys.stderr, "           your applications using comma.csv will mostly work; sometimes they will fail"
-            print >>sys.stderr, "           early (meaning you will know straight away) until types_of_dtype is rewritten"
-            print >>sys.stderr, "           See todo comment in python/comma/numpy/functions.py"
-            print >>sys.stderr
-            for s in sys.exc_info(): print >>sys.stderr, "           " + str( s )
-            print >>sys.stderr
+            print( file = sys.stderr )
+            print( "ATTENTION: test_structure_out_of_order failed due to the version of numpy on this computer", file = sys.stderr )
+            print( "           your applications using comma.csv will mostly work; sometimes they will fail", file = sys.stderr )
+            print( "           early (meaning you will know straight away) until types_of_dtype is rewritten", file = sys.stderr )
+            print( "           See todo comment in python/comma/numpy/functions.py", file = sys.stderr )
+            print( file = sys.stderr )
+            for s in sys.exc_info(): print( "           " + str( s ), file = sys.stderr )
+            print( file = sys.stderr )
 
         if False:
             import sys
             self.assertEqual( sorted( ndtype1.descr ), sorted( ndtype2.descr ) )
             self.assertEqual( sorted( functions.types_of_dtype( ndtype1 ) ), sorted( functions.types_of_dtype( ndtype2 ) ) )
 
-            print >>sys.stderr, "observe the differences:"
+            print( "observe the differences:", file = sys.stderr )
 
-            print >>sys.stderr, "ndtype1: ", ndtype1
-            print >>sys.stderr, "ndtype2: ", ndtype2
+            print( "ndtype1: " + str( ndtype1 ), file = sys.stderr )
+            print( "ndtype2: " + str( ndtype2 ), file = sys.stderr )
 
-            print >>sys.stderr, "ndtype1.fields: ", ndtype1.fields
-            print >>sys.stderr, "ndtype2.fields: ", ndtype2.fields
-            print >>sys.stderr, "fields identical: ", sorted_fields1 == sorted_fields2
+            print( "ndtype1.fields: " + str( ndtype1.fields ), file = sys.stderr )
+            print( "ndtype2.fields: " + str( ndtype2.fields ), file = sys.stderr )
+            print( "fields identical: " + str( sorted_fields1 == sorted_fields2 ), file = sys.stderr )
 
-            print >>sys.stderr, "ndtype1.descr: ", ndtype1.descr
-            print >>sys.stderr, "ndtype2.descr: ", ndtype2.descr
+            print( "ndtype1.descr: " + str( ndtype1.descr ), file = sys.stderr )
+            print( "ndtype2.descr: " + str( ndtype2.descr ), file = sys.stderr )
 
-            print >>sys.stderr, "types_of_dtype( ndtype1 ): ", comma.numpy.functions.types_of_dtype( ndtype1 )
-            print >>sys.stderr, "types_of_dtype( ndtype2 ): ", comma.numpy.functions.types_of_dtype( ndtype2 )
+            print( "types_of_dtype( ndtype1 ): " + str( comma.numpy.functions.types_of_dtype( ndtype1 ) ), file = sys.stderr )
+            print( "types_of_dtype( ndtype2 ): " + str( comma.numpy.functions.types_of_dtype( ndtype2 ) ), file = sys.stderr )
 
 
 if __name__ == '__main__':
diff --git a/python/comma/signal/__init__.py b/python/comma/signal/__init__.py
index c2a318e96..af8770deb 100644
--- a/python/comma/signal/__init__.py
+++ b/python/comma/signal/__init__.py
@@ -27,4 +27,4 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .signal import is_shutdown
+from ._signal import is_shutdown
diff --git a/python/comma/signal/signal.py b/python/comma/signal/_signal.py
similarity index 88%
rename from python/comma/signal/signal.py
rename to python/comma/signal/_signal.py
index 209ba511c..9612127e6 100644
--- a/python/comma/signal/signal.py
+++ b/python/comma/signal/_signal.py
@@ -28,6 +28,7 @@
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 from __future__ import absolute_import
+from __future__ import print_function
 import signal
 import sys
 import os
@@ -42,8 +43,10 @@ def __init__( self, verbose = False ):
 
     def switch_on( self, signum, frame ):
         self.state = True
-        if self.verbose: print >> sys.stderr, os.path.basename(sys.argv[0]), "caught signal:", signum
+        if self.verbose: print( os.path.basename( sys.argv[0] ), ": caught signal:", signum, file = sys.stderr )
 
-    def __nonzero__( self ): return self.state
+    def __bool__( self ): return self.state
 
-signal.signal( signal.SIGPIPE, signal.SIG_DFL )
+    __nonzero__ = __bool__
+
+# signal.signal( signal.SIGPIPE, signal.SIG_DFL )
diff --git a/python/comma/test/performance/csv/calc/max/data/max b/python/comma/test/performance/csv/calc/max/data/max
index 43b7f6ca1..d89e0dd60 100755
--- a/python/comma/test/performance/csv/calc/max/data/max
+++ b/python/comma/test/performance/csv/calc/max/data/max
@@ -1,4 +1,4 @@
-#!/usr/bin/python
+#!/usr/bin/env python3
 import numpy as np
 import comma
 t = comma.csv.struct( 'id,value', 'u4', 'f8' )
@@ -11,4 +11,3 @@ for data in s:
             continue
         max[id] = current_max
 s.write(np.array(max.items(), dtype=t))
-
diff --git a/python/comma/test/performance/csv/calc/test b/python/comma/test/performance/csv/calc/test
index 0d1c6cebe..230e6d433 100755
--- a/python/comma/test/performance/csv/calc/test
+++ b/python/comma/test/performance/csv/calc/test
@@ -4,7 +4,7 @@ function generate_uniform_input
 {
     local size=$1
     local number_of_ids=100
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import numpy as np
 import comma
 t = comma.csv.struct('id,value', 'u4', 'f8')
@@ -23,7 +23,7 @@ END
 function generate_random_input
 {
     local size=$1
-    python -c "$( cat <<END
+    python3 -c "$( cat <<END
 import numpy as np
 import comma
 t = comma.csv.struct('id,value', 'u4', 'f8')
@@ -71,4 +71,3 @@ python_script=$( pwd )/$python_script
 
 ( mkdir -p output/random && cd output/random && process random )
 ( mkdir -p output/uniform && cd output/uniform && process uniform )
-
diff --git a/python/comma/test/performance/csv/stream/test b/python/comma/test/performance/csv/stream/test
index 36f0c29d3..36d9494a5 100755
--- a/python/comma/test/performance/csv/stream/test
+++ b/python/comma/test/performance/csv/stream/test
@@ -11,7 +11,7 @@ function output_code
         *) echo "$scriptname: expected --ascii or --binary, got '$1'"; exit 1 ;;
     esac
 cat <<END
-#!/usr/bin/python
+#!/usr/bin/env python3
 
 import comma
 comma.csv.time.zone( 'UTC' )
diff --git a/python/comma/util/CMakeLists.txt b/python/comma/util/CMakeLists.txt
deleted file mode 100644
index e69de29bb..000000000
diff --git a/python/comma/util/__init__.py b/python/comma/util/__init__.py
index 000e7ad61..3d4c43554 100644
--- a/python/comma/util/__init__.py
+++ b/python/comma/util/__init__.py
@@ -27,5 +27,5 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-from .help_formatter import argparse_fmt
-from .warning import warning
\ No newline at end of file
+from ._help_formatter import argparse_fmt
+from ._warning import warning
\ No newline at end of file
diff --git a/python/comma/util/help_formatter.py b/python/comma/util/_help_formatter.py
similarity index 100%
rename from python/comma/util/help_formatter.py
rename to python/comma/util/_help_formatter.py
diff --git a/python/comma/util/warning.py b/python/comma/util/_warning.py
similarity index 100%
rename from python/comma/util/warning.py
rename to python/comma/util/_warning.py
diff --git a/python/comma/version.py b/python/comma/version.py
index be136aaf5..3d27eb5f0 100644
--- a/python/comma/version.py
+++ b/python/comma/version.py
@@ -1,31 +1,4 @@
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 # if you change this file, check that it still works with ../setup.py, which gets the comma version by reading this file
-__version__ = "1.0"
+__version__ = "1.2.1"
diff --git a/python/requirements.txt b/python/requirements.txt
new file mode 100644
index 000000000..24ce15ab7
--- /dev/null
+++ b/python/requirements.txt
@@ -0,0 +1 @@
+numpy
diff --git a/python/setup.py b/python/setup.py
index eaf1d4e55..647559a2d 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -1,14 +1,37 @@
-#!/usr/bin/env python
+#!/usr/bin/env python3
 
-from distutils.core import setup
+import setuptools #from distutils.core import setup
+import comma.version
 
-setup(
-        name                = 'comma',
-        version             = open('comma/version.py').readlines()[-1].strip().split()[-1].strip('\"'),
-        description         = 'comma python utilties',
-        url                 = 'https://github.com/acfr/comma',
+# https://realpython.com/pypi-publish-python-package/
+
+setuptools.setup(
+        name                = 'comma-py', # quick and dirty to make python packaging work
+        version             = comma.version.__version__,
+        classifiers = [
+          'Environment :: Console',
+          'Intended Audience :: End Users/Desktop',
+          'Intended Audience :: Developers',
+          'License :: OSI Approved :: BSD License',
+          'Operating System :: MacOS :: MacOS X',
+          'Operating System :: Microsoft :: Windows',
+          'Operating System :: POSIX',
+          'Programming Language :: Python :: 3',
+          'Topic :: Communications :: Email'
+        ],
+        description         = 'csv and fixed-width binary python utilities',
+        url                 = 'https://gitlab.com/orthographic/comma',
         license             = 'BSD 3-Clause',
-        packages            = [ 'comma', 'comma.csv', 'comma.csv.applications', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
-        package_dir         = { 'comma.cpp_bindings': 'comma/cpp_bindings' },
-        package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] }
+        long_description    =  open( '/'.join( __file__.split( '/' )[:-1] ) + '/README.md' ).read(), #long_description    = ( pathlib.Path(__file__).parent / "README.md" ).read_text(),
+        long_description_content_type = "text/markdown",
+        author              = "vsevolod vlaskine",
+        author_email        = "vsevolod.vlaskine@gmail.com",
+        maintainer          = 'vsevolod vlaskine',
+        maintainer_email    = 'vsevolod.vlaskine@gmail.com',
+        python_requires     = '>=3.6',
+        #install_requires    = [ 'numpy' ], # todo? does it need to be uncommented for packaging
+        packages            = [ 'comma', 'comma.containers', 'comma.containers.multidimensional', 'comma.csv', 'comma.csv.applications', 'comma.dictionary', 'comma.filesystem', 'comma.io', 'comma.numpy', 'comma.signal', 'comma.util', 'comma.cpp_bindings', 'comma.application' ],
+        package_dir         = { 'comma': 'comma', 'comma.cpp_bindings': 'comma/cpp_bindings' },
+        package_data        = { 'comma.cpp_bindings': [ '*.so', '*.dll' ] },
+        entry_points        = { 'console_scripts': ['csv-eval=comma.csv.applications.csv_eval:main'] } #scripts             = [ "comma/csv/applications/csv-eval" ]
      )
diff --git a/string/choice.h b/string/choice.h
new file mode 100644
index 000000000..45f19e852
--- /dev/null
+++ b/string/choice.h
@@ -0,0 +1,68 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+#pragma once
+
+#include <string>
+#include <vector>
+#include "../base/exception.h"
+#include "string.h"
+
+namespace comma { namespace strings {
+
+template < typename Derived, typename Base = std::string >
+struct choice: public Base
+{
+    typedef Base base_t;
+    choice( typename Derived::values rhs = static_cast< typename Derived::values >( 0 ) ): Base( Derived::choices()[static_cast< unsigned int >( rhs )] ) {}
+    choice( const std::string& rhs ) { operator=( rhs ); }
+    choice& operator=( const std::string& rhs ) { assert_valid( rhs ); Base::operator=( rhs ); return *this; }
+    typename Derived::values to_enum() const;
+    static bool valid( const std::string& rhs );
+    static void assert_valid( const std::string& rhs );
+    bool valid() const { return valid( std::string( *this ) ); } // quick and dirty for now
+    void assert_valid() const { assert_valid( std::string( *this ) ); } // quick and dirty for now
+    operator typename Derived::values() const { return to_enum(); }
+};
+
+template < typename Enum >
+Enum make_choice( const std::string& name, const std::vector< std::string >& choices ); // convenience function, quick and dirty for now
+
+namespace impl {
+
+template < typename Enum, typename T, typename V >
+inline Enum make_choice( const T& name, const V& choices ) // quick and dirty for now
+{
+    unsigned int i = 0;
+    for( const auto& c: choices ) { if( name == c ) { return static_cast< Enum >( i ); } ++i; }
+    COMMA_THROW( comma::exception, "could not convert to enum value: '" << name << "'" ); // in theory never here
+}
+
+} // namespace impl {
+
+template < typename Enum >
+inline Enum make_choice( const std::string& name, const std::vector< std::string >& choices )
+{
+    return impl::make_choice< Enum >( name, choices );
+}
+
+template < typename Derived, typename Base >
+inline typename Derived::values choice< Derived, Base >::to_enum() const
+{
+    return impl::make_choice< typename Derived::values >( static_cast< const Base& >( *this ), Derived::choices() );
+}
+
+template < typename Derived, typename Base >
+inline bool choice< Derived, Base >::valid( const std::string& rhs )
+{
+    unsigned int i = 0;
+    for( const auto& c: Derived::choices() ) { if( rhs == c ) { return true; } ++i; }
+    return false;
+}
+
+template < typename Derived, typename Base >
+inline void choice< Derived, Base >::assert_valid( const std::string& rhs )
+{
+    COMMA_ASSERT( valid( rhs ), "expected one of: " << comma::join( Derived::choices(), ',' ) << "; got: '" << rhs << "'" );
+}
+
+} } // namespace comma { namespace strings {
diff --git a/string/split.cpp b/string/split.cpp
index ed00ae1ee..71ca2d7af 100644
--- a/string/split.cpp
+++ b/string/split.cpp
@@ -1,39 +1,9 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 /// @author mathew hounsell
 
 #include <boost/optional.hpp>
-
-// Don't use <> foc comma as that requires the code to be installed first.
 #include "../base/exception.h"
 #include "split.h"
 
@@ -45,26 +15,73 @@ bool string::is_one_of( char c, const char * characters )
     return false;
 }
 
-std::vector< std::string > split( const std::string & s, const char * separators )
+static std::vector< std::string > split_impl( const std::string & s, const char * separators, bool empty_if_empty_input, unsigned int size, bool head )
 {
     std::vector< std::string > v;
+    if( empty_if_empty_input && s.empty() ) { return v; }
     const char* begin( &s[0] );
     const char* end( begin + s.length() );
     v.push_back( std::string() );
     for( const char* p = begin; p < end; ++p )
     {
         if( string::is_one_of( *p, separators ) )
+        {
             v.push_back( std::string() );
+        }
         else
+        {
             v.back() += *p;
+        }
     }
-    return v;
+    if( size == 0 || v.size() <= size ) { return v; }
+    std::vector< std::string > r( size );
+    if( head ) // quick and dirty for now
+    {
+        unsigned int sum{0};
+        for( unsigned int i = 0; i < size; ++i ) { r[i] = v[i]; sum += v[i].size() + 1; }
+        r.back() += std::string( s.substr( sum - 1 ) );
+    }
+    else
+    {
+        unsigned int sum{0}, k{0};
+        for( unsigned int i = 0; i < v.size() - size + 1; ++i ) { sum += v[i].size() + 1; ++k; }
+        r[0] = s.substr( 0, sum - 1 );
+        for( unsigned int i = 1; i < size; ++i ) { r[i] = v[k + i - 1]; }
+    }
+    return r;
+}
+
+std::vector< std::string > split( const std::string & s, const char * separators, bool empty_if_empty_input )
+{
+    return split_impl( s, separators, empty_if_empty_input, 0, true ); 
+}
+
+std::vector< std::string > split( const std::string & s, char separator, bool empty_if_empty_input )
+{
+    const char separators[] = { separator, 0 };
+    return split( s, separators, empty_if_empty_input );
+}
+
+std::vector< std::string > split_head( const std::string& s, unsigned int size, const char* separators, bool empty_if_empty_input )
+{
+    return split_impl( s, separators, empty_if_empty_input, size, true ); 
+}
+
+std::vector< std::string > split_head( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input )
+{
+    const char separators[] = { separator, 0 };
+    return split_head( s, size, separators, empty_if_empty_input );
+}
+
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, const char* separators, bool empty_if_empty_input )
+{
+    return split_impl( s, separators, empty_if_empty_input, size, false ); 
 }
 
-std::vector< std::string > split( const std::string & s, char separator )
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input )
 {
     const char separators[] = { separator, 0 };
-    return split( s, separators );
+    return split_tail( s, size, separators, empty_if_empty_input );
 }
 
 std::vector< std::string > split_escaped( const std::string & s, const char * separators, const char * quotes, char escape )
@@ -72,7 +89,7 @@ std::vector< std::string > split_escaped( const std::string & s, const char * se
     std::vector< std::string > v;
     const char* begin( &s[0] );
     const char* const end( begin + s.length() );
-    boost::optional<char> quoted;
+    boost::optional< char > quoted;
     v.push_back( std::string() );
     for( const char* p = begin; p < end; ++p )
     {
@@ -110,4 +127,49 @@ std::vector< std::string > split_escaped( const std::string & s, char separator,
     return split_escaped( s, separators, quotes, escape );
 }
 
+std::vector< std::string > split_bracketed( const std::string& s, const char* separators, char lbracket, char rbracket, bool strip_brackets )
+{
+    std::vector< std::string > v;
+    const char* begin( &s[0] );
+    const char* const end( begin + s.length() );
+    unsigned int depth = 0;
+    v.push_back( std::string() );
+    for( const char* p = begin; p < end; ++p )
+    {
+        if( lbracket == *p )
+        {
+            if( strip_brackets && depth == 0 )
+            {
+                if( !v.back().empty() ) { COMMA_THROW( comma::exception, "asked to strip brackets; expected opening bracket immediately following separator, got'" << s << "'" ); }
+            }
+            else
+            {
+                v.back() += *p;
+            }
+            ++depth;
+        }
+        else if( rbracket == *p )
+        {
+            if( !strip_brackets || depth > 1 ) { v.back() += *p; }
+            if( depth > 0 ) { --depth; }
+        }
+        else if( depth == 0 && string::is_one_of( *p, separators ) )
+        {
+            v.push_back( std::string() );
+        }
+        else
+        {
+            v.back() += *p;
+        }
+    }
+    return v;
+}
+
+std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket, char rbracket, bool strip_brackets )
+{
+    const char separators[] = { separator, 0 };
+    return split_bracketed( s, separators, lbracket, rbracket, strip_brackets );
+}
+
+
 } // namespace comma {
diff --git a/string/split.h b/string/split.h
index bdfe94722..629e5645e 100644
--- a/string/split.h
+++ b/string/split.h
@@ -1,53 +1,45 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_STRING_SPLIT_H_
-#define COMMA_STRING_SPLIT_H_
+#pragma once
 
+#include <array>
 #include <string>
 #include <vector>
+#include <boost/array.hpp>
+#include <boost/lexical_cast.hpp>
+#include <boost/optional.hpp>
 
 namespace comma {
 
 namespace string {
-    // Used for escaping / unescaping to maybe find a character in a list of specials
-    bool is_one_of( char c, const char * characters );
-}
 
-/// split string into tokens (a quick implementation); always contains at least one element
-std::vector< std::string > split( const std::string& s, const char* separators = " " );
+bool is_one_of( char c, const char* characters );
+
+} // namespace string {
 
-/// split string into tokens (a quick implementation); always contains at least one element
-std::vector< std::string > split( const std::string& s, char separator );
+/// split string into tokens (a quick implementation); always contains at least one element unless empty_if_empty_input is true
+std::vector< std::string > split( const std::string& s, const char* separators = " ", bool empty_if_empty_input = false );
+std::vector< std::string > split( const std::string& s, char separator, bool empty_if_empty_input = false );
+/// split to up to <size> elements starting from the start of the string
+std::vector< std::string > split_head( const std::string& s, unsigned int size, const char* separators = " ", bool empty_if_empty_input = false );
+std::vector< std::string > split_head( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input = false );
+/// split to up to <size> elements starting from the end of the string
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, const char* separators = " ", bool empty_if_empty_input = false );
+std::vector< std::string > split_tail( const std::string& s, unsigned int size, char separator, bool empty_if_empty_input = false );
+
+/// split string into tokens and cast to a vector of given types
+template < typename T > std::vector< T > split_as( const std::string& s, const char* separators );
+template < typename T > std::vector< T > split_as( const std::string& s, const char* separators, const T& default_value );
+template < typename T > std::vector< T > split_as( const std::string& s, char separator );
+template < typename T > std::vector< T > split_as( const std::string& s, char separator, const T& default_value );
+template < typename T > std::vector< T > split_as( const std::string& s, const char* separators, const std::vector< T >& defaults ); // todo: re-implement using traits
+template < typename T > std::vector< T > split_as( const std::string& s, char separator, const std::vector< T >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, const char* separators, const std::array< T, N >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, char separator, const std::array< T, N >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, const char* separators, const boost::array< T, N >& defaults );
+template < typename T, std::size_t N > std::vector< T > split_as( const std::string& s, char separator, const boost::array< T, N >& defaults );
 
 /// Split string into tokens; always contains at least one element;
 /// skips backslash escaped separator, handle non-nested quotes;
@@ -58,17 +50,70 @@ std::vector< std::string > split( const std::string& s, char separator );
 /// An escape character will only escape a delimiter, quote or escape character;
 /// escaping any other character will result in both being kept;
 /// e.g. c:\windows\ will be kept as c:\windows\ with the trailing backslash
-/// e.g. fname;delimiter=\\;field=a,b will be kept as fname;delimiter=\;field=a,b 
+/// e.g. filename;delimiter=\\;fields=a,b will be kept as filename;delimiter=\;fields=a,b
 ///
 /// A quote may be anywhere in a string. Quotes must be closed; i.e Each start
 /// quote must be paired with an end quote, or an exception is thrown.
 /// Quotes don't nest and can not be mixed; e.g. a ' will not close a " quoted string.
 /// However "'" and '"' are perfectly legal strings of ' and "
-std::vector< std::string > split_escaped( const std::string & s, const char * separators = " ", const char * quotes = "\"\'", char escape = '\\' );
+std::vector< std::string > split_escaped( const std::string& s, const char * separators = " ", const char * quotes = "\"\'", char escape = '\\' );
 /// split string into tokens; always contains at least one element;
-/// skips backslash escaped seperator, handle boolean quotes 
-std::vector< std::string > split_escaped( const std::string & s, char separator, const char * quotes = "\"\'", char escape = '\\' );
+/// skips backslash escaped separator, handle boolean quotes
+std::vector< std::string > split_escaped( const std::string& s, char separator, const char * quotes = "\"\'", char escape = '\\' );
+/// skips bracketed separators
+std::vector< std::string > split_bracketed( const std::string& s, const char * separators = " ", char lbracket = '(', char rbrackets = ')', bool strip_brackets = true );
+/// skips bracketed separators
+std::vector< std::string > split_bracketed( const std::string& s, char separator, char lbracket = '(', char rbracket = ')', bool strip_brackets = true );
 
-} // namespace comma {
+namespace impl {
+
+template < typename T >
+inline std::vector< T > split_with_scalar_default( const std::string& s, const char* separators, const boost::optional< T >& default_value )
+{
+    const auto& v = split( s, separators, true );
+    std::vector< T > t( v.size() );
+    for( unsigned int i = 0; i < v.size(); ++i ) { t[i] = v[i].empty() && default_value ? *default_value : boost::lexical_cast< T >( v[i] ); }
+    return t;
+}
+
+template < typename T, typename V > inline std::vector< T > split_as( const std::string& s, const char* separators, const V& defaults )
+{
+    const auto& v = split( s, separators, true );
+    std::vector< T > t( v.size() < defaults.size() ? defaults.size() : v.size() );
+    for( unsigned int i = 0; i < v.size(); ++i ) { t[i] = v[i].empty() && defaults.size() > i ? defaults[i] : boost::lexical_cast< T >( v[i] ); }
+    for( unsigned int i = v.size(); i < defaults.size(); ++i ) { t[i] = defaults[i]; }
+    return t;
+}
+
+template < typename T, typename V > inline std::vector< T > split_as( const std::string& s, char separator, const V& defaults )
+{
+    const char separators[] = { separator, 0 };
+    return split_as< T >( s, &separators[0], defaults );
+}
+
+} // namespace impl {
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, const char* separators ) { return impl::split_with_scalar_default( s, separators, boost::optional< T >() ); }
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, const char* separators, const T& default_value ) { return impl::split_with_scalar_default( s, separators, default_value ); }
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator )
+{ 
+    const char separators[] = { separator, 0 };
+    return impl::split_with_scalar_default( s, &separators[0], boost::optional< T >() );
+}
+
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator, const T& default_value )
+{ 
+    const char separators[] = { separator, 0 };
+    return impl::split_with_scalar_default( s, &separators[0], boost::optional< T >( default_value ) );
+}
 
-#endif // COMMA_STRING_SPLIT_H_
+template < typename T > inline std::vector< T > split_as( const std::string& s, const char* separators, const std::vector< T >& defaults ) { return impl::split_as< T >( s, separators, defaults ); }
+template < typename T > inline std::vector< T > split_as( const std::string& s, char separator, const std::vector< T >& defaults ) { return impl::split_as< T >( s, separator, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, const char* separators, const std::array< T, N >& defaults ) { return impl::split_as< T >( s, separators, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, char separator, const std::array< T, N >& defaults ) { return impl::split_as< T >( s, separator, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, const char* separators, const boost::array< T, N >& defaults ) { return impl::split_as< T >( s, separators, defaults ); }
+template < typename T, std::size_t N > inline std::vector< T > split_as( const std::string& s, char separator, const boost::array< T, N >& defaults ) { return impl::split_as< T >( s, separator, defaults ); }
+
+} // namespace comma {
diff --git a/string/string.cpp b/string/string.cpp
index c8229b4e4..d75bb7ecc 100644
--- a/string/string.cpp
+++ b/string/string.cpp
@@ -1,39 +1,10 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 /// @author mathew hounsell
 
+#include <iostream>
 #include <boost/optional.hpp>
-
-// Don't use <> foc comma as that requires the code to be installed first.
 #include "../base/exception.h"
 #include "string.h"
 
@@ -139,4 +110,47 @@ std::string unescape_and_unquote( const std::string & s, char esc, const char* q
     return v;
 }
 
+std::string common_front( const std::string& s, const std::string& t )
+{
+    std::string::size_type i = 0;
+    for( ; i < s.size() && i < t.size() && s[i] == t[i]; ++i );
+    return s.substr( 0, i );
+}
+
+std::string common_front( const std::string& s, const std::string& t, char delimiter )
+{
+    bool s_abs = !s.empty() && s[0] == delimiter;
+    bool t_abs = !t.empty() && t[0] == delimiter;
+    if( s_abs != t_abs ) { COMMA_THROW( comma::exception, "expected both paths absolute or both relative; got '" << s << "' and '" << t << "'" ); }
+    std::string::size_type i = 0;
+    for( ; i < s.size() && i < t.size() && s[i] == t[i]; ++i );
+    if( i < s.size() && s[i] != delimiter )
+    {
+        i = s.find_last_of( delimiter, i );
+        if( i == 0 ) { i = 1; } // root only
+    }
+    else if( i < t.size() && t[i] != delimiter )
+    {
+        i = t.find_last_of( delimiter, i );
+        if( i == 0 ) { i = 1; } // root only
+    }
+    if( i == std::string::npos ) { i = 0; }
+    else if( i == s.size() && s.size() > 1 && s.back() == delimiter ) { --i; }
+    return s.substr( 0, i );
+}
+
+std::string replace( const std::string& s, const std::unordered_map< std::string, std::string >& aliases )
+{
+    if( aliases.empty() ) { return s; }
+    auto v = comma::split( s, ',', true );
+    std::string f, comma;
+    for( const auto& e: v )
+    {
+        auto i = aliases.find( e );
+        f += comma + ( i == aliases.end() ? e : i->second );
+        comma = ",";
+    }
+    return f;
+}
+
 } // namespace comma {
diff --git a/string/string.h b/string/string.h
index 2d3e2efd1..0849c2d6c 100644
--- a/string/string.h
+++ b/string/string.h
@@ -1,41 +1,13 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_STRING_STRING_H_
-#define COMMA_STRING_STRING_H_
+#pragma once
 
 #include <stdlib.h>
 #include <sstream>
 #include <string>
+#include <unordered_map>
 #include <vector>
 #include "../string/split.h"
 
@@ -47,16 +19,24 @@ std::string strip( const std::string& s, const char* characters = " \t\r\n" );
 /// strip given character from the beginning and end
 std::string strip( const std::string& s, char character );
 
-// Escape given character and escape characters by preceding them with escape charcter.
+// escape given character and escape characters by preceding them with escape charcter.
 std::string escape( const std::string & s, char character = '\'', char esc = '\\' );
-// Escape any of the given characters and escape character by preceding them with escape character
+// escape any of the given characters and escape character by preceding them with escape character
 std::string escape( const std::string & s, const char* characters, char esc = '\\' );
 
-// Escape given character and escape characters by preceding them with escape charcter.
+// escape given character and escape characters by preceding them with escape charcter.
 std::string unescape( const std::string & s, char character = '\'', char esc = '\\' );
-// Escape any of the given characters and escape character by preceding them with escape character
+// escape any of the given characters and escape character by preceding them with escape character
 std::string unescape( const std::string & s, const char* characters, char esc = '\\' );
 
+/// return common initial part of two strings
+/// e.g. for abc and abd return ab; for abc and def return empty string
+std::string common_front( const std::string& s, const std::string& t );
+
+/// return common initial part of two strings as xpaths with a delimiter (probably should be in xpath)
+/// e.g. for abc and abd return ab; for abc and def return empty string
+std::string common_front( const std::string& s, const std::string& t, char delimiter ); 
+
 /// join array elements into a string with given delimiter
 template < typename A >
 std::string join( const A& a, std::size_t size, char delimiter );
@@ -65,6 +45,9 @@ std::string join( const A& a, std::size_t size, char delimiter );
 template < typename A >
 inline std::string join( const A& a, char delimiter ) { return join( a, a.size(), delimiter ); }
 
+/// convenience function, somewhat overfit: split, replace aliased entries, join
+std::string replace( const std::string& s, const std::unordered_map< std::string, std::string >& aliases );
+
 template < typename A >
 inline std::string join( const A& a, std::size_t size, char delimiter )
 {
@@ -86,5 +69,3 @@ inline std::string join( It begin, It end, char delimiter )
 }
 
 } // namespace comma {
-
-#endif // COMMA_STRING_STRING_H_
diff --git a/string/test/CMakeLists.txt b/string/test/CMakeLists.txt
index 383d8775d..6d1199d84 100644
--- a/string/test/CMakeLists.txt
+++ b/string/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET(KIT string)
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_${KIT} ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT string )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base comma_string comma_name_value ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${test_name} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/string/test/string_test.cpp b/string/test/string_test.cpp
index 4fb612134..264093db2 100644
--- a/string/test/string_test.cpp
+++ b/string/test/string_test.cpp
@@ -1,38 +1,14 @@
-// This file is part of comma, a generic and flexible library
-// Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+// Copyright (c) 2023 vsevolod vlaskine
 
-
-#include "../../base/exception.h"
-#include "../string.h"
-#include "../split.h"
 #include <list>
+#include <sstream>
 #include <gtest/gtest.h>
+#include "../../base/exception.h"
+#include "../../name_value/serialize.h"
+#include "../choice.h"
+#include "../split.h"
+#include "../string.h"
+#include "../traits.h"
 
 namespace comma {
 
@@ -82,6 +58,23 @@ TEST( string, join )
     }
 }
 
+static inline void make_vector_impl( std::vector< std::string >& v ) {}
+
+template < typename T, typename... Args >
+static inline void make_vector_impl( std::vector< std::string >& v, T arg, Args... args )
+{
+    v.push_back( arg );
+    make_vector_impl( v, args... );
+}
+
+template < typename... Args >
+static inline std::vector< std::string > make_vector( Args... args )
+{
+    std::vector< std::string > v;
+    make_vector_impl( v, args... );
+    return v;
+}
+
 TEST( string, split )
 {
     {
@@ -123,6 +116,66 @@ TEST( string, split )
         EXPECT_TRUE( v.size() == 4 );
         for( unsigned int i = 0; i < 4; ++i ) { EXPECT_TRUE( v.at(i) == "" ); }
     }
+    {
+        EXPECT_EQ( split_head( "",              1, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_head( "",              5, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_head( "a",             1, ',', true ), make_vector( "a" ) );
+        EXPECT_EQ( split_head( "abc",           1, ',', true ), make_vector( "abc" ) );
+        EXPECT_EQ( split_head( "a,b",           1, ',', true ), make_vector( "a,b" ) );
+        EXPECT_EQ( split_head( "ab,cd",         1, ',', true ), make_vector( "ab,cd" ) );
+        EXPECT_EQ( split_head( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_head( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_head( "a,b",           3, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_head( "a,b,c,d,e,f,g", 5, ',', true ), make_vector( "a", "b", "c", "d", "e,f,g" ) );
+    }
+    {
+        EXPECT_EQ( split_tail( "",              1, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_tail( "",              5, ',', true ), std::vector< std::string >() );
+        EXPECT_EQ( split_tail( "a",             1, ',', true ), make_vector( "a" ) );
+        EXPECT_EQ( split_tail( "abc",           1, ',', true ), make_vector( "abc" ) );
+        EXPECT_EQ( split_tail( "a,b",           1, ',', true ), make_vector( "a,b" ) );
+        EXPECT_EQ( split_tail( "ab,cd",         1, ',', true ), make_vector( "ab,cd" ) );
+        EXPECT_EQ( split_tail( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_tail( "a,b",           2, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_tail( "a,b",           3, ',', true ), make_vector( "a", "b" ) );
+        EXPECT_EQ( split_tail( "a,b,c,d,e,f",   5, ',', true ), make_vector( "a,b", "c", "d", "e", "f" ) );
+        EXPECT_EQ( split_tail( "a,b,c,d,e,f,g", 5, ',', true ), make_vector( "a,b,c", "d", "e", "f", "g" ) );
+    }
+}
+
+TEST( string, split_as )
+{
+    {
+        std::vector< int > expected{ 1, 2, 3 };
+        EXPECT_EQ( split_as< int >( "1,2,3", ',' ), expected );
+        EXPECT_EQ( split_as< int >( "1,2;3", ",;" ), expected );
+        EXPECT_EQ( split_as< int >( "1,2;3", ",;_" ), expected );
+    }
+    {
+        std::vector< int > expected{ 5, 5, 3, 5 };
+        EXPECT_EQ( split_as< int >( ",,3,", ',', 5 ), expected );
+    }
+    {
+        std::vector< int > expected{ 1, 5, 3 };
+        std::vector< int > defaults_vector{ 1, 5 };
+        std::array< int, 2 > defaults_std_array{ 1, 5 };
+        boost::array< int, 2 > defaults_boost_array{ 1, 5 };
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_vector ), expected );
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_boost_array ), expected );
+        EXPECT_EQ( split_as< int >( ",,3", ',', defaults_std_array ), expected );
+    }
+    {
+        std::vector< int > expected{ 1, 5, 3, 7 };
+        std::vector< int > defaults_vector{ 1, 5, 1, 7 };
+        std::array< int, 4 > defaults_std_array{ 1, 5, 1, 7 };
+        boost::array< int, 4 > defaults_boost_array{ 1, 5, 1, 7 };
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_vector ), expected );
+        EXPECT_EQ( split_as< int >( std::string( ",,3," ), ',', defaults_vector ), expected );
+        EXPECT_EQ( split_as< int >( std::string( ",,3" ), ',', defaults_boost_array ), expected );
+        EXPECT_EQ( split_as< int >( std::string( ",,3," ), ',', defaults_boost_array ), expected );
+        EXPECT_EQ( split_as< int >( ",,3", ',', defaults_std_array ), expected );
+        EXPECT_EQ( split_as< int >( ",,3,", ',', defaults_std_array ), expected );
+    }
 }
 
 TEST( string, escape )
@@ -282,6 +335,62 @@ TEST( string, split_escaped_quoted )
     }
 }
 
+TEST( string, split_bracketed )
+{
+    {
+        std::vector< std::string > v( split_bracketed( "" ) );
+        EXPECT_EQ( 1u, v.size() );
+        EXPECT_EQ( "", v[0] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "()", ',' ) );
+        EXPECT_EQ( 1u, v.size() );
+        EXPECT_EQ( "", v[0] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "(),(),()", ',' ) );
+        EXPECT_EQ( 3u, v.size() );
+        EXPECT_EQ( "", v[0] );
+        EXPECT_EQ( "", v[1] );
+        EXPECT_EQ( "", v[2] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( ")()", ',', '(', ')', false ) );
+        EXPECT_EQ( 1u, v.size() );
+        EXPECT_EQ( ")()", v[0] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "(),(,),(,)", ',' ) );
+        EXPECT_EQ( 3u, v.size() );
+        EXPECT_EQ( "", v[0] );
+        EXPECT_EQ( ",", v[1] );
+        EXPECT_EQ( ",", v[2] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "a,[,b,[c]],d", ',', '[', ']' ) );
+        EXPECT_EQ( 3u, v.size() );
+        EXPECT_EQ( "a", v[0] );
+        EXPECT_EQ( ",b,[c]", v[1] );
+        EXPECT_EQ( "d", v[2] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "a,( b, c, d ),( f ( g, h ) ), i", ',' ) );
+        EXPECT_EQ( 4u, v.size() );
+        EXPECT_EQ( "a", v[0] );
+        EXPECT_EQ( " b, c, d ", v[1] );
+        EXPECT_EQ( " f ( g, h ) ", v[2] );
+        EXPECT_EQ( " i", v[3] );
+    }
+    {
+        std::vector< std::string > v( split_bracketed( "a,( b, c, d ),( f ( g, h ) ), i", ',', '(', ')', false ) );
+        EXPECT_EQ( 4u, v.size() );
+        EXPECT_EQ( "a", v[0] );
+        EXPECT_EQ( "( b, c, d )", v[1] );
+        EXPECT_EQ( "( f ( g, h ) )", v[2] );
+        EXPECT_EQ( " i", v[3] );
+    }
+}
+
 TEST( string, strip )
 {
     EXPECT_EQ( strip( "", ";" ), "" );
@@ -294,6 +403,131 @@ TEST( string, strip )
     EXPECT_EQ( strip( ";,;abc;;,", ";," ), "abc" );
 }
 
+TEST( string, common_head )
+{
+    EXPECT_EQ( "", common_front( "", "" ) );
+    EXPECT_EQ( "", common_front( "", "a" ) );
+    EXPECT_EQ( "", common_front( "", "ab" ) );
+    EXPECT_EQ( "", common_front( "", "abc" ) );
+    EXPECT_EQ( "", common_front( "a", "" ) );
+    EXPECT_EQ( "", common_front( "ab", "" ) );
+    EXPECT_EQ( "", common_front( "abc", "" ) );
+    EXPECT_EQ( "", common_front( "a", "b" ) );
+    EXPECT_EQ( "", common_front( "abc", "def" ) );
+    EXPECT_EQ( "a", common_front( "ab", "ac" ) );
+    EXPECT_EQ( "ab", common_front( "abc", "abd" ) );
+}
+
+TEST( string, common_head_delimiter )
+{
+    EXPECT_EQ( common_front( "", "", '/' ), "" );
+    EXPECT_EQ( common_front( "a", "b", '/' ), "" );
+    EXPECT_EQ( common_front( "ab", "cd", '/' ), "" );
+    EXPECT_EQ( common_front( "ab", "abc", '/' ), "" );
+    EXPECT_EQ( common_front( "/", "/", '/' ), "/" );
+    EXPECT_EQ( common_front( "/a", "/b", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab", "/cd", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab", "/abc", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab/", "/abc", '/' ), "/" );
+    EXPECT_EQ( common_front( "/ab/", "/abc/", '/' ), "/" );
+    EXPECT_EQ( common_front( "a/b", "a/c", '/' ), "a" );
+    EXPECT_EQ( common_front( "a/b/", "a/c", '/' ), "a" );
+    EXPECT_EQ( common_front( "a/b", "a/c/", '/' ), "a" );
+    EXPECT_EQ( common_front( "a/b/", "a/c/", '/' ), "a" );
+    EXPECT_EQ( common_front( "/a/b", "/a/c", '/' ), "/a" );
+    EXPECT_EQ( common_front( "ab/cd", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/", "ab/cd/", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef", "ab/cd/xy", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd", "ab/cd/", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd", "ab/cd/ef", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef/", "ab/cd", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef/", "ab/cd/", '/' ), "ab/cd" );
+    EXPECT_EQ( common_front( "ab/cd/ef", "ab/cd/", '/' ), "ab/cd" );
+}
+
+struct fruit
+{
+    static std::vector< std::string > choices() { return { "apple", "orange", "juicymambo" }; }
+    enum values { apple, orange, juicymambo };
+};
+
+struct veg
+{
+    static std::vector< std::string > choices() { return { "cucumber", "pumpkin" }; }
+    enum class values { cucumber, pumpkin };
+};
+
+struct groceries
+{
+    strings::choice< comma::fruit > fruit;
+    strings::choice< comma::veg > veg;
+};
+
+namespace visiting {
+
+template <> struct traits< groceries >
+{
+    template < typename Key, class Visitor > static void visit( const Key& k, groceries& p, Visitor& v )
+    {
+        v.apply( "fruit", p.fruit );
+        v.apply( "veg", p.veg );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key& k, const groceries& p, Visitor& v )
+    {
+        v.apply( "fruit", p.fruit );
+        v.apply( "veg", p.veg );
+    }
+};
+
+} // namespace visiting {
+
+TEST( strings, choice )
+{
+    EXPECT_EQ( strings::choice< fruit >(), "apple" );
+    EXPECT_EQ( strings::choice< fruit >().to_enum(), fruit::apple );
+    EXPECT_EQ( strings::choice< fruit >( "orange" ), "orange" );
+    EXPECT_EQ( strings::choice< fruit >( fruit::orange ), "orange" );
+    EXPECT_EQ( strings::choice< fruit >( fruit::orange ).to_enum(), fruit::orange );
+    EXPECT_EQ( strings::choice< fruit >( fruit::orange ), fruit::orange );
+    EXPECT_TRUE( strings::choice< fruit >::valid( "juicymambo" ) );
+    EXPECT_FALSE( strings::choice< fruit >::valid( "driedmambo" ) );
+    EXPECT_THROW( strings::choice< fruit >( "driedmambo" ), comma::exception );
+
+    EXPECT_EQ( strings::choice< veg >(), "cucumber" );
+    EXPECT_EQ( strings::choice< veg >().to_enum(), veg::values::cucumber );
+    EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ), "pumpkin" );
+    EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ).to_enum(), veg::values::pumpkin );
+    EXPECT_EQ( strings::choice< veg >( veg::values::pumpkin ), veg::values::pumpkin );
+
+    {
+        std::istringstream iss( R"({})" );
+        auto g = comma::read_json< groceries >( iss );
+        EXPECT_EQ( g.fruit, "apple" );
+        EXPECT_EQ( g.veg, "cucumber" );
+        EXPECT_EQ( comma::json_to_string( g, false ), R"({"fruit":"apple","veg":"cucumber"})" );
+    }
+    {
+        std::istringstream iss( R"({ "fruit": "orange" })" );
+        auto g = comma::read_json< groceries >( iss );
+        EXPECT_EQ( g.fruit, "orange" );
+        EXPECT_EQ( g.veg, "cucumber" );
+        EXPECT_EQ( comma::json_to_string( g, false ), R"({"fruit":"orange","veg":"cucumber"})" );
+    }
+    {
+        std::istringstream iss( R"({ "fruit": "orange", "veg": "pumpkin" })" );
+        auto g = comma::read_json< groceries >( iss );
+        EXPECT_EQ( g.fruit, "orange" );
+        EXPECT_EQ( g.veg, "pumpkin" );
+        EXPECT_EQ( comma::json_to_string( g, false ), R"({"fruit":"orange","veg":"pumpkin"})" );
+    }
+
+    EXPECT_EQ( strings::make_choice< fruit::values >( "orange", { "apple", "orange" } ), fruit::orange );
+    EXPECT_EQ( strings::make_choice< veg::values >( "pumpkin", { "cucumber", "pumpkin" } ), veg::values::pumpkin );
+}
+
 } // namespace comma {
 
 int main( int argc, char* argv[] )
diff --git a/string/traits.h b/string/traits.h
new file mode 100644
index 000000000..1363d9b31
--- /dev/null
+++ b/string/traits.h
@@ -0,0 +1,31 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+
+/// @author Vsevolod Vlaskine
+
+#pragma once
+
+#include <string>
+#include "../base/exception.h"
+#include "../visiting/apply.h"
+#include "../visiting/traits.h"
+#include "choice.h"
+
+namespace comma { namespace visiting {
+
+template < typename Derived, typename Base > struct traits< comma::strings::choice< Derived, Base > >
+{
+    typedef comma::strings::choice< Derived, Base > choice_t;
+
+    template < typename Key, class Visitor > static void visit( const Key& k, choice_t& p, Visitor& v )
+    {
+        comma::visiting::apply( v, static_cast< Base& >( p ) );
+        choice_t::assert_valid( std::string( p ) );
+    }
+
+    template < typename Key, class Visitor > static void visit( const Key& k, const choice_t& p, Visitor& v )
+    {
+        comma::visiting::apply( v, static_cast< const Base& >( p ) );
+    }
+};
+
+} } // namespace comma { namespace visiting {
diff --git a/sync/test/CMakeLists.txt b/sync/test/CMakeLists.txt
index 5e759ecd1..049903f49 100644
--- a/sync/test/CMakeLists.txt
+++ b/sync/test/CMakeLists.txt
@@ -1,15 +1,13 @@
-SET( KIT sync )
-SET( DIR ${SOURCE_CODE_BASE_DIR}/${KIT}/test )
-FILE( GLOB source ${DIR}/*_test.cpp )
-FILE( GLOB extras ${DIR}/*.cpp ${DIR}/*.h )
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT sync )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/sync/test/lazy_test.cpp b/sync/test/lazy_test.cpp
index 49de0cfd3..5ae86f9d8 100644
--- a/sync/test/lazy_test.cpp
+++ b/sync/test/lazy_test.cpp
@@ -28,7 +28,7 @@
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 #include <gtest/gtest.h>
-#include <boost/bind.hpp>
+#include <boost/bind/bind.hpp>
 #include "../lazy.h"
 
 namespace comma { namespace sync { namespace test {
diff --git a/system/ansible/install.yml b/system/ansible/install.yml
index 2ddad404c..4ede9cf02 100644
--- a/system/ansible/install.yml
+++ b/system/ansible/install.yml
@@ -6,47 +6,42 @@
   vars:
     - base: "{{ ansible_env.HOME }}"
     - make_j: 6
-    - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF"
+    - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
 
   tasks:
   - name: "install comma dependencies"
     become: true
-    apt: pkg={{ item }} state=present update_cache=yes
-    with_items:
-      - build-essential 
-      - git
-      - cmake-curses-gui
-      - cmake
-      - perl
-      - python
-      - libboost-all-dev
-      - socat
-      - libzmq3-dev
-      - libgtest-dev
-      - python-dev
-      - python-numpy
-      - libprocps-dev
-      - recode
-      
+    apt:
+        pkg: ['build-essential', 'git', 'cmake-curses-gui', 'cmake', 'gawk', 'perl', 'python3', 'libboost-all-dev', 'socat', 'libzmq3-dev', 'libgtest-dev', 'python3-dev', 'python3-pip', 'python3-numpy', 'libproc2-dev', 'libyaml-dev', 'recode']
+        state: present
+        update_cache: yes
+
+  - name: "install comma regressions test dependencies"
+    become: true
+    apt:
+        pkg: ['moreutils', 'net-tools', 'pv']
+        state: present
+        update_cache: yes
+
   - name: "comma: make source directory at {{ base }}"
     file: path={{ base }}/{{ item }} state=directory
     with_items:
         - src
         - build
-    
+
   - name: "comma: clone"
     git:
         repo: "https://gitlab.com/orthographic/comma.git"
         dest: "{{ base }}/src/comma"
         clone: yes
         update: yes
-        
+
   - name: "comma: make build directory at {{ base }}"
     file: dest="{{ base }}/build/comma" state=directory
 
   - name: "comma: cmake"
     vars:
-        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -Dcomma_INSTALL_WEB_SHELL=OFF"
+        - comma_cmake_options: "-DBUILD_TESTS=ON -DINSTALL_TESTS=ON -DINSTALL_BASH_COMPLETION=ON -Dcomma_BUILD_XML=ON -Dcomma_BUILD_ZEROMQ=ON -DBUILD_PYTHON_PACKAGES=ON -Dcomma_INSTALL_WEB_SHELL=OFF -DPYTHON=/usr/bin/python3"
     shell: "/usr/bin/cmake {{ comma_cmake_options }} {{ base }}/src/comma chdir={{ base }}/build/comma"
 
   - name: "comma: make"
diff --git a/system/launchpad/comma-launchpad-test b/system/launchpad/comma-launchpad-test
new file mode 100755
index 000000000..f02be1f81
--- /dev/null
+++ b/system/launchpad/comma-launchpad-test
@@ -0,0 +1,36 @@
+#!/bin/bash
+
+function say() { echo "usage: $0: $@" >&2; }; function die() { say "$@"; exit 1; }
+
+comma_py_version='1.0.0'
+
+add-apt-repository -y ppa:orthographic/comma || die "add-apt-repository ppa:orthographic/comma failed"
+add-apt-repository -y multiverse || die "add-apt-repository multiverse failed"
+apt-get update || die "apt-get update failed"
+apt-get -y install comma || die "apt-get install comma failed"
+pip3 install comma-py==$comma_py_version
+
+say "testing basic csv utilities..."
+output=$( csv-paste line-number | head | csv-to-bin ui | csv-from-bin ui ) || die "failed: failed to run"
+expected=$( seq 0 9 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+say "testing basic csv utilities: done"
+
+say "testing bash utils..."
+type -p comma-application-util || die "failed: failed"
+say "testing bash utils: done"
+
+say "running csv-eval --help (for reference)"
+csv-eval --help
+
+say "testing comma-py..."
+output=$( python3 -c "import comma; print( comma.version.__version__ )" ) || die "failed: failed to run"
+expected=$comma_py_version
+[[ "$output" == "$expected" ]] || die "failed: expected: $expected; got: $output"
+say "testing comma-py: done"
+
+say "testing csv-eval..."
+output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
+expected=$( seq 1 10 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+say "testing csv-eval: done"
diff --git a/system/launchpad/comma-launchpad-upload b/system/launchpad/comma-launchpad-upload
new file mode 100755
index 000000000..e5db5a449
--- /dev/null
+++ b/system/launchpad/comma-launchpad-upload
@@ -0,0 +1,27 @@
+#!/bin/bash
+
+# todo
+#   - !!! script to build in docker (how to manage signature and dput in docker?)
+#   - manual steps (automate if possible)
+#     - update changelog
+#       - version
+#       - changes
+#       - date
+#     - cmake: update default version
+#     - commit
+#     - tag repo with version
+#     - push
+
+type -p debuild >/dev/null || sudo apt install devscripts
+function say() { echo "usage: $0: $@" >&2; }; function die() { "$0: error: $@"; exit 1; }
+[[ -n "$2" ]] || { echo "usage: $0 <what> <ubuntu-name> <comma-version>" >&2; exit 1; }
+what=$1
+comma_version=$2
+name=comma_${comma_version}
+[[ -d comma ]] || die "comma directory not found; please run in something like ~/src"
+tar -acf $name.orig.tar.gz comma || die "tar failed"
+if [[ "$what" == "orig" ]]; then rm -f comma/debian/files; what_option='a'
+elif [[ "$what" == "update" ]]; then what_option='d'
+else die "expected <what>: orig or update; got \"$what\""; fi
+( cd comma && debuild -S -s$what_option ) || die "debuild failed"
+dput ppa:orthographic/comma $name-0ppa0_source.changes || die "dput failed"
diff --git a/system/launchpad/readme b/system/launchpad/readme
new file mode 100644
index 000000000..7f469bb8a
--- /dev/null
+++ b/system/launchpad/readme
@@ -0,0 +1,57 @@
+uploading to launchpad
+
+- update comma/debian/changelog; see https://www.debian.org/doc/debian-policy/ch-source.html#debian-changelog-debian-changelog
+  - ubuntu version (currently jammy)
+  - version, e.g. 1.2.3
+  - changes
+  - date
+- update default version in comma/CMakeLists.txt
+- run:
+      cd ~/src/comma
+      git tag -a 1.2.3 -m 'your comments for version 1.2.3'
+      cd ..
+      comma/system/launchpad/comma-launchpad-upload update 1.2.3
+- sign gpg as snaky gpg (as opposed to dromedary)
+- once build in launchpad succeeds, commit and push
+- if there were changes in comma/python, release them into pypi
+- notify interested parties
+
+verifying ppa in docker
+
+uploading to pypi (i know, wrong place; todo: script)
+
+cd comma/python
+# version.py: bump up version
+# setup.py: uncomment install_requires (commented since it messes installation for those who use apt to install python3 packages (e.g. numpy)
+rm -rf dist
+python3 setup.py sdist bdist_wheel
+twine upload --repository-url https://pypi.org/legacy/ dist/* # test
+twine upload dist/*
+
+update of 20240205
+- pypi requires 2FA now (set e.g. with google authenticator on a mobile)
+- legacy twine upload dist/* does not work: 
+    HTTPError: 403 Forbidden from https://upload.pypi.org/legacy/
+    Username/Password authentication is no longer supported. Migrate to API Tokens or Trusted Publishers instead. See https://pypi.org/help/#apitoken and https://pypi.org/help/#trusted-publishers
+- follow instructions in the link above to set up api token and rc file (which are really vague: e.g. it seems that PROJECT_NAME should be left as is, NOT replaced with comma-py)
+- then run: twine upload --repository PROJECT_NAME dist/* or twine upload dist/*
+- it may exit with a very obscure HTTP error 403 or 400, but it seems to upload the repo nevertheless...
+
+todo
+  - document
+    - uploading to launchpad
+    - verifying in docker
+      add-apt-repository ppa:orthographic/ppa
+      apt-get update
+      add-apt-repository multiverse
+      apt-get update
+      apt-get install comma
+
+  - move docker out of system/package/cpack (can symlink it back)
+
+useful links
+  - generous tutorial: http://schneegans.github.io/lessons/2011/11/02/ppa-launchpad-cmake
+  - adding gpg-key and setting it in launchpad: https://help.launchpad.net/YourAccount/ImportingYourPGPKey
+  - debian package policy, all necessary files: https://www.debian.org/doc/debian-policy/ch-controlfields.html
+  - building ppa: https://www.ebower.com/docs/ubuntu-ppa/
+  - using ppa: https://itsfoss.com/ppa-guide/
diff --git a/system/package/cpack/Dockerfile b/system/package/cpack/Dockerfile
new file mode 100644
index 000000000..4c73eafa0
--- /dev/null
+++ b/system/package/cpack/Dockerfile
@@ -0,0 +1,10 @@
+ARG version
+FROM ubuntu:${version}
+ENV DEBIAN_FRONTEND="noninteractive"
+RUN apt-get update \
+    && apt-get install --yes apt-utils \
+    && apt-get install --yes software-properties-common \
+    && apt-get install --yes ansible git build-essential cmake cmake-curses-gui python3-pip devscripts \
+    && apt-get install --yes python3-stdeb python3-all dh-python
+    && apt-get install --yes libboost-all-dev libzmq3-dev libprocps-dev libc-dev socat recode
+# && apt-add-repository --yes --update ppa:ansible/ansible \
diff --git a/system/package/cpack/changelog.gz b/system/package/cpack/changelog.gz
new file mode 100644
index 000000000..185c51ea2
Binary files /dev/null and b/system/package/cpack/changelog.gz differ
diff --git a/system/package/cpack/comma-package-docker-build b/system/package/cpack/comma-package-docker-build
new file mode 100755
index 000000000..363fd4f54
--- /dev/null
+++ b/system/package/cpack/comma-package-docker-build
@@ -0,0 +1,9 @@
+#!/bin/bash
+version=$1
+comma_dir="$2"
+[[ -n "$version" ]] || { echo "usage: $0 <ubuntu version> [<comma dir>]; e.g. $0 20.04" >&2; exit 1; }
+[[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
+[[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
+echo "$0: running:" >&2
+echo "docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f '$comma_dir/system/package/cpack/Dockerfile' ." >&2
+docker build -t ubuntu.$version.build.basics --build-arg version=$version --no-cache -f "$comma_dir/system/package/cpack/Dockerfile" .
diff --git a/system/package/cpack/comma-package-docker-run b/system/package/cpack/comma-package-docker-run
new file mode 100755
index 000000000..57cd148de
--- /dev/null
+++ b/system/package/cpack/comma-package-docker-run
@@ -0,0 +1,16 @@
+#!/bin/bash
+
+ubuntu_version=$1
+comma_version_major=$2
+comma_version_minor=$3
+comma_version_patch=$4
+comma_dir="$5"
+[[ -n "$comma_version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
+[[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
+[[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
+
+docker run \
+       --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
+       --mount "type=bind,source=$( pwd ),target=/root/output" \
+       ubuntu.$ubuntu_version.build.basics \
+       /mnt/comma/system/package/cpack/comma-package-make $ubuntu_version $comma_version_major $comma_version_minor $comma_version_patch /mnt/comma || { echo "$0: failed" >&2; exit 1; }
diff --git a/system/package/cpack/comma-package-docker-test b/system/package/cpack/comma-package-docker-test
new file mode 100755
index 000000000..f399e1ed9
--- /dev/null
+++ b/system/package/cpack/comma-package-docker-test
@@ -0,0 +1,21 @@
+#!/bin/bash
+
+function die() { echo "$0: $@" >&2; exit 1; }
+
+ubuntu_version="$1"
+package="$2"
+python_package="$3"
+comma_dir="$4"
+[[ -n "$python_package" ]] || { echo "usage: $0 <ubuntu version> <package> <python package> [<comma dir>]" >&2; exit 1; }
+[[ -s "$package" ]] || die "file not found or empty: '$package'"
+[[ -s "$python_package" ]] || die "file not found or empty: '$python_package'"
+[[ -n "$comma_dir" ]] || comma_dir="$( realpath ~/src/comma )"
+package_dir=$( dirname "$( realpath "$package" )" )
+[[ -d "$comma_dir" ]] || { echo "usage: $0 please specify <comma dir> explicitly (since you seem to either run with sudo or have comma not in '$comma_dir')" >&2; exit 1; }
+# todo: optionally run full regression test
+
+docker run \
+       --mount "type=bind,source=$comma_dir,target=/mnt/comma" \
+       --mount "type=bind,source=$package_dir,target=/mnt/package" \
+       ubuntu.$ubuntu_version.build.basics \
+       /mnt/comma/system/package/cpack/comma-package-test "/mnt/package/$( basename "$package" )" "/mnt/package/$( basename "$python_package" )" || { echo "$0: failed" >&2; exit 1; }
diff --git a/system/package/cpack/comma-package-make b/system/package/cpack/comma-package-make
new file mode 100755
index 000000000..f49068e93
--- /dev/null
+++ b/system/package/cpack/comma-package-make
@@ -0,0 +1,103 @@
+#!/bin/bash
+
+function die() { echo "$0: $@" >&2; exit 1; }
+
+ubuntu_version=$1
+version_major=$2
+version_minor=$3
+version_patch=$4
+comma_dir="$5"
+package_name="comma-$version_major.$version_minor.$version_patch-ubuntu.$ubuntu_version"
+[[ -n "$comma_dir" ]] || comma_dir=$( realpath ~/src/comma )
+[[ -n "$version_patch" ]] || { echo "usage: $0 <ubuntu version> <comma version major> <comma version minor> <comma version patch> [<comma dir>]" >&2; exit 1; }
+cd ~
+echo "$0: running ansible-playbook '$comma_dir/system/ansible/install.yml' in $( pwd )..." >&2
+#ansible-playbook "$comma_dir/system/ansible/install.yml" || die "ansible-playbook failed"
+case $ubuntu_version in
+    18.04) libproc_version="libprocps6 (>= 2:3.3.0)" ;;
+    20.04) libproc_version="libprocps8 (>= 1)" ;;
+    22.04) libproc_version="libprocps8 (>= 1)" ;;
+    *) libproc_version="libprocps8 (>= 1)" ;; # for now
+esac
+
+(
+    mkdir -p ~/build/comma
+    cd ~/build/comma
+    echo "$0: running cmake in $( pwd )..." >&2
+    cmake $comma_dir \
+            -DCPACK_GENERATOR=DEB \
+            -DCPACK_PACKAGE_NAME="$package_name" \
+            -DBUILD_PYTHON_PACKAGES=OFF \
+            -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+            -DBUILD_SHARED_LIBS=ON \
+            -DBUILD_TESTS=OFF \
+            -DCMAKE_BUILD_TYPE=Release \
+            -DCMAKE_INSTALL_PREFIX=/usr \
+            -DINSTALL_BASH_COMPLETION=OFF \
+            -DINSTALL_TESTS=OFF \
+            -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
+            -DCMAKE_PROJECT_VERSION_MAJOR=$version_major \
+            -DCMAKE_PROJECT_VERSION_MINOR=$version_minor \
+            -DCMAKE_PROJECT_VERSION_PATCH=$version_patch  \
+            -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+            -Dcomma_BUILD_XML=OFF \
+            -Dcomma_build_io_rabbit_cat=OFF || die "cmake failed"
+    echo "$0: running cpack in $( pwd )..." >&2
+    cpack -j4 || die "cpack failed"
+    echo "$0: created package at $( realpath $package_name.deb )" >&2
+    # todo: optionally run full regression test
+    echo "$0: done" >&2
+)
+if [[ -d output ]]; then
+    cp ~/build/comma/$package_name.deb output
+    echo "$0: copied $( realpath ~/build/comma/$package_name.deb ) to $( realpath output )" >&2
+fi
+
+# (
+#     cd ~/src/comma/python
+#     echo "$0: setting up python in $( pwd )" >&2
+#     #python3 setup.py --command-packages=stdeb.command bdist_deb || die "failed"
+#     echo "$0: running python3 setup.py ..." >&2
+#     python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../COPYING --suite focal  || die "failed"
+#     # todo: mount gpg key
+#     # debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/comma-py_1.0.0-1.dsc
+#     # mkdir tmp
+#     # cd tmp
+#     # dpkg-source -x ../deb_dist/comma-py_1.0.0-1.dsc
+#     # cd comma-py-1.0.0
+#     # debuild -S -sa
+#     # dput ppa:orthographic/ppa ../comma-py_1.0.0-1_source.changes
+#     # ? debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 ../../deb_dist/comma-py_1.0.0-1_source.changes
+#     #
+#     # ...
+#     echo "$0: building package..." >&2
+#     cd deb_dist/comma-$version_major.$version_minor.$version_patch || die "failed"
+#     dpkg-buildpackage -rfakeroot -uc -us || die "failed"
+#     #https://shallowsky.com/blog/programming/packaging-launchpad-ppas.html
+#     # todo? or do all above outside of this script using something like (but also see above):
+#     #       debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
+#     cd ~/build/comma
+#     echo "$0: running cmake in $( pwd )" >&2
+#     cmake . -DCPACK_GENERATOR=DEB \
+#             -DBUILD_PYTHON_PACKAGES=ON \
+#             -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+#             -DBUILD_SHARED_LIBS=ON \
+#             -DBUILD_TESTS=OFF \
+#             -DCMAKE_BUILD_TYPE=Release \
+#             -DCMAKE_INSTALL_PREFIX=/usr \
+#             -DINSTALL_BASH_COMPLETION=OFF \
+#             -DINSTALL_TESTS=OFF \
+#             -DCPACK_DEPENDENCIES_LIBPROCPS="$libproc_version" \
+#             -DCPACK_PACKAGE_VERSION_MAJOR=$version_major \
+#             -DCPACK_PACKAGE_VERSION_MINOR=$version_minor \
+#             -DCPACK_PACKAGE_VERSION_PATCH=$version_patch  \
+#             -Dcomma_INSTALL_LIB_DIR=lib/x86_64-linux-gnu \
+#             -Dcomma_BUILD_XML=OFF \
+#             -Dcomma_build_io_rabbit_cat=OFF || die "failed"
+#     echo "$0: running cpack in $( pwd )" >&2
+#     cpack || die "failed"
+#     # todo: optionally run full regression test
+#     echo "$0: done" >&2
+# )
+# cp ~/build/comma/comma-$version_major.$version_minor.$version_patch-Linux.deb output
+# cp ~/src/comma/python/deb_dist/comma-py*.deb output
diff --git a/system/package/cpack/comma-package-test b/system/package/cpack/comma-package-test
new file mode 100755
index 000000000..89e4cf5e1
--- /dev/null
+++ b/system/package/cpack/comma-package-test
@@ -0,0 +1,29 @@
+#!/bin/bash
+
+function die() { echo "$0: $@" >&2; exit 1; }
+
+package="$1"
+python_package="$2"
+[[ -n "$python_package" ]] || { echo "usage: $0 <package> <python package>" >&2; exit 1; }
+#pip3 install numpy # todo! very unfortunate, but python deb package installs python3-numpy, which is wrong version and we gave up for now
+apt install --yes "$python_package" || die "failed to install package '$python_package'"
+apt install --yes "$package" || die "failed to install package '$package'"
+
+echo "$0: testing basic csv utilities..." >&2
+output=$( csv-paste line-number | head | csv-to-bin ui | csv-from-bin ui ) || die "failed: failed to run"
+expected=$( seq 0 9 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+echo "$0: testing basic csv utilities: done" >&2
+
+echo "$0: testing bash utils..." >&2
+type -p comma-application-util || die "failed: failed"
+echo "$0: testing bash utils: done" >&2
+
+echo "$0: running csv-eval --help (for reference)..." >&2
+csv-eval --help
+
+echo "$0: testing csv-eval..." >&2
+output=$( seq 0 9 | csv-eval --fields a "a+=1" || exit ) || die "failed: failed to run"
+expected=$( seq 1 10 )
+[[ "$output" == "$expected" ]] || die "failed: unexpected output: $output"
+echo "$0: testing csv-eval: done" >&2
diff --git a/system/package/cpack/readme b/system/package/cpack/readme
new file mode 100644
index 000000000..0d4cc5446
--- /dev/null
+++ b/system/package/cpack/readme
@@ -0,0 +1,27 @@
+to build docker that has ansible, cmake, etc, run
+
+(you may need to run as sudo, unless you set up your docker running without sudo; see e.g: https://www.digitalocean.com/community/tutorials/how-to-install-and-use-docker-on-ubuntu-20-04)
+
+> ./comma-package-docker-build 18.04 # ubuntu 18.04
+> ./comma-package-docker-build 20.04 # ubuntu 20.04
+
+to build deb package e.g. for comma version 1.2.3 for ubuntu 20.04 run:
+
+> ./comma-package-docker-run 20.04 1 2 3
+
+if your comma reposity is not in ~/src/comma, but e.g. in ~/my/src/comma, run (you also need to specify comma directory if you run as sudo, since default location is ~):
+
+> ./comma-package-docker-run 20.04 1 2 3 ~/my/src/comma
+
+debian package will be built in your current directory
+
+test that package is ok, e.g:
+
+> ./comma-package-docker-test 20.04 comma-1.2.3-Linux.deb comma-py_1.2.3-1_all.deb
+
+sign packages, e.g:
+
+> debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-1.0.0-Linux.deb
+> debsigs --sign=origin -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 comma-py_1.0.0-1_all.deb
+
+todo: fix lintian misplaced-extra-member-in-deb, which happens after gpg-signing
diff --git a/system/package/examples/make-debian-package b/system/package/examples/make-debian-package
new file mode 100755
index 000000000..359217e87
--- /dev/null
+++ b/system/package/examples/make-debian-package
@@ -0,0 +1,41 @@
+#!/bin/bash
+
+home=$1
+[[ -n "$home" ]] || { echo "usage: $0 <packaging-dir>" >&2; exit 1; }
+home=$( realpath $home )
+mkdir -p $home/src
+cd $home/src
+git clone https://gitlab.com/orthographic/comma.git
+build_dir=$home/src/comma/build
+mkdir -p $build_dir
+cd $build_dir
+
+# if you want the library path to be lib/x86_64-linux-gnu
+# see target build in src/comma/debian/rules
+cmake $home/src/comma \
+    -DCMAKE_INSTALL_PREFIX=$build_dir/debian/tmp/usr \
+    -DCMAKE_BUILD_TYPE=Release \
+    -DBUILD_SHARED_LIBS=ON \
+    -DBUILD_PYTHON_PACKAGES=OFF \
+    -DADD_PYTHON_PACKAGES_TO_RPM=OFF \
+    -DBUILD_TESTS=OFF \
+    -DINSTALL_BASH_COMPLETION=OFF \
+    -DINSTALL_TESTS=OFF \
+    -Dcomma_INSTALL_RUN_POST_INSTALL=OFF \
+    -Dcomma_BUILD_XML=OFF \
+    -Dcomma_BUILD_ZEROMQ=OFF \
+    -Dcomma_build_io_rabbit_cat=OFF
+make -j
+make install -j
+
+# make vodoo debian directory
+mkdir -p $build_dir/debian/tmp/DEBIAN
+
+# copy debian configuration files to our build directory for packaging
+cp -r $home/src/comma/debian/control $home/src/comma/debian/changelog $home/src/comma/debian/copyright $build_dir/debian
+
+# generate the control file
+dpkg-gencontrol -pcomma
+
+# build the package
+dpkg --build $build_dir/debian/tmp $build_dir
diff --git a/system/package/examples/package-python b/system/package/examples/package-python
new file mode 100755
index 000000000..2438cfff9
--- /dev/null
+++ b/system/package/examples/package-python
@@ -0,0 +1,12 @@
+#!/bin/bash
+
+cd ~/src/comma/python
+rm -rf deb_dist dist tmp
+python3 setup.py --command-packages=stdeb.command sdist_dsc --copyright-file ../copyright --suite focal --package comma-py --build-depends python3-numpy
+debsign -k 79BF9724F37751A39B08698DB3CB85AF5FB6E9F1 deb_dist/comma-py_1.0.0-1.dsc
+mkdir tmp
+cd tmp
+dpkg-source -x ../deb_dist/comma-py_1.0.0-1.dsc
+cd comma-py-1.0.0
+debuild -S -sa
+dput ppa:orthographic/test-ppa ../comma-py_1.0.0-1_source.changes #dput ppa:orthographic/ppa ../python3-comma_1.0.0-1_source.changes
diff --git a/timing/CMakeLists.txt b/timing/CMakeLists.txt
new file mode 100644
index 000000000..61fd19ea4
--- /dev/null
+++ b/timing/CMakeLists.txt
@@ -0,0 +1,20 @@
+SET( PROJECT "timing" )
+SET( TARGET_NAME comma_${PROJECT} )
+
+SET( PROJECT "timing" )
+SET( TARGET_NAME comma_${PROJECT} )
+
+FILE( GLOB source   ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.cpp)
+FILE( GLOB includes ${SOURCE_CODE_BASE_DIR}/${PROJECT}/*.h)
+SOURCE_GROUP( ${PROJECT} FILES ${source} ${includes} )
+ADD_LIBRARY( ${TARGET_NAME} ${source} ${includes} )
+target_link_libraries( ${TARGET_NAME} comma_string ) # target_link_libraries( ${TARGET_NAME} comma_csv comma_name_value comma_string )
+SET_TARGET_PROPERTIES( ${TARGET_NAME} PROPERTIES ${comma_LIBRARY_PROPERTIES} )
+
+INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
+INSTALL(
+    TARGETS ${TARGET_NAME}
+    RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime     # .exe, .dll
+    LIBRARY DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Runtime     # .so, mod.dll
+    ARCHIVE DESTINATION ${comma_INSTALL_LIB_DIR} COMPONENT Development # .a, .lib
+)
diff --git a/timing/conversions.cpp b/timing/conversions.cpp
new file mode 100644
index 000000000..0e70f0acf
--- /dev/null
+++ b/timing/conversions.cpp
@@ -0,0 +1,19 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "../base/exception.h"
+#include "conversions.h"
+
+namespace comma { namespace timing {
+
+std::string to_iso_string( boost::posix_time::ptime t, unsigned int fraction_digits, bool strict )
+{
+    std::string s = boost::posix_time::to_iso_string( t );
+    unsigned int size = 16 + fraction_digits;
+    if( t.is_not_a_date_time() || t.is_neg_infinity() || t.is_infinity() ) { COMMA_THROW_IF( strict, "expected valid time; got: '" << s << "'" ); return s; }
+    return s.size() < size ? s + std::string( '0', size - s.size() ) : s.substr( 0, size );
+}
+
+} } // namespace comma { namespace timing {
diff --git a/timing/conversions.h b/timing/conversions.h
new file mode 100644
index 000000000..1fa02a02a
--- /dev/null
+++ b/timing/conversions.h
@@ -0,0 +1,19 @@
+// Copyright (c) 2024 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time.hpp>
+#include "duration.h"
+
+namespace comma { namespace timing {
+
+/// same as boost::posix_time::to_iso_string, but pads second fractions with zeroes
+/// @param t: time
+/// @param fraction_digits: number of second fraction digits
+/// @param strict: throw on uninitialised time and infinity
+std::string to_iso_string( boost::posix_time::ptime t, unsigned int fraction_digits = 6, bool strict = false );
+
+} } // namespace comma { namespace timing {
diff --git a/timing/duration.cpp b/timing/duration.cpp
new file mode 100644
index 000000000..17e082d29
--- /dev/null
+++ b/timing/duration.cpp
@@ -0,0 +1,17 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "duration.h"
+
+namespace comma { namespace timing { namespace duration {
+
+boost::posix_time::time_duration from_seconds( double seconds )
+{
+    long long s = seconds;
+    int microseconds = ::ceil( ( seconds - s ) * 1000000 - 0.5 ); //int microseconds = ::round( ( d - seconds ) * 1000000 ); // although ::round() is slow, have to round, since lexical cast has floating point jitter, e.g. try: boost::lexical_cast< double >( "1369179610.752231000" );
+    return boost::posix_time::time_duration( boost::posix_time::seconds( s ) + boost::posix_time::microseconds( microseconds ) );
+}
+
+} } } // namespace comma { namespace timing { namespace duration {
diff --git a/timing/duration.h b/timing/duration.h
new file mode 100644
index 000000000..9a0e1edd6
--- /dev/null
+++ b/timing/duration.h
@@ -0,0 +1,15 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time.hpp>
+
+namespace comma { namespace timing { namespace duration {
+
+boost::posix_time::time_duration from_seconds( double seconds );
+
+} } } // namespace comma { namespace timing { namespace duration {
+
diff --git a/timing/epoch.cpp b/timing/epoch.cpp
new file mode 100644
index 000000000..4fe492da4
--- /dev/null
+++ b/timing/epoch.cpp
@@ -0,0 +1,16 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "duration.h"
+#include "epoch.h"
+
+namespace comma { namespace timing {
+
+boost::posix_time::ptime from_seconds_since_epoch( double seconds, boost::gregorian::date e )
+{
+    return boost::posix_time::ptime( e, duration::from_seconds( seconds ) );
+}
+
+} } // namespace comma { namespace timing {
diff --git a/timing/epoch.h b/timing/epoch.h
new file mode 100644
index 000000000..8592e5678
--- /dev/null
+++ b/timing/epoch.h
@@ -0,0 +1,17 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time.hpp>
+
+namespace comma { namespace timing {
+
+const boost::gregorian::date epoch( 1970, 1, 1 );
+
+boost::posix_time::ptime from_seconds_since_epoch( double seconds, boost::gregorian::date e = timing::epoch );
+
+} } // namespace comma { namespace timing {
+
diff --git a/timing/stats.cpp b/timing/stats.cpp
new file mode 100644
index 000000000..6e3e8a318
--- /dev/null
+++ b/timing/stats.cpp
@@ -0,0 +1,75 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+// introduces circular dependencies: #include "../csv/ascii.h" // quick and dirty
+#include "../name_value/ptree.h"
+#include "../timing/stats.h"
+//#include "../timing/traits.h"
+
+namespace comma { namespace timing {
+
+stats& stats::operator+=( const stats::time_type& t ) // todo: move to cpp file
+{
+    if( _start.time_since_epoch() == std::chrono::seconds( 0 ) )
+    {
+        _start = t;
+    }
+    else
+    {
+        double d = double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000;
+        if( _ema.count() == 0 ) { _min = _max = d; }
+        else { if( d < _min ) { _min = d; } else if( d > _max ) { _max = d; } }
+        _ema += double( std::chrono::duration_cast< std::chrono::microseconds >( t - _t ).count() ) / 1000000; // quick and dirty for now
+    }
+    _t = t;
+    return *this;
+}
+
+double stats::elapsed() const
+{ 
+    return double( std::chrono::duration_cast< std::chrono::microseconds >( _t - _start ).count() ) / 1000000;
+}
+
+void stats::output( std::ostream& os, const std::string& prefix, bool csv ) // todo: template on prefix
+{
+    // freaking hate chrono! os << prefix << "start=" << _start << ";elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << _ema() << std::endl;
+    auto p = os.precision();
+    os.setf( std::ios::fixed, std::ios::floatfield );
+    os << std::setprecision( 6 ) << prefix;
+    std::cerr << std::setprecision( 6 );
+    if( csv ) // quick and dirty for now to avoid circular dependencies; todo? csv::timing::stats wrapper or something along those lines
+    {
+        //static comma::csv::ascii< stats > ascii; // introduces circular dependencies
+        //os << ascii.put( *this ) << std::endl;
+        os << elapsed() << ',' << count() << ',' << rate() << ',' << min() << ',' << max() << ',' << ema() << std::endl;
+    }
+    else
+    {
+        // todo! fix! to_ptree: eventually calls ptree.put() which does lexical cast at very high precision
+        //                      the solution: parametrize on precision and/or provide translator for putting value (or getting)
+        // boost::property_tree::ptree t;
+        // to_ptree to( t );
+        // visiting::apply( to, *this );
+        // comma::property_tree::to_path_value( os, t, comma::property_tree::disabled, '=', ';', xpath(), true );
+        // os << std::endl;
+        os << prefix << "elapsed=" << elapsed() << ";count=" << _ema.count() << ";rate=" << rate() << ";intervals/min=" << _min << ";intervals/max=" << _max << ";intervals/mean=" << ema() << std::endl;
+    }
+    os << std::setprecision( p ); // todo! not excetion-safe
+}
+
+void stats::output( unsigned int c, std::ostream& os, const std::string& prefix, bool csv )
+{
+    if( count() > 0 && count() % c == 0 ) { output( os, prefix, csv ); }
+}
+
+void stats::output_every( const stats::duration_type& d, std::ostream& os, const std::string& prefix, bool csv )
+{
+    auto now = std::chrono::system_clock::now();
+    if( ( now - _previous_output_time ) < d ) { return; }
+    output( os, prefix, csv );
+    _previous_output_time = now;
+}
+
+} } // namespace comma { namespace timing {
diff --git a/timing/stats.h b/timing/stats.h
new file mode 100644
index 000000000..4b0865815
--- /dev/null
+++ b/timing/stats.h
@@ -0,0 +1,59 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#pragma once
+
+#include <chrono>
+#include <iostream>
+#include <string>
+#include "../math/exponential_moving_average.h"
+
+namespace comma { namespace timing {
+
+class stats
+{
+    public:
+        typedef std::chrono::time_point< std::chrono::system_clock > time_type;
+
+        typedef decltype( time_type() - time_type() ) duration_type;
+
+        stats( double ema_alpha = 0.5, comma::uint64 ema_initial_count = 1 ): _ema( ema_alpha, ema_initial_count ), _previous_output_time( std::chrono::system_clock::now() ) {}
+
+        stats& operator+=( const time_type& t );
+
+        stats& operator++() { return operator+=( std::chrono::system_clock::now() ); }
+
+        stats& touch( const time_type& t ) { _t = t; return *this; }
+
+        stats& touch() { return touch( std::chrono::system_clock::now() ); }
+
+        comma::uint64 count() const { return _ema.count(); }
+
+        double rate() const { return _ema.count() > 0 ? 1. / _ema() : 0; }
+
+        double ema() const { return _ema.count() > 0 ? _ema() : 0; }
+
+        double min() const { return _min; }
+
+        double max() const { return _max; }
+
+        double elapsed() const;
+
+        void output( std::ostream& os = std::cerr, const std::string& prefix = "", bool csv = false );
+    
+        void output( unsigned int count = 1, std::ostream& os = std::cerr, const std::string& prefix = "", bool csv = false );
+
+        void output_every( const stats::duration_type& d, std::ostream& os = std::cerr, const std::string& prefix = "", bool csv = false );
+
+    private:
+        math::exponential_moving_average< double > _ema;
+        time_type _start;
+        time_type _t;
+        time_type _previous_output_time;
+        double _min{0};
+        double _max{0};
+};
+
+} } // namespace comma { namespace timing {
diff --git a/timing/tai.cpp b/timing/tai.cpp
new file mode 100644
index 000000000..39a45a369
--- /dev/null
+++ b/timing/tai.cpp
@@ -0,0 +1,107 @@
+// Copyright (c) 2024 Mission Systems Pty Ltd
+//
+// Data extracted from https://hpiers.obspm.fr/eoppc/bul/bulc/UTC-TAI.history
+// which is linked to from https://www.iers.org/IERS/EN/Publications/Bulletins/bulletins.html
+//
+// For an overview see https://en.wikipedia.org/wiki/Leap_second
+//
+// Note that boost::posix_time doesn't really support leap seconds. It treats
+// 19720630T235960 as identical to 19720701T000000. You can see this with:
+//   $ echo 19720630T235959 | csv-time --to seconds
+//   78796799
+//   $ echo 19720630T235960 | csv-time --to seconds
+//   78796800
+//   $ echo 19720701T000000 | csv-time --to seconds
+//   78796800
+//
+// There should be an extra second there
+//
+// Note that C++20 introduces std::chrono::tai_clock
+// https://en.cppreference.com/w/cpp/chrono/tai_clock
+
+/// @author dave jennings
+
+#include <utility>
+#include <vector>
+#include "tai.h"
+
+namespace comma { namespace timing { namespace tai {
+
+typedef std::pair< boost::posix_time::ptime, int > leap_seconds_entry;
+
+using boost::posix_time::ptime;
+using boost::gregorian::date;
+using boost::date_time::Jan;
+using boost::date_time::Jul;
+
+static std::vector< leap_seconds_entry > leap_seconds_table = {
+    leap_seconds_entry(  boost::date_time::neg_infin, 0 ),
+    leap_seconds_entry( ptime( date( 1972, Jan, 1 )), 10 ),
+    leap_seconds_entry( ptime( date( 1972, Jul, 1 )), 11 ),
+    leap_seconds_entry( ptime( date( 1973, Jan, 1 )), 12 ),
+    leap_seconds_entry( ptime( date( 1974, Jan, 1 )), 13 ),
+    leap_seconds_entry( ptime( date( 1975, Jan, 1 )), 14 ),
+    leap_seconds_entry( ptime( date( 1976, Jan, 1 )), 15 ),
+    leap_seconds_entry( ptime( date( 1977, Jan, 1 )), 16 ),
+    leap_seconds_entry( ptime( date( 1978, Jan, 1 )), 17 ),
+    leap_seconds_entry( ptime( date( 1979, Jan, 1 )), 18 ),
+    leap_seconds_entry( ptime( date( 1980, Jan, 1 )), 19 ),
+    leap_seconds_entry( ptime( date( 1981, Jul, 1 )), 20 ),
+    leap_seconds_entry( ptime( date( 1982, Jul, 1 )), 21 ),
+    leap_seconds_entry( ptime( date( 1983, Jul, 1 )), 22 ),
+    leap_seconds_entry( ptime( date( 1985, Jul, 1 )), 23 ),
+    leap_seconds_entry( ptime( date( 1988, Jan, 1 )), 24 ),
+    leap_seconds_entry( ptime( date( 1990, Jan, 1 )), 25 ),
+    leap_seconds_entry( ptime( date( 1991, Jan, 1 )), 26 ),
+    leap_seconds_entry( ptime( date( 1992, Jul, 1 )), 27 ),
+    leap_seconds_entry( ptime( date( 1993, Jul, 1 )), 28 ),
+    leap_seconds_entry( ptime( date( 1994, Jul, 1 )), 29 ),
+    leap_seconds_entry( ptime( date( 1996, Jan, 1 )), 30 ),
+    leap_seconds_entry( ptime( date( 1997, Jul, 1 )), 31 ),
+    leap_seconds_entry( ptime( date( 1999, Jan, 1 )), 32 ),
+    leap_seconds_entry( ptime( date( 2006, Jan, 1 )), 33 ),
+    leap_seconds_entry( ptime( date( 2009, Jan, 1 )), 34 ),
+    leap_seconds_entry( ptime( date( 2012, Jul, 1 )), 35 ),
+    leap_seconds_entry( ptime( date( 2015, Jul, 1 )), 36 ),
+    leap_seconds_entry( ptime( date( 2017, Jan, 1 )), 37 ),
+    leap_seconds_entry(  boost::date_time::pos_infin, 37 )
+};
+
+// The switch-over times are in UTC. That's how we get a time of 23:59:60.
+// So when working out the leap_second offset we need the UTC timestamp.
+// See https://en.wikipedia.org/wiki/Leap_second#Process
+static std::vector< leap_seconds_entry >::reverse_iterator lookup_table( const boost::posix_time::ptime& time, bool time_is_utc )
+{
+    // Timestamps are likely to be recent so look backwards through the table to
+    // find the right entry
+    std::vector< leap_seconds_entry >::reverse_iterator riter;
+    for( riter = leap_seconds_table.rbegin(); riter != leap_seconds_table.rend(); ++riter )
+    {
+        boost::posix_time::ptime utc = ( time_is_utc ? time : time - boost::posix_time::seconds( riter->second ));
+        if( utc >= riter->first ) { break; }
+    }
+    return riter;
+}
+
+int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc )
+{
+    return lookup_table( time, time_is_utc )->second;
+}
+
+std::pair< int, boost::posix_time::ptime > leap_seconds_with_valid_time( const boost::posix_time::ptime& time, bool time_is_utc )
+{
+    std::vector< leap_seconds_entry >::reverse_iterator riter = lookup_table( time, time_is_utc );
+    return std::pair< int, boost::posix_time::ptime >( riter->second, ( riter - 1 )->first );
+}
+
+boost::posix_time::ptime from_utc( const boost::posix_time::ptime& utc )
+{
+    return utc + boost::posix_time::seconds( leap_seconds( utc, true ));
+}
+
+boost::posix_time::ptime to_utc( const boost::posix_time::ptime& tai )
+{
+    return tai - boost::posix_time::seconds( leap_seconds( tai, false ));
+}
+
+} } } // namespace comma { namespace timing { namespace tai {
diff --git a/timing/tai.h b/timing/tai.h
new file mode 100644
index 000000000..9650eee9c
--- /dev/null
+++ b/timing/tai.h
@@ -0,0 +1,31 @@
+// Copyright (c) 2024 Mission Systems Pty Ltd
+
+#pragma once
+
+#include <boost/date_time/posix_time/posix_time_types.hpp>
+
+namespace comma { namespace timing {
+
+namespace tai {
+
+// For conversion of fast streaming data you probably want to just get the leap
+// seconds once then apply that offset to all the data (utc = tai - leap_seconds).
+// This will not be accurate if the data crosses a leap-second boundary but is much faster.
+int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc = true );
+
+// If you want accurate time across a boundary, use this call, check your
+// timestamps and update the leap seconds when you go past the valid time.
+// Valid time is in UTC.
+std::pair< int, boost::posix_time::ptime > leap_seconds_with_valid_time( const boost::posix_time::ptime& time, bool time_is_utc );
+
+// Otherwise use the from/to functions which are accurate across boundaries.
+// Although note that boost doesn't understand UTC times of 23:59:60.
+// It thinks it's the same as 00:00:00 even if it aligns with a leap-second.
+boost::posix_time::ptime from_utc( const boost::posix_time::ptime& utc );
+boost::posix_time::ptime to_utc( const boost::posix_time::ptime& tai );
+
+} // namespace tai {
+
+inline int leap_seconds( const boost::posix_time::ptime& time, bool time_is_utc = true ) { return tai::leap_seconds( time, time_is_utc ); }
+
+} } // namespace comma { namespace timing {
diff --git a/io/publisher.cpp b/timing/timestamped.h
similarity index 66%
rename from io/publisher.cpp
rename to timing/timestamped.h
index 486780099..988e38cfa 100644
--- a/io/publisher.cpp
+++ b/timing/timestamped.h
@@ -1,4 +1,3 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
 // All rights reserved.
 //
@@ -27,25 +26,32 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
+#pragma once
 
-/// @author vsevolod vlaskine
+#include <boost/date_time/posix_time/posix_time.hpp>
 
-#include "publisher.h"
+namespace comma {
 
-namespace comma { namespace io {
+template < typename T >
+struct timestamped
+{
+    boost::posix_time::ptime t;
 
-publisher::publisher( const std::string& name, comma::io::mode::value mode, bool blocking, bool flush ) : pimpl_( new impl::publisher( name, mode, blocking, flush ) ) {}
+    T data;
 
-publisher::~publisher() { delete pimpl_; }
+    timestamped() {}
 
-std::size_t publisher::write( const char* buf, std::size_t size, bool do_accept ) { return pimpl_->write( buf, size, do_accept ); }
+    timestamped( const T& data ) : t( boost::posix_time::microsec_clock::universal_time() ), data( data ) {}
 
-unsigned int publisher::accept() { return pimpl_->accept(); }
+    timestamped( T&& data ) : t( boost::posix_time::microsec_clock::universal_time() ), data( data ) {}
 
-void publisher::close() { pimpl_->close(); }
+    timestamped( boost::posix_time::ptime t, const T& data ) : t( t ), data( data ) {}
 
-std::size_t publisher::size() const { return pimpl_->size(); }
+    timestamped( boost::posix_time::ptime t, T&& data ) : t( t ), data( data ) {}
+};
 
-file_descriptor publisher::acceptor_file_descriptor() const { return pimpl_->acceptor_ ? pimpl_->acceptor().fd() : comma::io::invalid_file_descriptor; }
+template < typename T > inline timestamped< T > make_timestamped( T&& data ) { return timestamped< T >( data ); }
 
-} } // namespace comma { namespace io {
+template < typename T > inline timestamped< T > make_timestamped( boost::posix_time::ptime t, T&& data ) { return timestamped< T >( t, data ); }
+
+} // namespace comma {
diff --git a/timing/traits.h b/timing/traits.h
new file mode 100644
index 000000000..7ba90b210
--- /dev/null
+++ b/timing/traits.h
@@ -0,0 +1,40 @@
+// Copyright (c) 2023 Vsevolod Vlaskine
+// All rights reserved.
+
+/// @author vsevolod vlaskine
+
+#include "../timing/stats.h"
+#include "../timing/timestamped.h"
+#include "../visiting/traits.h"
+
+namespace comma { namespace visiting {
+
+template <> struct traits< comma::timing::stats > // quick and dirty
+{
+    template < typename Key, class Visitor > static void visit( const Key& k, const comma::timing::stats& p, Visitor& v )
+    {
+        v.apply( "elapsed", p.elapsed() );
+        v.apply( "count", p.count() );
+        v.apply( "rate", p.rate() );
+        v.apply( "min", p.min() );
+        v.apply( "max", p.max() );
+        v.apply( "mean", p.ema() );
+    }
+};
+
+template < typename T > struct traits< comma::timestamped< T > >
+{
+    template< typename K, typename V > static void visit( const K&, comma::timestamped< T >& p, V& v )
+    {
+        v.apply( "t", p.t );
+        v.apply( "data", p.data );
+    }
+
+    template< typename K, typename V > static void visit( const K&, const comma::timestamped< T >& p, V& v )
+    {
+        v.apply( "t", p.t );
+        v.apply( "data", p.data );
+    }
+};
+
+} } // namespace comma { namespace visiting {
diff --git a/util/applications/CMakeLists.txt b/util/applications/CMakeLists.txt
index daffc41a6..7486763b7 100644
--- a/util/applications/CMakeLists.txt
+++ b/util/applications/CMakeLists.txt
@@ -1,6 +1,7 @@
 add_executable( comma-progress comma-progress.cpp )
 target_link_libraries(comma-progress ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_name_value )
-INSTALL( TARGETS comma-progress RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+set_target_properties( comma-progress PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS comma-progress RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
 if( NOT WIN32 )
     # It is too troublesome to cross compile PROCPS
@@ -17,21 +18,27 @@ if( NOT WIN32 )
             if( HAVE_PROCPS_SYSTEMD )
                 set_source_files_properties( comma-timeout-group.cpp PROPERTIES COMPILE_FLAGS "-DHAVE_PROCPS_DEV -DWITH_SYSTEMD" )
             endif( HAVE_PROCPS_SYSTEMD )
+        else()
+            # unset the cached result, so that we check again next time, in case the library is installed
+            unset( HAVE_PROCPS_DEV CACHE )
         endif( HAVE_PROCPS_DEV )
-        target_link_libraries(comma-timeout-group ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_name_value ${LIBPROCPS} )
-        INSTALL( TARGETS comma-timeout-group RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+        target_link_libraries( comma-timeout-group ${comma_ALL_EXTERNAL_LIBRARIES} comma_csv comma_xpath comma_name_value ${LIBPROCPS} )
+        set_target_properties( comma-timeout-group PROPERTIES LINK_FLAGS_RELEASE -s )
+        install( TARGETS comma-timeout-group RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
     endif( NOT NO_PROCPS )
 endif( NOT WIN32 )
 
-add_executable(comma-nap comma-nap.cpp )
-target_link_libraries(comma-nap ${comma_ALL_EXTERNAL_LIBRARIES} )
-INSTALL( TARGETS comma-nap RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
+add_executable( comma-nap comma-nap.cpp )
+target_link_libraries( comma-nap ${comma_ALL_EXTERNAL_LIBRARIES} )
+set_target_properties( comma-nap PROPERTIES LINK_FLAGS_RELEASE -s )
+install( TARGETS comma-nap RUNTIME DESTINATION ${comma_INSTALL_BIN_DIR} COMPONENT Runtime )
 
-INSTALL( PROGRAMS comma-build DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-profile-graph DESTINATION ${comma_INSTALL_BIN_DIR} )
-INSTALL( PROGRAMS comma-repeat DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-build DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-profile-graph DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-repeat DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-enforce DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-match DESTINATION ${comma_INSTALL_BIN_DIR} )
+install( PROGRAMS comma-test-query DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-run DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-util DESTINATION ${comma_INSTALL_BIN_DIR} )
 install( PROGRAMS comma-test-resources DESTINATION ${comma_INSTALL_BIN_DIR} )
diff --git a/util/applications/comma-build b/util/applications/comma-build
index 0f1ea188b..e1f4ed709 100755
--- a/util/applications/comma-build
+++ b/util/applications/comma-build
@@ -33,6 +33,9 @@
 
 source $( type -p comma-application-util ) || { echo "$basename: cannot source 'comma-application-util'" >&2; exit 1; }
 
+function say() { echo "comma-build: $@" >&2; }
+function die() { say $@; exit 1; }
+
 function description()
 {
     cat <<eof
@@ -167,6 +170,7 @@ list-commits
 pack
 pull
 push
+sudo-install
 eof
 }
 
@@ -216,12 +220,29 @@ function sudo_make_install() { cmake "../../src/$( basename $( pwd ) )" $@ && ma
 
 function run_build_command()
 {
-    local build_dir="../../build/$1"
     local src_dir="../../src/$1"
     local command=$2
-    mkdir "$build_dir" -p || { echo "comma-build: $command: failed to create '$build_dir'" >&2 ; exit 1 ; }
-    echo "comma-build: $command: running in $build_dir: ${@:2}" >&2
-    ( cd "$build_dir" && ${@:2} )
+    if [[ -f "$src_dir/CMakeLists.txt" ]]; then
+        local build_dir="../../build/$1"
+        mkdir "$build_dir" -p || { echo "comma-build: $command: failed to create '$build_dir'" >&2 ; exit 1 ; }
+        echo "comma-build: $command: running in $build_dir: ${@:2}" >&2
+        ( cd "$build_dir" && ${@:2} )
+    elif [[ -f "$src_dir/setup.py" ]]; then # quick and dirty
+        case "$command" in
+            make_install) echo "comma-build: $command: running in $src_dir on python3 setup: ${@:2}" >&2
+                          ( cd "$src_dir" && python3 setup.py install ) 
+                          ;;
+            make_only) echo "comma-build: $command: no CMakeLists.txt in $src_dir, but found setup.py; skipped" >&2
+                       ;;
+            sudo_make_install) echo "comma-build: $command: running in $src_dir on python3 setup: ${@:2}" >&2
+                               ( cd "$src_dir" && sudo python3 setup.py install ) 
+                               ;;
+            *) die "$command: on $src_dir: do not know how to handle command for python3 installations"
+               ;;
+        esac
+    else
+        die "$command: on $src_dir: CMakeLists.txt or setup.py not found; don't know how to handle"
+    fi
 }
 
 function run_cmake()
@@ -312,13 +333,13 @@ function run_pack() # quick and dirty
         [[ ! -f $src_dir/dependencies.cmake-cache ]] || cmake_options+=( -C$src_dir/dependencies.cmake-cache )
         comma-build install ${cmake_options[@]}
         if [[ -f $src_dir/dependencies.cpack-options ]]; then
-		cpack_make_opts=$(cat $src_dir/dependencies.cpack-options )
-		# The user specified different options for packing. Re-run the make so that the Cmake files are regenerated.
-		# This is primarily done so that software can be built as a standard user, and installations that would otherwise go into system directories (eg /etc/systemd) can be redirected to /usr/local/...
-		# When the software is packed however, you'd want it to go to install location (/etc).
-		comma-build make ${cpack_make_opts}
-	fi		
-	comma-build cpack -G RPM ${@:3} || exit 1 #-D CPACK_RPM_PACKAGE_RELOCATABLE=ON || exit 1 #-D CPACK_PACKAGING_INSTALL_PREFIX=$pack_dir/rpm
+            cpack_make_opts=$(cat $src_dir/dependencies.cpack-options )
+            # The user specified different options for packing. Re-run the make so that the Cmake files are regenerated.
+            # This is primarily done so that software can be built as a standard user, and installations that would otherwise go into system directories (eg /etc/systemd) can be redirected to /usr/local/...
+            # When the software is packed however, you'd want it to go to install location (/etc).
+            comma-build make ${cpack_make_opts}
+        fi
+        comma-build cpack -G RPM ${@:3} || exit 1 #-D CPACK_RPM_PACKAGE_RELOCATABLE=ON || exit 1 #-D CPACK_PACKAGING_INSTALL_PREFIX=$pack_dir/rpm
     ) || { echo "comma-build: pack failed" >&2 ; exit 1 ; }
     cat dependencies.commits | while IFS=, read what commit ; do cp $pack_dir/build/$what/*.rpm $pack_dir/rpm ; done
     cp $pack_dir/build/$top_repository/*.rpm $pack_dir/rpm
diff --git a/util/applications/comma-progress.cpp b/util/applications/comma-progress.cpp
index c9e0b86d7..43127b312 100644
--- a/util/applications/comma-progress.cpp
+++ b/util/applications/comma-progress.cpp
@@ -27,23 +27,19 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-#include <boost/date_time/posix_time/ptime.hpp>
-#include <vector>
-#include <boost/unordered_map.hpp>
 #include <deque>
-#include <boost/unordered_set.hpp>
 #include <functional>
-#include <boost/functional.hpp>
+#include <vector>
+#include <boost/date_time/posix_time/ptime.hpp>
 #include <boost/math/special_functions/round.hpp>
+#include <boost/unordered_map.hpp>
+#include <boost/unordered_set.hpp>
 #include "../../csv/stream.h"
 #include "../../visiting/traits.h"
 #include "../../application/command_line_options.h"
 #include "../../name_value/ptree.h"
 
-static const std::string& name() {
-    static const std::string name = "comma-progress";
-    return name;
-}
+static const char* name() { return "comma-progress"; }
 
 static char delimiter = ';';
 static const char equal_sign = '=';
@@ -85,37 +81,82 @@ template < > struct traits< impl_::log > {
     
 } } // namespace comma { namespace visiting { 
 
-
-static void usage( bool verbose=false )
+static void usage( bool verbose )
 {
-    std::cerr << std::endl;
-    std::cerr << "cat progress.csv | " << name() << " [<options>] > stat.csv" << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "Example: cat progress.csv | comma-progress --elapsed | comma-progress --ratio run_all/application"  << std::endl;
-    std::cerr << "         In this example, every 'ratio' value is compared against time of run_all/application, instead" << std::endl;
-    std::cerr << "         of total time." << std::endl;
-    std::cerr << std::endl;
-    std::cerr << "modes" << std::endl;
-    std::cerr << "    These are mutually exclusive." << std::endl;
-    std::cerr << "    <no option>: Outputs path value for input data: " << comma::join( comma::csv::names< impl_::log >(), ',' )  << std::endl;
-    std::cerr << "                 Output format is 'path/{begin,end}=<ISO timestamp>'" << std::endl;
-    std::cerr << "    --elapsed [ --from-path-value|--from-pv ]" << std::endl;
-    std::cerr << "                 Outputs path value with 'elapsed' time, input data format: " << comma::join( comma::csv::names< impl_::log >(), ',' )  << std::endl;
-    std::cerr << "                 If '--from-path-value|--from-pv' is given, it takes inputs from outputs of < no option >" << std::endl;
-    std::cerr << "                 Output format is 'path/elapsed=<duration in second>'" << std::endl;
-    std::cerr << "    --sum [--mean] [--count] [--ratio ] [-P|--percentage] " << std::endl;
-    std::cerr << "                 Outputs path value with summed 'elapsed' time, taking input data from --elapsed mode." << std::endl;
-    std::cerr << "                 Elapsed duration is duration sum of runs with the same <path> key, where one application was called multiple times." << std::endl;
-    std::cerr << "                 Output format is '<path>/elapsed=<duration in second>'" << std::endl;
-    std::cerr << "                 --mean  adds '<path>/mean=< mean duration in second >' for items that ran more than once - duplicated elapsed path/keys." << std::endl;
-    std::cerr << "                 --mean  adds '<path>/count=< occurances of <path>/elapsed >', where mean=( elapsed / count )." << std::endl;
-    std::cerr << "                 --ratio adds '<path>/ratio=< ratio to total time or time of [path] if given >', " << std::endl;
-    std::cerr << "                 --ratio with -P|--percentage, a percentage is the value for <path>/ratio, rounded to 3 decimal places." << std::endl;
-    std::cerr << "options" << std::endl;
-    std::cerr << "    --help,-h:   Print this message.." << std::endl;
-    std::cerr << std::endl;
+    std::cerr << "\nsummarise timestamped elapsed time data";
+    std::cerr << "\n";
+    std::cerr << "\nusage: cat progress.csv | " << name() << " [<options>] > stat.csv";
+    std::cerr << "\n";
+    std::cerr << "\noptions:";
+    std::cerr << "\n    --help,-h:     display this help message and exit";
+    std::cerr << "\n    --verbose,-v:  more output";
+    std::cerr << "\n    --elapsed:     output path value with elapsed time";
+    std::cerr << "\n    --sum          output path value with summed elapsed time";
+    std::cerr << "\n";
+    std::cerr << "\nelapsed options:";
+    std::cerr << "\n    --from-path-value,--from-pv: take input from output of <no option>";
+    std::cerr << "\n";
+    std::cerr << "\nsum options:";
+    std::cerr << "\n    --count:          adds number of occurances of <path> (requires --mean)";
+    std::cerr << "\n    --mean:           adds mean duration for duplicate paths";
+    std::cerr << "\n    --percentage,-P:  express --ratio as a percentage";
+    std::cerr << "\n    --ratio [<path>]: adds ratio to total time or time of [path] if given";
+    std::cerr << "\n";
+    std::cerr << "\nmodes:";
+    std::cerr << "\n    with no option comma-progress takes " << comma::join( comma::csv::names< impl_::log >(), ',' ) << " and converts to";
+    std::cerr << "\n    path-value format of 'path/{begin,end}=<ISO timestamp>'";
+    std::cerr << "\n";
+    std::cerr << "\n    --elapsed";
+    std::cerr << "\n        input data format: " << comma::join( comma::csv::names< impl_::log >(), ',' );
+    std::cerr << "\n        output format: 'path/elapsed=<duration in second>'";
+    std::cerr << "\n        if --from-path-value is given input format is <no option> output";
+    std::cerr << "\n";
+    std::cerr << "\n    --sum";
+    std::cerr << "\n        input: data in format from --elapsed mode";
+    std::cerr << "\n        output: path-value with summed 'elapsed' time";
+    std::cerr << "\n        elapsed duration sums of runs with the same <path>";
+    std::cerr << "\n        additional accumlation stats can be added with --mean, --count, --ratio";
+    std::cerr << "\n        options in the format <path>/<stat>=<value>";
+    std::cerr << "\n";
+    if( verbose )
+    {
+        std::cerr << "\nexamples:";
+        std::cerr << "\n    --- create input data ---";
+        std::cerr << "\n    cat <<-EOF > data.csv";
+        std::cerr << "\n\t20230101T120000,main,begin";
+        std::cerr << "\n\t20230101T120100,sub_a,begin";
+        std::cerr << "\n\t20230101T120200,sub_a,end";
+        std::cerr << "\n\t20230101T120200,sub_b,begin";
+        std::cerr << "\n\t20230101T120600,sub_b,end";
+        std::cerr << "\n\t20230101T120600,sub_a,begin";
+        std::cerr << "\n\t20230101T120800,sub_a,end";
+        std::cerr << "\n\t20230101T121000,main,end";
+        std::cerr << "\n\tEOF";
+        std::cerr << "\n";
+        std::cerr << "\n    --- create path/value data ---";
+        std::cerr << "\n    cat data.csv | comma-progress";
+        std::cerr << "\n";
+        std::cerr << "\n    --- calculate elapsed times ---";
+        std::cerr << "\n    cat data.csv | comma-progress --elapsed";
+        std::cerr << "\n    cat data.csv | comma-progress | comma-progress --elapsed --from-path-value";
+        std::cerr << "\n";
+        std::cerr << "\n    --- sum up repeated entries ---";
+        std::cerr << "\n    cat data.csv | comma-progress --elapsed > elapsed.csv";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --mean";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --mean --count";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --ratio";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --ratio --percentage";
+        std::cerr << "\n    cat elapsed.csv | comma-progress --sum --ratio main/sub_b";
+    }
+    else
+    {
+        std::cerr << "\nsee comma-progress --help --verbose for examples";
+    }
+    std::cerr << "\n" << std::endl;
     exit( 1 );
 }
+
 static const std::string start = "begin";
 static const std::string finished = "end";
 
@@ -306,12 +347,10 @@ void process_begin_end( L get_log, O output )
 
 int main( int ac, char** av )
 {
-    comma::command_line_options options( ac, av );
-    
-    if( options.exists( "-h,--help" ) ) { usage(); }
-    
     try
     {
+        comma::command_line_options options( ac, av, usage );
+
         if( options.exists( "--sum" ) )
         {
             
@@ -379,8 +418,8 @@ int main( int ac, char** av )
         }
         else if( options.exists( "--elapsed" ) )
         {
-            boost::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output_elapsed );
-            boost::function< const impl_::log*() > extractor( &get_log );
+            std::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output_elapsed );
+            std::function< const impl_::log*() > extractor( &get_log );
             if( options.exists( "--from-path-value,--from-pv" ) )
             {
                 extractor = &get_log_path_value;
@@ -391,18 +430,16 @@ int main( int ac, char** av )
         }
         else
         {
-            boost::function< const impl_::log*() > extractor( &get_log );
-            boost::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output );
+            std::function< const impl_::log*() > extractor( &get_log );
+            std::function< void( const impl_::log&, const impl_::log&, const std::string&) > outputting( &output );
             impl_::process_begin_end< impl_::log >( extractor , outputting );
             
             return 0;
         }
         
     }
-    catch( std::exception& e ) {
-        std::cerr << name() << ": exception caught - " << e.what() << std::endl;
-    }
-    catch(...) {
-        std::cerr << name() << ": unknown exception caught, terminating." << std::endl;
-    }
+    catch( std::exception& e ) { comma::say() << "exception caught - " << e.what() << std::endl; }
+    catch(...) { comma::say() << "unknown exception" << std::endl; }
+    return 1;
 }
+
diff --git a/util/applications/comma-test-query b/util/applications/comma-test-query
new file mode 100755
index 000000000..41ce0aef2
--- /dev/null
+++ b/util/applications/comma-test-query
@@ -0,0 +1,86 @@
+#!/usr/bin/env python3
+
+# Copyright (c) 2024 Vsevolod Vlaskine
+
+import argparse, collections.abc, comma, json, os, sys
+
+def _find( what, dir, absolute=False ):
+    if dir == '-': raise Exception( 'comma-test-query: --dir="-": reading directories from stdin: todo, just ask' )
+    w = comma.filesystem.walk( dir, followlinks=True, followmounts=False )
+    f = comma.filesystem.find( what, w, find_children=True )
+    r = sorted( [ i[0] for i in f ] )
+    if not absolute: offset = len( dir ) + 1; r = [ p[offset:] for p in r ]
+    return dir, r
+
+def _list( args ):
+    _, paths = _find( args.what if isinstance( args.what, list ) else [ args.what ], args.dir )
+    for p in paths: print( f'{p}' )
+
+def _transpose( args ):
+    root, paths = _find( args.what, args.dir )
+    d = {}
+    for path in paths:
+        for w in args.what:
+            what = f'{root}/{path}/{w}'
+            status = 'todo'
+            if os.path.isfile( what ):
+                with open( what ) as f: r = json.load( f )
+                if not args.key in r:
+                    if args.strict: raise KeyError( f'{args.key} not found in {what}' )
+                    else: continue
+                if args.output == 'all':
+                    if isinstance( r[args.key], list ):
+                        for k in r[args.key]:
+                            comma.dictionary.set( d, f'{args.key}/{k}/{path}', r ) # todo! quick and dirty, super-overfit!
+                    else:
+                        comma.dictionary.set( d, f'{args.key}/{r[args.key]}/{path}', r ) # todo! quick and dirty, super-overfit!
+                elif args.output == 'paths':
+                    if isinstance( r[args.key], list ):
+                        for k in r[args.key]: comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
+                    else:
+                        k = r[args.key]
+                        comma.dictionary.set( d, f'{args.key}/{k}', { 'paths': comma.dictionary.at( d, f'{args.key}/{k}/paths' ) + [ path ] if comma.dictionary.has( d, f'{args.key}/{k}/paths' ) else [ path ] } ) # todo! quick and dirty, super-overfit!
+    #json.dump( sorted( d, key=lambda i: i[0] ), sys.stdout, indent = None if args.minify else 4 )    
+    json.dump( d, sys.stdout, sort_keys=True, indent = None if args.minify else 4 )
+
+def _traverse( args ):
+    d = {}
+    root, paths = _find( args.what, args.dir )
+    print( f'a: {root=}', file=sys.stderr )
+    print( f'b: {paths=}', file=sys.stderr )
+    for path in paths:
+        for w in args.what:
+            what = f'{root}/{path}/{w}'
+            print( f'c: {what=}', file=sys.stderr )
+            if os.path.isfile( what ):
+                with open( what ) as f: comma.dictionary.set( d, path, json.load( f ) ) # todo: fix overfitting on loading files of various types
+    json.dump( d, sys.stdout, indent = None if args.minify else 4 )
+
+def make_args():
+    description = 'usage: todo'
+    epilog = 'examples: todo'
+    parser = argparse.ArgumentParser( description=description, epilog=epilog, formatter_class=argparse.RawDescriptionHelpFormatter )
+    parser.add_argument( 'what', type=str, help='what to look for, e.g. readme.json' )
+    parser.add_argument( '--dir', default='.', type=str, help='directory to traverse; default: current directory, "-": read paths from stdin (todo)' )
+    parser.add_argument( '--verbose', '-v', help='more human-readable output', action='store_true' )
+    subparsers = parser.add_subparsers( help='sub-command help' )
+    list_parser = subparsers.add_parser( 'list', help='print subdirectories containing test or <what>, following symlinks, but skipping mounted drives (for now)' )
+    #list_parser.add_argument( '--absolute', help='output absolute path', action='store_true' )
+    list_parser.set_defaults( func=_list )
+    transpose_parser = subparsers.add_parser( 'transpose', help='transpose into the given primary key' )
+    transpose_parser.add_argument( 'key', type=str, help='field name vs which to transpose' )
+    transpose_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
+    transpose_parser.add_argument( '--output', default='all', type=str, choices=['all', 'paths'], help='what to output' )
+    transpose_parser.add_argument( '--strict', help='fail if one of files does not have desired <key>', action='store_true' )
+    transpose_parser.set_defaults( func=_transpose )
+    traverse_parser = subparsers.add_parser( 'traverse', help='traverse subdirectories, following symlinks, find <what>, output combined json' )
+    traverse_parser.add_argument( '--minify', help='output one-line json', action='store_true' )
+    traverse_parser.set_defaults( func=_traverse )
+    return parser.parse_args()
+
+def main():
+    args = make_args()
+    args.what = args.what.split( ',' )
+    args.func( args )
+
+if __name__ == '__main__': main()
diff --git a/util/applications/comma-test-run b/util/applications/comma-test-run
index 9aaa742e6..34e958dc0 100755
--- a/util/applications/comma-test-run
+++ b/util/applications/comma-test-run
@@ -1,33 +1,6 @@
 #!/bin/bash
 
-# This file is part of comma, a generic and flexible library
 # Copyright (c) 2011 The University of Sydney
-# All rights reserved.
-#
-# Redistribution and use in source and binary forms, with or without
-# modification, are permitted provided that the following conditions are met:
-# 1. Redistributions of source code must retain the above copyright
-#    notice, this list of conditions and the following disclaimer.
-# 2. Redistributions in binary form must reproduce the above copyright
-#    notice, this list of conditions and the following disclaimer in the
-#    documentation and/or other materials provided with the distribution.
-# 3. Neither the name of the University of Sydney nor the
-#    names of its contributors may be used to endorse or promote products
-#    derived from this software without specific prior written permission.
-#
-# NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-# GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-# HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-# WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-# MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-# BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-# WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-# OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-# IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 name=$( basename $0 )
 
@@ -85,12 +58,17 @@ function description_test_selection()
 --black-list=[<file>]; do not run these tests mentioned in <file>, e.g. a lists of sub-directories in white list
   to be excluded; see '--white-list' below for file format.
 --end=[<dir>]; run tests up to a given test, the latter excluded, where test directories are ordered lexicographically
+--followsymlinks,-L; follow symlinks when looking for test directories, same as find -L
+--followmounts; search mounted filesystems when looking for test directories, same as find without -mount
 --from,--begin=[<dir>]; run tests starting from a given test, where test directories are ordered lexicographically
 --run-disabled; run disabled tests
 --run-optional,--optional; run tests having file called "optional" (same logic as for --run-disabled)
 --stdin; read paths from stdin e.g. run test in hello/world: echo hello/world | comma-test-run --stdin
+--tags=[<tags>]; |-separated tags or regular expressions, run only tests with given tags (see below)
+--tags-excluded=[<tags>]; |-separated tags or regular expressions, do not run tests with given tags (see below)
+--tags-list; list tags for all subdirectories as <dir>,<tags>
 --to=[<dir>]; run tests up to a given test, the latter included, where test directories are ordered lexicographically
---until-first-failure; exit after the first failure (works only when tests run serially)
+--until-first-failure,--assert-status; exit after the first failure i.e. test script or command returning non-zero (works only when tests run serially)
 --white-list=[<file>]; only run these tests mentioned in the <file>, applied first before black list;
   comment lines starting with # are ignored; each entry in the list matches to a sub-directory or
   directories name using pattern ^<subdir>; see examples
@@ -109,7 +87,7 @@ function description_resources()
 --max-run-time=[<time>]; maximal time to wait for a test completion before failing it by force, default: ${max_run_time}
 --max-resources=[<file>]; specify limits for all resources in path-value format; see config files in verbose help;
   explicit options above have precedence
---parallel; run tests in parallel; default: run serially
+--parallel,-p; run tests in parallel; default: run serially
 EOF
 }
 
@@ -122,10 +100,12 @@ function description_others()
   'expected' file; pass multiple global files by invoking this option several times
 --debug; much more debug output
 --document,--doc; do not run tests, only output to stdout a collated test documentation in informal way, if --junit present, produce junit-like output (todo)
---junit=[<file>]; output to file junit record compatible with jenkins for each test
 --no-ansiterm-control-characters,--no-control-characters,--raw; unstyled output (no ANSIterm control characters)
 --output-directories,--dry-run,--dry; output list of test directories intended to run and exit
+--output-junit,--junit=[<file>]; output to file junit record compatible with jenkins for each test
+--output-stdout,--stdout; output test results to stdout as <dir>,<status>, <status>: success, failed, timeout, disabled
 --path=[<dir>]; data-storage directory for tests, default: none, let the tests define it
+--root-path,--root=[<dir>]; todo: do not accend beyond this path while searching for specially-named files, e.g. 'test' or 'config'
 --test-option=[<option>]; extra command line argument(s) pass to "test" script
 
 --quiet,-q; minimize output
@@ -236,7 +216,7 @@ ${brown}Running tests in parallel${none}
         as are available on the system. This is ${red}not recommended${none} for resource-heavy tests
         unless additional configuration files are provided as explained below.
 
-${brown}Config files${none}
+${brown}config files${none}
     The way a test is run can be controlled using a file named ${brown}config${none} in the test directory,
     which may contain the following parameters:
 
@@ -262,6 +242,12 @@ ${brown}Config files${none}
     run/max_time=<seconds>
         Test will be terminated and fail if it has not completed in the specified time (seconds).
         Overrides option '--max-run-time'.
+    
+    tags=<tags>
+        <tags>: comma-separated list of tags applied to the current directory and subdirectories
+                that do not have their own config containing 'tags' entry or a file named 'tags'
+                containing comma-separated list of arbitrary key words (tags); tests can be filtered
+                by tags using --tags and/or --tags-excluded command line options
 
     Example config:
         resources/cpus=4
@@ -269,6 +255,11 @@ ${brown}Config files${none}
         resources/serial=\"true\"
         run/max_time=600
 
+${brown}tags files${none}
+    If a file named 'tags' is present in the current directory or in one of its parent directories,
+    this file is expected to contain a comma-separated list of arbitrary key words (tags); tests can be
+    filtered by tags using --tags and/or --tags-excluded command line options
+
 ${brown}White(and black)-listing tests${none}
     The test names in the white/black list file shall match ${brown}exactly${none} the corresponding
     names in '--dry-run' output, e.g.
@@ -281,6 +272,9 @@ ${brown}White(and black)-listing tests${none}
         comma-test-run --white-list=white.list
     Do not remove leading dots or append input file names or anything similar.
 
+    This can also be done with an on-the-fly generated file:
+        comma-test-run --black-list <( echo ./exclude-me )
+
 ${brown}White(and black)-listing pro hint${none}
     Assume some tests failed:
         comma-test-run > comma-test-run.log 2>&1 ; echo \$?
@@ -301,7 +295,7 @@ function error_()
         local bold=$( tput bold )
         local red=$( tput setaf 1 )
         local normal=$( tput sgr0 )
-        echo -e "$bold$red$*$normal" >&2
+        echo -e "${bold}${red}$*${normal}" >&2
     fi
 }
 export -f error_
@@ -309,10 +303,10 @@ export -f error_
 function error_and_junit_()
 {
     local -r error_and_junit_formatted=$( echo -e "$1" )
-    error_ $( head -1 <<< "$error_and_junit_formatted" )
+    error_ $( head -1 <<< "comma-test-run: $error_and_junit_formatted" )
     local -r error_and_junit_formatted_tail="$( tail -n +2 <<< "$error_and_junit_formatted" )"
     [[ -z "$error_and_junit_formatted_tail" ]] || cat >&2 <<< "$error_and_junit_formatted_tail"
-    if [[ -n "$options_junit" && -d 'output' ]] ; then cat >> 'output/junit.failure.log' <<< "$error_and_junit_formatted" ; fi
+    if [[ -n "$options_output_junit" && -d 'output' ]] ; then cat >> 'output/junit.failure.log' <<< "$error_and_junit_formatted" ; fi
 }
 export -f error_and_junit_
 
@@ -360,6 +354,7 @@ function disabled_()
         if [[ "$verbose" == "--verbose" ]]; then
             if [[ -s $dir/$filename ]] ; then warning_ "$name: test $counter: $dir: $filename:" ; cat $dir/$filename | sed 's/^/    /' >&2
             else error_ "$name: test $counter: $dir: $filename (with no explanation)" ; fi
+            (( !options_output_stdout )) || echo "$dir,disabled" # todo? put it in message_
         fi
         return 0
     fi
@@ -412,19 +407,15 @@ function closest_file_in_path()
 {
     local path="$1"
     local file="$2"
-    
-    # sanity check (and avoid infinite loop)
-    if [[ -z "$path" || -z "$file" ]]; then echo "$name: error: empty path in closest_file_in_path()" >&2; exit 1; fi
-    # get canonical name (so path always starts with "/")
-    path=$( readlink -e "$path" )
-
+    [[ -n "$path" && -n "$file" ]] || { echo "$name: error: empty path in closest_file_in_path()" >&2; exit 1; }
+    path=$( readlink -e "$path" ) # get canonical name (so path always starts with "/")
     while true; do
         if [[ -d "$path/$file" ]]; then
-            echo "$name: warning: \"$path/$file\" is a directory (expected an executable script); ignoring" >&2
+            echo "$name: warning: '$path/$file' is a directory (expected an executable script); ignoring" >&2
         elif [[ -f "$path/$file" ]]; then
-            if [[ $file == "test" && ! -x "$path/$file" ]]; then echo "$name: warning: \"$path/$file\" is not executable; ignoring" >&2 
-            else echo $path/$file; break; fi
-        elif [[ $path == "/" ]]; then break
+            if [[ $file == "test" && ! -x "$path/$file" ]]; then echo "$name: warning: '$path/$file' is not executable; ignoring" >&2 
+            else echo "$path/$file"; break; fi
+        elif [[ "$path" == "/" || -d "$path/.git" ]]; then break # super-quick and dirty: stop on .git directory, otherwise it leads to bizarre errors, e.g. when there is a file 'config' or 'test' outside of git repository 
         fi
         path=$( dirname "$path" )
     done
@@ -492,7 +483,7 @@ function stats_finalize()
 {
     [[ -f "$stats_progress_csv" ]] || return
     cat "$stats_progress_csv" | comma-progress --elapsed > "$stats_elapsed_path_value"
-    [[ -z "$options_junit" ]] || junit_finalize > "$options_junit"
+    [[ -z "$options_output_junit" ]] || junit_finalize > "$options_output_junit"
 }
 
 function resources_limits()
@@ -617,8 +608,8 @@ function run_and_match_test()
 
     local env_variables="PYTHONPATH,XDG_RUNTIME_DIR,DISPLAY"
     
-    rm -rf output || { error_and_junit_ "Unable to remove 'output' directory" ; return 1 ; }
-    mkdir -p output || { error_and_junit_ "Unable to make 'output' directory" ; return 1 ; }
+    rm -rf output || { error_and_junit_ "unable to remove 'output' directory" ; return 1 ; }
+    mkdir -p output || { error_and_junit_ "unable to make 'output' directory" ; return 1 ; }
 
     {
         if [[ -f ./input ]] ; then cat ./input ; fi | comma_env --import "$env_variables" "$test_exec" "$path" $verbose $options_test_option
@@ -637,7 +628,7 @@ function run_and_match_test()
         
         function junit_log_error() # quick and dirty; todo: move all junit stuff to one location
         {
-            [[ -n "$options_junit" ]] || return
+            [[ -n "$options_output_junit" ]] || return
             local dir=$1
             mkdir -p $dir
             touch $dir/junit.failure.log
@@ -658,7 +649,7 @@ function run_and_match_test()
                     (( options_verbose )) && message_ "$name: match expectations in '$extra'"
                     local extra_match_output=$( comma-test-match "$extra" < 'output/stdout.log' )
                     [[ $is_global ]] || junit_log_error output/$( sed 's#^\./expected/##' <<< "$extra" ) "$extra_match_output"
-                    [[ -z "$extra_match_output" ]] || match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; echo "$extra_match_output" | sed "s#^#$extra:#" 2>&1 )
+                    [[ -z "$extra_match_output" ]] || match_output=$( [[ -n "$match_output" ]] && echo "$match_output"; echo "$extra_match_output" | sed "s#^#$extra:#" )
                 done
             fi
         }
@@ -670,9 +661,9 @@ function run_and_match_test()
         if [[ -n "$options_always_expected" ]] ; then
             for global_expected in $options_always_expected ; do match_expected "$global_expected" "is_global" ; done
         fi
-        echo -e '\n# After comma-test-match in comma-test-run' >> 'output/stdout.log'
+        echo -e '\n# after comma-test-match in comma-test-run' >> 'output/stdout.log'
         if [[ -n "$match_output" ]]; then
-            error_and_junit_ "Test output does not match expected:\nexpected output:\n$match_output"
+            error_and_junit_ "test output does not match expected:\nexpected output:\n$match_output"
             return 1
         fi
     }
@@ -808,11 +799,11 @@ function run_single_test()
     # say something so that the user is not guessing what is going on
     (
         flock -x 9
-        message_ "$name: test $counter: $dir: started..."
+        message_ "$name: test $counter: $dir: launching..."
     ) 9>>"$comma_test_run_output_flock"
 
     # do not touch this equilibristics with file descriptors
-    exec 3>&1 4>&2 1>"$our_stderrout_log" 2>&1
+    exec 3>&1 4>&2 1>"$our_stderrout_log" # exec 3>&1 4>&2 1>"$our_stderrout_log" 2>&1
 
     local test_exec basedir outcome
     local result=0
@@ -823,13 +814,11 @@ function run_single_test()
     elif disabled_ "optional" "$dir" "$options_run_optional" ; then
         warning_ "$name: test $counter: $dir: optional, skipped"
     else
-        test_exec=$( closest_file_in_path "$dir" "test" )
+        test_exec=$( closest_file_in_path "$dir" test )
         if [[ -z "$test_exec" ]]; then
             error_ "$name: error: no \"test\" script found in any parent directory of $dir"
             result=1
         else
-            message_ "$name: test $counter: $dir: running..."
-
             basedir=$( pwd )
 
             ## Comment out for now: the exact usage to be discussed, it is confusing and can be taken as a sign of error
@@ -845,6 +834,7 @@ function run_single_test()
                     report_end_of_wait
                     local error_files test_failed
                     find . -name out_of_shared_memory | xargs rm -f
+                    message_ "$name: test $counter: $dir: running..."
                     comma_progress_named "$our_stats_progress" "$dir" run_test_with_timeout
                     test_failed=$?
                     comma_locked "$comma_test_run_resources_flock" comma_release_resources "$request" "$comma_test_run_resources_counter" "$worker_id"
@@ -853,6 +843,7 @@ function run_single_test()
                         comma_locked "$comma_test_run_resources_flock" comma_release_resources "$request" "$comma_test_run_resources_counter" "$worker_id"
                         (( $? == 0 )) || {
                             error_ "$name: test $counter: $dir: repeated internal error on release_resources, terminate the test run PID '$comma_test_run_top_pid'"
+                            (( !options_output_stdout )) || echo "$dir,timeout" # todo? put it in message_; disambiguate timeout status
                             kill -TERM $comma_test_run_top_pid
                         }
                     }
@@ -864,10 +855,12 @@ function run_single_test()
                     }
                     [[ "$test_failed" == "0" ]] && {
                         message_ "$name: test $counter: $dir: succeeded"
+                        (( !options_output_stdout )) || echo "$dir,succeeded" # todo? put it in message_
                     } || {
                         result=1
                         error_ "$name: $dir: failed$( (( $test_failed == 124 )) && echo ' (likely timed out)' )"
-                        [[ -n "$options_junit" && $test_failed == 124 ]] && echo "likely timed out" >> "output/junit.failure.log"
+                        (( !options_output_stdout )) || echo "$dir,failed" # todo? put it in message_
+                        [[ -n "$options_output_junit" && $test_failed == 124 ]] && echo "likely timed out" >> "output/junit.failure.log"
                     }
                     break
                 else
@@ -876,6 +869,7 @@ function run_single_test()
                         [[ "$max_wait_time" != "forever" ]] && {
                             if gawk '{ a=$1 > $2; exit !a }' < <( echo $wait_time $max_wait_time ) ; then
                                 echo "$name: in '$dir', could not get requested resources for ${wait_time}s, failed to run" >&2
+                                (( !options_output_stdout )) || echo "$dir,timeout" # todo? put it in message_
                                 result=1
                                 break
                             fi
@@ -893,13 +887,14 @@ function run_single_test()
                             sleep 1  # do not count as waiting time, for simplicity
                             continue
                         else
-                            error_ "$name: terminate the test run with PID '$comma_test_run_top_pid'"
+                            error_ "$name: $dir: terminate the test run with PID '$comma_test_run_top_pid'"
                             kill -TERM $comma_test_run_top_pid
+                            (( !options_output_stdout )) || echo "$dir,timeout" # todo? put it in message_; disambiguate timeout status
                         fi
                     fi
                 fi
             done
-            [[ -n "$options_junit" && $result != 0 && ! -f "output/junit.failure.log" ]] && echo "internal error, see detailed log" >> "output/junit.failure.log"
+            [[ -n "$options_output_junit" && $result != 0 && ! -f "output/junit.failure.log" ]] && echo "internal error, see detailed log" >> "output/junit.failure.log"
             cd "$basedir"
         fi
     fi
@@ -1037,6 +1032,7 @@ comma_path_value_to_var --export --prefix=options < <( default_options )
 options_path_value="$( description | comma-options-to-name-value $@ )"
 comma_path_value_to_var --export --prefix=options <<<"$options_path_value"
 
+[[ -z "$options_root_path" ]] || { error_ "$name: --root-path: todo, just ask"; exit 1; }
 options_test_option=$( echo "$options_path_value" |  grep "^test-option=" | cut -d'=' -f2- | sed 's#^"##;s#"$##' | tr '\n' ' ' )
 
 # and perform sanity check
@@ -1056,9 +1052,9 @@ have_max_parallel=$(( have_max_parallel_equal > 0 || have_max_parallel_space > 0
 [[ "$options_parallel" != "0" && "$options_estimate_resources" == "1" ]] && { error_ "$name: resource estimation shall be serial"; exit 1; }
 if [[ "$options_debug" != "0" ]] ; then verbose="--verbose" ; fi
 (( options_verbose )) && verbose="--verbose"
-if [[ -n "$options_junit" ]] ; then
+if [[ -n "$options_output_junit" ]] ; then
     type -p recode >/dev/null || { error_ "$name: --junit given, but recode is not found; please install recode; e.g. run: sudo apt-get install recode"; exit 1; }
-    rm -f "$options_junit"
+    rm -f "$options_output_junit"
 fi
 [[ -n "$options_also_expected" ]] && {
     [[ -f "$options_also_expected" ]] || { error_ "$name: global expected file '$options_also_expected' not found"; exit 1; }
@@ -1086,20 +1082,59 @@ function apply_black_list() { if [[ -n "$options_black_list" ]] ; then grep -vE
 
 function apply_white_black_list() { apply_white_list | apply_black_list ; }
 
+function tags-get()
+{
+    local config tags dc dt tt tc
+    config=$( closest_file_in_path "." "config" )
+    tags=$( closest_file_in_path "." "tags" )
+    [[ -f "$tags" || -f "$config" ]] || return
+    if [[ -f "$config" ]]; then tc="$( name-value-get tags < "$config" )"; fi
+    if [[ -f "$tags" ]]; then tt="$( cat "$tags" | grep -v '^#' | grep -v '^$' )"; fi
+    if [[ -n "$tc" && -n "$tt" ]]; then
+        dc="$( dirname "$config" )"
+        dt="$( dirname "$tags" )"
+        if (( "${#dc}" < "${#dt}" )); then echo "$tc"; else echo "$tt"; fi
+    elif [[ -n "$tc" ]]; then echo "$tc"
+    elif [[ -n "$tt" ]]; then echo "$tt"
+    fi
+}
+export -f tags-get
+
+function tags-apply() # todo! getting tags for each subdirectory is very slow; get tags for the root, then list all tags, then join matching/not-matching
+{
+    [[ -n "$options_tags" || -n "$options_tags_excluded" ]] || { cat; return; }
+    while read d; do
+        tags="$( cd $d && tags-get | tr ',' '\n' )"
+        if [[ -n "$tags" ]]; then
+            if [[ -n "$options_tags_excluded" ]]; then if egrep -e "^($options_tags_excluded)" <<< "$tags" --quiet; then continue; fi; fi
+            csv-paste <( echo "$tags" ) value="$d"; else echo ",$d"
+        fi
+    done \
+        | if [[ -n "$options_tags" ]]; then egrep -e "^($options_tags),"; else cat; fi \
+        | cut -d, -f2
+}
+
+function tags-list()
+{
+    while read d; do echo "$d,$( cd $d && tags-get | tr ',' '\n' )"; done
+}
+
 # to run, search for directories containing either "test", "input" or "expected";
 # if "test" is absent, use the "test" in the closest parent directory
 function test_directories()
 {
-    if [[ -n "$options_white_list" && -f "$options_white_list" ]]; then
+    if [[ -n "$options_white_list" && -e "$options_white_list" && ! -d "$options_white_list" ]]; then
         message_ "$name: applying white list from file '$options_white_list'"
         options_white_list="^(\./)?($( sed 's#\./##' <$options_white_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//'  ))";
     fi
-    if [[ -n "$options_black_list" && -f "$options_black_list" ]]; then
+    if [[ -n "$options_black_list" && -e "$options_black_list" && ! -d "$options_black_list" ]]; then
         message_ "$name: applying black list from file '$options_black_list'"
         options_black_list="^(\./)?($( sed 's#\./##' <$options_black_list | grep -v ^# | grep -v ^$ | tr \\n '|' | sed 's/|$//' ))";
     fi
-
-    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find . -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list ) )
+    local followsymlinks followmounts="-mount"
+    (( ! options_followsymlinks )) || followsymlinks="-L"
+    (( ! options_followmounts )) || followmounts=
+    test_script_dirs_all=( $( exclude_generic_tests $( get_dirnames $( find $followsymlinks . $followmounts -name "test" -or -name "input" -or -name "expected" | grep -v "/\." ) 2>/dev/null | sort -u ) | apply_white_black_list | tags-apply ) )
     [[ -n "$options_from" || -n "$options_to" || -n "$options_end" ]] || { echo ${test_script_dirs_all[@]} ; return ; }
     [[ -z "$options_from" ]] || { local from="${options_from#\.\/}" ; }
     [[ -z "$options_to" ]] || { local to="${options_to#\.\/}" ; }
@@ -1123,6 +1158,7 @@ else
     done
 fi
 [[ -z "$options_output_directories" ]] || { echo ${test_script_dirs[@]} | tr ' ' '\n' ; exit 0 ; }
+[[ -z "$options_tags_list" ]] || { echo ${test_script_dirs[@]} | tr ' ' '\n' | tags-list ; exit 0 ; }
 [[ -z "$options_document" ]] || { for d in ${test_script_dirs[@]} ; do document_test $d ; done ; exit 0 ; }
 export test_scripts_count=${#test_script_dirs[@]}
 
diff --git a/util/applications/comma-test-util b/util/applications/comma-test-util
index 3dd6d3272..69393582d 100644
--- a/util/applications/comma-test-util
+++ b/util/applications/comma-test-util
@@ -39,6 +39,114 @@ readonly comma_test_util_include_guard_=1
 
 source $( type -p comma-name-value-util )
 
+function _comma_test_util_unquote()
+{
+    cat <<eof
+import sys
+for v in sys.stdin.readlines(): 
+    v = v.strip()
+    assert v.startswith( '"' ), f'comma-string-unquote: expected string starting with double quote; got: {v}'
+    assert v.endswith( '"' ), f'comma-string-unquote: expected string ending with with double quote"; got: {v}'
+    print( v[1:-1] )
+eof
+}
+
+function _comma_test_util_strip()
+{
+    cat <<eof
+import sys
+for line in sys.stdin.readlines(): print( line.strip() )
+eof
+}
+
+function _comma_test_util_test_case_name()
+{
+     cat <<eof
+import sys
+import re
+for line in sys.stdin:
+    match = re.match(r'(?:\S+\s+)?([^\s=]+)/command$', line)
+    if match:
+        print(match.group(1))
+eof
+}
+
+function _comma_test_util_test_name_parse()
+{
+    cat <<eof
+import sys
+import re
+test_case_name = sys.argv[1]
+lines = sys.stdin.read().splitlines()
+for line in lines:
+    match = re.match(r'(?:(\S+)\s+)?(' + re.escape(test_case_name) + r')/(.+?)=(.*)', line)
+    if match:
+        predicate = match.group(1)
+        key = match.group(3)
+        val = match.group(4)
+        prefix = (predicate + ' ') if predicate else ''
+        print(f'{prefix}{key}={val}')
+eof
+}
+
+readonly _comma_test_util_strip_command="$( _comma_test_util_strip )"
+readonly _comma_test_util_unquote_command="$( _comma_test_util_unquote )"
+readonly _comma_test_util_test_case_name_command="$( _comma_test_util_test_case_name )"
+readonly _comma_test_util_test_name_parse_command="$( _comma_test_util_test_name_parse )"
+
+function comma-string-strip() { python3 -c "$_comma_test_util_strip_command"; } # todo: add comma-string-util, parametrise on strip characters
+
+export -f comma-string-strip
+
+function comma-string-unquote() { python3 -c "$_comma_test_util_unquote_command"; } # todo: add comma-string-util, parametrise on strip characters
+
+export -f comma-string-unquote
+
+function _comma_test_case_name() { python3 -c "$_comma_test_util_test_case_name_command"; } # todo: add comma-string-util, parametrise on strip characters
+
+function _comma_test_name_parse() { local name="$1"; python3 -c "$_comma_test_util_test_name_parse_command" "$name"; } # todo: add comma-string-util, parametrise on strip characters
+
+function _comma_test_command_impl()
+{
+    local key="$1" value="$2"
+    key=$( comma-string-strip <<< "$key" )
+    value=$( comma-string-unquote <<< "$value" )
+    output=$( eval "$value" )
+    status=$? # eval and bash -c both returns one error code, PIPESTATUS has only one value
+    if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
+        local count=0
+        while read line; do
+            if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output/line[$count]" <<< "$line" # todo? escape quote? ${line//\"/\\\"}, otherwise they get removed by bash
+            else echo "$key/output/line[$count]=\"$line\""; fi
+            (( ++count ))
+        done <<< "$output"
+    else
+        if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output" <<< "$output" # todo? escape quotes, otherwise they get removed by bash
+        else echo "$key/output=\"$output\""; fi
+    fi
+    return $status
+}
+
+export -f _comma_test_command_impl
+
+function _comma_test_commands_impl()
+{
+    local lhs key value status output until_first_failure=$1 fields=$2 predicate
+    while IFS='=' read lhs value ; do
+        [[ -n "$lhs" && ! "$lhs" =~ \#.* ]] || continue
+        local a=( $lhs )
+        if (( ${#a[@]} == 1 )); then predicate=; key=${a[0]}
+        elif (( ${#a[@]} == 2 )); then predicate=${a[0]}; key=${a[1]}
+        else echo "$0: expected [<predicate>] <test_name>=<command>, got: '$lhs=$value'" >&2; return 1; fi
+        _comma_test_command_impl "$key" "$value"
+        status=$?
+        echo "$key/status=$status"
+        (( status != 0 )) || continue
+        if (( until_first_failure )); then return 1; fi 
+        if [[ "$predicate" == 'assert' ]]; then return 1; fi
+    done < <( grep '=' ; grep -v '^#' )
+}
+
 # a helper to write tests in the comma-test-run style
 #
 # take line by line on stdin: <test name>="<command>"
@@ -55,7 +163,6 @@ source $( type -p comma-name-value-util )
 #
 # if output fields are specified then the output will be split by field
 #
-#
 # e.g:
 # 
 # source $( type -p comma-test-util )
@@ -68,35 +175,27 @@ source $( type -p comma-name-value-util )
 # my_basic_test[1]/for/something/output/b="4"
 # my_basic_test[1]/for/something/output=0
 #
-function comma_test_commands()
-{
-    local key
-    local value
-    local status
-    local output
-    local fields=$1
-    while IFS='=' read key value ; do
-        [[ -n "$key" && ! "$key" =~ \#.* ]] || continue
-        value="${value/#\"}"
-        value="${value/%\"}"
-        output=$( eval "$value" )
-        status=$?       # eval and bash -c both returns one error code, PIPESTATUS has only one value
-        if (( $( wc -l <<< "$output" ) > 1 )); then # a separate case for backward compatibility
-            local count=0
-            while read line; do
-                if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output/line[$count]" <<< "$line" # todo? escape quote? ${line//\"/\\\"}, otherwise they get removed by bash
-                else echo "$key/output/line[$count]=\"$line\""; fi
-                (( ++count ))
-            done <<< "$output"
-        else
-            if [[ -n "$fields" ]]; then name-value-from-csv "$fields" --prefix "$key/output" <<< "$output" # todo? escape quotes, otherwise they get removed by bash
-            else echo "$key/output=\"$output\""; fi
-        fi
-        echo "$key/status=$status"
-    done < <( grep '=' ; grep -v '^#' )
-}
+# 'assert' keyword: if present, do not run the remaining tests in the input file
+#
+# e.g, in the following example, the second test case my/test[1] does NOT run because
+#      the first failing test case my/test[0] has 'assert' in front of it
+#
+# source $( type -p comma-test-util )
+# ( echo 'assert my/test[0]="ls non-existent"'; echo 'my/test[1]="ls ."' ) | comma_test_commands
+# ls: cannot access 'non-existent': No such file or directory
+# my/test[0]/output=""
+# my/test[0]/status=2
 
-# run interactive test, something like
+function comma_test_commands() { _comma_test_commands_impl 0 "$@" ; }
+function comma_test_commands_until_first_failure() { _comma_test_commands_impl 1 "$@" ; }
+
+# run interactive test
+#
+# usage: comma_test_interactive_commands [<until_first_failure>]
+#        <until_first_failure>: 0 (i.e. false) or 1 (i.e. true); default: 0
+#
+# it works as something like
+#
 # > cat input
 # 
 # default/instruction=
@@ -114,50 +213,100 @@ function comma_test_commands()
 #
 # comma_test_interactive_commands
 #
+# if test case does not have both instruction and expected, it is deemed non-interactive
+#
 # see for an example: e.g. snark/graphics/applications/test/view-points/colour/scalar/options
+#
+# 'assert' keyword: if present, do not run the remaining tests in the input file
+# predicates (like assert) are individually assosciated with command | instruction | expected
+#
+# in the folllowing example, my/test[1] will NOT  run if
+#   - command returns non-zero status (assert command)
+#   - zenity prompt returns non-zero status (assert expected)
+# there is currently no implementation for assert instruction
+# 
+# > cat input
+# 
+# assert my/test[0]/command=<command>
+# my/test[0]/instruction=<instruction>
+# assert my/test[0]/expected=<expected >
+# my/test[1]/command=<command>
 function comma_test_interactive_commands()
 {
-    (
+    local until_first_failure=$1
+    if [[ -n "$until_first_failure" ]]; then until_first_failure=1; else until_first_failure=0; fi
+    (   
         function comma_test_interactive_test_case()
-        {
-            local name=$1
-            local command instruction expected dialog
-            eval $( comma_path_value_mangle | sed 's/^/local /' )
-            [[ -n "$command" ]] || { echo "$name/command not specified" >&2 ; echo "$name/status=1"; return 1 ; }
-            eval "$command" &
-            local eval_pid=$!
-            [[ $instruction ]] && dialog="$name: $instruction\n\n"
-            dialog+="do you see $expected?"
-            zenity --question --text="$dialog"
-            result=$?
+        {   
+            local name="$1" testcase_number=$2 number_of_testcases=$3
+            declare -A interactive_test
+            local lhs value dialog zenity_pid command_result zenity_result result
+            while IFS='=' read lhs value; do
+                local a predicate key
+                a=( $lhs )
+                if (( ${#a[@]} == 1 )); then predicate=""; key=${a[0]};
+                elif (( ${#a[@]} == 2 )); then predicate=${a[0]}; key=${a[1]};
+                else echo "$0: expected [<predicate>] <key>=<value>, got: '$lhs=$value'" >&2; return 1; fi
+                key=$( comma-string-strip <<< "$key" )
+                case "$key" in
+                    command|instruction|expected)
+                        if [[ "$key" == "instruction" || "$key" == "expected" ]]; then value=$(echo "$value" | sed -E "s/^(['\"])(.*)\1$/\2/"); fi
+                        interactive_test["$key"]="$value"
+                        interactive_test["${key}_predicate"]="$predicate"
+                        ;;
+                    *)
+                        echo "$0: test '$name': expected 'command', 'instruction', or 'expected', got: '$key'" >&2; 
+                        return 2
+                        ;;
+                esac
+            done
+
+            [[ -n "${interactive_test[command]}" ]] || { echo "$0: $name/command not specified" >&2; return 3; }
+            if [[ -n "${interactive_test[instruction]}" || -n "${interactive_test[expected]}" ]]; then
+                [[ -z "${interactive_test[instruction]}" ]] || dialog+="${interactive_test[instruction]}\n\n"
+                if [[ -n "${interactive_test[expected]}" ]]; then dialog+="do you see: ${interactive_test[expected]}?"; else dialog+="does it look good?"; fi
+                zenity --question --title="testcase $testcase_number of $number_of_testcases: $name" --text="$dialog" --width=600 &
+                zenity_pid=$!
+            fi
+
+            _comma_test_command_impl "$name" "${interactive_test[command]}"
+            command_result=$?
+            if [[ -n "$zenity_pid" ]]; then
+                wait $zenity_pid
+                zenity_result=$?
+                result=$(( command_result != 0 || zenity_result != 0 ? 1 : 0 ))
+            else
+                result=$command_result
+            fi
             echo "$name/status=$result"
-            kill $( pgrep -P $eval_pid )
-            wait $eval_pid
-            return $result
+            
+            (( result != 0 )) || return $result
+            if (( until_first_failure )); then return 4; fi
+            if [[ "${interactive_test[command_predicate]}" == "assert" ]]; then
+                (( command_result != 0 )) && return 5
+            fi
+            [[ -n "$zenity_result" ]] || return 0
+            if [[ "${interactive_test[expected_predicate]}" == "assert" ]]; then
+                (( zenity_result != 0 )) && return 6
+            fi
+            return 0
         }
 
-        local test_case
-        local test_name
-        local path
-        while read line ; do
-            [[ "$line" =~ ^# ]] && continue
-            local p=$( cut -d= -f1 <<< "$line" )
-            [[ -n "$p" ]] || continue
-            local n=$( dirname $p )
-            if [[ "$n" != "$test_name" ]] ; then
-                [[ -z "$test_name" ]] || comma_test_interactive_test_case $test_name <<< "$test_case"
-                test_name=$n
-                test_case=
-            fi
-            n=${n//[/\\[}
-            n=${n//]/\\]}
-            test_case=$( echo "$test_case" ; sed "s#^$n/##" <<< "$line" )
-        done
-        if [[ -n "$test_case" ]] ; then comma_test_interactive_test_case $test_name <<< "$test_case" ; fi
-        return $?
+        local lines=$( cat );
+        local test_cases=$( cut -d= -f1 <<< "$lines" | grep -v '^#' | comma-string-strip | grep '/command$' | egrep '^[a-zA-Z0-9_]' | _comma_test_case_name )
+        local number_of_testcases=$( wc -l <<< "$test_cases" )
+        local testcase_number=0 test_case_name
+        while read test_case_name; do
+            local test_case=$(_comma_test_name_parse "$test_case_name" <<< "$lines")
+            comma_test_interactive_test_case "$test_case_name" $testcase_number $number_of_testcases <<< "$test_case"
+            local r=$?
+            (( r == 0 )) || return $r;
+            (( ++testcase_number ))
+        done <<< "$test_cases"
     )
 }
 
+function comma_test_interactive_commands_until_first_failure() { comma_test_interactive_commands 1; }
 
 # the tmp directory cleanup for comma_test_run_tarball
 function comma_test_run_tarball_cleanup()
diff --git a/util/applications/comma-timeout-group.cpp b/util/applications/comma-timeout-group.cpp
index 47fcf3d42..104f791c9 100644
--- a/util/applications/comma-timeout-group.cpp
+++ b/util/applications/comma-timeout-group.cpp
@@ -1,32 +1,4 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
 
 /// @author dmitry mikhin
 
@@ -47,7 +19,6 @@
 #include <boost/lexical_cast.hpp>
 #include <boost/assign/list_of.hpp>
 
-#include "../../application/contact_info.h"
 #include "../../application/command_line_options.h"
 #include "../../base/exception.h"
 #include "../../base/types.h"
@@ -57,68 +28,99 @@ namespace {
 void usage( bool )
 {
     static char const * const msg_general =
-        "\nRun a given command with its arguments. Kill the command if it is still running after the given"
-        "\ntime duration."
+        "\nRun a given command with its arguments. Kill the command if it is still running"
+        "\nafter the given time duration."
         "\n"
-        "\nUsage:"
-        "\n    comma-timeout-group <options> duration command <args>"
+        "\nUsage: comma-timeout-group <options> duration command <args>"
         "\n"
-        "\nA drop-in replacement of the standard timeout(1) utility for most common usage patterns."
-        "\nThe capability to wait for all processes in a process group added."
+        "\nA drop-in replacement of the standard timeout(1) utility for most common usage"
+        "\npatterns. The capability to wait for all processes in a process group added."
 #ifndef HAVE_PROCPS_DEV
-        "\nWARNING: this new capability is not available in this build. Install procps (or procps-ng)"
-        "\ndevelopment package (containing headers and library) and recompile comma-timeout-group."
+        "\n"
+        "\nWARNING: this new capability is not available in this build. Install procps"
+        "\n(or procps-ng) development package (containing headers and library) and"
+        "\nrecompile comma-timeout-group."
 #endif
-        "\nSome options of timeout (1) are not supported, and, if given, this utility exits in error."
+        "\n"
+        "\nSome options of timeout(1) are not supported, and, if given, this utility exits"
+        "\nin error."
         "\n"
         "\nOptions:"
-        "\n    -h,--help, print this help and exit"
-        "\n    -v,--verbose, chat more"
-        "\n    --report-timeout, run silently but print a message if a command times out"
-        "\n    --verbose-signal-handler, print messages on stderr when sending signals within signal handler;"
-        "\n        WARNING: generally output routines are not re-entrant and shall not be invoked in signal"
-        "\n        handlers; use for debugging but not in production code"
-        "\n    --preserve-status, exit with the same status as <command>, even when the command timed out"
-        "\n    --foreground, not supported"
-        "\n    -k, --kill-after=duration, if the command is still running this long after the initial"
-        "\n        signal was sent, send the KILL signal to finish it off"
-        "\n    --wait-for-process-group=duration, after the initial signal, wait this time for all the processes"
-        "\n        in the current process group to finish; if some processes are still left, send the KILL signal"
-        "\n        to finish them off (same as -k duration); if both this option and '-k' is given, the duration"
-        "\n        specified by '-k' takes precedence"
+        "\n    -h,--help:                 print this help and exit"
+        "\n    -v,--verbose:              chat more"
+        "\n    --report-timeout:          run silently but print a message if a command"
+        "\n                               times out"
+        "\n    --verbose-signal-handler:  print messages on stderr when sending signals"
+        "\n                               within signal handler"
+        "\n"
+        "\n               WARNING: generally output routines are not re-entrant and should"
+        "\n               not be invoked in signal handlers; use for debugging but not in"
+        "\n               production code"
+        "\n"
+        "\n    --preserve-status:         exit with the same status as <command>, even when"
+        "\n                               the command timed out"
+        "\n    --foreground:              not supported"
+        "\n    -k, --kill-after=duration: if the command is still running this long after"
+        "\n                               the initial signal was sent, send the KILL"
+        "\n                               signal to finish it off"
+        "\n    --wait-for-process-group=<duration>:"
+        "\n                               after the initial signal, wait this time for all"
+        "\n                               the processes in the current process group to"
+        "\n                               finish; if some processes are still left send"
+        "\n                               the KILL signal to finish them off (same as -k"
+        "\n                               duration); if both this option and -k is given,"
+        "\n                               the duration specified by -k takes precedence"
 #ifndef HAVE_PROCPS_DEV
-        "\n        WARNING: your version of comma-timeout-group is built without procps support, the capability to"
-        "\n        wait for process group is not available, and this options is a synonym to '-k'"
+        "\n"
+        "\n               WARNING: your version of comma-timeout-group is built without"
+        "\n               procps support, the capability to wait for process group is not"
+        "\n               available, and this options is a synonym to -k"
+        "\n"
 #endif
-        "\n    --enforce-group, enforce waiting for process groups; if comma-timeout-group is built without procps"
-        "\n        support, '--wait-for-process-group' would exit in error rather then become a synonym to '-k';"
-        "\n        this option does nothing if procps support is built in"
-        "\n    --wait-for-process-group-delay=value, when waiting for all processes in the group to finish, a delay"
-        "\n        is inserted between each parsing of the process tree; the value in microseconds is passed to"
-        "\n        usleep (2), default is 100000 (0.1 s); note that low delay values make the program more"
-        "\n        responsive at the cost of higher CPU load when parsing the process tree"
+        "\n    --enforce-group:           enforce waiting for process groups; if"
+        "\n                               comma-timeout-group is built without procps"
+        "\n                               support, --wait-for-process-group would exit in"
+        "\n                               error rather then become a synonym to -k; this"
+        "\n                               option does nothing if procps support is built in"
+        "\n    --wait-for-process-group-delay=<value>:"
+        "\n                               when waiting for all processes in the group to"
+        "\n                               finish, a delay is inserted between each parsing"
+        "\n                               of the process tree; the value in microseconds is"
+        "\n                               passed to usleep(2), default is 100000 (0.1s);"
+        "\n                               note that low delay values make the program more"
+        "\n                               responsive at the cost of higher CPU load when"
+        "\n                               parsing the process tree"
 #ifndef HAVE_PROCPS_DEV
-        "\n        WARNING: your version of comma-timeout-group is built without procps support, this option"
-        "\n        has no effect"
+        "\n"
+        "\n               WARNING: your version of comma-timeout-group is built without"
+        "\n               procps support, this option has no effect"
+        "\n"
 #endif
-        "\n    -s, --signal=signal, the signal to be sent on timeout, given as a name (HUP, SIGHUP) or number;"
-        "\n        only a sub-set of all available signal names is supported, use '--list-known-signals' to list;"
-        "\n        arbitrary signal to use can be specified as a number, see 'kill -l' for the values;"
-        "\n        by default, use SIGTERM"
-        "\n    --list-known-signals, list the supported signals, one per line, and exit"
-        "\n    --can-wait-for-process-group, if built with procps library and can wait for process groups, exit"
-        "\n        with status success, otherwise, exit with failure"
+        "\n    -s, --signal=<signal>:     the signal to be sent on timeout, given as a name"
+        "\n                               (HUP, SIGHUP) or number; only a sub-set of all"
+        "\n                               available signal names is supported, use"
+        "\n                               --list-known-signals to list; arbitrary signal"
+        "\n                               to use can be specified as a number, see"
+        "\n                               'kill -l' for the values; by default, use SIGTERM"
+        "\n    --list-known-signals:      list the supported signals and exit"
+        "\n    --can-wait-for-process-group:"
+        "\n                               if built with procps library and can wait for"
+        "\n                               process groups, exit with status success,"
+        "\n                               otherwise, exit with failure"
         "\n"
-        "\nAll the timeout durations are specified as floating point numbers with optional suffixes 's' for seconds,"
-        "\n(default), 'm' for minutes, 'h' for hours, and 'd' for days. The '--wait-for-process-group' option also"
-        "\n accepts special duration 'forever' (equal to max double) given as a literal string (no quotes). If both"
-        "\n'--kill-after and --wait-for-process-group' durations are specified, the former takes precedence."
+        "\n    All the timeout durations are specified as floating point numbers with"
+        "\n    optional suffixes 's' for seconds (default), 'm' for minutes, 'h' for hours,"
+        "\n    and 'd' for days. The --wait-for-process-group option also accepts special"
+        "\n    duration 'forever' (equal to max double) as a literal string (no quotes)."
+        "\n"
+        "\n    If both --kill-after and --wait-for-process-group durations are specified,"
+        "\n    the former takes precedence."
         "\n"
         "\nReturn value:"
-        "\n    - if the command times out, exit with status 124"
-        "\n    - if the command does not exit on the first signal, and the KILL signal is sent, exit with"
-        "\n      status 128+9"
-        "\n    - otherwise, exit with the status of command"
+        "\n    * if the command times out, exit with status 124"
+        "\n    * if the command does not exit on the first signal, and the KILL signal is"
+        "\n      sent, exit with status 128+9"
+        "\n    * otherwise, exit with the status of command"
         "\n"
         "\nExamples:"
         "\n    Run an application:"
@@ -131,44 +133,46 @@ void usage( bool )
         "\n"
         "\n    Run an application, send KILL signal in 5 seconds if does not die:"
         "\n        comma-timeout-group -k 5 10 sleep 3"
-        "\n            if the application does not exit within 5 s in response to the first signal (TERM,"
-        "\n            default), send KILL signal"
+        "\n            if the application does not exit within 5 s in response to the first"
+        "\n            signal (TERM, default), send KILL signal"
         "\n"
         "\n    Pass custom signal:"
         "\n        comma-timeout-group --signal=USR1 10 sleep 3"
-        "\n            send USR1 after 10 s timeout"
-        "\n            send the bash process the USR1 signal if it is still running in 10 s after start"
-        "\n            send the entire process group the KILL signal if it is still running after another 5 s"
+        "\n            * send USR1 after 10s timeout"
+        "\n            * send the bash process the USR1 signal if it is still running 10s"
+        "\n              after start"
+        "\n            * send the entire process group the KILL signal if it is still"
+        "\n              running after another 5s"
         "\n"
         "\n    Wait for all processes in the group:"
-        "\n        comma-timeout-group --wait-for-process-group=5 10 application"
-        "\n            or"
-        "\n        comma-timeout-group --wait-for-process-group=5 10 application"
-        "\n            wait for 5 s for all processes in the group to exit; if some are left, send KILL"
-        "\n            if your version is built without procps support, however, the call above"
-        "\n"
-        "\n";
-    std::cerr << msg_general << comma::contact_info << std::endl << std::endl;
+        "\n        comma-timeout-group --wait-for-process-group=5 10 cmd"
+        "\n            wait for 5 s for all processes in the group to exit; if some are"
+        "\n            left, send KILL"
+        "\n        -or-"
+        "\n        comma-timeout-group --wait-for-process-group=5 --enforce-group 10 cmd"
+        "\n            as above, but if comma-timeout-group is built without procps support"
+        "\n            exit with error";
+    std::cerr << msg_general << std::endl;
     exit( 0 );
 }
 
 // many values are used in the signal handler, no way to pass via arguments, hence, global
 // the rest just moved here to keep all in one place
-sig_atomic_t timed_out = 0;
-int signal_to_use = SIGTERM;  // same default as kill and timeout commands
-int child_pid = 0;
-bool verbose = false;
-bool verbose_signal_handler = false;
-bool report_timeout = false;
-bool preserve_status = false;
-double timeout = 0.0;
-double kill_after = 0.0;
+static sig_atomic_t timed_out = 0;
+static int signal_to_use = SIGTERM;  // same default as kill and timeout commands
+static int child_pid = 0;
+static bool verbose = false;
+static bool verbose_signal_handler = false;
+static bool report_timeout = false;
+static bool preserve_status = false;
+static double timeout = 0.0;
+static double kill_after = 0.0;
 #ifdef HAVE_PROCPS_DEV
-bool wait_for_process_group = false;
-const bool can_wait_for_process_group = true;
-unsigned int wait_for_process_group_delay = 100000;
+static bool wait_for_process_group = false;
+static const bool can_wait_for_process_group = true;
+static unsigned int wait_for_process_group_delay = 100000;
 #else
-const bool can_wait_for_process_group = false;
+static const bool can_wait_for_process_group = false;
 #endif
 
 double seconds_from_string( const std::string& s, bool allow_forever = false )
@@ -272,9 +276,10 @@ int parse_process_tree( bool verbose = false )
     int count = 0;
     while ( readproc( proc, &proc_info ) != NULL ) {
         if ( proc_info.pgrp == ownpid ) {
-            if ( first && verbose ) { std::cerr << "extant processes in group " << ownpid << std::endl; first = 0; }
-            ++count;
-            if ( verbose ) { std::cerr << "    " << proc_info.cmd << ":\t" << proc_info.tid << "\t" << proc_info.pgrp << "\t" << proc_info.state << "\t" << proc_info.start_time << std::endl; }
+            if ( first && verbose ) { comma::say() << "extant processes in group " << ownpid << std::endl; first = 0; }
+            if( proc_info.state == 'Z' ) { comma::say() << "    " << proc_info.cmd << " (pid " << proc_info.tid << ") is a zombie process - ignoring" << std::endl; }
+            else { ++count; }
+            if ( verbose ) { comma::say() << "    " << proc_info.cmd << ":\t" << proc_info.tid << "\t" << proc_info.pgrp << "\t" << proc_info.state << "\t" << proc_info.start_time << std::endl; }
         }
     }
     closeproc(proc);
diff --git a/util/applications/comma-top b/util/applications/comma-top
index 55cf66aef..bf55b082d 100755
--- a/util/applications/comma-top
+++ b/util/applications/comma-top
@@ -29,62 +29,50 @@
 # OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 # IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-name=$( basename $0 )
+source $( type -p comma-application-util ) 2>/dev/null || { echo "io-top: could not source 'comma-application-util'" >&2; exit 1; }
 
-source $( which comma-application-util ) 2>/dev/null || { echo "$name: could not source 'comma-application-util'" >&2; exit 1; }
-
-function description()
+function prologue()
 {
-    cat <<EOF
---help,-h; show this help
---accumulated; if present for --io, passed to iotop
---debug; much more debug output
---io; if present, run iotop instead of top
---output-fields; output the field names to stdout and exit
---num-procs=[<N>]; output the top N processes (default: totals)
---num-samples=[<N>]; number of samples to take, default: forever, until terminated
---sampling-interval,--delay=[<time>]; sampling interval, see '-d' option of top (1), default: defined by top (1)
---top-options=[<options>]; extra command line argument(s) pass to the top (1) utility
-EOF
-}
-
-function usage()
-{
-    cat >&2 <<EOF
+    cat <<eof
 Invokes the performance monitoring utility top (1) or iotop in continuous mode, parses
 top (1) output, and collects the results into CVS file (sent to stdout).
 
-Usage: ${name} <options> [ > output_file.csv ]
-
 Note: top (1) output is affected by its global and user configuration files.
 There is no option to ignore those files. This utility assumes the default format
 of top (1) output and will fail if alternative output layout is enforced through
 the configuration file(s). It shall be possible to explicitly mandate the desired
 output layout through command-line switches to top that override configuration
 files. This is a possible future extension.
+eof
+}
 
-Options:
-EOF
-    description | sed 's/^/    /g' >&2
-    cat >&2 <<EOF
-
-Examples:
-
-    Collect data until terminated by the user:
-
-        $name > results.csv
-
-    Take 1000 samples and quit (default sampling interval of top (1) is 3s; thus,
+function epilogue()
+{
+    cat << eof
+examples
+    collect data until terminated by the user:
+        io-top > results.csv
+    take 1000 samples and quit (default sampling interval of top (1) is 3s; thus,
     collect 3000s of data):
+        io-top --num-samples=1000 > results.csv
+    facilitate parsing io-top output:
+        io-top --output-fields
+eof
+}
 
-        $name --num-samples=1000 > results.csv
-
-    Facilitate parsing $name output:
-
-        $name --output-fields
-
-EOF
-    exit 0
+function options-description()
+{
+    cat <<eof
+--help,-h; show this help
+--accumulated; if present for --io, passed to iotop
+--debug; much more debug output
+--io; if present, run iotop instead of top
+--num-procs,--number-of-processes,--processes=[<N>]; output the top N processes (default: totals)
+--num-samples,--number-of-samples,--samples=[<N>]; number of samples to take, default: forever, until terminated
+--output-fields; output the field names to stdout and exit
+--sampling-interval,--delay=[<time>]; sampling interval, see '-d' option of top (1), default: defined by top (1)
+--top-options=[<options>]; extra command line argument(s) pass to the top (1) utility
+eof
 }
 
 function feeder()
@@ -93,9 +81,7 @@ function feeder()
     local extra_opts=$2
     local top_opts="-b $extra_opts"
     [[ -n "$num" ]] && top_opts="$top_opts -n $num"
-    
-    # make all buffering per-line
-    stdbuf -oL -eL top $top_opts 
+    stdbuf -oL -eL top $top_opts # make all buffering per-line
 }
 
 function extract_cpus()
@@ -120,9 +106,9 @@ function extract_mem()
 function parser_totals()
 {
     shopt -s extglob
-    local timestamp line first shared
-    first="true"
+    local timestamp line first="true" shared
     grep --line-buffered -A 4 '^top' \
+    | tee 0.csv \
     | while true ; do
         read line
         [[ -z "$line" ]] && break
@@ -131,38 +117,40 @@ function parser_totals()
             first="false"
         }
         [[ "$line" = "%Cpu(s)"* ]]  && extract_cpus "$line"
-        [[ "$line" = "KiB Mem"* ]]  && { extract_mem  "$line" ; echo -n ",$shared" ; }
-        # swap is last, finish the line
-        [[ "$line" = "KiB Swap"* ]] && { extract_mem  "$line" ; echo ; }
+        [[ "$line" = [KMG]"iB Mem"* || "$line" = [KMG]"iB Mem"* ]]  && { extract_mem  "$line" ; echo -n ",$shared" ; }
+        [[ "$line" = [KMG]"iB Swap"* || "$line" = [KMG]"iB Swap"* ]] && { extract_mem  "$line" ; echo ; } # swap is last, finish the line
         [[ "$line" = "--" ]] && first="true"
     done \
-    | sed -u -n '1!p'
+    | tee 1.csv \
+    | sed -u -n '1!p' \
+    | tee 2.csv
 }
 
 function parser_num_procs()
 {
-    grep --line-buffered -E -A $((num_procs + 1)) '^[ ]+PID ' \
-    | sed -r -u -n 's/[[:blank:]]+/,/g ; s/^,// ; /^[0-9]+,/p'
+    grep --line-buffered -E -A $((options_num_procs + 1)) '^[ ]+PID ' \
+        | sed -r -u -n 's/[[:blank:]]+/,/g ; s/^,// ; /^[0-9]+,/p'
 }
 
 io_payload_fields="total/read,total/write,actual/read,actual/write"
 io_fields="timestamp,$io_payload_fields"
-total_fields="timestamp,cpu/user,cpu/system,cpu/total,memory/ram,memory/shared,memory/swap"
+all_fields="timestamp,cpu/user,cpu/system,cpu/total,memory/ram,memory/shared,memory/swap"
 procs_fields="timestamp,pid,user,priority,nice,memory/virtual,memory/physical,memory/shared,status,cpu/percent,memory/percent,uptime,command"
 
-function output_fields()
+function maybe_output_fields()
 {
-    if (( $( comma_options_has --io $@ ) )) ; then echo $io_fields
-    elif (( $(comma_options_has --num-procs $@ ) )); then echo $procs_fields
-    else echo "$total_fields" ; fi
+    (( options_output_fields )) || return
+    if (( options_io )) ; then echo $io_fields; exit; fi
+    if (( options_num_procs )); then echo $procs_fields; exit; fi
+    echo "$all_fields"; exit
 }
 
 function run_iotop()
 {
     local total actual
-    [[ -z "$sampling_interval" ]] || delay="--delay=$sampling_interval"
-    [[ -z "$accumulated" ]] || accumulated="--accumulated"
-    sudo iotop --batch --kilobytes -o $delay $accumulated $top_options \
+    [[ -z "$options_sampling_interval" ]] || delay="--delay=$options_sampling_interval"
+    [[ -z "$options_accumulated" ]] || options_accumulated="--accumulated"
+    sudo iotop --batch --kilobytes -o $delay $options_accumulated $options_top_options \
         | egrep -e 'Total DISK|Actual DISK' --line-buffered \
         | sed -u -e 's#[a-zA-Z:/ ]##g' -e 's/|/,/g' \
         | while read total ; do
@@ -173,22 +161,16 @@ function run_iotop()
         | csv-time-stamp 2>/dev/null
 }
 
-if (( $( comma_options_has --help "$@" ) || $( comma_options_has -h "$@" ) )) ; then usage ; exit ; fi
-if (( $( comma_options_has --output-fields "$@" ) )) ; then output_fields "$@" ; exit ; fi
-
-debug=0
-
-description | comma-options-validate "$@"
-comma_path_value_to_var --export < <( description | comma-options-to-name-value "$@" )
-
-if [[ -n "$io" ]] ; then
+comma-application-init $@ < <( options-description ) || die "failed" # comma_path_value_to_var --export < <( description | comma-options-to-name-value "$@" )
+maybe_output_fields
+if [[ -n "$options_io" ]] ; then
     [[ -n "$( sudo which iotop )" ]] || { echo "comma-top: make sure iotop installed" >&2 ; exit 1 ; }
     run_iotop
 else
     feeder_opts=""
-    [[ -n "$sampling_interval" ]] && feeder_opts="-d $sampling_interval"
-    [[ -n "$top_options" ]] && feeder_opts="$feeder_opts $top_options"
-    [[ -n "$num_samples" && -z "$num_procs" ]] && (( ++num_samples )) # first line will be ignored, leaving num_samples lines
-    if [[ -n "$num_procs" ]]; then parser="parser_num_procs"; else parser="parser_totals"; fi
-    feeder "$num_samples" "$feeder_opts" "$num_procs" | $parser | csv-time-stamp 2>/dev/null 
+    [[ -n "$options_sampling_interval" ]] && feeder_opts="-d $options_sampling_interval"
+    [[ -n "$options_top_options" ]] && feeder_opts="$feeder_opts $options_top_options"
+    [[ -n "$options_num_samples" && -z "$options_num_procs" ]] && (( ++options_num_samples )) # first line will be ignored, leaving options_num_samples lines
+    if [[ -n "$options_num_procs" ]]; then parser="parser_num_procs"; else parser="parser_totals"; fi
+    feeder "$options_num_samples" "$feeder_opts" "$options_num_procs" | $parser | tee 3.csv | csv-time-stamp 2>/dev/null
 fi
diff --git a/util/examples/comma-profile-graph-example b/util/examples/comma-profile-graph-example
new file mode 100755
index 000000000..fc47cc709
--- /dev/null
+++ b/util/examples/comma-profile-graph-example
@@ -0,0 +1,55 @@
+#!/bin/bash
+
+scriptname=$( basename $0 )
+
+source $( type -p comma-progress-util ) || { echo "$scriptname: cannot source 'comma-progress-util'" >&2; exit 1; }
+
+elapsed_csv=elapsed.csv
+profile_svg=profile.svg
+
+function usage()
+{
+    cat <<EOF
+
+usage: $scriptname <make|view>
+
+make - create profile data in $elapsed_csv
+view - visualise $elapsed_csv in $profile_svg
+
+EOF
+}
+
+function profile()
+{
+    local fn=$1
+    comma_progress_named $elapsed_csv $fn $fn
+}
+
+function func_a() { profile func_b; profile func_d; sleep 1.5; }
+function func_b() { for i in {0..2}; do profile func_c; done; sleep 0.1; }
+function func_c() { sleep 0.4; }
+function func_d() { sleep 0.2; }
+function func_e() { profile func_b; }
+function func_f() { profile func_d; }
+
+function make()
+{
+    [[ -f $elapsed_csv ]] && rm $elapsed_csv
+    profile func_a
+    profile func_e
+    profile func_f
+}
+
+function view()
+{
+    cat $elapsed_csv | comma-progress --elapsed | comma-profile-graph | dot -Tsvg > $profile_svg
+    eog $profile_svg
+}
+
+[[ $1 == "-h" || $1 == "--help" ]] && { usage; exit 1; }
+
+case $1 in
+    make) make ;;
+    view) view ;;
+    *)    usage
+esac
diff --git a/util/test/test_run/black_subdirs/test.2/expected b/util/test/test_run/black_subdirs/test.2/expected
index 6c0055604..936856dee 100644
--- a/util/test/test_run/black_subdirs/test.2/expected
+++ b/util/test/test_run/black_subdirs/test.2/expected
@@ -1,5 +1,5 @@
 #python
 
 expect len(expected) == 9
-expect locals().has_key('output') == False
-expect locals().has_key('stdout_log') == False
+expect ( 'output' in locals() ) == False
+expect ( 'stdout_log' in locals() ) == False
diff --git a/util/test/test_run/interactive/disabled b/util/test/test_run/interactive/disabled
index bdee1f276..2808ba79e 100644
--- a/util/test/test_run/interactive/disabled
+++ b/util/test/test_run/interactive/disabled
@@ -1 +1 @@
-this test must be run manually using --interactive mode
+this is an interactive test that is run manually as needed
diff --git a/util/test/test_run/interactive/expected b/util/test/test_run/interactive/expected
new file mode 100644
index 000000000..9c98c5705
--- /dev/null
+++ b/util/test/test_run/interactive/expected
@@ -0,0 +1,25 @@
+interactive/success/output/line[0]="input"
+interactive/success/output/line[1]="test"
+interactive/success/status=0
+
+interactive/failure/by_user/output/line[0]="input"
+interactive/failure/by_user/output/line[1]="test"
+interactive/failure/by_user/status=1
+
+interactive/failure/by_expected/output/line[0]="blah"
+interactive/failure/by_expected/output/line[1]="blah"
+interactive/failure/by_expected/status=0
+
+non_interactive/success[0]/output/line[0]="input"
+non_interactive/success[0]/output/line[1]="test"
+non_interactive/success[0]/status=0
+
+non_interactive/success[1]/output/line[0]="input"
+non_interactive/success[1]/output/line[1]="test"
+non_interactive/success[1]/status=0
+
+non_interactive/failure[0]/output=""
+non_interactive/failure[0]/status=2
+
+non_interactive/failure[1]/output=""
+non_interactive/failure[1]/status=2
diff --git a/util/test/test_run/interactive/input b/util/test/test_run/interactive/input
new file mode 100644
index 000000000..b5cf8d733
--- /dev/null
+++ b/util/test/test_run/interactive/input
@@ -0,0 +1,16 @@
+interactive/success/command="ls input test"
+interactive/success/instruction="will run ls on current directory, press YES for the test to succeed"
+interactive/success/expected="list of files in current directory"
+
+interactive/failure/by_user/command="ls input test"
+interactive/failure/by_user/instruction="will run ls on current directory, press NO for the test to fail"
+interactive/failure/by_user/expected="list of files in current directory"
+
+interactive/failure/by_expected/command="ls input test"
+interactive/failure/by_expected/instruction="will run ls on current directory, press YES, the test still should fail on actual/expected mismatch"
+interactive/failure/by_expected/expected="list of files in current directory"
+
+non_interactive/success[0]/command="ls input test"
+non_interactive/success[1]/command="ls input test"
+non_interactive/failure[0]/command="ls non-existent-file"
+non_interactive/failure[1]/command="ls non-existent-file"
diff --git a/util/test/test_run/interactive/test b/util/test/test_run/interactive/test
index 764e581bc..f70da7533 100755
--- a/util/test/test_run/interactive/test
+++ b/util/test/test_run/interactive/test
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 source $(type -p comma-application-util)
-source $(type -p comma-process-util)
+source $(type -p comma-test-util)
+
+comma_test_interactive_commands
 
-zenity --question --text="Do you want the test to succeed?"
-comma_status_ok || exit 1
diff --git a/util/test/test_util/commands/assert/expected b/util/test/test_util/commands/assert/expected
new file mode 100644
index 000000000..444ca4026
--- /dev/null
+++ b/util/test/test_util/commands/assert/expected
@@ -0,0 +1,6 @@
+basics[0]/output=""
+basics[0]/status=2
+basics[1]/output=""
+basics[1]/status=2
+status=1
+output/lines/count=4
diff --git a/util/test/test_util/commands/assert/input b/util/test/test_util/commands/assert/input
new file mode 100644
index 000000000..71d7b29b0
--- /dev/null
+++ b/util/test/test_util/commands/assert/input
@@ -0,0 +1,4 @@
+basics[0]="ls ./non-existent-file"
+assert basics[1]="ls ./non-existent-file"
+basics[1]="ls"
+basics[2]="ls ./non-existent-file"
diff --git a/util/test/test_util/commands/assert/test b/util/test/test_util/commands/assert/test
new file mode 100755
index 000000000..1a4e681a8
--- /dev/null
+++ b/util/test/test_util/commands/assert/test
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+output=$( comma_test_commands )
+status=$?
+echo "$output"
+echo "status=$status"
+echo "output/lines/count=$( wc -l <<< "$output" )"
\ No newline at end of file
diff --git a/util/test/test_util/commands/quoting/expected b/util/test/test_util/commands/quoting/expected
new file mode 100644
index 000000000..905e619f1
--- /dev/null
+++ b/util/test/test_util/commands/quoting/expected
@@ -0,0 +1,23 @@
+basic/output/line[0]="input"
+basic/output/line[1]="test"
+basic/status=0
+quoted/single[0]/output/line[0]="input"
+quoted/single[0]/output/line[1]="test"
+quoted/single[0]/status=0
+quoted/single[1]/output/line[0]="input"
+quoted/single[1]/output/line[1]="test"
+quoted/single[1]/status=0
+quoted/single[2]/output/line[0]="input"
+quoted/single[2]/output/line[1]="test"
+quoted/single[2]/status=0
+quoted/single[3]/output/line[0]="input"
+quoted/single[3]/output/line[1]="test"
+quoted/single[3]/status=0
+quoted/double[0]/output/line[0]="input"
+quoted/double[0]/output/line[1]="test"
+quoted/double[0]/status=0
+quoted/double[1]/output/line[0]="input"
+quoted/double[1]/output/line[1]="test"
+quoted/double[1]/status=0
+trailing_spaces/output="input"
+trailing_spaces/status=0
diff --git a/util/test/test_util/commands/quoting/input b/util/test/test_util/commands/quoting/input
new file mode 100644
index 000000000..11ba21a3f
--- /dev/null
+++ b/util/test/test_util/commands/quoting/input
@@ -0,0 +1,9 @@
+basic="ls input test"
+quoted/single[0]="ls 'input' 'test'"
+quoted/single[1]=" ls 'input' 'test' "
+quoted/single[2]=    " ls 'input' 'test' "
+quoted/single[3] =    " ls 'input' 'test' "
+quoted/double[0]="ls \"input\" \"test\""
+quoted/double[1]=" ls \"input\" \"test\" "
+trailing_spaces="ls input"   
+# commented_test="exit 1" # todo: add checks to expected
\ No newline at end of file
diff --git a/util/test/test_util/commands/quoting/test b/util/test/test_util/commands/quoting/test
new file mode 100755
index 000000000..90d7cb1fc
--- /dev/null
+++ b/util/test/test_util/commands/quoting/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_commands
diff --git a/util/test/test_util/interactive_commands/assert/expected b/util/test/test_util/interactive_commands/assert/expected
new file mode 100644
index 000000000..cac43217b
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/expected
@@ -0,0 +1,6 @@
+basics[0]/output=""
+basics[0]/status=1
+basics[1]/output=""
+basics[1]/status=2
+status=5
+output/lines/count=4
diff --git a/util/test/test_util/interactive_commands/assert/input b/util/test/test_util/interactive_commands/assert/input
new file mode 100644
index 000000000..35ea63842
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/input
@@ -0,0 +1,6 @@
+basics[0]/command="ls ./non-existent-file"
+basics[0]/instruction="this test command will FAIL safely, press YES for the user test to pass"
+assert basics[0]/expected="'ls: cannot access 'non-existent': No such file or directory'"
+assert basics[1]/command="ls ./non-existent-file"
+basics[2]/command="ls"
+basics[3]/command="ls ./non-existent-file"
diff --git a/util/test/test_util/interactive_commands/assert/optional b/util/test/test_util/interactive_commands/assert/optional
new file mode 100644
index 000000000..2808ba79e
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/optional
@@ -0,0 +1 @@
+this is an interactive test that is run manually as needed
diff --git a/util/test/test_util/interactive_commands/assert/test b/util/test/test_util/interactive_commands/assert/test
new file mode 100755
index 000000000..78a402201
--- /dev/null
+++ b/util/test/test_util/interactive_commands/assert/test
@@ -0,0 +1,10 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+output=$( comma_test_interactive_commands )
+status=$?
+echo "$output"
+echo "status=$status"
+echo "output/lines/count=$( wc -l <<< "$output" )"
\ No newline at end of file
diff --git a/util/test/test_util/interactive_commands/command/expected b/util/test/test_util/interactive_commands/command/expected
new file mode 100644
index 000000000..7407a7975
--- /dev/null
+++ b/util/test/test_util/interactive_commands/command/expected
@@ -0,0 +1,26 @@
+basic/output/line[0]="input"
+basic/output/line[1]="test"
+basic/status=0
+quoted/single[0]/output/line[0]="input"
+quoted/single[0]/output/line[1]="test"
+quoted/single[0]/status=0
+quoted/single[1]/output/line[0]="input"
+quoted/single[1]/output/line[1]="test"
+quoted/single[1]/status=0
+quoted/single[2]/output/line[0]="input"
+quoted/single[2]/output/line[1]="test"
+quoted/single[2]/status=0
+quoted/single[3]/output/line[0]="input"
+quoted/single[3]/output/line[1]="test"
+quoted/single[3]/status=0
+quoted/single[4]/output/line[0]="input"
+quoted/single[4]/output/line[1]="test"
+quoted/single[4]/status=0
+quoted/double[0]/output/line[0]="input"
+quoted/double[0]/output/line[1]="test"
+quoted/double[0]/status=0
+quoted/double[1]/output/line[0]="input"
+quoted/double[1]/output/line[1]="test"
+quoted/double[1]/status=0
+trailing_spaces/output="input"
+trailing_spaces/status=0
diff --git a/util/test/test_util/interactive_commands/command/input b/util/test/test_util/interactive_commands/command/input
new file mode 100644
index 000000000..f4e02c174
--- /dev/null
+++ b/util/test/test_util/interactive_commands/command/input
@@ -0,0 +1,10 @@
+basic/command="ls input test"
+quoted/single[0]/command="ls 'input' 'test'"
+quoted/single[1]/command=" ls 'input' 'test' "
+quoted/single[2]/command= " ls 'input' 'test' "
+quoted/single[3]/command =" ls 'input' 'test' "
+quoted/single[4]/command = " ls 'input' 'test' "
+quoted/double[0]/command="ls \"input\" \"test\""
+quoted/double[1]/command=" ls \"input\" \"test\" "
+trailing_spaces/command="ls input"
+# commented_test/command="exit 1"  # todo: add checks to expected
diff --git a/util/test/test_util/interactive_commands/command/test b/util/test/test_util/interactive_commands/command/test
new file mode 100755
index 000000000..8b1bfde81
--- /dev/null
+++ b/util/test/test_util/interactive_commands/command/test
@@ -0,0 +1,6 @@
+#!/bin/bash
+
+source $( type -p comma-application-util ) || { echo "$0: failed to source comma-application-util" >&2 ; exit 1 ; }
+source $( type -p comma-test-util ) || { echo "$0: failed to source comma-test-util" >&2 ; exit 1 ; }
+
+comma_test_interactive_commands
diff --git a/visiting/CMakeLists.txt b/visiting/CMakeLists.txt
index bb08d565b..32339a5ba 100644
--- a/visiting/CMakeLists.txt
+++ b/visiting/CMakeLists.txt
@@ -7,7 +7,6 @@ SOURCE_GROUP( ${TARGET_NAME} FILES ${source} ${includes} )
 ADD_CUSTOM_TARGET( ${TARGET_NAME} ${source} ${includes} )
 
 INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT} )
-INSTALL( FILES ${includes} DESTINATION ${comma_INSTALL_INCLUDE_DIR}/${PROJECT}/Visitors )
                                            
 IF( comma_BUILD_TESTS )
     ADD_SUBDIRECTORY( test )
diff --git a/visiting/test/CMakeLists.txt b/visiting/test/CMakeLists.txt
index 8483176a1..398724ecd 100644
--- a/visiting/test/CMakeLists.txt
+++ b/visiting/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET(KIT visiting)
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_base ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT visiting )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} ${comma_ALL_EXTERNAL_LIBRARIES} ${GTEST_BOTH_LIBRARIES} pthread ) # comma_name_value comma_xpath
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )
diff --git a/visiting/test/visiting_test.cpp b/visiting/test/visiting_test.cpp
index 02aa44ed7..97e66537b 100644
--- a/visiting/test/visiting_test.cpp
+++ b/visiting/test/visiting_test.cpp
@@ -1,32 +1,5 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 #include <gtest/gtest.h>
 #include <sstream>
@@ -37,7 +10,9 @@
 #include <vector>
 #include <boost/array.hpp>
 #include <boost/noncopyable.hpp>
+#include "../../base/optional.h"
 #include "../../base/types.h"
+//#include "../../name_value/serialize.h"
 #include "../apply.h"
 #include "../visit.h"
 
@@ -75,6 +50,7 @@ class o_stream_visitor : public boost::noncopyable
     private:
         std::ostream& m_stream;
         bool empty( const char* name ) { return *name == 0; }
+        bool empty( const std::string& name ) { return name.empty(); }
         bool empty( std::size_t ) { return false; }
 };
 
@@ -110,13 +86,18 @@ struct old_plain
     nested world;
 };
 
+struct optionals
+{
+    comma::optional< int > a;
+    comma::optional< std::pair< int, int > > b;
+};
+
 } } } // namespace comma { namespace visiting { namespace test {
 
 namespace comma { namespace visiting {
 
 /// traits specialization for old_plain
-template <>
-struct traits< test::old_plain >
+template <> struct traits< test::old_plain >
 {
     template < typename Key, typename visitor >
     static void visit( const Key&, const test::old_plain& p, visitor& v )
@@ -128,8 +109,7 @@ struct traits< test::old_plain >
 };
 
 /// traits specialization for old_plain::nested
-template <>
-struct traits< test::old_plain::nested >
+template <> struct traits< test::old_plain::nested >
 {
     template < typename Key, typename visitor >
     static void visit( const Key&, const test::old_plain::nested& p, visitor& v )
@@ -140,6 +120,16 @@ struct traits< test::old_plain::nested >
     }
 };
 
+template <> struct traits< test::optionals >
+{
+    template < typename Key, typename visitor >
+    static void visit( const Key&, const test::optionals& p, visitor& v )
+    {
+        v.apply( "a", p.a );
+        v.apply( "b", p.b );
+    }
+};
+
 } } // namespace comma { namespace visiting {
 
 namespace comma { namespace visiting { namespace test {
@@ -225,6 +215,94 @@ TEST( visiting, container )
     }
 }
 
+TEST( visiting, tuple )
+{
+    std::tuple< int, double, std::string > t{ 5, 10, "hello" };
+    std::ostringstream oss;
+    o_stream_visitor v( oss );
+    visiting::apply( v, t );
+    EXPECT_EQ( oss.str(), "{ int:0=5 double:1=10 string:2=\"hello\" }" ); // EXPECT_EQ( oss.str(), "{ int:elem_0=5 double:elem_1=10 string:elem_2=\"hello\" }" );
+}
+
+TEST( visiting, optional )
+{
+    {
+        test::optionals t;
+        t.a.value = 0; // quick and dirty
+        t.b.value = {0, 0}; // quick and dirty
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:a={ int:value=0 bool:is_set=false } object:b={ object:value={ int:first=0 int:second=0 } bool:is_set=false } }" );
+    }
+    {
+        test::optionals t;
+        t.a.value = 0; // quick and dirty
+        t.b.value = {0, 0}; // quick and dirty
+        t.a = 5;
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:a={ int:value=5 bool:is_set=true } object:b={ object:value={ int:first=0 int:second=0 } bool:is_set=false } }" );
+    }
+    {
+        test::optionals t;
+        t.a.value = 0; // quick and dirty
+        t.b.value = {0, 0}; // quick and dirty
+        t.b = std::make_pair( 3, 4 );
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:a={ int:value=0 bool:is_set=false } object:b={ object:value={ int:first=3 int:second=4 } bool:is_set=true } }" );
+    }
+}
+
+struct some_struct
+{
+    struct naming { static std::array< std::string, 3 > names() { return { "a", "b", "c" }; } };
+    typedef comma::named_variant< naming, int, std::pair< std::string, float >, double > named_variant_t;
+    named_variant_t variant;
+};
+
+} } } /// namespace comma { namespace visiting { namespace test {
+
+namespace comma { namespace visiting {
+
+template <> struct traits< test::some_struct >
+{
+    template < typename Key, typename visitor > static void visit( const Key&,       test::some_struct& p, visitor& v ) { v.apply( "variant", p.variant ); }
+    template < typename Key, typename visitor > static void visit( const Key&, const test::some_struct& p, visitor& v ) { v.apply( "variant", p.variant ); }
+};
+
+} } // namespace comma { namespace visiting {
+
+namespace comma { namespace visiting { namespace test {
+
+TEST( visiting, named_variant )
+{
+    {
+        test::some_struct t;
+        std::ostringstream oss;
+        o_stream_visitor v( oss );
+        visiting::apply( v, t );
+        EXPECT_EQ( oss.str(), "{ object:variant={ } }" );
+    }
+    {
+        // test::some_struct t;
+        // t.variant.set( std::pair< std::string, float >( "hello", 5 ) );
+        // std::ostringstream oss;
+        // o_stream_visitor v( oss );
+        // visiting::apply( v, t );
+        // //EXPECT_EQ( oss.str(), "{ object:variant={ } }" );
+        // std::cerr << "=============" << std::endl;
+        // std::cerr << oss.str() << std::endl;
+        // std::cerr << "=============" << std::endl;
+        // write_json( t, std::cerr );
+        // std::cerr << "=============" << std::endl;
+    }
+    // todo! test serialization and deserialization! make test dependent on name_value?
+}
+
 } } } /// namespace comma { namespace visiting { namespace test {
 
 int main( int argc, char* argv[] )
diff --git a/visiting/traits.h b/visiting/traits.h
index 20a8c5146..2d96b5b35 100644
--- a/visiting/traits.h
+++ b/visiting/traits.h
@@ -1,47 +1,27 @@
-// This file is part of comma, a generic and flexible library
 // Copyright (c) 2011 The University of Sydney
-// All rights reserved.
-//
-// Redistribution and use in source and binary forms, with or without
-// modification, are permitted provided that the following conditions are met:
-// 1. Redistributions of source code must retain the above copyright
-//    notice, this list of conditions and the following disclaimer.
-// 2. Redistributions in binary form must reproduce the above copyright
-//    notice, this list of conditions and the following disclaimer in the
-//    documentation and/or other materials provided with the distribution.
-// 3. Neither the name of the University of Sydney nor the
-//    names of its contributors may be used to endorse or promote products
-//    derived from this software without specific prior written permission.
-//
-// NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE
-// GRANTED BY THIS LICENSE.  THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT
-// HOLDERS AND CONTRIBUTORS \"AS IS\" AND ANY EXPRESS OR IMPLIED
-// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
-// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
-// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
-// BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
-// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
-// OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
-// IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-
+// Copyright (c) 2022 Vsevolod Vlaskine
 
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_VISITING_TRAITS_HEADER_GUARD_
-#define COMMA_VISITING_TRAITS_HEADER_GUARD_
+#pragma once
 
 #ifndef WIN32
 #include <stdlib.h>
 #endif
 #include <array>
+#include <complex>
 #include <map>
 #include <set>
 #include <string>
+#include <tuple>
+#include <unordered_map>
+#include <unordered_set>
 #include <vector>
 #include <boost/array.hpp>
+#include "../base/exception.h"
+#include "../base/none.h"
+#include "../base/optional.h"
+#include "../base/variant.h"
 
 namespace comma { namespace visiting {
 
@@ -50,22 +30,25 @@ namespace comma { namespace visiting {
 template < typename T >
 struct traits
 {
-    /// visit arbitrary type
     template < typename K, typename V > static void visit( const K& key, T& t, V& v );
+    template < typename K, typename V > static void visit( const K& key, const T& t, V& v );
+};
+
+template <> struct traits< comma::none >
+{
+    template < typename K, typename V > static void visit( const K& key, comma::none& t, V& v ) {}
+    template < typename K, typename V > static void visit( const K&, const comma::none& t, V& v ) {}
 };
 
-/// std::pair visiting traits; todo: better semantics?
 template < typename T, typename S >
 struct traits< std::pair< T, S > >
 {
-    /// visit
     template < typename K, typename V > static void visit( const K& key, std::pair< T, S >& t, V& v )
     {
         v.apply( "first", t.first );
         v.apply( "second", t.second );
     }
     
-    /// visit const
     template < typename K, typename V > static void visit( const K&, const std::pair< T, S >& t, V& v )
     {
         v.apply( "first", t.first );
@@ -73,26 +56,255 @@ struct traits< std::pair< T, S > >
     }    
 };
 
-namespace Impl {
+template < typename T >
+struct traits< comma::optional< T > >
+{
+    template < typename K, typename V > static void visit( const K& key, comma::optional< T >& t, V& v )
+    {
+        v.apply( "value", t.value );
+        v.apply( "is_set", t.is_set );
+    }
+    
+    template < typename K, typename V > static void visit( const K&, const comma::optional< T >& t, V& v )
+    {
+        v.apply( "value", t.value );
+        v.apply( "is_set", t.is_set );
+    }    
+};
+
+template < typename... Args >
+struct traits< comma::variant< Args... > > // todo? should it be in the visitors instead? todo!
+{
+    typedef comma::variant< Args... > variant_t;
+
+    template < typename S, Args... > struct _variant_traits // todo
+    {
+        template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            traits< boost::optional< S > >::visit( key, s, v );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+            _variant_traits< Args... >::_visit( key, t, v, bool( s ) );
+        }
+        template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { traits< S >::visit( key, *s, v ); } else { _variant_traits< Args... >::_visit( key, t, v ); }
+        }
+    };
+
+    template < typename K, typename V > static void visit( const K& key, variant_t& t, V& v )
+    {
+        _variant_traits< Args... >::visit( key, t, v, false );
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const variant_t& t, V& v )
+    {
+        _variant_traits< Args... >::visit( key, t, v );
+    }
+};
+
+template < typename T >
+struct traits< comma::variant< T > >
+{
+    typedef comma::variant< T > variant_t;
+
+    template < typename S > struct _variant_traits // todo
+    {
+        template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            traits< boost::optional< S > >::visit( key, s, v );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+        }
+        template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { traits< S >::visit( key, *s, v ); }
+        }
+    };
+
+    template < typename K, typename V > static void visit( const K& key, variant_t& t, V& v )
+    {
+        _variant_traits< T >::visit( key, t, v, false );
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const variant_t& t, V& v )
+    {
+        _variant_traits< T >::visit( key, t, v );
+    }
+};
+
+template < typename Names, typename... NArgs >
+struct traits< comma::named_variant< Names, NArgs... > > // todo? should it be in the visitors instead?
+{
+    typedef comma::named_variant< Names, NArgs... > named_variant_t;
+    typedef comma::variant< NArgs... > variant_t;
+
+    template < typename S, typename... Args > struct _variant_traits
+    {
+        template < typename V > static void visit( variant_t& t, V& v, unsigned int i, bool is_set )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            v.apply( named_variant_t::names()[i], s );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+            _variant_traits< Args... >::visit( t, v, ++i, bool( s ) );
+        }
+        template < typename V > static void visit( const variant_t& t, V& v, unsigned int i )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { v.apply( named_variant_t::names()[i], *s ); } else { _variant_traits< Args... >::visit( t, v, ++i ); }
+        }
+    };
+
+    template < typename S > struct _variant_traits< S >
+    {
+        template < typename V > static void visit( variant_t& t, V& v, unsigned int i, bool is_set )
+        {
+            boost::optional< S > s = t.template optional< S >();
+            v.apply( named_variant_t::names()[i], s );
+            COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+            if( s ) { t.set( s ); }
+        }
+        template < typename V > static void visit( const variant_t& t, V& v, unsigned int i )
+        {
+            const boost::optional< S >& s = t.template optional< S >();
+            if( s ) { v.apply( named_variant_t::names()[i], *s ); }
+        }
+    };
+
+    template < typename K, typename V > static void visit( const K&, named_variant_t& t, V& v )
+    {
+        _variant_traits< NArgs... >::visit( static_cast< variant_t& >( t ), v, 0, false );
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const named_variant_t& t, V& v )
+    {
+        _variant_traits< NArgs... >::visit( static_cast< const variant_t& >( t ), v, 0 );
+    }
+};
+
+// template < typename Names, typename T >
+// struct traits< comma::named_variant< T > >
+// {
+//     typedef typename comma::variant< T >::variant_t variant_t;
+
+//     template < typename S > struct _variant_traits // todo
+//     {
+//         template < typename K, typename V > void _visit( const K& key, variant_t& t, V& v, bool is_set, unsigned int i )
+//         {
+//             boost::optional< S > s = t.template optional< S >();
+//             v.apply( variant_t::names()[i], s );
+//             COMMA_ASSERT( !s || !is_set, "variant: ambiguous: expected not more than one variant type set; got at least two variant types set" );
+//             if( s ) { t.set( s ); }
+//         }
+//         template < typename K, typename V > void _visit( const K& key, const variant_t& t, V& v, unsigned int i )
+//         {
+//             const boost::optional< S >& s = t.template optional< S >();
+//             if( s ) { v.apply( variant_t::names()[i], *s ); }
+//         }
+//     };
+
+//     template < typename K, typename V > static void visit( const K& key, variant_t& t, V& v )
+//     {
+//         _variant_traits< T >::visit( key, t, v, false );
+//     }
+    
+//     template < typename K, typename V > static void visit( const K& key, const variant_t& t, V& v )
+//     {
+//         _variant_traits< T >::visit( key, t, v );
+//     }
+// };
+
+template < typename T >
+struct traits< std::complex< T > >
+{
+    template < typename K, typename V > static void visit( const K& key, std::complex< T >& t, V& v )
+    {
+        T s = t.real();
+        v.apply( "real", s );
+        t.real( s );
+        s = t.imag();
+        v.apply( "imag", s );
+        t.imag( s );
+    }
+    
+    template < typename K, typename V > static void visit( const K& key, const std::complex< T >& t, V& v )
+    {
+        v.apply( "real", t.real() );
+        v.apply( "imag", t.imag() );
+    }    
+};
+
+namespace detail {
+
+// template < unsigned int I > const char* element_name(); // super-quick and dirty for now, it would be better to use numeric indices, but then all visitors need to support tuple correctly
+// template <> inline const char* element_name< 0 >() { return "first"; }
+// template <> inline const char* element_name< 1 >() { return "second"; }
+// template <> inline const char* element_name< 2 >() { return "third"; }
+// template <> inline const char* element_name< 3 >() { return "fourth"; }
+// template <> inline const char* element_name< 4 >() { return "fifth"; }
+// template <> inline const char* element_name< 5 >() { return "sixth"; }
+// template <> inline const char* element_name< 6 >() { return "seventh"; }
+// template <> inline const char* element_name< 7 >() { return "eighth"; }
+
+// template < unsigned int I, unsigned int Size > struct elementwise
+// {
+//     template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+//     template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - I >(), std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+// };
+
+// template < unsigned int Size > struct elementwise< 1, Size >
+// {
+//     template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
+//     template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( element_name< Size - 1 >(), std::get< Size - 1 >( t ) ); }
+// };
+
+template < unsigned int I, unsigned int Size > struct elementwise // todo! add tuple support to all visitors
+{
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - I, std::get< Size - I >( t ) ); elementwise< I - 1, Size >::visit( t, v ); }
+};
+
+template < unsigned int Size > struct elementwise< 1, Size >
+{
+    template < typename T, typename V > static void visit( T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
+    template < typename T, typename V > static void visit( const T& t, V& v ) { v.apply( Size - 1, std::get< Size - 1 >( t ) ); }
+};
+
+} // namespace detail {
+
+template < typename... T >
+struct traits< std::tuple< T... > >
+{
+    typedef std::tuple< T... > tuple_t;
+
+    static const unsigned int size{ std::tuple_size< tuple_t >::value };
+
+    static_assert( size > 0 );
+
+    template < typename K, typename V > static void visit( const K& key, tuple_t& t, V& v ) { detail::elementwise< size, size >::visit( t, v ); }
+    
+    template < typename K, typename V > static void visit( const K&, const tuple_t& t, V& v ) { detail::elementwise< size, size >::visit( t, v ); }
+};
+
+namespace impl {
 
 template < typename K, typename V, typename Visitor >
 inline void visit_non_associative_container( const K&, const V& c, Visitor& v )
 {
     std::size_t index = 0;
-    for( typename V::const_iterator it = c.begin(); it != c.end(); ++it, ++index )
-    {
-        v.apply( index, *it );
-    }
+    for( typename V::const_iterator it = c.begin(); it != c.end(); ++it, ++index ) { v.apply( index, *it ); }
 }
 
 template < typename K, typename V, typename Visitor >
 inline void visit_non_associative_container( const K&, V& c, Visitor& v )
 {
     std::size_t index = 0;
-    for( typename V::iterator it = c.begin(); it != c.end(); ++it, ++index )
-    {
-        v.apply( index, *it );
-    }
+    for( typename V::iterator it = c.begin(); it != c.end(); ++it, ++index ) { v.apply( index, *it ); }
 }
 
 template < typename T, typename Visitor >
@@ -110,110 +322,59 @@ inline void visit_associative_container_key( const K& k, const T& t, Visitor& v
 template < typename K, typename M, typename Visitor >
 inline void visit_associative_container( const K&, M& c, Visitor& v )
 {
-    for( typename M::iterator it = c.begin(); it != c.end(); ++it )
-    {
-        visit_associative_container_key( it->first, it->second, v );
-    }
+    for( typename M::iterator it = c.begin(); it != c.end(); ++it ) { visit_associative_container_key( it->first, it->second, v ); }
 }
 
 template < typename K, typename M, typename Visitor >
 inline void visit_associative_container( const K&, const M& c, Visitor& v )
 {
-    for( typename M::const_iterator it = c.begin(); it != c.end(); ++it )
-    {
-        visit_associative_container_key( it->first, it->second, v );
-    }
+    for( typename M::const_iterator it = c.begin(); it != c.end(); ++it ) { visit_associative_container_key( it->first, it->second, v ); }
 }
 
-} // namespace Impl {
+} // namespace impl {
 
-/// vector visiting traits
-template < typename T, typename A >
-struct traits< std::vector< T, A > >
+template < typename T, typename A > struct traits< std::vector< T, A > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::vector< T, A >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::vector< T, A >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, std::vector< T, A >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::vector< T, A >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
 };
 
-/// set visiting traits
-template < typename T >
-struct traits< std::set< T > >
+template < typename T > struct traits< std::set< T > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::set< T >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::set< T >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, std::set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
 };
 
-/// std array visiting traits
-template < typename T, std::size_t S >
-struct traits< std::array< T, S > >
+template < typename T > struct traits< std::unordered_set< T > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
+    template < typename K, typename V > static void visit( const K& key, std::unordered_set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::unordered_set< T >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
+};
 
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
+template < typename T, std::size_t S > struct traits< std::array< T, S > >
+{
+    template < typename K, typename V > static void visit( const K& key, std::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
 };
 
-/// boost array visiting traits
-template < typename T, std::size_t S >
-struct traits< boost::array< T, S > >
+template < typename T, std::size_t S > struct traits< boost::array< T, S > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, boost::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const boost::array< T, S >& t, V& v )
-    {
-        Impl::visit_non_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, boost::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const boost::array< T, S >& t, V& v ) { impl::visit_non_associative_container( key, t, v ); }    
 };
 
-/// map visiting traits
-template < typename T, typename S >
-struct traits< std::map< T, S > >
+template < typename T, typename S > struct traits< std::map< T, S > >
 {
-    /// visit
-    template < typename K, typename V > static void visit( const K& key, std::map< T, S >& t, V& v )
-    {
-        Impl::visit_associative_container( key, t, v );
-    }
-    
-    /// visit const
-    template < typename K, typename V > static void visit( const K& key, const std::map< T, S >& t, V& v )
-    {
-        Impl::visit_associative_container( key, t, v );
-    }    
+    template < typename K, typename V > static void visit( const K& key, std::map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }    
+};
+
+template < typename T, typename S > struct traits< std::unordered_map< T, S > >
+{
+    template < typename K, typename V > static void visit( const K& key, std::unordered_map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }
+    template < typename K, typename V > static void visit( const K& key, const std::unordered_map< T, S >& t, V& v ) { impl::visit_associative_container( key, t, v ); }    
 };
 
 /// @todo add more types as needed
 
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_VISITING_TRAITS_HEADER_GUARD_
diff --git a/visiting/visit.h b/visiting/visit.h
index 09d23246b..f799b3ccf 100644
--- a/visiting/visit.h
+++ b/visiting/visit.h
@@ -27,24 +27,18 @@
 // OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN
 // IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
-
 /// @author vsevolod vlaskine
 
-#ifndef COMMA_VISITING_VISIT_HEADER_GUARD_
-#define COMMA_VISITING_VISIT_HEADER_GUARD_
+#pragma once
 
 #include "traits.h"
 
 namespace comma { namespace visiting {
     
-/// visit
 template < typename K, typename T, typename V >
 inline void visit( const K& key, T& t, V& v ) { traits< T >::visit( key, t, v ); }
 
-/// visit const
 template < typename K, typename T, typename V >
 inline void visit( const K& key, const T& t, V& v ) { traits< T >::visit( key, t, v ); }
     
 } } // namespace comma { namespace visiting {
-
-#endif // COMMA_VISITING_VISIT_HEADER_GUARD_
diff --git a/xml/applications/xml-split.cpp b/xml/applications/xml-split.cpp
index 0f5fbd4fb..1d215c7ce 100644
--- a/xml/applications/xml-split.cpp
+++ b/xml/applications/xml-split.cpp
@@ -40,14 +40,11 @@
 
 #include <expat.h>
 
-#include <boost/filesystem.hpp>
-
 #include "../../application/command_line_options.h"
+#include "../../io/impl/filesystem.h"
 #include "../../xpath/xpath.h"
 #include "expat_util.h"
 
-namespace FS = boost::filesystem;
-
 #define CMDNAME "xml-split"
 
 static unsigned TOTAL_MAX = std::numeric_limits<unsigned>::max() - 1;
@@ -190,14 +187,14 @@ output_wrapper::start()
     
     if (0 == _total_count)
     {
-        if (FS::exists(oss.str()))
+        if (comma::filesystem::exists(oss.str()))
         {
             std::cerr << CMDNAME ": Error: Output Directory Name '" << oss.str() << "' Already Exists on Filesystem. Abort!" << std::endl;
             exit(1);
         }
         else
         {
-            if (! FS::create_directory(oss.str()))
+            if (! comma::filesystem::create_directory(oss.str()))
             {
                 std::cerr << CMDNAME ": Error: Could not Create Output Directory '" << oss.str() << "'. Abort!" << std::endl;
                 return _destination;
diff --git a/xpath/test/CMakeLists.txt b/xpath/test/CMakeLists.txt
index 10216ab48..d94d2e0d0 100644
--- a/xpath/test/CMakeLists.txt
+++ b/xpath/test/CMakeLists.txt
@@ -1,16 +1,13 @@
-SET(KIT xpath)
-
-FILE( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
-
-ADD_EXECUTABLE( ${CMAKE_PROJECT_NAME}_test_${KIT} ${source} )
-
-TARGET_LINK_LIBRARIES( ${CMAKE_PROJECT_NAME}_test_${KIT} comma_xpath comma_string ${GTEST_BOTH_LIBRARIES} pthread )
-
-IF( INSTALL_TESTS )
-INSTALL ( 
-    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
-    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
-    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
-ENDIF( INSTALL_TESTS )
-
-add_test( NAME ${CMAKE_PROJECT_NAME}_test_${KIT} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+set( KIT xpath )
+file( GLOB source ${SOURCE_CODE_BASE_DIR}/${KIT}/test/*test.cpp )
+set( test_name ${CMAKE_PROJECT_NAME}_test_${KIT} )
+add_executable( ${test_name} ${source} )
+target_link_libraries( ${test_name} comma_base comma_xpath ${GTEST_BOTH_LIBRARIES} pthread )
+add_test( NAME ${test_name} COMMAND ${CMAKE_PROJECT_NAME}_test_${KIT} WORKING_DIRECTORY ${PROJECT_BINARY_DIR}/bin )
+if( INSTALL_TESTS )
+    install( TARGETS ${test_name} RUNTIME DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} COMPONENT Runtime )
+    #INSTALL (
+    #    FILES ${PROJECT_BINARY_DIR}/bin/${CMAKE_PROJECT_NAME}_test_${KIT}
+    #    PERMISSIONS WORLD_READ GROUP_READ OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_EXECUTE WORLD_EXECUTE
+    #    DESTINATION ${comma_CPP_TESTS_INSTALL_DIR} )
+endif( INSTALL_TESTS )