lumiera_/src/lib/stat/data.hpp

/*
  DATA.hpp  -  read and write a table with CSV data

   Copyright (C)
     2022,            Hermann Vosseler <Ichthyostega@web.de>

  **Lumiera** is free software; you can redistribute it and/or modify it
  under the terms of the GNU General Public License as published by the
  Free Software Foundation; either version 2 of the License, or (at your
  option) any later version. See the file COPYING for further details.

*/


/** @file data.hpp
 ** Manage a table with data records, stored persistently as CSV.
 ** In the context of observations, configuration, calibration and QA, a series
 ** of measurement data taken over time is often evaluated statistically, to distill
 ** typical averages, variances and trends. Short of using a database, a modest
 ** amount of numeric data can be maintained in CSV files, which also allows for
 ** further manual evaluation within a spreadsheet or statistics application.
 ** The CSV format as such can be quite elaborate, yet for the purpose of
 ** saving and later reading back some values generated by the application
 ** itself, supporting a limited format flavour is sufficient:
 ** - first line is a header line and used to verify the storage format
 ** - one record per line, embedded line breaks prohibited
 ** - fields separated by comma, semicolon tolerated
 ** - fields are trimmed and may be empty
 ** - a field may be double quoted
 ** - only quoted fields may contain whitespace or comma
 ** - no escaping of quotes, i.e. no quotes within quotes
 ** 
 ** As a fundamental building block, this header provides a data table template
 ** with flexible column configuration to hold arbitrary, explicitly typed values.
 ** This solution is statically typed and does not carry any runtime type information;
 ** the actual data table object is then defined and accessed by means of _accessor_
 ** components for each column of data. A tuple of _current values_ corresponding to
 ** the most recent row of data can be accessed directly through these sub-components.
 ** 
 ** # Usage
 ** Create an actual instantiation of the DataTable template, passing a structure
 ** with util::Column descriptors. You may then directly access the values of the
 ** _actual column_ or save/load from a persistent CSV file.
 ** @note mandatory to define a method `allColumns()`
 ** \code
 ** struct Storage
 **   {
 **     Column<string> name{"theName"};
 **     Column<int>    n{"counter"};
 **     Column<double> x{"X value"};
 **     Column<double> y{"Y value"};
 **
 **     auto allColumns(){ return std::tie(name,n,x,y); }
 **   };
 ** 
 ** using Dataz = lib::stat::DataTable<Storage>;
 ** 
 ** Dataz daz("filename.csv");
 ** 
 ** daz.x = 123e-4;
 ** daz.y = -12345e-6;
 ** 
 ** std::vector<int>& counters = daz.n.data;
 ** \endcode
 ** \par Variations
 ** The standard case is to have a table backed by persistent file storage,
 ** which can be initially empty. Under some conditions, especially for tests
 ** - the DataTable can be created without filename
 ** - it can be created from a CSVData, which is a `std::vector` of CSV-strings
 ** - it can be [rendered into CSV strings](\ref #renderCSV)
 ** - a (new) storage file name can be [given later](\ref saveAs)
 ** @see DataCSV_test
 **
 */


#ifndef LIB_STAT_DATA_H
#define LIB_STAT_DATA_H


#include "lib/error.hpp"
#include "lib/nocopy.hpp"
#include "lib/stat/csv.hpp"
#include "lib/file.hpp"
#include "lib/format-string.hpp"
#include "lib/util.hpp"

#include <type_traits>
#include <utility>
#include <fstream>
#include <vector>
#include <string>
#include <limits>
#include <deque>


namespace lib {
namespace stat{
  
  namespace error = lumiera::error;
  
  using std::move;
  using std::tuple;
  using std::vector;
  using std::string;
  using util::isnil;
  using util::unConst;
  using util::_Fmt;
  using util::min;
  
  
  /**
   * Descriptor and Accessor for a data column within a DataTable table.
   * @tparam VAL type of values contained within this column;
   *             this type must be _default constructible_ and _copyable._
   */
  template<typename VAL>
  struct Column
    : util::MoveOnly
    {
      string header;
      vector<VAL> data;
      
      using ValueType = VAL;
      
      
      Column (string headerID)
        : header{headerID}
        , data{}
        { }
      
      
      VAL&
      get()
        {
          if (isnil (data))
              throw error::State{"No rows in DataTable yet"};
          return data.back();
        }
      
      operator VAL&()
        {
          return get();
        }
      
      operator VAL const&()  const
        {
          return unConst(this)->get();
        }
      
      template<typename X>
      VAL& operator= (X&& newVal)
      {
          return get() = std::forward<X> (newVal);
      }
    };
  
  
  /******************************************************************************************//**
   * Table with data values, stored persistently as CSV file.
   * Each row within the table represents a data record, holding a sequence
   * of values. Values are statically typed per column, i.e. one column may hold
   * strings, while the next column holds doubles. For actual usage it is thus necessary
   * to define the column layout, through a sequence of [column Descriptors](\ref util::Column).
   * 
   * # Usage
   * Actually those Column objects serve as descriptors, but also as accessors — and they hold
   * the actual data storage for each column, which is a `std::vector<VAL>` of value type `VAL`.
   * There is always a _current record_ — corresponding to the actual data value and the newest
   * data row. For persistent storage, the sequence of rows is _reversed,_ so the newest data
   * appears at the top of the CSV file.
   * @tparam TAB a struct comprised of several Column objects, which hold the data and
   *         provide access to values of this specific column. Moreover, this type _must define_
   *         a function `allColumns()` to return a tuple with references to these column fields;
   *         the order of fields within this tuple also defines the order of columns
   *         within the table and persistent CSV storage.
   */
  template<class TAB>
  class DataTable
      : public TAB
      , util::MoveOnly
    {
      fs::path filename_;
      
    public:
      DataTable(fs::path csvFile ="")
        : filename_{fs::consolidated (csvFile)}
        {
          loadData();
        }
      
      DataTable (CSVData const& csv)
        : filename_{}
        {
          appendFrom (csv);
        }
      
      
      /* === Data Access === */
      
      static constexpr size_t columnCnt = std::tuple_size_v<decltype(std::declval<TAB>().allColumns())>;
      
      bool
      empty()  const
        {
          return 0 == this->size();
        }
      
      size_t
      size()  const
        {
          if (0 == columnCnt) return 0;
          size_t rowCnt = std::numeric_limits<size_t>::max();
          forAllColumns(
                    [&](auto& col)
                      {
                        rowCnt = min (rowCnt, col.data.size());
                      }); // the smallest number of data points found in any column
          return rowCnt;
        }
      
      CSVData
      renderCSV()  const
        {
          CSVData csv{{}};
          csv.reserve (size()+1);
          auto header = generateHeaderSpec();
          using std::swap;
          swap (csv[0], header);
          for (uint i=0; i < size(); ++i)
            csv.emplace_back (formatCSVRow(i));
          return csv;
        }
      
      
      /* === Manipulation === */
      
      void
      newRow()
        {
            forAllColumns(
                    [siz = size()+1]
                    (auto& col)
                      {
                        col.data.resize (siz);
                      });
        }
      
      void
      dupRow()
        {
          if (empty())
            newRow();
          else
            forAllColumns(
                    [](auto& col)
                      {
                        col.data.emplace_back (col.data.back());
                      });
        }
      
      void
      dropLastRow()
        {
          if (not empty())
            forAllColumns(
                    [](auto& col)
                      {
                        size_t siz = col.data.size();
                        col.data.resize (siz>0? siz-1 : 0);
                      });
        }
      
      void
      reserve (size_t expectedCapacity)
        {
            forAllColumns(
                    [=](auto& col)
                      {
                        col.data.reserve(expectedCapacity);
                      });
        }
      
      void
      clear()
        {
            forAllColumns(
                    [](auto& col)
                      {
                        col.data.clear();
                      });
        }
      
      void
      appendFrom (CSVData const& csv)
        {
          if (isnil (csv)) return;
          verifyHeaderSpec (csv[0]);
          for (size_t row=1; row<csv.size(); ++row)
            if (not isnil (csv[row]))
              appendRowFromCSV (csv[row]);
        }
      
      
      /** @param lineLimit number of rows to retain, back from the newest */
      void
      save (size_t lineLimit =std::numeric_limits<size_t>::max()
           ,bool backupOld =false)
        {
          if (filename_.empty())
            throw error::Logic{"Unable to save DataFile without filename given."};
          
          fs::path newFilename{filename_};
          newFilename += ".tmp";
          
          std::ofstream csvFile{newFilename, std::ios_base::out | std::ios_base::trunc};
          if (not csvFile.good())
            throw error::State{_Fmt{"Unable to create CSV output file %s"}
                                   % newFilename};
          saveData (csvFile, lineLimit);
          
          if (backupOld)
            {
              fs::path oldFile{filename_};
              oldFile += ".bak";
              if (fs::exists (filename_))
                  fs::rename (filename_, oldFile);
            }
          fs::rename (newFilename, filename_);
          filename_ = fs::consolidated(filename_);
        }                // lock onto absolute path
      
      
      void
      saveAs (fs::path newStorage
             ,size_t lineLimit =std::numeric_limits<size_t>::max())
        {
          newStorage = fs::consolidated (newStorage);
          if (fs::exists(newStorage))
            throw error::Invalid{_Fmt{"Storing DataFile rejected: target %s exists already"}
                                     % newStorage};
          if (not (newStorage.parent_path().empty()
                   or fs::exists(newStorage.parent_path())))
            throw error::Invalid{_Fmt{"DataFile(%s) placed into nonexistent directory %s"}
                                     % newStorage.filename() % newStorage.parent_path()};
          filename_ = newStorage;
          save (lineLimit);
        }
      
      
    private: /* === Implementation === */
      
      /** apply a generic Lambda to all columns */
      template<class OP>
      void
      forAllColumns (OP&& doIt)  const
        {
          lib::meta::forEach (unConst(this)->allColumns()
                             ,std::forward<OP> (doIt));
        }
      
      void
      loadData()
        {
          if (not (filename_.parent_path().empty()
                   or fs::exists(filename_.parent_path())))
            throw error::Invalid{_Fmt{"DataFile(%s) placed into nonexistent directory %s"}
                                     % filename_.filename() % filename_.parent_path()};
          if (not fs::exists(filename_))
            return; // leave the table empty
          
          std::ifstream csvFile{filename_};
          if (not csvFile.good())
            throw error::Config{_Fmt{"unable to read CSV data file %s"} % filename_};
          
          std::deque<string> rawLines;
          for (string line; std::getline(csvFile, line); )
            rawLines.emplace_back (move(line));
          
          if (rawLines.size() < 1) return;
          verifyHeaderSpec (rawLines[0]);
          
          // we know the number of rows now...
          reserve (rawLines.size() - 1);
          
          // storage in file is backwards, with newest data on top
          for (size_t row = rawLines.size()-1; 0<row; --row)
            if (not isnil(rawLines[row]))
              appendRowFromCSV (rawLines[row]);
        }
      
      
      void
      saveData (std::ofstream& csvFile, size_t lineLimit)
        {
          csvFile << generateHeaderSpec() << "\n";
          if (empty())
            return;
          lineLimit = size() > lineLimit? size()-lineLimit : 0;
          // store newest data first, possibly discard old data
          for (size_t row = size(); lineLimit < row; --row)
            csvFile << formatCSVRow(row-1) << "\n";
        }
      
      
      void
      verifyHeaderSpec (string headerLine)
        {
          CsvParser header{headerLine};
          forAllColumns(
                  [&](auto& col)
                    {
                      if (*header != col.header)
                        throw error::Invalid{_Fmt{"Header mismatch in CSV file %s. "
                                                  "Expecting column(%s) but found \"%s\""}
                                                 % filename_ % col.header % *header};
                      ++header;
                    });
        }
      
      CSVLine
      generateHeaderSpec()  const
        {
          CSVLine csv;
          forAllColumns(
                  [&](auto& col)
                    {
                      csv += col.header;
                    });
          return csv;
        }
      
      
      void
      appendRowFromCSV (string line)
        {
          newRow();
          CsvParser csv(line);
          forAllColumns(
                  [&](auto& col)
                    {
                      if (not csv)
                        {
                          if (csv.isParseFail())
                            csv.fail();
                          else
                            throw error::Invalid{_Fmt{"Insufficient data; only %d fields, %d expected. Line:%s"}
                                                     % csv.getParsedFieldCnt() % columnCnt % line};
                        }
                      
                      using Value = std::remove_reference<decltype(col)>::type::ValueType;
                      col.get() = parseAs<Value>(*csv);
                      ++csv;
                    });
          if (csv)
            throw error::Invalid{_Fmt{"Excess data fields in CSV. Expect %d fields. Line:%s"}
                                     % columnCnt % line};
        }
      
      
      CSVLine
      formatCSVRow (size_t rownum)  const
        {
          if (this->empty())
            throw error::Logic{"Attempt to access data from empty DataTable."};
          if (rownum >= this->size())
            throw error::Logic{_Fmt{"Attempt to access row #%d beyond range [0..%d]."}
                                   % rownum % (size()-1)};
          
          CSVLine csvLine;
          forAllColumns(
                  [&](auto& col)
                    {
                      csvLine += col.data.at(rownum);
                    });
          return csvLine;
        }
    };
  
}} // namespace lib::stat
#endif /*LIB_STAT_DATA_H*/
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								/*
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								  DATA.hpp  -  read and write a table with CSV data
-												Copyright: clarify and simplify the file headers

 * Lumiera source code always was copyrighted by individual contributors
 * there is no entity "Lumiera.org" which holds any copyrights
 * Lumiera source code is provided under the GPL Version 2+

== Explanations ==
Lumiera as a whole is distributed under Copyleft, GNU General Public License Version 2 or above.
For this to become legally effective, the ''File COPYING in the root directory is sufficient.''

The licensing header in each file is not strictly necessary, yet considered good practice;
attaching a licence notice increases the likeliness that this information is retained
in case someone extracts individual code files. However, it is not by the presence of some
text, that legally binding licensing terms become effective; rather the fact matters that a
given piece of code was provably copyrighted and published under a license. Even reformatting
the code, renaming some variables or deleting parts of the code will not alter this legal
situation, but rather creates a derivative work, which is likewise covered by the GPL!

The most relevant information in the file header is the notice regarding the
time of the first individual copyright claim. By virtue of this initial copyright,
the first author is entitled to choose the terms of licensing. All further
modifications are permitted and covered by the License. The specific wording
or format of the copyright header is not legally relevant, as long as the
intention to publish under the GPL remains clear. The extended wording was
based on a recommendation by the FSF. It can be shortened, because the full terms
of the license are provided alongside the distribution, in the file COPYING.

											
										
										
											2024-11-17 23:42:55 +01:00
+								   Copyright (C)
 ,            Hermann Vosseler <Ichthyostega@web.de>
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
-												Copyright: clarify and simplify the file headers

 * Lumiera source code always was copyrighted by individual contributors
 * there is no entity "Lumiera.org" which holds any copyrights
 * Lumiera source code is provided under the GPL Version 2+

== Explanations ==
Lumiera as a whole is distributed under Copyleft, GNU General Public License Version 2 or above.
For this to become legally effective, the ''File COPYING in the root directory is sufficient.''

The licensing header in each file is not strictly necessary, yet considered good practice;
attaching a licence notice increases the likeliness that this information is retained
in case someone extracts individual code files. However, it is not by the presence of some
text, that legally binding licensing terms become effective; rather the fact matters that a
given piece of code was provably copyrighted and published under a license. Even reformatting
the code, renaming some variables or deleting parts of the code will not alter this legal
situation, but rather creates a derivative work, which is likewise covered by the GPL!

The most relevant information in the file header is the notice regarding the
time of the first individual copyright claim. By virtue of this initial copyright,
the first author is entitled to choose the terms of licensing. All further
modifications are permitted and covered by the License. The specific wording
or format of the copyright header is not legally relevant, as long as the
intention to publish under the GPL remains clear. The extended wording was
based on a recommendation by the FSF. It can be shortened, because the full terms
of the license are provided alongside the distribution, in the file COPYING.

											
										
										
											2024-11-17 23:42:55 +01:00
+								  **Lumiera** is free software; you can redistribute it and/or modify it
 								  under the terms of the GNU General Public License as published by the
 								  Free Software Foundation; either version 2 of the License, or (at your
 								  option) any later version. See the file COPYING for further details.
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
 								*/
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
 								/** @file data.hpp
-												Library: complete coverage of CSV data table including storage

also encompasses some coverage for the simplistic CSV format
implemented as storage backend for this data table

											
										
										
											2024-03-14 23:44:39 +01:00
+								 ** Manage a table with data records, stored persistently as CSV.
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 ** In the context of observations, configuration, calibration and QA, a series
 								 ** of measurement data taken over time is often evaluated statistically, to distill
 								 ** typical averages, variances and trends. Short of using a database, a modest
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								 ** amount of numeric data can be maintained in CSV files, which also allows for
 								 ** further manual evaluation within a spreadsheet or statistics application.
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 ** The CSV format as such can be quite elaborate, yet for the purpose of
 								 ** saving and later reading back some values generated by the application
 								 ** itself, supporting a limited format flavour is sufficient:
 								 ** - first line is a header line and used to verify the storage format
 								 ** - one record per line, embedded line breaks prohibited
 								 ** - fields separated by comma, semicolon tolerated
 								 ** - fields are trimmed and may be empty
 								 ** - a field may be double quoted
 								 ** - only quoted fields may contain whitespace or comma
 								 ** - no escaping of quotes, i.e. no quotes within quotes
 								 **
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								 ** As a fundamental building block, this header provides a data table template
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 ** with flexible column configuration to hold arbitrary, explicitly typed values.
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								 ** This solution is statically typed and does not carry any runtime type information;
 								 ** the actual data table object is then defined and accessed by means of _accessor_
 								 ** components for each column of data. A tuple of _current values_ corresponding to
 								 ** the most recent row of data can be accessed directly through these sub-components.
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 **
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 ** # Usage
-												Scheduler-test: settle definition of specific test setup and data

After a lot of further tinkering, seemingly arriving at a
somewhat satisfactory solution for the layout and arrangement of
test definitions and especially the table for measurement series.

While the complete setup remains fragile indeed, and complexity is more
hidden than reduced — the pragmatic compromise established yesterday
at least allows to reduce the amount of boilerplate in the test or
measurement setup to make the actual specifics stand out clearly.

----

As an aside, the usage of the `DataFile` type imported from Yoshimi-test
recently was re-shaped more towards a generic handling of tabular data with
CSV storage option; thus renaming the type now into `DataTable`.
Persistent storage is now just one option, while another usage pattern
compounds observation data into table rows, which are then directly
rendered into a CSV string, e.g. for visualisation as Gnuplot graph.

											
										
										
											2024-04-07 23:52:56 +02:00
+								 ** Create an actual instantiation of the DataTable template, passing a structure
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 ** with util::Column descriptors. You may then directly access the values of the
 								 ** _actual column_ or save/load from a persistent CSV file.
 								 ** @note mandatory to define a method `allColumns()`
 								 ** \code
 								 ** struct Storage
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 **   {
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 **     Column<string> name{"theName"};
 								 **     Column<int>    n{"counter"};
 								 **     Column<double> x{"X value"};
 								 **     Column<double> y{"Y value"};
 								 **
-												capture and store individual timings as time series

Note: work-in-progress...
TODO: derive the expense factor and delta

											
										
										
											2021-09-19 17:31:54 +02:00
+								 **     auto allColumns(){ return std::tie(name,n,x,y); }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 **   };
 								 **
-												Scheduler-test: settle definition of specific test setup and data

After a lot of further tinkering, seemingly arriving at a
somewhat satisfactory solution for the layout and arrangement of
test definitions and especially the table for measurement series.

While the complete setup remains fragile indeed, and complexity is more
hidden than reduced — the pragmatic compromise established yesterday
at least allows to reduce the amount of boilerplate in the test or
measurement setup to make the actual specifics stand out clearly.

----

As an aside, the usage of the `DataFile` type imported from Yoshimi-test
recently was re-shaped more towards a generic handling of tabular data with
CSV storage option; thus renaming the type now into `DataTable`.
Persistent storage is now just one option, while another usage pattern
compounds observation data into table rows, which are then directly
rendered into a CSV string, e.g. for visualisation as Gnuplot graph.

											
										
										
											2024-04-07 23:52:56 +02:00
+								 ** using Dataz = lib::stat::DataTable<Storage>;
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 **
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 ** Dataz daz("filename.csv");
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 **
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 ** daz.x = 123e-4;
 								 ** daz.y = -12345e-6;
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								 **
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 ** std::vector<int>& counters = daz.n.data;
 								 ** \endcode
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								 ** \par Variations
 								 ** The standard case is to have a table backed by persistent file storage,
 								 ** which can be initially empty. Under some conditions, especially for tests
-												Scheduler-test: settle definition of specific test setup and data

After a lot of further tinkering, seemingly arriving at a
somewhat satisfactory solution for the layout and arrangement of
test definitions and especially the table for measurement series.

While the complete setup remains fragile indeed, and complexity is more
hidden than reduced — the pragmatic compromise established yesterday
at least allows to reduce the amount of boilerplate in the test or
measurement setup to make the actual specifics stand out clearly.

----

As an aside, the usage of the `DataFile` type imported from Yoshimi-test
recently was re-shaped more towards a generic handling of tabular data with
CSV storage option; thus renaming the type now into `DataTable`.
Persistent storage is now just one option, while another usage pattern
compounds observation data into table rows, which are then directly
rendered into a CSV string, e.g. for visualisation as Gnuplot graph.

											
										
										
											2024-04-07 23:52:56 +02:00
+								 ** - the DataTable can be created without filename
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								 ** - it can be created from a CSVData, which is a `std::vector` of CSV-strings
 								 ** - it can be [rendered into CSV strings](\ref #renderCSV)
 								 ** - a (new) storage file name can be [given later](\ref saveAs)
-												Library: extend the DataFile to allow using it without storage

...seems obvious and does not compromise the simplistic design...
...we do check the file path anyway, just need to add saveAs()...

											
										
										
											2024-03-13 18:57:48 +01:00
+								 ** @see DataCSV_test
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								 **
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								 */
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								#ifndef LIB_STAT_DATA_H
 								#define LIB_STAT_DATA_H
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								#include "lib/error.hpp"
 								#include "lib/nocopy.hpp"
 								#include "lib/stat/csv.hpp"
-												Clean-up: get rid of `boost::filesystem`

Since C++17 we can use the std::filesystem instead (and we ''do use it'' indeed)
- relocate the `/lib/file.hpp` header
- adapt the self-discovery of the executable to using std::filesystem

Furthermore, some recherche regarding XVideo and Video Output

											
										
										
											2025-04-27 23:54:21 +02:00
+								#include "lib/file.hpp"
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								#include "lib/format-string.hpp"
 								#include "lib/util.hpp"
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
-												integrate CSV handling into the new data table type

											
										
										
											2021-09-17 15:01:28 +02:00
+								#include <type_traits>
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								#include <utility>
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								#include <fstream>
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								#include <vector>
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								#include <string>
-												integrate CSV handling into the new data table type

											
										
										
											2021-09-17 15:01:28 +02:00
+								#include <limits>
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								#include <deque>
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								namespace lib {
 								namespace stat{
 								  namespace error = lumiera::error;
 								  using std::move;
 								  using std::tuple;
 								  using std::vector;
 								  using std::string;
 								  using util::isnil;
 								  using util::unConst;
 								  using util::_Fmt;
 								  using util::min;
 								  /**
-												Scheduler-test: settle definition of specific test setup and data

After a lot of further tinkering, seemingly arriving at a
somewhat satisfactory solution for the layout and arrangement of
test definitions and especially the table for measurement series.

While the complete setup remains fragile indeed, and complexity is more
hidden than reduced — the pragmatic compromise established yesterday
at least allows to reduce the amount of boilerplate in the test or
measurement setup to make the actual specifics stand out clearly.

----

As an aside, the usage of the `DataFile` type imported from Yoshimi-test
recently was re-shaped more towards a generic handling of tabular data with
CSV storage option; thus renaming the type now into `DataTable`.
Persistent storage is now just one option, while another usage pattern
compounds observation data into table rows, which are then directly
rendered into a CSV string, e.g. for visualisation as Gnuplot graph.

											
										
										
											2024-04-07 23:52:56 +02:00
+								   * Descriptor and Accessor for a data column within a DataTable table.
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								   * @tparam VAL type of values contained within this column;
 								   *             this type must be _default constructible_ and _copyable._
 								   */
 								  template<typename VAL>
 								  struct Column
-												Scheduler-test: rework `ParameterRange` tool for data visualisation

Rework the existing tool to capture the measurement series
into the newly integrated CSV-based data storage, allowing
to turn the results into a Gnuplot-visualisation.

											
										
										
											2024-04-04 00:44:11 +02:00
+								    : util::MoveOnly
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								    {
 								      string header;
 								      vector<VAL> data;
 								      using ValueType = VAL;
 								      Column (string headerID)
-												parse a simplified variant of CSV

rationale: the purpose is to read back our own values,
yet it should be reasonably standard, to allow investigating
and tweaking values with a spreadsheet

 - first line is a header line and used to verify the number of columns
 - one record per line, embedded line breaks prohibited
 - fields separated by comma, semicolon tolerated
 - fields are trimmed and may be empty
 - a field may be double quoted
 - only quoted fields may contain whitespace or comma
 - no escaping of quotes, i.e. no quotes within quotes

											
										
										
											2021-09-16 23:54:11 +02:00
+								        : header{headerID}
 								        , data{}
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								        { }
 								      VAL&
 								      get()
 								        {
 								          if (isnil (data))
 								              throw error::State{"No rows in DataTable yet"};
 								          return data.back();
 								        }
 								      operator VAL&()
 								        {
 								          return get();
 								        }
 								      operator VAL const&()  const
 								        {
 								          return unConst(this)->get();
 								        }
 								      template<typename X>
 								      VAL& operator= (X&& newVal)
 								      {
 								          return get() = std::forward<X> (newVal);
 								      }
 								    };
 								  /******************************************************************************************//**
 								   * Table with data values, stored persistently as CSV file.
 								   * Each row within the table represents a data record, holding a sequence
 								   * of values. Values are statically typed per column, i.e. one column may hold
 								   * strings, while the next column holds doubles. For actual usage it is thus necessary
 								   * to define the column layout, through a sequence of [column Descriptors](\ref util::Column).
 								   *
 								   * # Usage
 								   * Actually those Column objects serve as descriptors, but also as accessors — and they hold
 								   * the actual data storage for each column, which is a `std::vector<VAL>` of value type `VAL`.
 								   * There is always a _current record_ — corresponding to the actual data value and the newest
 								   * data row. For persistent storage, the sequence of rows is _reversed,_ so the newest data
 								   * appears at the top of the CSV file.
 								   * @tparam TAB a struct comprised of several Column objects, which hold the data and
 								   *         provide access to values of this specific column. Moreover, this type _must define_
 								   *         a function `allColumns()` to return a tuple with references to these column fields;
 								   *         the order of fields within this tuple also defines the order of columns
 								   *         within the table and persistent CSV storage.
 								   */
 								  template<class TAB>
-												Scheduler-test: settle definition of specific test setup and data

After a lot of further tinkering, seemingly arriving at a
somewhat satisfactory solution for the layout and arrangement of
test definitions and especially the table for measurement series.

While the complete setup remains fragile indeed, and complexity is more
hidden than reduced — the pragmatic compromise established yesterday
at least allows to reduce the amount of boilerplate in the test or
measurement setup to make the actual specifics stand out clearly.

----

As an aside, the usage of the `DataFile` type imported from Yoshimi-test
recently was re-shaped more towards a generic handling of tabular data with
CSV storage option; thus renaming the type now into `DataTable`.
Persistent storage is now just one option, while another usage pattern
compounds observation data into table rows, which are then directly
rendered into a CSV string, e.g. for visualisation as Gnuplot graph.

											
										
										
											2024-04-07 23:52:56 +02:00
+								  class DataTable
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								      : public TAB
-												Scheduler-test: rework `ParameterRange` tool for data visualisation

Rework the existing tool to capture the measurement series
into the newly integrated CSV-based data storage, allowing
to turn the results into a Gnuplot-visualisation.

											
										
										
											2024-04-04 00:44:11 +02:00
+								      , util::MoveOnly
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								    {
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								      fs::path filename_;
 								    public:
-												Scheduler-test: settle definition of specific test setup and data

After a lot of further tinkering, seemingly arriving at a
somewhat satisfactory solution for the layout and arrangement of
test definitions and especially the table for measurement series.

While the complete setup remains fragile indeed, and complexity is more
hidden than reduced — the pragmatic compromise established yesterday
at least allows to reduce the amount of boilerplate in the test or
measurement setup to make the actual specifics stand out clearly.

----

As an aside, the usage of the `DataFile` type imported from Yoshimi-test
recently was re-shaped more towards a generic handling of tabular data with
CSV storage option; thus renaming the type now into `DataTable`.
Persistent storage is now just one option, while another usage pattern
compounds observation data into table rows, which are then directly
rendered into a CSV string, e.g. for visualisation as Gnuplot graph.

											
										
										
											2024-04-07 23:52:56 +02:00
+								      DataTable(fs::path csvFile ="")
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								        : filename_{fs::consolidated (csvFile)}
 								        {
 								          loadData();
 								        }
-												Scheduler-test: settle definition of specific test setup and data

After a lot of further tinkering, seemingly arriving at a
somewhat satisfactory solution for the layout and arrangement of
test definitions and especially the table for measurement series.

While the complete setup remains fragile indeed, and complexity is more
hidden than reduced — the pragmatic compromise established yesterday
at least allows to reduce the amount of boilerplate in the test or
measurement setup to make the actual specifics stand out clearly.

----

As an aside, the usage of the `DataFile` type imported from Yoshimi-test
recently was re-shaped more towards a generic handling of tabular data with
CSV storage option; thus renaming the type now into `DataTable`.
Persistent storage is now just one option, while another usage pattern
compounds observation data into table rows, which are then directly
rendered into a CSV string, e.g. for visualisation as Gnuplot graph.

											
										
										
											2024-04-07 23:52:56 +02:00
+								      DataTable (CSVData const& csv)
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								        : filename_{}
 								        {
 								          appendFrom (csv);
 								        }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
 								      /* === Data Access === */
 								      static constexpr size_t columnCnt = std::tuple_size_v<decltype(std::declval<TAB>().allColumns())>;
 								      bool
 								      empty()  const
 								        {
 								          return 0 == this->size();
 								        }
 								      size_t
 								      size()  const
 								        {
 								          if (0 == columnCnt) return 0;
 								          size_t rowCnt = std::numeric_limits<size_t>::max();
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								          forAllColumns(
 								                    [&](auto& col)
 								                      {
 								                        rowCnt = min (rowCnt, col.data.size());
 								                      }); // the smallest number of data points found in any column
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								          return rowCnt;
 								        }
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								      CSVData
 								      renderCSV()  const
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								        {
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								          CSVData csv{{}};
 								          csv.reserve (size()+1);
 								          auto header = generateHeaderSpec();
-												Library: handle chaining of iterator-pipelines

This involves some quite tricky changes in the way types are composed to form an iterator-pipeline.
Some wrappers are added as adaptors or for additional safety-checks, and to provide a builder-API.
Unfortunately, when building a new `IterExplorer` iterator pipeline from an existing pipeline naively,
composing all those types will add several unecessary intermediary wrapper-layers.
Worse even, the handling of `BaseAdapter` prevents the new tuple-zipping iterator
actually to pass-through any `expandChildren()` call.

These issues are a consequence of using templated types, instead of fixed types with an interface;
we can not just determine if some wrapper is present — unless the wrapper itself ''helps by exposing a tag.''
Even while I must admit that the whole packaging and adaptation machinery of `IterExplorer`
looks dangerously complex already, using dedicated type tags for this single purpose
seems like a tenable soulution.

											
										
										
											2024-11-24 19:53:07 +01:00
+								          using std::swap;
 								          swap (csv[0], header);
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								          for (uint i=0; i < size(); ++i)
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								            csv.emplace_back (formatCSVRow(i));
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								          return csv;
 								        }
 								      /* === Manipulation === */
 								      void
 								      newRow()
 								        {
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								            forAllColumns(
 								                    [siz = size()+1]
 								                    (auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                      {
-												Library: cover row handling of data table

...this uncovered one inconsistency: when directly adding values
into one of the embedded data vectors, the inconsistent size
was allowed to persist even when adding / removing lines.

This is in contradiction to the behavior for the CSV dump,
which uses index positions from the front of all vectors uniformely.

Thus changed the behaviour of adding a new row, so that it now
caps all vectors to a common size

also added function to clear the table

											
										
										
											2024-03-13 19:47:43 +01:00
+								                        col.data.resize (siz);
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                      });
 								        }
 								      void
 								      dupRow()
 								        {
 								          if (empty())
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								            newRow();
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								          else
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								            forAllColumns(
 								                    [](auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                      {
 								                        col.data.emplace_back (col.data.back());
 								                      });
 								        }
 								      void
 								      dropLastRow()
-												implement fitting the platform model by linear regression

 * triggered by --calibrate
 * normalise away any known expense factors, but use them as weight
 * calculate simple linear regression from statistic data

											
										
										
											2021-09-25 03:39:21 +02:00
+								        {
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								          if (not empty())
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								            forAllColumns(
 								                    [](auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                      {
 								                        size_t siz = col.data.size();
 								                        col.data.resize (siz>0? siz-1 : 0);
 								                      });
-												implement fitting the platform model by linear regression

 * triggered by --calibrate
 * normalise away any known expense factors, but use them as weight
 * calculate simple linear regression from statistic data

											
										
										
											2021-09-25 03:39:21 +02:00
+								        }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
 								      void
 								      reserve (size_t expectedCapacity)
 								        {
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								            forAllColumns(
 								                    [=](auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                      {
 								                        col.data.reserve(expectedCapacity);
 								                      });
 								        }
-												Library: cover row handling of data table

...this uncovered one inconsistency: when directly adding values
into one of the embedded data vectors, the inconsistent size
was allowed to persist even when adding / removing lines.

This is in contradiction to the behavior for the CSV dump,
which uses index positions from the front of all vectors uniformely.

Thus changed the behaviour of adding a new row, so that it now
caps all vectors to a common size

also added function to clear the table

											
										
										
											2024-03-13 19:47:43 +01:00
 								      void
 								      clear()
 								        {
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								            forAllColumns(
 								                    [](auto& col)
-												Library: cover row handling of data table

...this uncovered one inconsistency: when directly adding values
into one of the embedded data vectors, the inconsistent size
was allowed to persist even when adding / removing lines.

This is in contradiction to the behavior for the CSV dump,
which uses index positions from the front of all vectors uniformely.

Thus changed the behaviour of adding a new row, so that it now
caps all vectors to a common size

also added function to clear the table

											
										
										
											2024-03-13 19:47:43 +01:00
+								                      {
 								                        col.data.clear();
 								                      });
 								        }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								      void
 								      appendFrom (CSVData const& csv)
 								        {
 								          if (isnil (csv)) return;
 								          verifyHeaderSpec (csv[0]);
 								          for (size_t row=1; row<csv.size(); ++row)
 								            if (not isnil (csv[row]))
 								              appendRowFromCSV (csv[row]);
 								        }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
 								      /** @param lineLimit number of rows to retain, back from the newest */
 								      void
 								      save (size_t lineLimit =std::numeric_limits<size_t>::max()
 								           ,bool backupOld =false)
 								        {
-												Library: extend the DataFile to allow using it without storage

...seems obvious and does not compromise the simplistic design...
...we do check the file path anyway, just need to add saveAs()...

											
										
										
											2024-03-13 18:57:48 +01:00
+								          if (filename_.empty())
 								            throw error::Logic{"Unable to save DataFile without filename given."};
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								          fs::path newFilename{filename_};
 								          newFilename += ".tmp";
 								          std::ofstream csvFile{newFilename, std::ios_base::out | std::ios_base::trunc};
 								          if (not csvFile.good())
 								            throw error::State{_Fmt{"Unable to create CSV output file %s"}
 								                                   % newFilename};
 								          saveData (csvFile, lineLimit);
 								          if (backupOld)
 								            {
 								              fs::path oldFile{filename_};
 								              oldFile += ".bak";
 								              if (fs::exists (filename_))
 								                  fs::rename (filename_, oldFile);
 								            }
 								          fs::rename (newFilename, filename_);
 								          filename_ = fs::consolidated(filename_);
 								        }                // lock onto absolute path
-												Library: extend the DataFile to allow using it without storage

...seems obvious and does not compromise the simplistic design...
...we do check the file path anyway, just need to add saveAs()...

											
										
										
											2024-03-13 18:57:48 +01:00
+								      void
 								      saveAs (fs::path newStorage
 								             ,size_t lineLimit =std::numeric_limits<size_t>::max())
 								        {
 								          newStorage = fs::consolidated (newStorage);
 								          if (fs::exists(newStorage))
 								            throw error::Invalid{_Fmt{"Storing DataFile rejected: target %s exists already"}
 								                                     % newStorage};
 								          if (not (newStorage.parent_path().empty()
 								                   or fs::exists(newStorage.parent_path())))
 								            throw error::Invalid{_Fmt{"DataFile(%s) placed into nonexistent directory %s"}
 								                                     % newStorage.filename() % newStorage.parent_path()};
 								          filename_ = newStorage;
 								          save (lineLimit);
 								        }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
 								    private: /* === Implementation === */
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								      /** apply a generic Lambda to all columns */
 								      template<class OP>
 								      void
 								      forAllColumns (OP&& doIt)  const
 								        {
 								          lib::meta::forEach (unConst(this)->allColumns()
 								                             ,std::forward<OP> (doIt));
 								        }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								      void
 								      loadData()
 								        {
 								          if (not (filename_.parent_path().empty()
 								                   or fs::exists(filename_.parent_path())))
 								            throw error::Invalid{_Fmt{"DataFile(%s) placed into nonexistent directory %s"}
 								                                     % filename_.filename() % filename_.parent_path()};
 								          if (not fs::exists(filename_))
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								            return; // leave the table empty
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
 								          std::ifstream csvFile{filename_};
 								          if (not csvFile.good())
 								            throw error::Config{_Fmt{"unable to read CSV data file %s"} % filename_};
 								          std::deque<string> rawLines;
 								          for (string line; std::getline(csvFile, line); )
 								            rawLines.emplace_back (move(line));
 								          if (rawLines.size() < 1) return;
 								          verifyHeaderSpec (rawLines[0]);
 								          // we know the number of rows now...
 								          reserve (rawLines.size() - 1);
 								          // storage in file is backwards, with newest data on top
 								          for (size_t row = rawLines.size()-1; 0<row; --row)
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								            if (not isnil(rawLines[row]))
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								              appendRowFromCSV (rawLines[row]);
 								        }
 								      void
 								      saveData (std::ofstream& csvFile, size_t lineLimit)
 								        {
 								          csvFile << generateHeaderSpec() << "\n";
 								          if (empty())
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								            return;
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								          lineLimit = size() > lineLimit? size()-lineLimit : 0;
 								          // store newest data first, possibly discard old data
 								          for (size_t row = size(); lineLimit < row; --row)
-												complete implementation of CSV backed data table

...mostly routine after solving the tricky design challenge

- for usage, instantiate the template DataFile with a Storage record
- object is created with filename, and immediately slurps in existing data
- data storage is optimised for readability (not speed); newest value at top

Note: some kind of testcase is "hidden" in this changeset only;
next changeset will remove research-experiment.hpp

											
										
										
											2021-09-17 17:57:55 +02:00
+								            csvFile << formatCSVRow(row-1) << "\n";
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								        }
 								      void
 								      verifyHeaderSpec (string headerLine)
 								        {
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								          CsvParser header{headerLine};
 								          forAllColumns(
 								                  [&](auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                    {
 								                      if (*header != col.header)
 								                        throw error::Invalid{_Fmt{"Header mismatch in CSV file %s. "
 								                                                  "Expecting column(%s) but found \"%s\""}
 								                                                 % filename_ % col.header % *header};
 								                      ++header;
 								                    });
 								        }
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								      CSVLine
 								      generateHeaderSpec()  const
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								        {
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								          CSVLine csv;
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								          forAllColumns(
 								                  [&](auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                    {
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								                      csv += col.header;
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                    });
 								          return csv;
 								        }
 								      void
 								      appendRowFromCSV (string line)
 								        {
 								          newRow();
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								          CsvParser csv(line);
 								          forAllColumns(
 								                  [&](auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                    {
 								                      if (not csv)
-												Library: some first thoughts regarding random number generation

Relying on random numbers for verification and measurements is known to be problematic.
At some point we are bound to control the seed values -- and in the actual
application usage we want to record sequence seeding in the event log.

Some initial thoughts regarding this intricate topic.
 * a low-ceremony drop-in replacement for rand() is required
 * we want the ability to pick-up and control each and every usage eventually
 * however, some usages explicitly require true randomness
 * the ability to use separate streams of random-number generation is desirable

											
										
										
											2024-03-11 22:47:29 +01:00
+								                        {
 								                          if (csv.isParseFail())
 								                            csv.fail();
 								                          else
 								                            throw error::Invalid{_Fmt{"Insufficient data; only %d fields, %d expected. Line:%s"}
 								                                                     % csv.getParsedFieldCnt() % columnCnt % line};
 								                        }
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
-												Upgrade: down with typename!!

Yet another chainsaw massacre.

One of the most obnoxious annoyances with C++ metaprogramming
is the need to insert `typename` and `template` qualifiers into
most definitions, to help the compiler to cope with the syntax,
which is not context-free.

The recent standards adds several clarifications, so that most
of these qualifiers are redundant now, at least at places where
it is unambiguously clear that only a type can be given.

GCC already supports most of these relaxing rules
(Clang unfortunately lags way behind with support of newer language features...)

											
										
										
											2025-07-05 20:08:18 +02:00
+								                      using Value = std::remove_reference<decltype(col)>::type::ValueType;
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                      col.get() = parseAs<Value>(*csv);
 								                      ++csv;
 								                    });
 								          if (csv)
 								            throw error::Invalid{_Fmt{"Excess data fields in CSV. Expect %d fields. Line:%s"}
 								                                     % columnCnt % line};
 								        }
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								      CSVLine
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								      formatCSVRow (size_t rownum)  const
 								        {
 								          if (this->empty())
 								            throw error::Logic{"Attempt to access data from empty DataTable."};
 								          if (rownum >= this->size())
 								            throw error::Logic{_Fmt{"Attempt to access row #%d beyond range [0..%d]."}
 								                                   % rownum % (size()-1)};
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								          CSVLine csvLine;
-												Library: rearrange support for CSV notation

- `forElse` belongs to the metaprogramming utils

- have a CSVLine, which is a string with custom appending mechanism

- this in turn allows CSVData to accept arbitrary sized tuples,
  by rendering them into CSVLine

											
										
										
											2024-04-01 22:33:55 +02:00
+								          forAllColumns(
 								                  [&](auto& col)
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                    {
-												Library: add some mutual integration between DataFile and CSVData

...both are related to CSV, and it is conceivable
to create inline CSVData in a test case to populate a DataFile

											
										
										
											2024-04-02 21:18:23 +02:00
+								                      csvLine += col.data.at(rownum);
-												Library: integrate into the Lumiera code base

- reformat in Lumieara-GNU style
- use the Lumiera exceptions
- use Lumiera format-string frontend
- use lib/util

NOTE: I am the original author of the code introduced here,
and thus I can re-license it under GPL 2+

											
										
										
											2024-03-11 01:52:49 +01:00
+								                    });
 								          return csvLine;
 								        }
 								    };
 								}} // namespace lib::stat
 								#endif /*LIB_STAT_DATA_H*/