LUMIERA.clone/src/steam/engine/proc-node.cpp
Ichthyostega 7998c8d724 Library: need support for specification parsing
Unfortunately, there are some common syntactic structures, which can not easily be dissected by regular expressions alone, since they entail nested subexpressions. While it is possible to get beyond those fundamental limitations with some trickery, doing so remains precisely that, ''trickery.''

After fighting some inner conflicts, since ''I do know how to write a parser'' —
in the end I have brought myself to just do it.

And indeed, as you'd might expect, I have looked into existing library solutions,
and I would not like to have any one of them as part of the project.
 * I do not want a ''parser engine'' or ''parser generator''
 * I want the directness of recursive-descent, but combined with Regular Expressions as terminal
 * I want to see the structure of the used grammar at the definition site of the custom parser function
 * I want deep integration of ''model bindings'' into the parse process, i.e. binding-λ
 * I do not want to write model-dissecting or pattern-matching code after the parse
 * I do not want to expose ''Monads'' as an interface, since they tend to spread unhealthy structure to surrounding code
 * I do not want to leak technicalities of the parse mechanics into the using code
 * I do not want to impose hard to remember specific conventions onto the user

Thus I've set the following aims:
 * The usage should require only a single header include (ideally header-only)
 * The entrance point should be a small number of DSL-starter functions
 * The parser shall be implemented by recursive-descent, using the parser-combinator technique
 * But I want that wrapped into a DSL, to be able to control what is (not) provided or exposed.
 * I want a stateful, applicative logic, since parsing, by its very nature, is stateful!
 * I want complete compile-time typing, visible to the optimiser, without a virtual »Parser« interface

And last but not least, ''I do not want to create a ticket, since I do not know if those goals can be achieved...''
2025-01-17 18:40:44 +01:00

268 lines
8 KiB
C++
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/*
ProcNode - Implementation of render node processing
Copyright (C)
2024, Hermann Vosseler <Ichthyostega@web.de>
  **Lumiera** is free software; you can redistribute it and/or modify it
  under the terms of the GNU General Public License as published by the
  Free Software Foundation; either version 2 of the License, or (at your
  option) any later version. See the file COPYING for further details.
* *****************************************************************/
/** @file proc-node.cpp
** Translation unit to hold the actual implementation of node processing operations.
**
** @todo WIP-WIP-WIP 6/2024 not clear yet what goes here and what goes into turnout-system.cpp
*/
#include "steam/engine/proc-id.hpp"
#include "steam/engine/proc-node.hpp"
#include "lib/iter-explorer.hpp"
#include "lib/format-string.hpp"
#include "lib/format-util.hpp"
#include "lib/regex.hpp"
#include "lib/util.hpp"
#include <boost/functional/hash.hpp> /////////////////////////////////////////////////////TICKET #1391 is boost-hash the proper tool for this task?
#include <unordered_set>
#include <set>
namespace steam {
namespace engine {
using lib::explore;
using util::_Fmt;
using util::isnil;
using util::unConst;
using util::contains;
using boost::hash_combine;
namespace {// Details: parsing, registration and symbol table for node spec data...
std::unordered_set<ProcID> procRegistry;
std::unordered_set<string> symbRegistry;
/** deduplicate and re-link to the entry in the symbol table */
void inline
dedupSymbol (StrView& symbol)
{
auto res = symbRegistry.emplace (symbol);
symbol = *res.first;
}
} // (END) Details...
Port::~Port() { } ///< @remark VTables for the Port-Turnout hierarchy emitted from \ref proc-node.cpp
/**
* @remark this is the only public access point to ProcID entries,
* which are automatically deduplicated and managed in a common registry
* and retained until end of the Lumiera process (never deleted).
*/
ProcID&
ProcID::describe (StrView nodeSymb, StrView portSpec)
{
REQUIRE (not isnil (nodeSymb));
REQUIRE (not isnil (portSpec));
REQUIRE (not contains (nodeSymb, ' '));
auto p = portSpec.find('(');
if (p == string::npos)
throw err::Invalid{_Fmt{"Spec for processing operation must contain at least one argument list. "
"Node:%s Spec:%s"}
% nodeSymb % portSpec
};
auto res = procRegistry.insert (ProcID{nodeSymb, portSpec.substr(0,p), portSpec.substr(p)});
ProcID& entry{unConst (*res.first)};
if (res.second)
{// new record placed into the registry
dedupSymbol (entry.nodeName_);
dedupSymbol (entry.argLists_);
if (not isnil(entry.portQual_))
dedupSymbol (entry.portQual_);
}
return entry;
}
/** @internal */
ProcID::ProcID (StrView nodeSymb, StrView portQual, StrView argLists)
: nodeName_{nodeSymb}
, portQual_{portQual}
, argLists_{argLists}
{ }
/**
* generate registry hash value based on the distinct data in ProcID.
* This function is intended to be picked up by ADL, and should be usable
* both with `std::hash` and `<boost/functional/hash.hpp>`.
*/
HashVal
hash_value (ProcID const& procID)
{
HashVal hash = boost::hash_value (procID.nodeName_); ///////////////////////////////////////////////////TICKET #1391 : which technology to use for processing-ID hashes -> cache keys?
if (not isnil(procID.portQual_))
hash_combine (hash, procID.portQual_); ////////////////////////////////////////////////////////TICKET #1391 : should use lib/hash-combine.hpp (stable, but not portable!)
hash_combine (hash, procID.argLists_);
return hash;
}
string
ProcID::genProcName()
{
std::ostringstream buffer;
buffer << genNodeSymbol()
<< genQualifier();
return buffer.str();
}
string
ProcID::genProcSpec()
{
std::ostringstream buffer;
buffer << nodeName_
<< genQualifier()
<< argLists_;
return buffer.str();
}
string
ProcID::genNodeName()
{
return string{nodeName_};
}
string
ProcID::genNodeSymbol()
{
auto p = nodeName_.find(':');
return p == string::npos? string{nodeName_}
: string{nodeName_.substr(p+1)};
}
string
ProcID::genNodeDomain()
{
auto p = nodeName_.find(':');
return p == string::npos? string{}
: string{nodeName_.substr(0,p)};
}
string
ProcID::genQualifier()
{
std::ostringstream buffer;
if (not isnil(portQual_))
buffer << '.' << portQual_;
return buffer.str();
}
namespace { // Helper to access ProcID recursively
ProcID&
procID (ProcNode& node)
{
REQUIRE (not isnil(watch(node).ports()));
return watch(node).ports().front().procID;
}
}
string
ProcID::genNodeSpec (Leads& leads)
{
std::ostringstream buffer;
buffer << nodeName_;
if (1 != leads.size())
buffer << genSrcSpec(leads);
else
{ // single chain....
ProcNode& p{leads.front().get()};
buffer << "◁—"
<< procID(p).genNodeName() // show immediate predecessor
<< procID(p).genSrcSpec(leads); // and behind that recursively the source(s)
}
return buffer.str();
}
string
ProcID::genSrcSpec (Leads& leads)
{
return isnil(leads)? string{"-◎"} // no leads => starting point itself is a source node
: "┉┉{"
+ util::join(
explore(leads)
.expandAll([](ProcNode& n){ return explore(watch(n).leads()); }) // depth-first expand all predecessors
.filter ([](ProcNode& n){ return watch(n).isSrc(); }) // but retain only leafs (≙ source nodes)
.transform([](ProcNode& n){ return procID(n).nodeName_;}) // render the node-symbol of each src
.deduplicate()) // sort and deduplicate
+ "}";
}
/**
* @return symbolic string with format `NodeSymb--<predecessorSpec>`
* @remark connectivity information is abbreviated and foremost
* indicates the data source(s)
*/
string
ProcNodeDiagnostic::getNodeSpec()
{
REQUIRE (not isnil(ports()));
return ports().front().procID.genNodeSpec (leads());
}
HashVal
ProcNodeDiagnostic::getNodeHash() ///< @todo not clear yet if this has to include predecessor info
{
UNIMPLEMENTED ("calculate an unique hash-key to designate this node");
}
/**
* @return symbolic string with format `NodeSymb[.portQualifier](inType[/#][,inType[/#]])(outType[/#][,outType[/#]][ >N])`
* @remark information presented here is passed-through from builder Level-3, based on semantic markup present there
*/
string
ProcNodeDiagnostic::getPortSpec (uint portIdx)
{
auto& p{n_.wiring_.ports};
return portIdx < p.size()? p[portIdx].procID.genProcSpec()
: util::FAILURE_INDICATOR;
}
HashVal
ProcNodeDiagnostic::getPortHash (uint portIdx)
{
UNIMPLEMENTED ("calculate an unique, stable and reproducible hash-key to identify the Turnout");
}
lib::Several<PortRef>
PortDiagnostic::srcPorts()
{
UNIMPLEMENTED ("intrude into the Turnout and find out about source connectivity");
}
/**
* @return the symbolic string representing this processing port,
* as [provided by Node-identification](\ref ProcID::genProcSpec())
*/
string
PortDiagnostic::getProcSpec()
{
return p_.procID.genProcSpec();
}
HashVal
PortDiagnostic::getProcHash() ///< @return as [calculated by Node-identification](\ref ProcID)
{
UNIMPLEMENTED ("calculate an unique, stable and reproducible hash-key to identify the Turnout");
}
}} // namespace steam::engine