LUMIERA.clone/src/steam/engine/proc-node.cpp
Ichthyostega ead494e465 Invocation: Argument-spec evaluation sufficiently complete for now
Some additional tests to challenge the parser, which seems to work well.
Without extended analysis into the usage of those node specifications,
it is pointless to expand further on its capabilities. For now, it is
sufficient to have a foundation for hash-computation in place.

__Note__: found a nifty way to give lib::Several an easy toString rendering,
without cranking up the header inclusion load.
2025-02-02 17:22:16 +01:00

408 lines
13 KiB
C++
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

/*
ProcNode - Implementation of render node processing
Copyright (C)
2024, Hermann Vosseler <Ichthyostega@web.de>
  **Lumiera** is free software; you can redistribute it and/or modify it
  under the terms of the GNU General Public License as published by the
  Free Software Foundation; either version 2 of the License, or (at your
  option) any later version. See the file COPYING for further details.
* *****************************************************************/
/** @file proc-node.cpp
** Translation unit to hold the actual implementation of node processing operations.
**
** @todo WIP-WIP-WIP 6/2024 not clear yet what goes here and what goes into turnout-system.cpp
*/
#include "steam/engine/proc-id.hpp"
#include "steam/engine/proc-node.hpp"
#include "lib/several-builder.hpp"
#include "lib/iter-explorer.hpp"
#include "lib/format-string.hpp"
#include "lib/format-util.hpp"
#include "lib/parse.hpp"
#include "lib/util.hpp"
#include <boost/functional/hash.hpp> /////////////////////////////////////////////////////TICKET #1391 is boost-hash the proper tool for this task?
#include <unordered_set>
#include <set>
namespace steam {
namespace engine {
using lib::explore;
using util::_Fmt;
using util::isnil;
using util::unConst;
using util::contains;
using boost::hash_combine;
namespace {// Details: parsing, registration and symbol table for node spec data...
std::unordered_set<ProcID> procRegistry;
std::unordered_set<string> symbRegistry;
/** deduplicate and re-link to the entry in the symbol table */
void inline
dedupSymbol (StrView& symbol)
{
auto res = symbRegistry.emplace (symbol);
symbol = *res.first;
}
/* ===== Parse nested spec ===== */
using util::parse::accept;
using util::parse::accept_bracket;
using util::parse::accept_repeated;
using util::parse::expectResult;
using lib::meta::NullType;
using std::regex_match;
using std::regex;
const regex SPEC_CONTENT{R"_([^,\\\(\)\[\]{}<>"]+)_", regex::optimize};
const regex NON_QUOTE {R"_([^"\\]+)_" , regex::optimize};
const regex ESCAPE {R"_(\\.)_" , regex::optimize};
const regex COMMA {R"_(,)_" , regex::optimize};
const regex D_QUOTE {R"_(")_" , regex::optimize};
auto quoted = accept_repeated(accept(NON_QUOTE).alt(ESCAPE));
auto quote = accept_bracket(D_QUOTE,D_QUOTE, quoted);
template<char OPE, char CLO>
auto&
syntaxBracketed()
{
string esc{"\\"};
regex OPENING{esc+OPE};
regex CLOSING{esc+CLO};
regex NON_PAREN{R"_([^\\)_"+esc+OPE+esc+CLO+"]+"};
static auto paren = expectResult<NullType>();
auto parenContent = accept_repeated(accept(NON_PAREN)
.alt(ESCAPE)
.alt(quote)
.alt(paren));
paren = accept_bracket(OPENING,CLOSING, parenContent).bind([](auto){ return NullType{}; });
return paren;
}
auto specTermSyntax = accept_repeated(accept(SPEC_CONTENT)
.alt(ESCAPE)
.alt(quote)
.alt(syntaxBracketed<'(',')'>())
.alt(syntaxBracketed<'<','>'>())
.alt(syntaxBracketed<'[',']'>())
.alt(syntaxBracketed<'{','}'>())
)
.bindMatch();
const regex REPEAT_SPEC {R"_(^(.+)\s*/(\d+)\s*$)_", regex::optimize};
/**
* Helper to expand an abbreviated repetition of arguments.
* Implemented as custom-processing layer for IterExplorer,
* by adapting the »State Core« interface
* @remark Repetition is indicated by a trailing "/NUM"
*/
template<class IT>
struct RepetitionExpander
: lib::IterStateCore<IT>
{
using Core = lib::IterStateCore<IT>;
mutable uint repeat_{0};
mutable std::smatch mat_;
StrView
yield() const
{
if (not repeat_)
{ // check if the next string ends with repetition marker /NUM
if (not regex_match (*Core::srcIter(), mat_, REPEAT_SPEC))
return *Core::srcIter(); // no repetition -> pass through
// setup repetition by extracting the repetition count
repeat_ = boost::lexical_cast<uint>(mat_.str(2));
}
return StrView(& *mat_[1].first, mat_[1].length());
} // several repetitions created from same source
void
iterNext()
{ // hold iteration until all repetitions were delivered
if (repeat_)
--repeat_;
if (not repeat_)
++ Core::srcIter();
}
using Core::Core;
};
/** Argument-Spec processing pipeline;
* possibly expands repetition abbreviation,
* collects all argument strings into a lib::Several
*/
lib::Several<const string>
evaluateArgSeq (std::vector<string>& parsedArgTerms)
{
auto several = lib::makeSeveral<const string>();
lib::explore (parsedArgTerms)
.processingLayer<RepetitionExpander>()
.foreach([&](StrView s){ several.emplace<string>(s); });
return several.build();
}
auto
emptyArgSeq()
{
return lib::Several<const string>();
}
} // (END) Details...
Port::~Port() { } ///< @remark VTables for the Port-Turnout hierarchy emitted from \ref proc-node.cpp
/**
* @remark this is the only public access point to ProcID entries,
* which are automatically deduplicated and managed in a common registry
* and retained until end of the Lumiera process (never deleted).
*/
ProcID&
ProcID::describe (StrView nodeSymb, StrView portSpec)
{
REQUIRE (not isnil (nodeSymb));
REQUIRE (not isnil (portSpec));
REQUIRE (not contains (nodeSymb, ' '));
auto p = portSpec.find('(');
if (p == string::npos)
throw err::Invalid{_Fmt{"Spec for processing operation must contain at least one argument list. "
"Node:%s Spec:%s"}
% nodeSymb % portSpec
};
auto res = procRegistry.insert (ProcID{nodeSymb, portSpec.substr(0,p), portSpec.substr(p)});
ProcID& entry{unConst (*res.first)};
if (res.second)
{// new record placed into the registry
dedupSymbol (entry.nodeName_);
dedupSymbol (entry.argLists_);
if (not isnil(entry.portQual_))
dedupSymbol (entry.portQual_);
}
return entry;
}
/** @internal */
ProcID::ProcID (StrView nodeSymb, StrView portQual, StrView argLists)
: nodeName_{nodeSymb}
, portQual_{portQual}
, argLists_{argLists}
{ }
/**
* generate registry hash value based on the distinct data in ProcID.
* This function is intended to be picked up by ADL, and should be usable
* both with `std::hash` and `<boost/functional/hash.hpp>`.
*/
HashVal
hash_value (ProcID const& procID)
{
HashVal hash = boost::hash_value (procID.nodeName_); ///////////////////////////////////////////////////TICKET #1391 : which technology to use for processing-ID hashes -> cache keys?
if (not isnil(procID.portQual_))
hash_combine (hash, procID.portQual_); ////////////////////////////////////////////////////////TICKET #1391 : should use lib/hash-combine.hpp (stable, but not portable!)
hash_combine (hash, procID.argLists_);
return hash;
}
string
ProcID::genProcName()
{
std::ostringstream buffer;
buffer << genNodeSymbol()
<< genQualifier();
return buffer.str();
}
string
ProcID::genProcSpec()
{
std::ostringstream buffer;
buffer << nodeName_
<< genQualifier()
<< argLists_;
return buffer.str();
}
string
ProcID::genNodeName()
{
return string{nodeName_};
}
string
ProcID::genNodeSymbol()
{
auto p = nodeName_.find(':');
return p == string::npos? string{nodeName_}
: string{nodeName_.substr(p+1)};
}
string
ProcID::genNodeDomain()
{
auto p = nodeName_.find(':');
return p == string::npos? string{}
: string{nodeName_.substr(0,p)};
}
string
ProcID::genQualifier()
{
std::ostringstream buffer;
if (not isnil(portQual_))
buffer << '.' << portQual_;
return buffer.str();
}
namespace { // Helper to access ProcID recursively
ProcID&
procID (ProcNode& node)
{
REQUIRE (not isnil(watch(node).ports()));
return watch(node).ports().front().procID;
}
}
string
ProcID::genNodeSpec (Leads& leads)
{
std::ostringstream buffer;
buffer << nodeName_;
if (1 != leads.size())
buffer << genSrcSpec(leads);
else
{ // single chain....
ProcNode& p{leads.front().get()};
buffer << "◁—"
<< procID(p).genNodeName() // show immediate predecessor
<< procID(p).genSrcSpec(leads); // and behind that recursively the source(s)
}
return buffer.str();
}
string
ProcID::genSrcSpec (Leads& leads)
{
return isnil(leads)? string{"-◎"} // no leads => starting point itself is a source node
: "┉┉{"
+ util::join(
explore(leads)
.expandAll([](ProcNode& n){ return explore(watch(n).leads()); }) // depth-first expand all predecessors
.filter ([](ProcNode& n){ return watch(n).isSrc(); }) // but retain only leafs (≙ source nodes)
.transform([](ProcNode& n){ return procID(n).nodeName_;}) // render the node-symbol of each src
.deduplicate()) // sort and deduplicate
+ "}";
}
/** parse and dissect the argument specification */
ProcID::ArgModel
ProcID::genArgModel()
{
auto argListSyntax = accept_bracket(accept_repeated(0,MAX_NODE_ARG, COMMA, specTermSyntax));
auto argSpecSyntax = accept(argListSyntax)
.opt(argListSyntax)
.bind([](auto model) -> ProcID::ArgModel
{
auto [list1,list2] = model;
if (list2)
return {evaluateArgSeq(list1), evaluateArgSeq(*list2)};
else
return {emptyArgSeq(), evaluateArgSeq(list1)};
});
argSpecSyntax.parse (argLists_);
if (not argSpecSyntax.success())
throw err::Invalid{_Fmt{"Unable to parse argument list. "
"Node:%s Spec:%s"}
% genProcName() % argLists_
};
return argSpecSyntax.extractResult();
}
/**
* @return symbolic string with format `NodeSymb--<predecessorSpec>`
* @remark connectivity information is abbreviated and foremost
* indicates the data source(s)
*/
string
ProcNodeDiagnostic::getNodeSpec()
{
REQUIRE (not isnil(ports()));
return ports().front().procID.genNodeSpec (leads());
}
HashVal
ProcNodeDiagnostic::getNodeHash() ///< @todo not clear yet if this has to include predecessor info
{
UNIMPLEMENTED ("calculate an unique hash-key to designate this node");
}
/**
* @return symbolic string with format `NodeSymb[.portQualifier](inType[/#][,inType[/#]])(outType[/#][,outType[/#]][ >N])`
* @remark information presented here is passed-through from builder Level-3, based on semantic markup present there
*/
string
ProcNodeDiagnostic::getPortSpec (uint portIdx)
{
auto& p{n_.wiring_.ports};
return portIdx < p.size()? p[portIdx].procID.genProcSpec()
: util::FAILURE_INDICATOR;
}
HashVal
ProcNodeDiagnostic::getPortHash (uint portIdx)
{
UNIMPLEMENTED ("calculate an unique, stable and reproducible hash-key to identify the Turnout");
}
lib::Several<PortRef>
PortDiagnostic::srcPorts()
{
UNIMPLEMENTED ("intrude into the Turnout and find out about source connectivity");
}
/**
* @return the symbolic string representing this processing port,
* as [provided by Node-identification](\ref ProcID::genProcSpec())
*/
string
PortDiagnostic::getProcSpec()
{
return p_.procID.genProcSpec();
}
HashVal
PortDiagnostic::getProcHash() ///< @return as [calculated by Node-identification](\ref ProcID)
{
UNIMPLEMENTED ("calculate an unique, stable and reproducible hash-key to identify the Turnout");
}
}} // namespace steam::engine