LUMIERA.clone/src/lib/util.hpp
Ichthyostega 58ffbac7f3 Library: implement logic-interpretation
- the basic interpretation of Action-tokens is already in place
 - add the interpretation of conditional and looping constructs
 - this includes helpers for
   * reset to another Action-token index
   * recursive interpretation of the next token
   * handling of nested loop evaluation context

In order to make this implementation compile, also the skeleton
of the Map-string-string data binding must be completed, including
a draft how to handle nested keys in a simple map
2024-03-25 03:30:16 +01:00

499 lines
13 KiB
C++

/*
UTIL.hpp - collection of small helper functions used "everywhere"
Copyright (C) Lumiera.org
2008, Hermann Vosseler <Ichthyostega@web.de>
This program is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License as
published by the Free Software Foundation; either version 2 of
the License, or (at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
*/
/** @file lib/util.hpp
** Tiny helper functions and shortcuts to be used _everywhere_
** Consider this header to be effectively included in almost every translation unit.
** @remark The motivation of using these helpers is conciseness and uniformity of expression.
** There are several extensions and not-so-frequently used supplements packaged into
** separate headers.
** @warning be sure to understand the ramifications of including _anything_ here...
** @see util-coll.hpp
** @see util-foreach.hpp
** @see util-quant.hpp
*/
#ifndef LIB_UTIL_H
#define LIB_UTIL_H
#include "include/limits.hpp"
#include "lib/hash-standard.hpp"
#include <string>
namespace std {// forward declarations to avoid pervasive includes
template<typename T>
class allocator;
template<typename K, typename CMP, class ALLO>
class set;
template<typename IT, typename V>
IT find (IT, IT, V const&);
template<typename IT, typename V>
IT remove (IT, IT, V const&);
}
const char* cStr (std::string const&);
namespace util {
using std::string;
using CStr = const char*;
template <class NUM>
inline int constexpr
sgn (NUM n)
{
return (n==0)? 0 :((n<0)? -1:+1 );
}
template <class N1, class N2>
inline N1 constexpr
min (N1 n1, N2 n2)
{
return n2 < n1? N1(n2) : n1;
}
template <class N1, class N2>
inline N1 constexpr
max (N1 n1, N2 n2)
{
return n1 < n2? N1(n2) : n1;
}
/** cut a numeric value to be >=0 */
template <typename NUM>
inline NUM constexpr
noneg (NUM val)
{
return (0<val? val : 0);
}
/** force a numeric to be within bounds, inclusively */
template <typename NUM, typename NB>
inline NUM constexpr
limited (NB lowerBound, NUM val, NB upperBound)
{
return min ( max (val, lowerBound)
, upperBound);
}
template <typename NUM, typename NB>
inline bool constexpr
isLimited (NB lowerBound, NUM val, NB upperBound)
{
return lowerBound <= val
and val <= upperBound;
}
/** positive integral number from textual representation
* @return always a number, 0 in case of unparseable text,
* limited to 0 <= num <= LUMIERA_MAX_ORDINAL_NUMBER */
inline uint
uNum (CStr charPtr)
{
if (!charPtr) return 0;
int parsedNumber (std::atoi (charPtr));
return limited (0, parsedNumber, LUMIERA_MAX_ORDINAL_NUMBER);
}
inline int
sNum (CStr charPtr)
{
if (!charPtr) return 0;
int parsedNumber (std::atoi (charPtr));
return limited (-LUMIERA_MAX_ORDINAL_NUMBER, parsedNumber, LUMIERA_MAX_ORDINAL_NUMBER);
}
template<class OBJ>
inline uint
uNum (OBJ const& spec)
{
return uNum (cStr(spec));
}
template<class OBJ>
inline int
sNum (OBJ const& spec)
{
return sNum (cStr(spec));
}
/* ======== generic empty check ========= */
/** a family of util functions providing a "no value whatsoever" test.
Works on strings and all STL containers, includes NULL test for pointers */
template <class CONT>
inline bool
isnil (const CONT& container)
{
return container.empty();
}
template <class CONT>
inline bool
isnil (const CONT* pContainer)
{
return !pContainer or pContainer->empty();
}
template <class CONT>
inline bool
isnil (CONT* pContainer)
{
return !pContainer or pContainer->empty();
}
inline bool
isnil (CStr charPtr)
{
return !charPtr or !(*charPtr);
}
/** check if string starts with a given prefix */
inline bool
startsWith (string const& str, string const& prefix)
{
return 0 == str.rfind (prefix, 0);
}
inline bool
startsWith (string const& str, CStr prefix)
{
return 0 == str.rfind (prefix, 0);
}
/** check if string ends with the given suffix */
inline bool
endsWith (string const& str, string const& suffix)
{
size_t l = suffix.length();
if (l > str.length()) return false;
size_t pos = str.length() - l;
return pos == str.find (suffix, pos);
}
inline bool
endsWith (string const& str, CStr suffix)
{
return endsWith (str, string(suffix));
}
inline void
removePrefix (string& str, string const& prefix)
{
if (not startsWith (str,prefix)) return;
str = str.substr (prefix.length());
}
inline void
removeSuffix (string& str, string const& suffix)
{
if (not endsWith (str,suffix)) return;
str.resize(str.length() - suffix.length());
}
/** shortcut for containment test on a map */
template <typename MAP>
inline bool
contains (MAP& map, typename MAP::key_type const& key)
{
return map.find(key) != map.end();
}
/** shortcut for set value containment test */
template <typename T, class CMP, class ALO>
inline bool
contains (std::set<T,CMP,ALO> const& set, T const& val)
{
return set.end() != set.find (val);
}
/** shortcut for string value containment test */
template <typename T>
inline bool
contains (std::string const& str, const T& val)
{
return str.find (val) != std::string::npos;
}
/** shortcut for brute-force containment test
* in any sequential container */
template <typename SEQ>
inline bool
contains (SEQ const& cont, typename SEQ::const_reference val)
{
typename SEQ::const_iterator begin = cont.begin();
typename SEQ::const_iterator end = cont.end();
return end != std::find(begin,end, val);
}
/** use (and exhaust) a »Lumiera Forward Iterator« for linear search */
template <class IT>
inline bool
linearSearch (IT iter, typename IT::value_type const& val)
{
IT end{};
return end != std::find (std::move (iter), end, val);
}
/** fetch value from a Map, or return a default if not found */
template <typename MAP>
inline typename MAP::mapped_type
getValue_or_default (MAP& map, typename MAP::key_type const& key
, typename MAP::mapped_type defaultVal)
{
typename MAP::const_iterator pos = map.find (key);
if (pos != map.end())
return pos->second;
else
return defaultVal;
}
/** expose a reference to a map entry, with fall-back to some default object
* @note exposing a const reference; especially the default needs to reside
* somewhere at a safe storage location.
* @see lib::NullValue
*/
template <typename MAP>
inline typename MAP::mapped_type const &
access_or_default (MAP& map, typename MAP::key_type const& key
, typename MAP::mapped_type const& refDefault)
{
typename MAP::const_iterator pos = map.find (key);
if (pos != map.end())
return pos->second;
else
return refDefault;
}
/** shortcut for removing all copies of an Element
* in any sequential collection */
template <typename SEQ>
inline typename SEQ::iterator
removeall (SEQ& coll, typename SEQ::value_type const& val)
{
typename SEQ::iterator collEnd = coll.end();
return coll.erase (std::remove (coll.begin(), collEnd, val),
collEnd
);
}
/** remove all elements fulfilling a given predicate
* from a (sorted) set.
* @return true if anything has been removed. */
template<class SET, typename FUN>
bool remove_if (SET& set, FUN test)
{
typedef typename SET::iterator Itor;
bool found = false;
Itor end = set.end();
Itor begin = set.begin();
Itor pos = begin;
while (pos!=end)
{
if (not test(*pos))
++pos;
else
{
found = true;
if (pos==begin)
{
set.erase(pos);
pos = begin = set.begin();
}
else
{
set.erase(pos--);
++pos;
}
end = set.end();
} }
return found;
}
/** shortcut to save some typing when having to define
* const and non-const variants of member functions
*/
template<class OBJ>
inline OBJ*
unConst (const OBJ* o)
{
return const_cast<OBJ*> (o);
}
template<class OBJ>
inline OBJ&
unConst (OBJ const& ro)
{
return const_cast<OBJ&> (ro);
}
/** compare plain object identity,
* bypassing any custom comparison operators.
*/
template<class A, class B>
inline bool
isSameObject (A const& a, B const& b)
{
return static_cast<const void*> (std::addressof(a))
== static_cast<const void*> (std::addressof(b));
}
/** extract address but strip any type info */
template<class X>
inline const void*
getAddr (X& x)
{
return static_cast<const void*> (std::addressof(x));
}
template<class X>
inline const void*
getAddr (X* x)
{
return static_cast<const void*> (x);
}
/** the addressable memory »slot« — platform dependent */
template<typename X>
inline size_t
slotNr (X const& x)
{
return reinterpret_cast<size_t> (std::addressof(x)) / sizeof(size_t);
}
template<typename X>
inline size_t
slotNr (X const* x)
{
return reinterpret_cast<size_t> (x) / sizeof(size_t);;
}
/** determine heuristically if two objects
* are located „close to each other“ in memory.
* @remark can be used to find out about heap vs. stack allocation
*/
template<typename A, typename B>
inline bool
isCloseBy (A&& a, B&& b, size_t consideredNearby =50)
{
size_t loc1 = slotNr (std::forward<A> (a));
size_t loc2 = slotNr (std::forward<B> (b));
size_t dist = loc2 > loc1? loc2-loc1:loc1-loc2;
return dist < consideredNearby;
}
/** produce an identifier based on the given string.
* remove non-standard-chars, reduce sequences of punctuation
* and whitespace to single underscores. The sanitised string
* will start with an alphanumeric character.
*
* @par Example Conversions
\verbatim
"Word" --> "Word"
"a Sentence" --> "a_Sentence"
"trailing Withespace \t \n" --> "trailing_Withespace"
"with a lot \nof Whitespace" --> "with_a_lot_of_Whitespace"
"@with\".\'much ($punctuation)[]!" --> "@with.much_($punctuation)"
"§&Ω%€ leading garbage" --> "leading_garbage"
"mixed Ω garbage" --> "mixed_garbage"
"Bääääh!!" --> "Bh"
\endverbatim
* @see \ref UtilSanitizedIdentifier_test
* @see \ref lib::meta::sanitisedSymbol()
*/
string sanitise (string const& org);
/** remove leading and trailing whitespace
* @return a trimmed copy (default locale)
*/
string trim (string const& org);
/** interpret text representation of a boolean value.
* @remarks this function detects the relevant token rather strict....
* - yields `true` for the tokens "true", "True", "TRUE", "yes", "Yes", "YES", "1", "+"
* - yields `false` for the tokens "false", "False", "FALSE", "no", "No, "NO", "0", "-"
* - leading and trailing whitespace is ignored
* @throws lumiera::error::Invalid for any other text content
*/
bool boolVal (string const&);
/** check the given text if it can be interpreted as affirmative answer (bool `true`).
* @remarks this function just fishes for the known `true` tokens and interprets
* all other content as `false`, including empty strings. Never throws.
*/
bool isYes (string const&) noexcept;
/** check if the given text is empty or can be interpreted as rejection (bool `false`)-
* @remarks this function fishes for the known `false` tokens;
* any other non-empty content counts as _not no._
*/
bool isNo (string const&) noexcept;
} // namespace util
/* === some common macro definitions === */
/** suppress "warning: unused variable" on vars, which are
* introduced into a scope because of some sideeffect, i.e. Locking
*/
#define SIDEEFFECT __attribute__ ((unused));
/** this macro wraps its parameter into a cstring literal */
#define STRINGIFY(TOKEN) __STRNGFY(TOKEN)
#define __STRNGFY(TOKEN) #TOKEN
/** shortcut for subclass test, intended for assertions only.
* @note it is considered bad style to use such in non-assertion code,
* and we probably will enforce this design rule in future. */
#define INSTANCEOF(CLASS, EXPR) (dynamic_cast<const CLASS*> (EXPR))
/** the inevitable MAX macro, sometimes still necessary in template code */
#ifndef MAX // this is present to make this definition play nice with GLib
#define MAX(A,B) ((A < B) ? (B) : (A))
#endif
#endif /*UTIL_HPP_*/