/* _____ __ _____________ _______ ______ ___________ / \| | \____ \__ \\_ __ \/ ___// __ \_ __ \ | Y Y \ | / |_> > __ \| | \/\___ \\ ___/| | \/ |__|_| /____/| __(____ /__| /____ >\___ >__| \/ |__| \/ \/ \/ Copyright (C) 2022 Ingo Berg Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: * Redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer. * Redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "muParserBase.h" #include "muParserTemplateMagic.h" //--- Standard includes ------------------------------------------------------------------------ #include #include #include #include #include #include #include #include #include #ifdef MUP_USE_OPENMP #include #endif #if defined(_MSC_VER) #pragma warning(push) #pragma warning(disable : 26812) #endif using namespace std; /** \file \brief This file contains the basic implementation of the muparser engine. */ namespace mu { std::locale ParserBase::s_locale = std::locale(std::locale::classic(), new change_dec_sep('.')); bool ParserBase::g_DbgDumpCmdCode = false; bool ParserBase::g_DbgDumpStack = false; //------------------------------------------------------------------------------ /** \brief Identifiers for built in binary operators. When defining custom binary operators with #AddOprt(...) make sure not to choose names conflicting with these definitions. */ const char_type* ParserBase::c_DefaultOprt[] = { _T("<="), _T(">="), _T("!="), _T("=="), _T("<"), _T(">"), _T("+"), _T("-"), _T("*"), _T("/"), _T("^"), _T("&&"), _T("||"), _T("="), _T("("), _T(")"), _T("?"), _T(":"), 0 }; const int ParserBase::s_MaxNumOpenMPThreads = 16; //------------------------------------------------------------------------------ /** \brief Constructor. \param a_szFormula the formula to interpret. \throw ParserException if a_szFormula is nullptr. */ ParserBase::ParserBase() : m_pParseFormula(&ParserBase::ParseString) , m_vRPN() , m_vStringBuf() , m_pTokenReader() , m_FunDef() , m_PostOprtDef() , m_InfixOprtDef() , m_OprtDef() , m_ConstDef() , m_StrVarDef() , m_VarDef() , m_bBuiltInOp(true) , m_sNameChars() , m_sOprtChars() , m_sInfixOprtChars() , m_vStackBuffer() , m_nFinalResultIdx(0) { InitTokenReader(); } //--------------------------------------------------------------------------- /** \brief Copy constructor. The parser can be safely copy constructed but the bytecode is reset during copy construction. */ ParserBase::ParserBase(const ParserBase& a_Parser) : m_pParseFormula(&ParserBase::ParseString) , m_vRPN() , m_vStringBuf() , m_pTokenReader() , m_FunDef() , m_PostOprtDef() , m_InfixOprtDef() , m_OprtDef() , m_ConstDef() , m_StrVarDef() , m_VarDef() , m_bBuiltInOp(true) , m_sNameChars() , m_sOprtChars() , m_sInfixOprtChars() { m_pTokenReader.reset(new token_reader_type(this)); Assign(a_Parser); } //--------------------------------------------------------------------------- ParserBase::~ParserBase() {} //--------------------------------------------------------------------------- /** \brief Assignment operator. Implemented by calling Assign(a_Parser). Self assignment is suppressed. \param a_Parser Object to copy to this. \return *this \throw nothrow */ ParserBase& ParserBase::operator=(const ParserBase& a_Parser) { Assign(a_Parser); return *this; } //--------------------------------------------------------------------------- /** \brief Copy state of a parser object to this. Clears Variables and Functions of this parser. Copies the states of all internal variables. Resets parse function to string parse mode. \param a_Parser the source object. */ void ParserBase::Assign(const ParserBase& a_Parser) { if (&a_Parser == this) return; // Don't copy bytecode instead cause the parser to create new bytecode // by resetting the parse function. ReInit(); m_ConstDef = a_Parser.m_ConstDef; // Copy user define constants m_VarDef = a_Parser.m_VarDef; // Copy user defined variables m_bBuiltInOp = a_Parser.m_bBuiltInOp; m_vStringBuf = a_Parser.m_vStringBuf; m_vStackBuffer = a_Parser.m_vStackBuffer; m_nFinalResultIdx = a_Parser.m_nFinalResultIdx; m_StrVarDef = a_Parser.m_StrVarDef; m_vStringVarBuf = a_Parser.m_vStringVarBuf; m_pTokenReader.reset(a_Parser.m_pTokenReader->Clone(this)); // Copy function and operator callbacks m_FunDef = a_Parser.m_FunDef; // Copy function definitions m_PostOprtDef = a_Parser.m_PostOprtDef; // post value unary operators m_InfixOprtDef = a_Parser.m_InfixOprtDef; // unary operators for infix notation m_OprtDef = a_Parser.m_OprtDef; // binary operators m_sNameChars = a_Parser.m_sNameChars; m_sOprtChars = a_Parser.m_sOprtChars; m_sInfixOprtChars = a_Parser.m_sInfixOprtChars; } //--------------------------------------------------------------------------- /** \brief Set the decimal separator. \param cDecSep Decimal separator as a character value. \sa SetThousandsSep By default muparser uses the "C" locale. The decimal separator of this locale is overwritten by the one provided here. */ void ParserBase::SetDecSep(char_type cDecSep) { char_type cThousandsSep = std::use_facet< change_dec_sep >(s_locale).thousands_sep(); s_locale = std::locale(std::locale("C"), new change_dec_sep(cDecSep, cThousandsSep)); } //--------------------------------------------------------------------------- /** \brief Sets the thousands operator. \param cThousandsSep The thousands separator as a character \sa SetDecSep By default muparser uses the "C" locale. The thousands separator of this locale is overwritten by the one provided here. */ void ParserBase::SetThousandsSep(char_type cThousandsSep) { char_type cDecSep = std::use_facet< change_dec_sep >(s_locale).decimal_point(); s_locale = std::locale(std::locale("C"), new change_dec_sep(cDecSep, cThousandsSep)); } //--------------------------------------------------------------------------- /** \brief Resets the locale. The default locale used "." as decimal separator, no thousands separator and "," as function argument separator. */ void ParserBase::ResetLocale() { s_locale = std::locale(std::locale("C"), new change_dec_sep('.')); SetArgSep(','); } //--------------------------------------------------------------------------- /** \brief Initialize the token reader. Create new token reader object and submit pointers to function, operator, constant and variable definitions. \post m_pTokenReader.get()!=0 \throw nothrow */ void ParserBase::InitTokenReader() { m_pTokenReader.reset(new token_reader_type(this)); } //--------------------------------------------------------------------------- /** \brief Reset parser to string parsing mode and clear internal buffers. Clear bytecode, reset the token reader. \throw nothrow */ void ParserBase::ReInit() const { m_pParseFormula = &ParserBase::ParseString; m_vStringBuf.clear(); m_vRPN.clear(); m_pTokenReader->ReInit(); } void ParserBase::OnDetectVar(string_type* /*pExpr*/, int& /*nStart*/, int& /*nEnd*/) {} /** \brief Returns a copy of the bytecode of the current expression. */ const ParserByteCode& ParserBase::GetByteCode() const { // If a variable factory is defined the bytecode may contain references to implicitely // created variables. // if (m_pTokenReader->HasVarCreator()) // Error(ecBYTECODE_IMPORT_EXPORT_DISABLED); return m_vRPN; } /** \brief Restore a previously saved bytecode. */ void ParserBase::SetByteCode(const ParserByteCode& a_ByteCode) { // If a variable factory is defined the bytecode may contain references to dynamically // created variables. // if (m_pTokenReader->HasVarCreator()) // Error(ecBYTECODE_IMPORT_EXPORT_DISABLED); m_vRPN = a_ByteCode; // restore expression environment string_type expr; std::tie(expr, m_vStringBuf) = a_ByteCode.RestoreEnvironment(); m_pTokenReader->SetFormula(expr); m_pParseFormula = &ParserBase::ParseCmdCode; } /** \brief Returns the version of muparser. \param eInfo A flag indicating whether the full version info should be returned or not. Format is as follows: "MAJOR.MINOR (COMPILER_FLAGS)" The COMPILER_FLAGS are returned only if eInfo==pviFULL. */ string_type ParserBase::GetVersion(EParserVersionInfo eInfo) const { stringstream_type ss; ss << ParserVersion; if (eInfo == pviFULL) { ss << _T(" (") << ParserVersionDate; ss << std::dec << _T("; ") << sizeof(void*) * 8 << _T("BIT"); #ifdef _DEBUG ss << _T("; DEBUG"); #else ss << _T("; RELEASE"); #endif #ifdef _UNICODE ss << _T("; UNICODE"); #else #ifdef _MBCS ss << _T("; MBCS"); #else ss << _T("; ASCII"); #endif #endif #ifdef MUP_USE_OPENMP ss << _T("; OPENMP"); #endif ss << _T(")"); } return ss.str(); } //--------------------------------------------------------------------------- /** \brief Add a value parsing function. When parsing an expression muParser tries to detect values in the expression string using different valident callbacks. Thus it's possible to parse for hex values, binary values and floating point values. */ void ParserBase::AddValIdent(identfun_type a_pCallback) { m_pTokenReader->AddValIdent(a_pCallback); } //--------------------------------------------------------------------------- /** \brief Set a function that can create variable pointer for unknown expression variables. \param a_pFactory A pointer to the variable factory. \param pUserData A user defined context pointer. */ void ParserBase::SetVarFactory(facfun_type a_pFactory, void* pUserData) { m_pTokenReader->SetVarCreator(a_pFactory, pUserData); } //--------------------------------------------------------------------------- /** \brief Add a function or operator callback to the parser. */ void ParserBase::AddCallback( const string_type& a_strName, const ParserCallback& a_Callback, funmap_type& a_Storage, const char_type* a_szCharSet) { if (!a_Callback.IsValid()) Error(ecINVALID_FUN_PTR); const funmap_type* pFunMap = &a_Storage; // Check for conflicting operator or function names if (pFunMap != &m_FunDef && m_FunDef.find(a_strName) != m_FunDef.end()) Error(ecNAME_CONFLICT, -1, a_strName); if (pFunMap != &m_PostOprtDef && m_PostOprtDef.find(a_strName) != m_PostOprtDef.end()) Error(ecNAME_CONFLICT, -1, a_strName); if (pFunMap != &m_InfixOprtDef && pFunMap != &m_OprtDef && m_InfixOprtDef.find(a_strName) != m_InfixOprtDef.end()) Error(ecNAME_CONFLICT, -1, a_strName); if (pFunMap != &m_InfixOprtDef && pFunMap != &m_OprtDef && m_OprtDef.find(a_strName) != m_OprtDef.end()) Error(ecNAME_CONFLICT, -1, a_strName); CheckOprt(a_strName, a_Callback, a_szCharSet); a_Storage[a_strName] = a_Callback; ReInit(); } //--------------------------------------------------------------------------- /** \brief Check if a name contains invalid characters. \throw ParserException if the name contains invalid characters. */ void ParserBase::CheckOprt(const string_type& a_sName, const ParserCallback& a_Callback, const string_type& a_szCharSet) const { if (!a_sName.length() || (a_sName.find_first_not_of(a_szCharSet) != string_type::npos) || (a_sName[0] >= '0' && a_sName[0] <= '9')) { switch (a_Callback.GetCode()) { case cmOPRT_POSTFIX: Error(ecINVALID_POSTFIX_IDENT, -1, a_sName); break; case cmOPRT_INFIX: Error(ecINVALID_INFIX_IDENT, -1, a_sName); break; default: Error(ecINVALID_NAME, -1, a_sName); } } } /** \brief Check if a name contains invalid characters. \throw ParserException if the name contains invalid characters. */ void ParserBase::CheckName(const string_type& a_sName, const string_type& a_szCharSet) const { if (!a_sName.length() || (a_sName.find_first_not_of(a_szCharSet) != string_type::npos) || (a_sName[0] >= '0' && a_sName[0] <= '9')) { Error(ecINVALID_NAME); } } /** \brief Set the formula. \param a_strFormula Formula as string_type \throw ParserException in case of syntax errors. Triggers first time calculation thus the creation of the bytecode and scanning of used variables. */ void ParserBase::SetExpr(const string_type& a_sExpr) { // Check locale compatibility if (m_pTokenReader->GetArgSep() == std::use_facet >(s_locale).decimal_point()) Error(ecLOCALE); // Check maximum allowed expression length. An arbitrary value small enough so i can debug expressions sent to me if (a_sExpr.length() >= MaxLenExpression) Error(ecEXPRESSION_TOO_LONG, 0, a_sExpr); m_pTokenReader->SetFormula(a_sExpr + _T(" ")); ReInit(); } //--------------------------------------------------------------------------- /** \brief Get the default symbols used for the built in operators. \sa c_DefaultOprt */ const char_type** ParserBase::GetOprtDef() const { return (const char_type**)(&c_DefaultOprt[0]); } //--------------------------------------------------------------------------- /** \brief Define the set of valid characters to be used in names of functions, variables, constants. */ void ParserBase::DefineNameChars(const char_type* a_szCharset) { m_sNameChars = a_szCharset; } //--------------------------------------------------------------------------- /** \brief Define the set of valid characters to be used in names of binary operators and postfix operators. */ void ParserBase::DefineOprtChars(const char_type* a_szCharset) { m_sOprtChars = a_szCharset; } //--------------------------------------------------------------------------- /** \brief Define the set of valid characters to be used in names of infix operators. */ void ParserBase::DefineInfixOprtChars(const char_type* a_szCharset) { m_sInfixOprtChars = a_szCharset; } //--------------------------------------------------------------------------- /** \brief Virtual function that defines the characters allowed in name identifiers. \sa #ValidOprtChars, #ValidPrefixOprtChars */ const char_type* ParserBase::ValidNameChars() const { MUP_ASSERT(m_sNameChars.size()); return m_sNameChars.c_str(); } //--------------------------------------------------------------------------- /** \brief Virtual function that defines the characters allowed in operator definitions. \sa #ValidNameChars, #ValidPrefixOprtChars */ const char_type* ParserBase::ValidOprtChars() const { MUP_ASSERT(m_sOprtChars.size()); return m_sOprtChars.c_str(); } //--------------------------------------------------------------------------- /** \brief Virtual function that defines the characters allowed in infix operator definitions. \sa #ValidNameChars, #ValidOprtChars */ const char_type* ParserBase::ValidInfixOprtChars() const { MUP_ASSERT(m_sInfixOprtChars.size()); return m_sInfixOprtChars.c_str(); } //--------------------------------------------------------------------------- /** \brief Add a user defined operator. \post Will reset the Parser to string parsing mode. */ void ParserBase::DefinePostfixOprt(const string_type& a_sName, fun_type1 a_pFun, bool a_bAllowOpt) { if (a_sName.length() > MaxLenIdentifier) Error(ecIDENTIFIER_TOO_LONG); AddCallback(a_sName, ParserCallback(a_pFun, a_bAllowOpt, prPOSTFIX, cmOPRT_POSTFIX), m_PostOprtDef, ValidOprtChars()); } //--------------------------------------------------------------------------- /** \brief Initialize user defined functions. Calls the virtual functions InitFun(), InitConst() and InitOprt(). */ void ParserBase::Init() { InitCharSets(); InitFun(); InitConst(); InitOprt(); } //--------------------------------------------------------------------------- /** \brief Add a user defined operator. \post Will reset the Parser to string parsing mode. \param [in] a_sName operator Identifier \param [in] a_pFun Operator callback function \param [in] a_iPrec Operator Precedence (default=prSIGN) \param [in] a_bAllowOpt True if operator is volatile (default=false) \sa EPrec */ void ParserBase::DefineInfixOprt(const string_type& a_sName, fun_type1 a_pFun, int a_iPrec, bool a_bAllowOpt) { if (a_sName.length() > MaxLenIdentifier) Error(ecIDENTIFIER_TOO_LONG); AddCallback(a_sName, ParserCallback(a_pFun, a_bAllowOpt, a_iPrec, cmOPRT_INFIX), m_InfixOprtDef, ValidInfixOprtChars()); } //--------------------------------------------------------------------------- /** \brief Define a binary operator. \param [in] a_sName The identifier of the operator. \param [in] a_pFun Pointer to the callback function. \param [in] a_iPrec Precedence of the operator. \param [in] a_eAssociativity The associativity of the operator. \param [in] a_bAllowOpt If this is true the operator may be optimized away. Adds a new Binary operator the the parser instance. */ void ParserBase::DefineOprt(const string_type& a_sName, fun_type2 a_pFun, unsigned a_iPrec, EOprtAssociativity a_eAssociativity, bool a_bAllowOpt) { if (a_sName.length() > MaxLenIdentifier) Error(ecIDENTIFIER_TOO_LONG); // Check for conflicts with built in operator names for (int i = 0; m_bBuiltInOp && i < cmENDIF; ++i) { if (a_sName == string_type(c_DefaultOprt[i])) { Error(ecBUILTIN_OVERLOAD, -1, a_sName); } } AddCallback(a_sName, ParserCallback(a_pFun, a_bAllowOpt, a_iPrec, a_eAssociativity), m_OprtDef, ValidOprtChars()); } //--------------------------------------------------------------------------- /** \brief Define a new string constant. \param [in] a_strName The name of the constant. \param [in] a_strVal the value of the constant. */ void ParserBase::DefineStrConst(const string_type& a_strName, const string_type& a_strVal) { // Test if a constant with that names already exists if (m_StrVarDef.find(a_strName) != m_StrVarDef.end()) Error(ecNAME_CONFLICT); CheckName(a_strName, ValidNameChars()); m_vStringVarBuf.push_back(a_strVal); // Store variable string in internal buffer m_StrVarDef[a_strName] = m_vStringVarBuf.size() - 1; // bind buffer index to variable name ReInit(); } //--------------------------------------------------------------------------- /** \brief Add a user defined variable. \param [in] a_sName the variable name \param [in] a_pVar A pointer to the variable value. \post Will reset the Parser to string parsing mode. \throw ParserException in case the name contains invalid signs or a_pVar is nullptr. */ void ParserBase::DefineVar(const string_type& a_sName, value_type* a_pVar) { if (a_pVar == 0) Error(ecINVALID_VAR_PTR); if (a_sName.length() > MaxLenIdentifier) Error(ecIDENTIFIER_TOO_LONG); // Test if a constant with that names already exists if (m_ConstDef.find(a_sName) != m_ConstDef.end()) Error(ecNAME_CONFLICT); CheckName(a_sName, ValidNameChars()); m_VarDef[a_sName] = a_pVar; ReInit(); } //--------------------------------------------------------------------------- /** \brief Add a user defined constant. \param [in] a_sName The name of the constant. \param [in] a_fVal the value of the constant. \post Will reset the Parser to string parsing mode. \throw ParserException in case the name contains invalid signs. */ void ParserBase::DefineConst(const string_type& a_sName, value_type a_fVal) { if (a_sName.length() > MaxLenIdentifier) Error(ecIDENTIFIER_TOO_LONG); CheckName(a_sName, ValidNameChars()); m_ConstDef[a_sName] = a_fVal; ReInit(); } //--------------------------------------------------------------------------- /** \brief Get operator priority. \throw ParserException if a_Oprt is no operator code */ int ParserBase::GetOprtPrecedence(const token_type& a_Tok) const { switch (a_Tok.GetCode()) { // built in operators case cmEND: return -5; case cmARG_SEP: return -4; case cmASSIGN: return -1; case cmELSE: case cmIF: return 0; case cmLAND: return prLAND; case cmLOR: return prLOR; case cmLT: case cmGT: case cmLE: case cmGE: case cmNEQ: case cmEQ: return prCMP; case cmADD: case cmSUB: return prADD_SUB; case cmMUL: case cmDIV: return prMUL_DIV; case cmPOW: return prPOW; // user defined binary operators case cmOPRT_INFIX: case cmOPRT_BIN: return a_Tok.GetPri(); default: throw exception_type(ecINTERNAL_ERROR, 5, _T("")); } } //--------------------------------------------------------------------------- /** \brief Get operator priority. \throw ParserException if a_Oprt is no operator code */ EOprtAssociativity ParserBase::GetOprtAssociativity(const token_type& a_Tok) const { switch (a_Tok.GetCode()) { case cmASSIGN: case cmLAND: case cmLOR: case cmLT: case cmGT: case cmLE: case cmGE: case cmNEQ: case cmEQ: case cmADD: case cmSUB: case cmMUL: case cmDIV: return oaLEFT; case cmPOW: return oaRIGHT; case cmOPRT_BIN: return a_Tok.GetAssociativity(); default: return oaNONE; } } //--------------------------------------------------------------------------- /** \brief Return a map containing the used variables only. */ const varmap_type& ParserBase::GetUsedVar() const { try { m_pTokenReader->IgnoreUndefVar(true); CreateRPN(); // try to create bytecode, but don't use it for any further calculations since it // may contain references to nonexisting variables. m_pParseFormula = &ParserBase::ParseString; m_pTokenReader->IgnoreUndefVar(false); } catch (exception_type& /*e*/) { // Make sure to stay in string parse mode, don't call ReInit() // because it deletes the array with the used variables m_pParseFormula = &ParserBase::ParseString; m_pTokenReader->IgnoreUndefVar(false); throw; } return m_pTokenReader->GetUsedVar(); } //--------------------------------------------------------------------------- /** \brief Return a map containing the used variables only. */ const varmap_type& ParserBase::GetVar() const { return m_VarDef; } //--------------------------------------------------------------------------- /** \brief Return a map containing all parser constants. */ const valmap_type& ParserBase::GetConst() const { return m_ConstDef; } //--------------------------------------------------------------------------- /** \brief Return prototypes of all parser functions. \return #m_FunDef \sa FunProt \throw nothrow The return type is a map of the public type #funmap_type containing the prototype definitions for all numerical parser functions. String functions are not part of this map. The Prototype definition is encapsulated in objects of the class FunProt one per parser function each associated with function names via a map construct. */ const funmap_type& ParserBase::GetFunDef() const { return m_FunDef; } //--------------------------------------------------------------------------- /** \brief Retrieve the formula. */ const string_type& ParserBase::GetExpr() const { return m_pTokenReader->GetExpr(); } //--------------------------------------------------------------------------- /** \brief Execute a function that takes a single string argument. \param a_FunTok Function token. \throw exception_type If the function token is not a string function */ ParserBase::token_type ParserBase::ApplyStrFunc( const token_type& a_FunTok, const std::vector& a_vArg) const { if (a_vArg.back().GetCode() != cmSTRING) Error(ecSTRING_EXPECTED, m_pTokenReader->GetPos(), a_FunTok.GetAsString()); token_type valTok; generic_callable_type pFunc = a_FunTok.GetFuncAddr(); MUP_ASSERT(pFunc); try { // Check function arguments; write dummy value into valtok to represent the result switch (a_FunTok.GetArgCount()) { case 0: valTok.SetVal(1); a_vArg[0].GetAsString(); break; case 1: valTok.SetVal(1); a_vArg[1].GetAsString(); a_vArg[0].GetVal(); break; case 2: valTok.SetVal(1); a_vArg[2].GetAsString(); a_vArg[1].GetVal(); a_vArg[0].GetVal(); break; case 3: valTok.SetVal(1); a_vArg[3].GetAsString(); a_vArg[2].GetVal(); a_vArg[1].GetVal(); a_vArg[0].GetVal(); break; case 4: valTok.SetVal(1); a_vArg[4].GetAsString(); a_vArg[3].GetVal(); a_vArg[2].GetVal(); a_vArg[1].GetVal(); a_vArg[0].GetVal(); break; case 5: valTok.SetVal(1); a_vArg[5].GetAsString(); a_vArg[4].GetVal(); a_vArg[3].GetVal(); a_vArg[2].GetVal(); a_vArg[1].GetVal(); a_vArg[0].GetVal(); break; default: Error(ecINTERNAL_ERROR); } } catch (ParserError&) { Error(ecVAL_EXPECTED, m_pTokenReader->GetPos(), a_FunTok.GetAsString()); } // string functions won't be optimized m_vRPN.AddStrFun(pFunc, a_FunTok.GetArgCount(), a_vArg.back().GetIdx()); // Push dummy value representing the function result to the stack return valTok; } //--------------------------------------------------------------------------- /** \brief Apply a function token. \param iArgCount Number of Arguments actually gathered used only for multiarg functions. \post The result is pushed to the value stack \post The function token is removed from the stack \throw exception_type if Argument count does not match function requirements. */ void ParserBase::ApplyFunc(std::stack& a_stOpt, std::stack& a_stVal, int a_iArgCount) const { MUP_ASSERT(m_pTokenReader.get()); // Operator stack empty or does not contain tokens with callback functions if (a_stOpt.empty() || a_stOpt.top().GetFuncAddr() == 0) return; token_type funTok = a_stOpt.top(); a_stOpt.pop(); MUP_ASSERT(funTok.GetFuncAddr() != nullptr); // Binary operators must rely on their internal operator number // since counting of operators relies on commas for function arguments // binary operators do not have commas in their expression int iArgCount = (funTok.GetCode() == cmOPRT_BIN) ? funTok.GetArgCount() : a_iArgCount; // determine how many parameters the function needs. To remember iArgCount includes the // string parameter whilst GetArgCount() counts only numeric parameters. int iArgRequired = funTok.GetArgCount() + ((funTok.GetType() == tpSTR) ? 1 : 0); // That's the number of numerical parameters int iArgNumerical = iArgCount - ((funTok.GetType() == tpSTR) ? 1 : 0); if (funTok.GetCode() == cmFUNC_STR && iArgCount - iArgNumerical > 1) Error(ecINTERNAL_ERROR); if (funTok.GetArgCount() >= 0 && iArgCount > iArgRequired) Error(ecTOO_MANY_PARAMS, m_pTokenReader->GetPos() - 1, funTok.GetAsString()); if (funTok.GetCode() != cmOPRT_BIN && iArgCount < iArgRequired) Error(ecTOO_FEW_PARAMS, m_pTokenReader->GetPos() - 1, funTok.GetAsString()); if (funTok.GetCode() == cmFUNC_STR && iArgCount > iArgRequired) Error(ecTOO_MANY_PARAMS, m_pTokenReader->GetPos() - 1, funTok.GetAsString()); // Collect the numeric function arguments from the value stack and store them // in a vector std::vector stArg; for (int i = 0; i < iArgNumerical; ++i) { if (a_stVal.empty()) Error(ecINTERNAL_ERROR, m_pTokenReader->GetPos(), funTok.GetAsString()); stArg.push_back(a_stVal.top()); a_stVal.pop(); if (stArg.back().GetType() == tpSTR && funTok.GetType() != tpSTR) Error(ecVAL_EXPECTED, m_pTokenReader->GetPos(), funTok.GetAsString()); } switch (funTok.GetCode()) { case cmFUNC_STR: if (a_stVal.empty()) Error(ecINTERNAL_ERROR, m_pTokenReader->GetPos(), funTok.GetAsString()); stArg.push_back(a_stVal.top()); a_stVal.pop(); if (stArg.back().GetType() == tpSTR && funTok.GetType() != tpSTR) Error(ecVAL_EXPECTED, m_pTokenReader->GetPos(), funTok.GetAsString()); ApplyStrFunc(funTok, stArg); break; case cmFUNC_BULK: m_vRPN.AddBulkFun(funTok.GetFuncAddr(), (int)stArg.size()); break; case cmOPRT_BIN: case cmOPRT_POSTFIX: case cmOPRT_INFIX: case cmFUNC: if (funTok.GetArgCount() == -1 && iArgCount == 0) Error(ecTOO_FEW_PARAMS, m_pTokenReader->GetPos(), funTok.GetAsString()); m_vRPN.AddFun(funTok.GetFuncAddr(), (funTok.GetArgCount() == -1) ? -iArgNumerical : iArgNumerical, funTok.IsOptimizable()); break; default: break; } // Push dummy value representing the function result to the stack token_type token; token.SetVal(1); a_stVal.push(token); } //--------------------------------------------------------------------------- void ParserBase::ApplyIfElse(std::stack& a_stOpt, std::stack& a_stVal) const { // Check if there is an if Else clause to be calculated while (a_stOpt.size() && a_stOpt.top().GetCode() == cmELSE) { MUP_ASSERT(!a_stOpt.empty()) token_type opElse = a_stOpt.top(); a_stOpt.pop(); // Take the value associated with the else branch from the value stack MUP_ASSERT(!a_stVal.empty()); token_type vVal2 = a_stVal.top(); if (vVal2.GetType() != tpDBL) Error(ecUNEXPECTED_STR, m_pTokenReader->GetPos()); a_stVal.pop(); // it then else is a ternary operator Pop all three values from the value s // tack and just return the right value MUP_ASSERT(!a_stVal.empty()); token_type vVal1 = a_stVal.top(); if (vVal1.GetType() != tpDBL) Error(ecUNEXPECTED_STR, m_pTokenReader->GetPos()); a_stVal.pop(); MUP_ASSERT(!a_stVal.empty()); token_type vExpr = a_stVal.top(); a_stVal.pop(); a_stVal.push((vExpr.GetVal() != 0) ? vVal1 : vVal2); token_type opIf = a_stOpt.top(); a_stOpt.pop(); MUP_ASSERT(opElse.GetCode() == cmELSE); if (opIf.GetCode() != cmIF) Error(ecMISPLACED_COLON, m_pTokenReader->GetPos()); m_vRPN.AddIfElse(cmENDIF); } // while pending if-else-clause found } //--------------------------------------------------------------------------- /** \brief Performs the necessary steps to write code for the execution of binary operators into the bytecode. */ void ParserBase::ApplyBinOprt(std::stack& a_stOpt, std::stack& a_stVal) const { // is it a user defined binary operator? if (a_stOpt.top().GetCode() == cmOPRT_BIN) { ApplyFunc(a_stOpt, a_stVal, 2); } else { if (a_stVal.size() < 2) Error(ecINTERNAL_ERROR, m_pTokenReader->GetPos(), _T("ApplyBinOprt: not enough values in value stack!")); token_type valTok1 = a_stVal.top(); a_stVal.pop(); token_type valTok2 = a_stVal.top(); a_stVal.pop(); token_type optTok = a_stOpt.top(); a_stOpt.pop(); token_type resTok; if (valTok1.GetType() != valTok2.GetType() || (valTok1.GetType() == tpSTR && valTok2.GetType() == tpSTR)) Error(ecOPRT_TYPE_CONFLICT, m_pTokenReader->GetPos(), optTok.GetAsString()); if (optTok.GetCode() == cmASSIGN) { if (valTok2.GetCode() != cmVAR) Error(ecUNEXPECTED_OPERATOR, -1, _T("=")); m_vRPN.AddAssignOp(valTok2.GetVar()); } else m_vRPN.AddOp(optTok.GetCode()); resTok.SetVal(1); a_stVal.push(resTok); } } //--------------------------------------------------------------------------- /** \brief Apply a binary operator. \param a_stOpt The operator stack \param a_stVal The value stack */ void ParserBase::ApplyRemainingOprt(std::stack& stOpt, std::stack& stVal) const { while (stOpt.size() && stOpt.top().GetCode() != cmBO && stOpt.top().GetCode() != cmIF) { token_type tok = stOpt.top(); switch (tok.GetCode()) { case cmOPRT_INFIX: case cmOPRT_BIN: case cmLE: case cmGE: case cmNEQ: case cmEQ: case cmLT: case cmGT: case cmADD: case cmSUB: case cmMUL: case cmDIV: case cmPOW: case cmLAND: case cmLOR: case cmASSIGN: if (stOpt.top().GetCode() == cmOPRT_INFIX) ApplyFunc(stOpt, stVal, 1); else ApplyBinOprt(stOpt, stVal); break; case cmELSE: ApplyIfElse(stOpt, stVal); break; default: Error(ecINTERNAL_ERROR); } } } //--------------------------------------------------------------------------- /** \brief Parse the command code. \sa ParseString(...) Command code contains precalculated stack positions of the values and the associated operators. The Stack is filled beginning from index one the value at index zero is not used at all. */ value_type ParserBase::ParseCmdCode() const { return ParseCmdCodeBulk(0, 0); } value_type ParserBase::ParseCmdCodeShort() const { const SToken *const tok = m_vRPN.GetBase(); value_type buf; switch (tok->Cmd) { case cmVAL: return tok->Val.data2; case cmVAR: return *tok->Val.ptr; case cmVARMUL: return *tok->Val.ptr * tok->Val.data + tok->Val.data2; case cmVARPOW2: buf = *(tok->Val.ptr); return buf * buf; case cmVARPOW3: buf = *(tok->Val.ptr); return buf * buf * buf; case cmVARPOW4: buf = *(tok->Val.ptr); return buf * buf * buf * buf; // numerical function without any argument case cmFUNC: return tok->Fun.cb.call_fun<0>(); // String function without a numerical argument case cmFUNC_STR: return tok->Fun.cb.call_strfun<1>(m_vStringBuf[0].c_str()); default: throw ParserError(ecINTERNAL_ERROR); } } //--------------------------------------------------------------------------- /** \brief Evaluate the RPN. \param nOffset The offset added to variable addresses (for bulk mode) \param nThreadID OpenMP Thread id of the calling thread */ value_type ParserBase::ParseCmdCodeBulk(int nOffset, int nThreadID) const { assert(nThreadID <= s_MaxNumOpenMPThreads); // Note: The check for nOffset==0 and nThreadID here is not necessary but // brings a minor performance gain when not in bulk mode. value_type *stack = ((nOffset == 0) && (nThreadID == 0)) ? &m_vStackBuffer[0] : &m_vStackBuffer[nThreadID * (m_vStackBuffer.size() / s_MaxNumOpenMPThreads)]; value_type buf; int sidx(0); for (const SToken* pTok = m_vRPN.GetBase(); pTok->Cmd != cmEND; ++pTok) { switch (pTok->Cmd) { // built in binary operators case cmLE: --sidx; stack[sidx] = stack[sidx] <= stack[sidx + 1]; continue; case cmGE: --sidx; stack[sidx] = stack[sidx] >= stack[sidx + 1]; continue; case cmNEQ: --sidx; stack[sidx] = stack[sidx] != stack[sidx + 1]; continue; case cmEQ: --sidx; stack[sidx] = stack[sidx] == stack[sidx + 1]; continue; case cmLT: --sidx; stack[sidx] = stack[sidx] < stack[sidx + 1]; continue; case cmGT: --sidx; stack[sidx] = stack[sidx] > stack[sidx + 1]; continue; case cmADD: --sidx; stack[sidx] += stack[1 + sidx]; continue; case cmSUB: --sidx; stack[sidx] -= stack[1 + sidx]; continue; case cmMUL: --sidx; stack[sidx] *= stack[1 + sidx]; continue; case cmDIV: --sidx; stack[sidx] /= stack[1 + sidx]; continue; case cmPOW: --sidx; stack[sidx] = MathImpl::Pow(stack[sidx], stack[1 + sidx]); continue; case cmLAND: --sidx; stack[sidx] = stack[sidx] && stack[sidx + 1]; continue; case cmLOR: --sidx; stack[sidx] = stack[sidx] || stack[sidx + 1]; continue; case cmASSIGN: // Bugfix for Bulkmode: // for details see: // https://groups.google.com/forum/embed/?place=forum/muparser-dev&showsearch=true&showpopout=true&showtabs=false&parenturl=http://muparser.beltoforion.de/mup_forum.html&afterlogin&pli=1#!topic/muparser-dev/szgatgoHTws --sidx; stack[sidx] = *(pTok->Oprt.ptr + nOffset) = stack[sidx + 1]; continue; // original code: //--sidx; Stack[sidx] = *pTok->Oprt.ptr = Stack[sidx+1]; continue; case cmIF: if (stack[sidx--] == 0) { MUP_ASSERT(sidx >= 0); pTok += pTok->Oprt.offset; } continue; case cmELSE: pTok += pTok->Oprt.offset; continue; case cmENDIF: continue; // value and variable tokens case cmVAR: stack[++sidx] = *(pTok->Val.ptr + nOffset); continue; case cmVAL: stack[++sidx] = pTok->Val.data2; continue; case cmVARPOW2: buf = *(pTok->Val.ptr + nOffset); stack[++sidx] = buf * buf; continue; case cmVARPOW3: buf = *(pTok->Val.ptr + nOffset); stack[++sidx] = buf * buf * buf; continue; case cmVARPOW4: buf = *(pTok->Val.ptr + nOffset); stack[++sidx] = buf * buf * buf * buf; continue; case cmVARMUL: stack[++sidx] = *(pTok->Val.ptr + nOffset) * pTok->Val.data + pTok->Val.data2; continue; // Next is treatment of numeric functions case cmFUNC: { int iArgCount = pTok->Fun.argc; // switch according to argument count switch (iArgCount) { case 0: sidx += 1; stack[sidx] = pTok->Fun.cb.call_fun<0 >(); continue; case 1: stack[sidx] = pTok->Fun.cb.call_fun<1 >(stack[sidx]); continue; case 2: sidx -= 1; stack[sidx] = pTok->Fun.cb.call_fun<2 >(stack[sidx], stack[sidx + 1]); continue; case 3: sidx -= 2; stack[sidx] = pTok->Fun.cb.call_fun<3 >(stack[sidx], stack[sidx + 1], stack[sidx + 2]); continue; case 4: sidx -= 3; stack[sidx] = pTok->Fun.cb.call_fun<4 >(stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3]); continue; case 5: sidx -= 4; stack[sidx] = pTok->Fun.cb.call_fun<5 >(stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4]); continue; case 6: sidx -= 5; stack[sidx] = pTok->Fun.cb.call_fun<6 >(stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5]); continue; case 7: sidx -= 6; stack[sidx] = pTok->Fun.cb.call_fun<7 >(stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6]); continue; case 8: sidx -= 7; stack[sidx] = pTok->Fun.cb.call_fun<8 >(stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6], stack[sidx + 7]); continue; case 9: sidx -= 8; stack[sidx] = pTok->Fun.cb.call_fun<9 >(stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6], stack[sidx + 7], stack[sidx + 8]); continue; case 10:sidx -= 9; stack[sidx] = pTok->Fun.cb.call_fun<10>(stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6], stack[sidx + 7], stack[sidx + 8], stack[sidx + 9]); continue; default: // function with variable arguments store the number as a negative value if (iArgCount > 0) Error(ecINTERNAL_ERROR, -1); sidx -= -iArgCount - 1; // From oss-fuzz. Happend when Multiarg functions and if-then-else are used incorrectly. // Expressions where this was observed: // sum(0?1,2,3,4,5:6) -> fixed // avg(0>3?4:(""),0^3?4:("")) // // The final result normally lieas at position 1. If sixd is smaller there is something wrong. if (sidx <= 0) Error(ecINTERNAL_ERROR, -1); // stack[sidx] = pTok->Fun.cb.call_multfun(&stack[sidx], -iArgCount); continue; } } // Next is treatment of string functions case cmFUNC_STR: { sidx -= pTok->Fun.argc - 1; // The index of the string argument in the string table int iIdxStack = pTok->Fun.idx; if (iIdxStack < 0 || iIdxStack >= (int)m_vStringBuf.size()) Error(ecINTERNAL_ERROR, m_pTokenReader->GetPos()); switch (pTok->Fun.argc) // switch according to argument count { case 0: stack[sidx] = pTok->Fun.cb.call_strfun<1>(m_vStringBuf[iIdxStack].c_str()); continue; case 1: stack[sidx] = pTok->Fun.cb.call_strfun<2>(m_vStringBuf[iIdxStack].c_str(), stack[sidx]); continue; case 2: stack[sidx] = pTok->Fun.cb.call_strfun<3>(m_vStringBuf[iIdxStack].c_str(), stack[sidx], stack[sidx + 1]); continue; case 3: stack[sidx] = pTok->Fun.cb.call_strfun<4>(m_vStringBuf[iIdxStack].c_str(), stack[sidx], stack[sidx + 1], stack[sidx + 2]); continue; case 4: stack[sidx] = pTok->Fun.cb.call_strfun<5>(m_vStringBuf[iIdxStack].c_str(), stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3]); continue; case 5: stack[sidx] = pTok->Fun.cb.call_strfun<6>(m_vStringBuf[iIdxStack].c_str(), stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4]); continue; } continue; } case cmFUNC_BULK: { int iArgCount = pTok->Fun.argc; // switch according to argument count switch (iArgCount) { case 0: sidx += 1; stack[sidx] = pTok->Fun.cb.call_bulkfun<0 >(nOffset, nThreadID); continue; case 1: stack[sidx] = pTok->Fun.cb.call_bulkfun<1 >(nOffset, nThreadID, stack[sidx]); continue; case 2: sidx -= 1; stack[sidx] = pTok->Fun.cb.call_bulkfun<2 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1]); continue; case 3: sidx -= 2; stack[sidx] = pTok->Fun.cb.call_bulkfun<3 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2]); continue; case 4: sidx -= 3; stack[sidx] = pTok->Fun.cb.call_bulkfun<4 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3]); continue; case 5: sidx -= 4; stack[sidx] = pTok->Fun.cb.call_bulkfun<5 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4]); continue; case 6: sidx -= 5; stack[sidx] = pTok->Fun.cb.call_bulkfun<6 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5]); continue; case 7: sidx -= 6; stack[sidx] = pTok->Fun.cb.call_bulkfun<7 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6]); continue; case 8: sidx -= 7; stack[sidx] = pTok->Fun.cb.call_bulkfun<8 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6], stack[sidx + 7]); continue; case 9: sidx -= 8; stack[sidx] = pTok->Fun.cb.call_bulkfun<9 >(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6], stack[sidx + 7], stack[sidx + 8]); continue; case 10:sidx -= 9; stack[sidx] = pTok->Fun.cb.call_bulkfun<10>(nOffset, nThreadID, stack[sidx], stack[sidx + 1], stack[sidx + 2], stack[sidx + 3], stack[sidx + 4], stack[sidx + 5], stack[sidx + 6], stack[sidx + 7], stack[sidx + 8], stack[sidx + 9]); continue; default: throw exception_type(ecINTERNAL_ERROR, 2, _T("")); } } default: throw exception_type(ecINTERNAL_ERROR, 3, _T("")); } // switch CmdCode } // for all bytecode tokens return stack[m_nFinalResultIdx]; } //--------------------------------------------------------------------------- void ParserBase::CreateRPN() const { if (!m_pTokenReader->GetExpr().length()) Error(ecUNEXPECTED_EOF, 0); std::stack stOpt, stVal; std::stack stArgCount; token_type opta, opt; // for storing operators token_type val, tval; // for storing value int ifElseCounter = 0; ReInit(); // The outermost counter counts the number of separated items // such as in "a=10,b=20,c=c+a" stArgCount.push(1); for (;;) { opt = m_pTokenReader->ReadNextToken(); switch (opt.GetCode()) { // // Next three are different kind of value entries // case cmSTRING: if (stOpt.empty()) Error(ecSTR_RESULT, m_pTokenReader->GetPos(), opt.GetAsString()); opt.SetIdx((int)m_vStringBuf.size()); // Assign buffer index to token stVal.push(opt); m_vStringBuf.push_back(opt.GetAsString()); // Store string in internal buffer break; case cmVAR: stVal.push(opt); m_vRPN.AddVar(static_cast(opt.GetVar())); break; case cmVAL: stVal.push(opt); m_vRPN.AddVal(opt.GetVal()); break; case cmELSE: if (stArgCount.empty()) Error(ecMISPLACED_COLON, m_pTokenReader->GetPos()); if (stArgCount.top() > 1) Error(ecUNEXPECTED_ARG_SEP, m_pTokenReader->GetPos()); stArgCount.pop(); ifElseCounter--; if (ifElseCounter < 0) Error(ecMISPLACED_COLON, m_pTokenReader->GetPos()); ApplyRemainingOprt(stOpt, stVal); m_vRPN.AddIfElse(cmELSE); stOpt.push(opt); break; case cmARG_SEP: if (!stOpt.empty() && stOpt.top().GetCode() == cmIF) Error(ecUNEXPECTED_ARG_SEP, m_pTokenReader->GetPos()); if (stArgCount.empty()) Error(ecUNEXPECTED_ARG_SEP, m_pTokenReader->GetPos()); ++stArgCount.top(); // Falls through. // intentional (no break!) case cmEND: ApplyRemainingOprt(stOpt, stVal); break; case cmBC: { // The argument count for parameterless functions is zero // by default an opening bracket sets parameter count to 1 // in preparation of arguments to come. If the last token // was an opening bracket we know better... if (opta.GetCode() == cmBO) --stArgCount.top(); ApplyRemainingOprt(stOpt, stVal); // Check if the bracket content has been evaluated completely if (stOpt.size() && stOpt.top().GetCode() == cmBO) { // if opt is ")" and opta is "(" the bracket has been evaluated, now its time to check // if there is either a function or a sign pending // neither the opening nor the closing bracket will be pushed back to // the operator stack // Check if a function is standing in front of the opening bracket, // if yes evaluate it afterwards check for infix operators MUP_ASSERT(stArgCount.size()); int iArgCount = stArgCount.top(); stArgCount.pop(); stOpt.pop(); // Take opening bracket from stack if (iArgCount > 1 && (stOpt.size() == 0 || (stOpt.top().GetCode() != cmFUNC && stOpt.top().GetCode() != cmFUNC_BULK && stOpt.top().GetCode() != cmFUNC_STR))) Error(ecUNEXPECTED_ARG, m_pTokenReader->GetPos()); // The opening bracket was popped from the stack now check if there // was a function before this bracket if (stOpt.size() && stOpt.top().GetCode() != cmOPRT_INFIX && stOpt.top().GetCode() != cmOPRT_BIN && stOpt.top().GetFuncAddr() != 0) { ApplyFunc(stOpt, stVal, iArgCount); } } } // if bracket content is evaluated break; // // Next are the binary operator entries // case cmIF: ifElseCounter++; stArgCount.push(1); // Falls through. // intentional (no break!) case cmLAND: case cmLOR: case cmLT: case cmGT: case cmLE: case cmGE: case cmNEQ: case cmEQ: case cmADD: case cmSUB: case cmMUL: case cmDIV: case cmPOW: case cmASSIGN: case cmOPRT_BIN: // A binary operator (user defined or built in) has been found. while ( stOpt.size() && stOpt.top().GetCode() != cmBO && stOpt.top().GetCode() != cmELSE && stOpt.top().GetCode() != cmIF) { int nPrec1 = GetOprtPrecedence(stOpt.top()), nPrec2 = GetOprtPrecedence(opt); if (stOpt.top().GetCode() == opt.GetCode()) { // Deal with operator associativity EOprtAssociativity eOprtAsct = GetOprtAssociativity(opt); if ((eOprtAsct == oaRIGHT && (nPrec1 <= nPrec2)) || (eOprtAsct == oaLEFT && (nPrec1 < nPrec2))) { break; } } else if (nPrec1 < nPrec2) { // In case the operators are not equal the precedence decides alone... break; } if (stOpt.top().GetCode() == cmOPRT_INFIX) ApplyFunc(stOpt, stVal, 1); else ApplyBinOprt(stOpt, stVal); } // while ( ... ) if (opt.GetCode() == cmIF) m_vRPN.AddIfElse(opt.GetCode()); // The operator can't be evaluated right now, push back to the operator stack stOpt.push(opt); break; // // Last section contains functions and operators implicitly mapped to functions // case cmBO: stArgCount.push(1); stOpt.push(opt); break; case cmOPRT_INFIX: case cmFUNC: case cmFUNC_BULK: case cmFUNC_STR: stOpt.push(opt); break; case cmOPRT_POSTFIX: stOpt.push(opt); ApplyFunc(stOpt, stVal, 1); // this is the postfix operator break; default: Error(ecINTERNAL_ERROR, 3); } // end of switch operator-token opta = opt; if (opt.GetCode() == cmEND) { m_vRPN.Finalize(); break; } if (ParserBase::g_DbgDumpStack) { StackDump(stVal, stOpt); m_vRPN.AsciiDump(); } // if (ParserBase::g_DbgDumpCmdCode) //m_vRPN.AsciiDump(); } // while (true) if (ParserBase::g_DbgDumpCmdCode) m_vRPN.AsciiDump(); if (ifElseCounter > 0) Error(ecMISSING_ELSE_CLAUSE); // get the last value (= final result) from the stack MUP_ASSERT(stArgCount.size() == 1); m_nFinalResultIdx = stArgCount.top(); if (m_nFinalResultIdx == 0) Error(ecINTERNAL_ERROR, 9); if (stVal.size() == 0) Error(ecEMPTY_EXPRESSION); // 2020-09-17; fix for https://oss-fuzz.com/testcase-detail/5758791700971520 // I don't need the value stack any more. Destructively check if all values in the value // stack represent floating point values while (stVal.size()) { if (stVal.top().GetType() != tpDBL) Error(ecSTR_RESULT); stVal.pop(); } m_vStackBuffer.resize(m_vRPN.GetMaxStackSize() * s_MaxNumOpenMPThreads); } //--------------------------------------------------------------------------- /** \brief One of the two main parse functions. \sa ParseCmdCode(...) Parse expression from input string. Perform syntax checking and create bytecode. After parsing the string and creating the bytecode the function pointer #m_pParseFormula will be changed to the second parse routine the uses bytecode instead of string parsing. */ value_type ParserBase::ParseString() const { try { CreateRPN(); if (m_vRPN.GetSize() == 2) { m_vRPN.StoreEnvironment(m_pTokenReader->GetExpr(), m_vStringBuf); m_pParseFormula = &ParserBase::ParseCmdCodeShort; m_vStackBuffer[1] = (this->*m_pParseFormula)(); return m_vStackBuffer[1]; } else { m_vRPN.StoreEnvironment(m_pTokenReader->GetExpr(), m_vStringBuf); m_pParseFormula = &ParserBase::ParseCmdCode; return (this->*m_pParseFormula)(); } } catch (ParserError& exc) { exc.SetFormula(m_pTokenReader->GetExpr()); throw; } } //--------------------------------------------------------------------------- /** \brief Create an error containing the parse error position. This function will create an Parser Exception object containing the error text and its position. \param a_iErrc [in] The error code of type #EErrorCodes. \param a_iPos [in] The position where the error was detected. \param a_strTok [in] The token string representation associated with the error. \throw ParserException always throws that's the only purpose of this function. */ void ParserBase::Error(EErrorCodes a_iErrc, int a_iPos, const string_type& a_sTok) const { throw exception_type(a_iErrc, a_sTok, m_pTokenReader->GetExpr(), a_iPos); } //------------------------------------------------------------------------------ /** \brief Clear all user defined variables. \throw nothrow Resets the parser to string parsing mode by calling #ReInit. */ void ParserBase::ClearVar() { m_VarDef.clear(); ReInit(); } //------------------------------------------------------------------------------ /** \brief Remove a variable from internal storage. \throw nothrow Removes a variable if it exists. If the Variable does not exist nothing will be done. */ void ParserBase::RemoveVar(const string_type& a_strVarName) { varmap_type::iterator item = m_VarDef.find(a_strVarName); if (item != m_VarDef.end()) { m_VarDef.erase(item); ReInit(); } } //------------------------------------------------------------------------------ /** \brief Clear all functions. \post Resets the parser to string parsing mode. \throw nothrow */ void ParserBase::ClearFun() { m_FunDef.clear(); ReInit(); } //------------------------------------------------------------------------------ /** \brief Clear all user defined constants. Both numeric and string constants will be removed from the internal storage. \post Resets the parser to string parsing mode. \throw nothrow */ void ParserBase::ClearConst() { m_ConstDef.clear(); m_StrVarDef.clear(); ReInit(); } //------------------------------------------------------------------------------ /** \brief Clear all user defined postfix operators. \post Resets the parser to string parsing mode. \throw nothrow */ void ParserBase::ClearPostfixOprt() { m_PostOprtDef.clear(); ReInit(); } //------------------------------------------------------------------------------ /** \brief Clear all user defined binary operators. \post Resets the parser to string parsing mode. \throw nothrow */ void ParserBase::ClearOprt() { m_OprtDef.clear(); ReInit(); } //------------------------------------------------------------------------------ /** \brief Clear the user defined Prefix operators. \post Resets the parser to string parser mode. \throw nothrow */ void ParserBase::ClearInfixOprt() { m_InfixOprtDef.clear(); ReInit(); } //------------------------------------------------------------------------------ /** \brief Enable or disable the formula optimization feature. \post Resets the parser to string parser mode. \throw nothrow */ void ParserBase::EnableOptimizer(bool a_bIsOn) { m_vRPN.EnableOptimizer(a_bIsOn); ReInit(); } //--------------------------------------------------------------------------- /** \brief Enable the dumping of bytecode and stack content on the console. \param bDumpCmd Flag to enable dumping of the current bytecode to the console. \param bDumpStack Flag to enable dumping of the stack content is written to the console. This function is for debug purposes only! */ void ParserBase::EnableDebugDump(bool bDumpCmd, bool bDumpStack) { ParserBase::g_DbgDumpCmdCode = bDumpCmd; ParserBase::g_DbgDumpStack = bDumpStack; } //------------------------------------------------------------------------------ /** \brief Enable or disable the built in binary operators. \throw nothrow \sa m_bBuiltInOp, ReInit() If you disable the built in binary operators there will be no binary operators defined. Thus you must add them manually one by one. It is not possible to disable built in operators selectively. This function will Reinitialize the parser by calling ReInit(). */ void ParserBase::EnableBuiltInOprt(bool a_bIsOn) { m_bBuiltInOp = a_bIsOn; ReInit(); } //------------------------------------------------------------------------------ /** \brief Query status of built in variables. \return #m_bBuiltInOp; true if built in operators are enabled. \throw nothrow */ bool ParserBase::HasBuiltInOprt() const { return m_bBuiltInOp; } //------------------------------------------------------------------------------ /** \brief Get the argument separator character. */ char_type ParserBase::GetArgSep() const { return m_pTokenReader->GetArgSep(); } //------------------------------------------------------------------------------ /** \brief Set argument separator. \param cArgSep the argument separator character. */ void ParserBase::SetArgSep(char_type cArgSep) { m_pTokenReader->SetArgSep(cArgSep); } //------------------------------------------------------------------------------ /** \brief Dump stack content. This function is used for debugging only. */ void ParserBase::StackDump(const std::stack& a_stVal, const std::stack& a_stOprt) const { std::stack stOprt(a_stOprt); std::stack stVal(a_stVal); mu::console() << _T("\nValue stack:\n"); while (!stVal.empty()) { token_type val = stVal.top(); stVal.pop(); if (val.GetType() == tpSTR) mu::console() << _T(" \"") << val.GetAsString() << _T("\" "); else mu::console() << _T(" ") << val.GetVal() << _T(" "); } mu::console() << "\nOperator stack:\n"; while (!stOprt.empty()) { if (stOprt.top().GetCode() <= cmASSIGN) { mu::console() << _T("OPRT_INTRNL \"") << ParserBase::c_DefaultOprt[stOprt.top().GetCode()] << _T("\" \n"); } else { switch (stOprt.top().GetCode()) { case cmVAR: mu::console() << _T("VAR\n"); break; case cmVAL: mu::console() << _T("VAL\n"); break; case cmFUNC: mu::console() << _T("FUNC \"") << stOprt.top().GetAsString() << _T("\"\n"); break; case cmFUNC_BULK: mu::console() << _T("FUNC_BULK \"") << stOprt.top().GetAsString() << _T("\"\n"); break; case cmOPRT_INFIX: mu::console() << _T("OPRT_INFIX \"") << stOprt.top().GetAsString() << _T("\"\n"); break; case cmOPRT_BIN: mu::console() << _T("OPRT_BIN \"") << stOprt.top().GetAsString() << _T("\"\n"); break; case cmFUNC_STR: mu::console() << _T("FUNC_STR\n"); break; case cmEND: mu::console() << _T("END\n"); break; case cmUNKNOWN: mu::console() << _T("UNKNOWN\n"); break; case cmBO: mu::console() << _T("BRACKET \"(\"\n"); break; case cmBC: mu::console() << _T("BRACKET \")\"\n"); break; case cmIF: mu::console() << _T("IF\n"); break; case cmELSE: mu::console() << _T("ELSE\n"); break; case cmENDIF: mu::console() << _T("ENDIF\n"); break; default: mu::console() << stOprt.top().GetCode() << _T(" "); break; } } stOprt.pop(); } mu::console() << dec << endl; } /** \brief Calculate the result. A note on const correctness: I consider it important that Calc is a const function. Due to caching operations Calc changes only the state of internal variables with one exception m_UsedVar this is reset during string parsing and accessible from the outside. Instead of making Calc non const GetUsedVar is non const because it explicitly calls Eval() forcing this update. \pre A formula must be set. \pre Variables must have been set (if needed) \sa #m_pParseFormula \return The evaluation result \throw ParseException if no Formula is set or in case of any other error related to the formula. */ value_type ParserBase::Eval() const { return (this->*m_pParseFormula)(); } //------------------------------------------------------------------------------ /** \brief Evaluate an expression containing comma separated subexpressions \param [out] nStackSize The total number of results available \return Pointer to the array containing all expression results This member function can be used to retrieve all results of an expression made up of multiple comma separated subexpressions (i.e. "x+y,sin(x),cos(y)") */ value_type* ParserBase::Eval(int& nStackSize) const { if (m_vRPN.GetSize() > 0) { ParseCmdCode(); } else { ParseString(); } nStackSize = m_nFinalResultIdx; // (for historic reasons the stack starts at position 1) return &m_vStackBuffer[1]; } //--------------------------------------------------------------------------- /** \brief Return the number of results on the calculation stack. If the expression contains comma separated subexpressions (i.e. "sin(y), x+y"). There may be more than one return value. This function returns the number of available results. */ int ParserBase::GetNumResults() const { return m_nFinalResultIdx; } //--------------------------------------------------------------------------- void ParserBase::Eval(value_type* results, int nBulkSize) { CreateRPN(); int i = 0; #ifdef MUP_USE_OPENMP //#define DEBUG_OMP_STUFF #ifdef DEBUG_OMP_STUFF int* pThread = new int[nBulkSize]; int* pIdx = new int[nBulkSize]; #endif int nMaxThreads = std::min(omp_get_max_threads(), s_MaxNumOpenMPThreads); int nThreadID = 0; #ifdef DEBUG_OMP_STUFF int ct = 0; #endif omp_set_num_threads(nMaxThreads); const int chunkSize = std::max(nBulkSize/nMaxThreads, 1); #pragma omp parallel for schedule(static, chunkSize) private(nThreadID) for (i = 0; i < nBulkSize; ++i) { nThreadID = omp_get_thread_num(); results[i] = ParseCmdCodeBulk(i, nThreadID); #ifdef DEBUG_OMP_STUFF #pragma omp critical { pThread[ct] = nThreadID; pIdx[ct] = i; ct++; } #endif } #ifdef DEBUG_OMP_STUFF FILE* pFile = fopen("bulk_dbg.txt", "w"); for (i = 0; i < nBulkSize; ++i) { fprintf(pFile, "idx: %d thread: %d \n", pIdx[i], pThread[i]); } delete[] pIdx; delete[] pThread; fclose(pFile); #endif #else for (i = 0; i < nBulkSize; ++i) { results[i] = ParseCmdCodeBulk(i, 0); } #endif } } // namespace mu #if defined(_MSC_VER) #pragma warning(pop) #endif