4544 lines
133 KiB
C++
4544 lines
133 KiB
C++
/*
|
|
* Cppcheck - A tool for static C/C++ code analysis
|
|
* Copyright (C) 2007-2009 Daniel Marjamäki and Cppcheck team.
|
|
*
|
|
* This program is free software: you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
|
|
//---------------------------------------------------------------------------
|
|
#include "tokenize.h"
|
|
#include "token.h"
|
|
#include "filelister.h"
|
|
#include "mathlib.h"
|
|
#include "settings.h"
|
|
#include "errorlogger.h"
|
|
#include "check.h"
|
|
|
|
#include <locale>
|
|
#include <fstream>
|
|
#include <string>
|
|
#include <cstring>
|
|
#include <iostream>
|
|
#include <sstream>
|
|
#include <list>
|
|
#include <cassert>
|
|
#include <algorithm>
|
|
#include <cctype>
|
|
#include <stack>
|
|
#include <stdexcept> // for std::runtime_error
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
Tokenizer::Tokenizer()
|
|
: _settings(0), _errorLogger(0)
|
|
{
|
|
_tokens = 0;
|
|
_tokensBack = 0;
|
|
}
|
|
|
|
Tokenizer::Tokenizer(const Settings *settings, ErrorLogger *errorLogger)
|
|
: _settings(settings), _errorLogger(errorLogger)
|
|
{
|
|
_tokens = 0;
|
|
_tokensBack = 0;
|
|
}
|
|
|
|
Tokenizer::~Tokenizer()
|
|
{
|
|
deallocateTokens();
|
|
}
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
// Helper functions..
|
|
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
const Token *Tokenizer::tokens() const
|
|
{
|
|
return _tokens;
|
|
}
|
|
|
|
|
|
const std::vector<std::string> *Tokenizer::getFiles() const
|
|
{
|
|
return &_files;
|
|
}
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
//---------------------------------------------------------------------------
|
|
// addtoken
|
|
// add a token. Used by 'Tokenizer'
|
|
//---------------------------------------------------------------------------
|
|
|
|
void Tokenizer::addtoken(const char str[], const unsigned int lineno, const unsigned int fileno)
|
|
{
|
|
if (str[0] == 0)
|
|
return;
|
|
|
|
// Replace hexadecimal value with decimal
|
|
std::ostringstream str2;
|
|
if (strncmp(str, "0x", 2) == 0)
|
|
{
|
|
str2 << std::strtoul(str + 2, NULL, 16);
|
|
}
|
|
else
|
|
{
|
|
str2 << str;
|
|
}
|
|
|
|
if (_tokensBack)
|
|
{
|
|
_tokensBack->insertToken(str2.str().c_str());
|
|
_tokensBack = _tokensBack->next();
|
|
}
|
|
else
|
|
{
|
|
_tokens = new Token;
|
|
_tokensBack = _tokens;
|
|
_tokensBack->str(str2.str());
|
|
}
|
|
|
|
_tokensBack->linenr(lineno);
|
|
_tokensBack->fileIndex(fileno);
|
|
}
|
|
//---------------------------------------------------------------------------
|
|
|
|
//---------------------------------------------------------------------------
|
|
// SizeOfType - gives the size of a type
|
|
//---------------------------------------------------------------------------
|
|
|
|
|
|
|
|
unsigned int Tokenizer::sizeOfType(const Token *type) const
|
|
{
|
|
if (!type || !type->strAt(0))
|
|
return 0;
|
|
|
|
if (type->str()[0] == '"')
|
|
return static_cast<unsigned int>(Token::getStrLength(type) + 1);
|
|
|
|
std::map<std::string, unsigned int>::const_iterator it = _typeSize.find(type->strAt(0));
|
|
if (it == _typeSize.end())
|
|
return 0;
|
|
|
|
return it->second;
|
|
}
|
|
//---------------------------------------------------------------------------
|
|
|
|
//---------------------------------------------------------------------------
|
|
// InsertTokens - Copy and insert tokens
|
|
//---------------------------------------------------------------------------
|
|
|
|
void Tokenizer::insertTokens(Token *dest, const Token *src, unsigned int n)
|
|
{
|
|
while (n > 0)
|
|
{
|
|
dest->insertToken(src->str().c_str());
|
|
dest = dest->next();
|
|
dest->fileIndex(src->fileIndex());
|
|
dest->linenr(src->linenr());
|
|
dest->varId(src->varId());
|
|
src = src->next();
|
|
--n;
|
|
}
|
|
}
|
|
//---------------------------------------------------------------------------
|
|
|
|
//---------------------------------------------------------------------------
|
|
// Tokenize - tokenizes a given file.
|
|
//---------------------------------------------------------------------------
|
|
|
|
void Tokenizer::createTokens(std::istream &code)
|
|
{
|
|
// line number in parsed code
|
|
unsigned int lineno = 1;
|
|
|
|
// The current token being parsed
|
|
std::string CurrentToken;
|
|
|
|
// lineNumbers holds line numbers for files in fileIndexes
|
|
// every time an include file is complitely parsed, last item in the vector
|
|
// is removed and lineno is set to point to that value.
|
|
std::vector<unsigned int> lineNumbers;
|
|
|
|
// fileIndexes holds index for _files vector about currently parsed files
|
|
// every time an include file is complitely parsed, last item in the vector
|
|
// is removed and FileIndex is set to point to that value.
|
|
std::vector<unsigned int> fileIndexes;
|
|
|
|
// FileIndex. What file in the _files vector is read now?
|
|
unsigned int FileIndex = 0;
|
|
|
|
// Read one byte at a time from code and create tokens
|
|
for (char ch = (char)code.get(); code.good(); ch = (char)code.get())
|
|
{
|
|
// We are not handling UTF and stuff like that. Code is supposed to plain simple text.
|
|
if (ch < 0)
|
|
continue;
|
|
|
|
// char/string..
|
|
if (ch == '\'' || ch == '\"')
|
|
{
|
|
std::string line;
|
|
|
|
// read char
|
|
bool special = false;
|
|
char c = ch;
|
|
do
|
|
{
|
|
// Append token..
|
|
line += c;
|
|
|
|
if (c == '\n')
|
|
++lineno;
|
|
|
|
// Special sequence '\.'
|
|
if (special)
|
|
special = false;
|
|
else
|
|
special = (c == '\\');
|
|
|
|
// Get next character
|
|
c = (char)code.get();
|
|
}
|
|
while (code.good() && (special || c != ch));
|
|
line += ch;
|
|
|
|
// Handle #file "file.h"
|
|
if (CurrentToken == "#file")
|
|
{
|
|
// Extract the filename
|
|
line = line.substr(1, line.length() - 2);
|
|
|
|
// Has this file been tokenized already?
|
|
++lineno;
|
|
bool foundOurfile = false;
|
|
fileIndexes.push_back(FileIndex);
|
|
for (unsigned int i = 0; i < _files.size(); i++)
|
|
{
|
|
if (FileLister::sameFileName(_files[i].c_str(), line.c_str()))
|
|
{
|
|
// Use this index
|
|
foundOurfile = true;
|
|
FileIndex = i;
|
|
}
|
|
}
|
|
|
|
if (!foundOurfile)
|
|
{
|
|
// The "_files" vector remembers what files have been tokenized..
|
|
_files.push_back(FileLister::simplifyPath(line.c_str()));
|
|
FileIndex = static_cast<unsigned int>(_files.size() - 1);
|
|
}
|
|
|
|
lineNumbers.push_back(lineno);
|
|
lineno = 0;
|
|
}
|
|
else
|
|
{
|
|
// Add previous token
|
|
addtoken(CurrentToken.c_str(), lineno, FileIndex);
|
|
|
|
// Add content of the string
|
|
addtoken(line.c_str(), lineno, FileIndex);
|
|
}
|
|
|
|
CurrentToken.clear();
|
|
|
|
continue;
|
|
}
|
|
|
|
if (strchr("+-*/%&|^?!=<>[](){};:,.~\n ", ch))
|
|
{
|
|
if (ch == '.' &&
|
|
CurrentToken.length() > 0 &&
|
|
std::isdigit(CurrentToken[0]))
|
|
{
|
|
// Don't separate doubles "5.4"
|
|
}
|
|
else if (strchr("+-", ch) &&
|
|
CurrentToken.length() > 0 &&
|
|
std::isdigit(CurrentToken[0]) &&
|
|
CurrentToken[CurrentToken.length()-1] == 'e')
|
|
{
|
|
// Don't separate doubles "4.2e+10"
|
|
}
|
|
else
|
|
{
|
|
if (CurrentToken == "#file")
|
|
{
|
|
// Handle this where strings are handled
|
|
continue;
|
|
}
|
|
else if (CurrentToken == "#endfile")
|
|
{
|
|
if (lineNumbers.empty() || fileIndexes.empty())
|
|
{
|
|
std::cerr << "####### Preprocessor bug! #######\n";
|
|
std::exit(0);
|
|
}
|
|
|
|
lineno = lineNumbers.back();
|
|
lineNumbers.pop_back();
|
|
FileIndex = fileIndexes.back();
|
|
fileIndexes.pop_back();
|
|
CurrentToken.clear();
|
|
continue;
|
|
}
|
|
|
|
// If token contains # characters, split it up
|
|
std::string temp;
|
|
for (std::string::size_type i = 0; i < CurrentToken.length(); ++i)
|
|
{
|
|
if (CurrentToken[i] == '#' && CurrentToken.length() + 1 > i && CurrentToken[i+1] == '#')
|
|
{
|
|
addtoken(temp.c_str(), lineno, FileIndex);
|
|
temp.clear();
|
|
addtoken("##", lineno, FileIndex);
|
|
++i;
|
|
}
|
|
else
|
|
temp += CurrentToken[i];
|
|
}
|
|
|
|
addtoken(temp.c_str(), lineno, FileIndex);
|
|
CurrentToken.clear();
|
|
|
|
if (ch == '\n')
|
|
{
|
|
++lineno;
|
|
continue;
|
|
}
|
|
else if (ch == ' ')
|
|
{
|
|
continue;
|
|
}
|
|
|
|
CurrentToken += ch;
|
|
// Add "++", "--" or ">>" token
|
|
if ((ch == '+' || ch == '-' || ch == '>') && (code.peek() == ch))
|
|
CurrentToken += (char)code.get();
|
|
addtoken(CurrentToken.c_str(), lineno, FileIndex);
|
|
CurrentToken.clear();
|
|
continue;
|
|
}
|
|
}
|
|
|
|
CurrentToken += ch;
|
|
}
|
|
addtoken(CurrentToken.c_str(), lineno, FileIndex);
|
|
|
|
}
|
|
|
|
void Tokenizer::simplifyTypedef()
|
|
{
|
|
std::string className;
|
|
int classLevel = 0;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "class %any%"))
|
|
{
|
|
className = tok->next()->str();
|
|
classLevel = 0;
|
|
continue;
|
|
}
|
|
else if (tok->str() == "}")
|
|
{
|
|
--classLevel;
|
|
if (classLevel < 0)
|
|
className = "";
|
|
|
|
continue;
|
|
}
|
|
else if (tok->str() == "{")
|
|
{
|
|
++classLevel;
|
|
continue;
|
|
}
|
|
else if (tok->str() != "typedef")
|
|
continue;
|
|
|
|
const char *type1 = 0;
|
|
const char *type2 = 0;
|
|
const char *typeName = 0;
|
|
bool pointer = false;
|
|
|
|
if (Token::Match(tok->next(), "%type% %type% ;") ||
|
|
Token::Match(tok->next(), "%type% %type% *| %type% ;"))
|
|
{
|
|
if (tok->tokAt(3)->str() == ";")
|
|
{
|
|
type1 = tok->strAt(1);
|
|
type2 = 0;
|
|
typeName = tok->strAt(2);
|
|
tok = tok->tokAt(3);
|
|
}
|
|
else
|
|
{
|
|
pointer = (tok->tokAt(3)->str() == "*");
|
|
|
|
type1 = tok->strAt(1);
|
|
type2 = tok->strAt(2);
|
|
|
|
if (pointer)
|
|
{
|
|
typeName = tok->strAt(4);
|
|
tok = tok->tokAt(5);
|
|
}
|
|
else
|
|
{
|
|
typeName = tok->strAt(3);
|
|
tok = tok->tokAt(4);
|
|
|
|
}
|
|
}
|
|
|
|
const std::string pattern = className + " :: " + typeName;
|
|
int level = 0;
|
|
bool inScope = true;
|
|
|
|
bool exitThisScope = false;
|
|
int exitScope = 0;
|
|
bool simplifyType = false;
|
|
for (Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "}")
|
|
{
|
|
--level;
|
|
if (level < 0)
|
|
inScope = false;
|
|
|
|
if (exitThisScope)
|
|
{
|
|
if (level < exitScope)
|
|
exitThisScope = false;
|
|
}
|
|
}
|
|
else if (tok2->str() == "{")
|
|
++level;
|
|
else if (Token::Match(tok2, pattern.c_str()))
|
|
{
|
|
tok2->deleteNext();
|
|
tok2->deleteNext();
|
|
simplifyType = true;
|
|
}
|
|
else if (inScope && !exitThisScope && tok2->str() == typeName)
|
|
{
|
|
if (Token::Match(tok2->tokAt(-2), "!!typedef") &&
|
|
Token::Match(tok2->tokAt(-3), "!!typedef"))
|
|
{
|
|
simplifyType = true;
|
|
}
|
|
else
|
|
{
|
|
// Typedef with the same name.
|
|
exitThisScope = true;
|
|
exitScope = level;
|
|
}
|
|
}
|
|
|
|
if (simplifyType)
|
|
{
|
|
tok2->str(type1);
|
|
if (type2)
|
|
{
|
|
tok2->insertToken(type2);
|
|
tok2 = tok2->next();
|
|
}
|
|
if (pointer)
|
|
{
|
|
tok2->insertToken("*");
|
|
tok2 = tok2->next();
|
|
}
|
|
|
|
simplifyType = false;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
bool Tokenizer::tokenize(std::istream &code, const char FileName[])
|
|
{
|
|
// The "_files" vector remembers what files have been tokenized..
|
|
_files.push_back(FileLister::simplifyPath(FileName));
|
|
|
|
createTokens(code);
|
|
|
|
if (!createLinks())
|
|
{
|
|
// Source has syntax errors, can't proceed
|
|
return false;
|
|
}
|
|
|
|
simplifyDoWhileAddBraces();
|
|
simplifyIfAddBraces();
|
|
|
|
// Combine "- %num%" ..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "[(+-*/=,] - %num%") && tok->strAt(2)[0] != '-')
|
|
{
|
|
tok->next()->str(std::string("-") + tok->strAt(2));
|
|
tok->next()->deleteNext();
|
|
}
|
|
|
|
if (Token::Match(tok, "return - %num%") && tok->strAt(2)[0] != '-')
|
|
{
|
|
tok->next()->str(std::string("-") + tok->strAt(2));
|
|
tok->next()->deleteNext();
|
|
}
|
|
}
|
|
|
|
// Combine tokens..
|
|
for (Token *tok = _tokens; tok && tok->next(); tok = tok->next())
|
|
{
|
|
static const char * const combineWithNext[][3] =
|
|
{
|
|
{ "<", "<", "<<" },
|
|
|
|
{ "&", "&", "&&" },
|
|
{ "|", "|", "||" },
|
|
|
|
{ "+", "=", "+=" },
|
|
{ "-", "=", "-=" },
|
|
{ "*", "=", "*=" },
|
|
{ "/", "=", "/=" },
|
|
{ "&", "=", "&=" },
|
|
{ "|", "=", "|=" },
|
|
|
|
{ "=", "=", "==" },
|
|
{ "!", "=", "!=" },
|
|
{ "<", "=", "<=" },
|
|
{ ">", "=", ">=" },
|
|
|
|
{ ":", ":", "::" },
|
|
{ "-", ">", "." }, // Replace "->" with "."
|
|
|
|
{ "private", ":", "private:" },
|
|
{ "protected", ":", "protected:" },
|
|
{ "public", ":", "public:" },
|
|
{ "__published", ":", "__published:" }
|
|
};
|
|
|
|
for (unsigned ui = 0; ui < sizeof(combineWithNext) / sizeof(combineWithNext[0]); ui++)
|
|
{
|
|
if (tok->str() == combineWithNext[ui][0] && tok->next()->str() == combineWithNext[ui][1])
|
|
{
|
|
tok->str(combineWithNext[ui][2]);
|
|
tok->deleteNext();
|
|
}
|
|
}
|
|
}
|
|
|
|
// typedef..
|
|
simplifyTypedef();
|
|
|
|
// Remove __asm..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok->next(), "__asm|_asm|asm {") &&
|
|
tok->tokAt(2)->link() &&
|
|
tok->tokAt(2)->link()->next())
|
|
{
|
|
Token::eraseTokens(tok, tok->tokAt(2)->link()->next());
|
|
}
|
|
}
|
|
|
|
// Remove "volatile" and "mutable"
|
|
while (_tokens && (_tokens->str() == "volatile" || _tokens->str() == "mutable"))
|
|
{
|
|
_tokens->deleteThis();
|
|
}
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
while (tok->next() && (tok->next()->str() == "volatile" || tok->next()->str() == "mutable"))
|
|
{
|
|
tok->deleteNext();
|
|
}
|
|
}
|
|
|
|
// replace "unsigned i" with "unsigned int i"
|
|
unsignedint();
|
|
|
|
// Use "<" comparison instead of ">"
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "[;(] %any% >|>= %any% [);]"))
|
|
{
|
|
const std::string op1(tok->strAt(1));
|
|
tok->next()->str(tok->strAt(3));
|
|
tok->tokAt(3)->str(op1);
|
|
if (tok->tokAt(2)->str() == ">")
|
|
tok->tokAt(2)->str("<");
|
|
else
|
|
tok->tokAt(2)->str("<=");
|
|
}
|
|
}
|
|
|
|
/**
|
|
* @todo simplify "for"
|
|
* - move out start-statement "for (a;b;c);" => "{ a; for(;b;c); }"
|
|
* - try to change "for" loop to a "while" loop instead
|
|
*/
|
|
|
|
// Split up variable declarations.
|
|
simplifyVarDecl();
|
|
|
|
// Handle templates..
|
|
simplifyTemplates();
|
|
|
|
// Simplify the operator "?:"
|
|
simplifyConditionOperator();
|
|
|
|
// remove exception specifications..
|
|
removeExceptionSpecifications(_tokens);
|
|
|
|
setVarId();
|
|
|
|
return true;
|
|
}
|
|
//---------------------------------------------------------------------------
|
|
|
|
/**
|
|
* is the token pointing at a template parameters block..
|
|
* < int , 3 > => yes
|
|
* \param tok start token that must point at "<"
|
|
* \return true if the tokens look like template parameters
|
|
*/
|
|
static bool templateParameters(const Token *tok)
|
|
{
|
|
if (!tok)
|
|
return false;
|
|
if (tok->str() != "<")
|
|
return false;
|
|
tok = tok->next();
|
|
|
|
while (tok)
|
|
{
|
|
// num/type ..
|
|
if (!tok->isNumber() && !tok->isName())
|
|
return false;
|
|
tok = tok->next();
|
|
|
|
// optional "*"
|
|
if (tok->str() == "*")
|
|
tok = tok->next();
|
|
|
|
// ,/>
|
|
if (tok->str() == ">")
|
|
return true;
|
|
if (tok->str() != ",")
|
|
break;
|
|
tok = tok->next();
|
|
}
|
|
return false;
|
|
}
|
|
|
|
|
|
/**
|
|
* Remove "template < ..." they can cause false positives because they are not expanded
|
|
*/
|
|
static void removeTemplates(Token *tok)
|
|
{
|
|
for (; tok; tok = tok->next())
|
|
{
|
|
if (! Token::simpleMatch(tok, "template <"))
|
|
continue;
|
|
|
|
for (const Token *tok2 = tok->next(); tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "{")
|
|
{
|
|
tok2 = tok2->link();
|
|
tok2 = tok2 ? tok2->next() : 0;
|
|
Token::eraseTokens(tok, tok2);
|
|
tok->str(";");
|
|
break;
|
|
}
|
|
if (tok2->str() == "(")
|
|
{
|
|
tok2 = tok2->link();
|
|
if (!tok2)
|
|
break;
|
|
}
|
|
if (tok2->str() == ";")
|
|
{
|
|
Token::eraseTokens(tok, tok2->next());
|
|
tok->str(";");
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void Tokenizer::simplifyTemplates()
|
|
{
|
|
// Remove "typename" unless used in template arguments..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "typename")
|
|
tok->deleteThis();
|
|
|
|
if (Token::simpleMatch(tok, "template <"))
|
|
{
|
|
while (tok && tok->str() != ">")
|
|
tok = tok->next();
|
|
if (!tok)
|
|
break;
|
|
}
|
|
}
|
|
|
|
std::set<std::string> expandedtemplates;
|
|
|
|
// Locate specialized templates..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() != "template")
|
|
continue;
|
|
if (!Token::simpleMatch(tok->next(), "< >"))
|
|
continue;
|
|
|
|
// what kind of template is this?
|
|
Token *tok2 = tok->tokAt(3);
|
|
while (tok2 && (tok2->isName() || tok2->str() == "*"))
|
|
tok2 = tok2->next();
|
|
|
|
if (!templateParameters(tok2))
|
|
continue;
|
|
|
|
// unknown template.. bail out
|
|
if (!tok2->previous()->isName())
|
|
continue;
|
|
|
|
tok2 = tok2->previous();
|
|
std::string s;
|
|
{
|
|
std::ostringstream ostr;
|
|
const Token *tok3 = tok2;
|
|
for (tok3 = tok2; tok3 && tok3->str() != ">"; tok3 = tok3->next())
|
|
{
|
|
if (tok3 != tok2)
|
|
ostr << " ";
|
|
ostr << tok3->str();
|
|
}
|
|
if (!Token::Match(tok3, "> ("))
|
|
continue;
|
|
s = ostr.str();
|
|
}
|
|
|
|
// save search pattern..
|
|
const std::string pattern(s + " > (");
|
|
|
|
// remove spaces to create new name
|
|
while (s.find(" ") != std::string::npos)
|
|
s.erase(s.find(" "), 1);
|
|
const std::string name(s + ">");
|
|
expandedtemplates.insert(name);
|
|
|
|
// Rename template..
|
|
Token::eraseTokens(tok2, Token::findmatch(tok2, "("));
|
|
tok2->str(name);
|
|
|
|
// delete the "template < >"
|
|
tok->deleteThis();
|
|
tok->deleteThis();
|
|
tok->deleteThis();
|
|
|
|
// Use this special template in the code..
|
|
while (0 != (tok2 = const_cast<Token *>(Token::findmatch(tok2, pattern.c_str()))))
|
|
{
|
|
Token::eraseTokens(tok2, Token::findmatch(tok2, "("));
|
|
tok2->str(name);
|
|
}
|
|
}
|
|
|
|
// Locate templates..
|
|
std::list<Token *> templates;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::simpleMatch(tok, "template <"))
|
|
{
|
|
for (const Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
// Just a declaration => ignore this
|
|
if (tok2->str() == ";")
|
|
break;
|
|
|
|
// Implementation => add to "templates"
|
|
if (tok2->str() == "{")
|
|
{
|
|
templates.push_back(tok);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
if (templates.empty())
|
|
{
|
|
removeTemplates(_tokens);
|
|
return;
|
|
}
|
|
|
|
// Locate possible instantiations of templates..
|
|
std::list<Token *> used;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
// template definition.. skip it
|
|
if (Token::simpleMatch(tok, "template <"))
|
|
{
|
|
for (; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "{" || tok->str() == "(")
|
|
{
|
|
tok = tok->link();
|
|
if (!tok)
|
|
break;
|
|
if (tok->str() == "}")
|
|
break;
|
|
}
|
|
else if (tok->str() == ";")
|
|
{
|
|
break;
|
|
}
|
|
}
|
|
if (!tok)
|
|
break;
|
|
}
|
|
else if (Token::Match(tok->previous(), "[{};=] %var% <") ||
|
|
Token::Match(tok->tokAt(-2), "[,:] private|protected|public %var% <"))
|
|
{
|
|
if (templateParameters(tok->next()))
|
|
used.push_back(tok);
|
|
}
|
|
}
|
|
if (used.empty())
|
|
{
|
|
removeTemplates(_tokens);
|
|
return;
|
|
}
|
|
|
|
|
|
|
|
|
|
// Template arguments with default values
|
|
for (std::list<Token *>::iterator iter1 = templates.begin(); iter1 != templates.end(); ++iter1)
|
|
{
|
|
std::list<Token *> eq;
|
|
unsigned int templatepar = 1;
|
|
std::string classname;
|
|
for (Token *tok = *iter1; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == ">")
|
|
{
|
|
if (Token::Match(tok, "> class %var%"))
|
|
classname = tok->strAt(2);
|
|
break;
|
|
}
|
|
|
|
if (tok->str() == ",")
|
|
++templatepar;
|
|
|
|
else if (tok->str() == "=")
|
|
eq.push_back(tok);
|
|
}
|
|
if (eq.empty() || classname.empty())
|
|
continue;
|
|
|
|
for (std::list<Token *>::iterator iter2 = used.begin(); iter2 != used.end(); ++iter2)
|
|
{
|
|
Token *tok = *iter2;
|
|
|
|
if (!Token::Match(tok, (classname + " < %any%").c_str()))
|
|
continue;
|
|
|
|
// count the parameters..
|
|
unsigned int usedpar = 1;
|
|
for (tok = tok->tokAt(3); tok; tok = tok->tokAt(2))
|
|
{
|
|
if (tok->str() == ">")
|
|
break;
|
|
|
|
if (tok->str() == ",")
|
|
++usedpar;
|
|
|
|
else
|
|
break;
|
|
}
|
|
if (tok && tok->str() == ">")
|
|
{
|
|
tok = tok->previous();
|
|
std::list<Token *>::const_iterator it = eq.begin();
|
|
for (unsigned int i = (templatepar - eq.size()); it != eq.end() && i < usedpar; ++i)
|
|
++it;
|
|
while (it != eq.end())
|
|
{
|
|
tok->insertToken(",");
|
|
tok = tok->next();
|
|
tok->insertToken((*it)->strAt(1));
|
|
tok = tok->next();
|
|
++it;
|
|
}
|
|
}
|
|
}
|
|
|
|
for (std::list<Token *>::iterator it = eq.begin(); it != eq.end(); ++it)
|
|
{
|
|
(*it)->deleteThis();
|
|
(*it)->deleteThis();
|
|
}
|
|
}
|
|
|
|
|
|
// expand templates
|
|
bool done = false;
|
|
while (!done)
|
|
{
|
|
done = true;
|
|
for (std::list<Token *>::iterator iter1 = templates.begin(); iter1 != templates.end(); ++iter1)
|
|
{
|
|
Token *tok = *iter1;
|
|
|
|
std::vector<std::string> type;
|
|
for (tok = tok->tokAt(2); tok && tok->str() != ">"; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "%var% ,|>"))
|
|
type.push_back(tok->str());
|
|
}
|
|
|
|
// bail out if the end of the file was reached
|
|
if (!tok)
|
|
break;
|
|
|
|
// if this is a template function, get the position of the function name
|
|
unsigned int pos = 0;
|
|
if (Token::Match(tok, "> %type% *| %var% ("))
|
|
pos = 2;
|
|
else if (Token::Match(tok, "> %type% %type% *| %var% ("))
|
|
pos = 3;
|
|
if (pos > 0 && tok->tokAt(pos)->str() == "*")
|
|
++pos;
|
|
|
|
// name of template function/class..
|
|
const std::string name(tok->strAt(pos > 0 ? pos : 2));
|
|
|
|
const bool isfunc(pos > 0);
|
|
|
|
// locate template usage..
|
|
|
|
std::string s(name + " <");
|
|
for (unsigned int i = 0; i < type.size(); ++i)
|
|
{
|
|
if (i > 0)
|
|
s += ",";
|
|
s += " %any% ";
|
|
}
|
|
const std::string pattern(s + "> ");
|
|
|
|
std::string::size_type sz1 = used.size();
|
|
unsigned int recursiveCount = 0;
|
|
|
|
for (std::list<Token *>::iterator iter2 = used.begin(); iter2 != used.end(); ++iter2)
|
|
{
|
|
// If the size of "used" has changed, simplify calculations
|
|
if (sz1 != used.size())
|
|
{
|
|
sz1 = used.size();
|
|
simplifyCalculations();
|
|
recursiveCount++;
|
|
if (recursiveCount > 100)
|
|
{
|
|
// bail out..
|
|
break;
|
|
}
|
|
}
|
|
|
|
Token *tok2 = *iter2;
|
|
|
|
if (tok2->str() != name)
|
|
continue;
|
|
|
|
if (Token::Match(tok2->previous(), "[;{}=]") &&
|
|
!Token::Match(tok2, (pattern + (isfunc ? "(" : "%var%")).c_str()))
|
|
continue;
|
|
|
|
// New type..
|
|
std::vector<std::string> types2;
|
|
s = "";
|
|
for (const Token *tok3 = tok2->tokAt(2); tok3->str() != ">"; tok3 = tok3->next())
|
|
{
|
|
if (tok3->str() != ",")
|
|
types2.push_back(tok3->str());
|
|
s += tok3->str();
|
|
}
|
|
const std::string type2(s);
|
|
|
|
// New classname/funcname..
|
|
const std::string name2(name + "<" + type2 + ">");
|
|
|
|
if (expandedtemplates.find(name2) == expandedtemplates.end())
|
|
{
|
|
expandedtemplates.insert(name2);
|
|
// Copy template..
|
|
int _indentlevel = 0;
|
|
int _parlevel = 0;
|
|
for (const Token *tok3 = _tokens; tok3; tok3 = tok3->next())
|
|
{
|
|
if (tok3->str() == "{")
|
|
++_indentlevel;
|
|
else if (tok3->str() == "}")
|
|
--_indentlevel;
|
|
else if (tok3->str() == "(")
|
|
++_parlevel;
|
|
else if (tok3->str() == ")")
|
|
--_parlevel;
|
|
|
|
// Start of template..
|
|
if (tok3 == tok)
|
|
{
|
|
tok3 = tok3->next();
|
|
}
|
|
|
|
// member function implemented outside class definition
|
|
else if (_indentlevel == 0 && _parlevel == 0 && Token::Match(tok3, (pattern + " :: %var% (").c_str()))
|
|
{
|
|
addtoken(name2.c_str(), tok3->linenr(), tok3->fileIndex());
|
|
while (tok3->str() != "::")
|
|
tok3 = tok3->next();
|
|
}
|
|
|
|
// not part of template.. go on to next token
|
|
else
|
|
continue;
|
|
|
|
int indentlevel = 0;
|
|
std::stack<Token *> braces; // holds "{" tokens
|
|
std::stack<Token *> brackets; // holds "(" tokens
|
|
|
|
for (; tok3; tok3 = tok3->next())
|
|
{
|
|
if (tok3->str() == "{")
|
|
++indentlevel;
|
|
|
|
else if (tok3->str() == "}")
|
|
{
|
|
if (indentlevel <= 1)
|
|
{
|
|
// there is a bug if indentlevel is 0
|
|
// the "}" token should only be added if indentlevel is 1 but I add it always intentionally
|
|
// if indentlevel ever becomes 0, cppcheck will write:
|
|
// ### Error: Invalid number of character {
|
|
addtoken("}", tok3->linenr(), tok3->fileIndex());
|
|
Token::createMutualLinks(braces.top(), _tokensBack);
|
|
braces.pop();
|
|
break;
|
|
}
|
|
--indentlevel;
|
|
}
|
|
|
|
|
|
if (tok3->isName())
|
|
{
|
|
// search for this token in the type vector
|
|
unsigned int itype = 0;
|
|
while (itype < type.size() && type[itype] != tok3->str())
|
|
++itype;
|
|
|
|
// replace type with given type..
|
|
if (itype < type.size())
|
|
{
|
|
addtoken(types2[itype].c_str(), tok3->linenr(), tok3->fileIndex());
|
|
continue;
|
|
}
|
|
}
|
|
|
|
// replace name..
|
|
if (Token::Match(tok3, (name + " !!<").c_str()))
|
|
{
|
|
addtoken(name2.c_str(), tok3->linenr(), tok3->fileIndex());
|
|
continue;
|
|
}
|
|
|
|
// copy
|
|
addtoken(tok3->str().c_str(), tok3->linenr(), tok3->fileIndex());
|
|
if (Token::Match(tok3, "%type% <"))
|
|
{
|
|
if (!Token::Match(tok3, (name + " <").c_str()))
|
|
done = false;
|
|
used.push_back(_tokensBack);
|
|
}
|
|
|
|
// link() newly tokens manually
|
|
if (tok3->str() == "{")
|
|
{
|
|
braces.push(_tokensBack);
|
|
}
|
|
else if (tok3->str() == "}")
|
|
{
|
|
assert(braces.empty() == false);
|
|
Token::createMutualLinks(braces.top(), _tokensBack);
|
|
braces.pop();
|
|
}
|
|
else if (tok3->str() == "(")
|
|
{
|
|
brackets.push(_tokensBack);
|
|
}
|
|
else if (tok3->str() == ")")
|
|
{
|
|
assert(brackets.empty() == false);
|
|
Token::createMutualLinks(brackets.top(), _tokensBack);
|
|
brackets.pop();
|
|
}
|
|
|
|
}
|
|
|
|
assert(braces.empty());
|
|
assert(brackets.empty());
|
|
}
|
|
}
|
|
|
|
// Replace all these template usages..
|
|
s = name + " < " + type2 + " >";
|
|
for (std::string::size_type pos = s.find(","); pos != std::string::npos; pos = s.find(",", pos + 2))
|
|
{
|
|
s.insert(pos + 1, " ");
|
|
s.insert(pos, " ");
|
|
}
|
|
for (Token *tok4 = tok2; tok4; tok4 = tok4->next())
|
|
{
|
|
if (Token::simpleMatch(tok4, s.c_str()))
|
|
{
|
|
tok4->str(name2);
|
|
while (tok4->next()->str() != ">")
|
|
tok4->deleteNext();
|
|
tok4->deleteNext();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
removeTemplates(_tokens);
|
|
}
|
|
//---------------------------------------------------------------------------
|
|
|
|
void Tokenizer::updateClassList()
|
|
{
|
|
const char pattern_class[] = "class %var% [{:]";
|
|
_classInfoList.clear();
|
|
|
|
// Locate class
|
|
const Token *tok1 = tokens();
|
|
while ((tok1 = Token::findmatch(tok1, pattern_class)) != 0)
|
|
{
|
|
const char *className;
|
|
className = tok1->strAt(1);
|
|
tok1 = tok1->next();
|
|
|
|
ClassInfo::MemberType memberType = ClassInfo::PRIVATE;
|
|
int indentlevel = 0;
|
|
for (const Token *tok = tok1; tok; tok = tok->next())
|
|
{
|
|
// Indentation
|
|
if (tok->str() == "{")
|
|
{
|
|
++indentlevel;
|
|
continue;
|
|
}
|
|
|
|
else if (tok->str() == "}")
|
|
{
|
|
--indentlevel;
|
|
if (indentlevel <= 0)
|
|
break;
|
|
|
|
continue;
|
|
}
|
|
|
|
// Parse class contents (indentlevel == 1)..
|
|
if (indentlevel == 1)
|
|
{
|
|
if (tok->str() == "private:")
|
|
memberType = ClassInfo::PRIVATE;
|
|
else if (tok->str() == "protected:")
|
|
memberType = ClassInfo::PROTECTED;
|
|
else if (tok->str() == "public:")
|
|
memberType = ClassInfo::PUBLIC;
|
|
|
|
else if (Token::Match(tok, "typedef %type% ("))
|
|
tok = tok->tokAt(2);
|
|
|
|
else if (Token::Match(tok, "[:,] %var% ("))
|
|
tok = tok->tokAt(2);
|
|
|
|
else if (Token::Match(tok, "%var% ("))
|
|
{
|
|
// member function
|
|
ClassInfo::MemberFunctionInfo func;
|
|
func._declaration = tok;
|
|
func._name = tok->str();
|
|
func._type = memberType;
|
|
|
|
_classInfoList[className]._memberFunctions.push_back(func);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
void Tokenizer::setVarId()
|
|
{
|
|
// Clear all variable ids
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
tok->varId(0);
|
|
|
|
// Set variable ids..
|
|
unsigned int _varId = 0;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok != _tokens && !Token::Match(tok, "[,;{}(] %type%"))
|
|
continue;
|
|
|
|
if (Token::Match(tok, "[,;{}(] %type%"))
|
|
tok = tok->next();
|
|
|
|
if (Token::Match(tok, "class|struct %type% :|{|;"))
|
|
continue;
|
|
|
|
if (Token::Match(tok, "else|return|typedef|delete|sizeof"))
|
|
continue;
|
|
|
|
if (Token::Match(tok, "const|static|extern|public:|private:|protected:"))
|
|
tok = tok->next();
|
|
|
|
while (Token::Match(tok, "%var% ::"))
|
|
tok = tok->tokAt(2);
|
|
|
|
// Skip template arguments..
|
|
if (Token::Match(tok, "%type% <"))
|
|
{
|
|
Token *tok2 = tok->tokAt(2);
|
|
|
|
while (Token::Match(tok2, "%var% ::"))
|
|
tok2 = tok2->tokAt(2);
|
|
|
|
while (tok2 && (tok2->isName() || tok2->isNumber() || tok2->str() == "*" || tok2->str() == ","))
|
|
tok2 = tok2->next();
|
|
|
|
if (Token::Match(tok2, "> %var%"))
|
|
tok = tok2;
|
|
else if (Token::Match(tok2, "> ::|*|& %var%"))
|
|
tok = tok2->next();
|
|
else
|
|
continue; // Not code that I understand / not a variable declaration
|
|
}
|
|
|
|
// Determine name of declared variable..
|
|
const char *varname = 0;
|
|
Token *tok2 = tok->tokAt(1);
|
|
while (tok2)
|
|
{
|
|
if (tok2->isName())
|
|
varname = tok2->strAt(0);
|
|
else if (tok2->str() != "*" && tok2->str() != "&")
|
|
break;
|
|
tok2 = tok2->next();
|
|
}
|
|
|
|
// End of tokens reached..
|
|
if (!tok2)
|
|
break;
|
|
|
|
// Is it a function?
|
|
if (tok2->str() == "(")
|
|
{
|
|
// Search for function declaration, e.g. void f();
|
|
if (Token::simpleMatch(tok2->next(), ") ;"))
|
|
continue;
|
|
|
|
// Search for function declaration, e.g. void f( int c );
|
|
if (Token::Match(tok2->next(), "%num%") ||
|
|
Token::Match(tok2->next(), "%bool%") ||
|
|
tok2->next()->str()[0] == '"' ||
|
|
tok2->next()->varId() != 0)
|
|
{
|
|
// This is not a function
|
|
}
|
|
else
|
|
{
|
|
continue;
|
|
}
|
|
}
|
|
|
|
// Variable declaration found => Set variable ids
|
|
if (Token::Match(tok2, "[,();[=]") && varname)
|
|
{
|
|
++_varId;
|
|
int indentlevel = 0;
|
|
int parlevel = 0;
|
|
bool dot = false;
|
|
bool funcDeclaration = false;
|
|
for (tok2 = tok->next(); tok2; tok2 = tok2->next())
|
|
{
|
|
if (!dot && tok2->str() == varname && !Token::Match(tok2->previous(), "struct|union"))
|
|
tok2->varId(_varId);
|
|
else if (tok2->str() == "{")
|
|
++indentlevel;
|
|
else if (tok2->str() == "}")
|
|
{
|
|
--indentlevel;
|
|
if (indentlevel < 0)
|
|
break;
|
|
|
|
// We have reached the end of a loop: "for( int i;;) { }"
|
|
if (funcDeclaration && indentlevel <= 0)
|
|
break;
|
|
}
|
|
else if (tok2->str() == "(")
|
|
++parlevel;
|
|
else if (tok2->str() == ")")
|
|
{
|
|
// Is this a function parameter or a variable declared in for example a for loop?
|
|
if (parlevel == 0 && indentlevel == 0 && Token::Match(tok2, ") const| {"))
|
|
funcDeclaration = true;
|
|
else
|
|
--parlevel;
|
|
}
|
|
else if (parlevel < 0 && tok2->str() == ";")
|
|
break;
|
|
dot = bool(tok2->str() == ".");
|
|
}
|
|
}
|
|
}
|
|
|
|
// Struct/Class members
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
// str.clear is a variable
|
|
// str.clear() is a member function
|
|
if (tok->varId() != 0 &&
|
|
Token::Match(tok->next(), ". %var% !!(") &&
|
|
tok->tokAt(2)->varId() == 0)
|
|
{
|
|
++_varId;
|
|
|
|
const std::string pattern(std::string("%varid% . ") + tok->strAt(2));
|
|
for (Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
if (Token::Match(tok2, pattern.c_str(), tok->varId()))
|
|
tok2->tokAt(2)->varId(_varId);
|
|
}
|
|
}
|
|
}
|
|
|
|
// Member functions in this source
|
|
std::list<Token *> allMemberFunctions;
|
|
{
|
|
const std::string funcpattern("%var% :: %var% (");
|
|
for (Token *tok2 = _tokens; tok2; tok2 = tok2->next())
|
|
{
|
|
// Found a class function..
|
|
if (Token::Match(tok2, funcpattern.c_str()))
|
|
{
|
|
allMemberFunctions.push_back(tok2);
|
|
}
|
|
}
|
|
}
|
|
|
|
// class members..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "class %var% {"))
|
|
{
|
|
const std::string &classname(tok->next()->str());
|
|
|
|
|
|
// What member variables are there in this class?
|
|
std::map<std::string, unsigned int> varlist;
|
|
{
|
|
unsigned int indentlevel = 0;
|
|
for (const Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
// Indentation..
|
|
if (tok2->str() == "{")
|
|
++indentlevel;
|
|
else if (tok2->str() == "}")
|
|
{
|
|
if (indentlevel <= 1)
|
|
break;
|
|
--indentlevel;
|
|
}
|
|
|
|
// Found a member variable..
|
|
else if (indentlevel == 1 && tok2->varId() > 0)
|
|
varlist[tok2->str()] = tok2->varId();
|
|
}
|
|
}
|
|
|
|
// Are there any member variables in this class?
|
|
if (varlist.empty())
|
|
continue;
|
|
|
|
|
|
// Member functions for this class..
|
|
std::list<Token *> funclist;
|
|
{
|
|
const std::string funcpattern(classname + " :: %var% (");
|
|
for (std::list<Token *>::iterator func = allMemberFunctions.begin(); func != allMemberFunctions.end(); ++func)
|
|
{
|
|
Token *tok2 = *func;
|
|
|
|
// Found a class function..
|
|
if (Token::Match(tok2, funcpattern.c_str()))
|
|
{
|
|
// Goto the end paranthesis..
|
|
tok2 = tok2->tokAt(3)->link();
|
|
if (!tok2)
|
|
break;
|
|
|
|
// If this is a function implementation.. add it to funclist
|
|
if (Token::Match(tok2, ") const|volatile| {"))
|
|
funclist.push_back(tok2);
|
|
}
|
|
}
|
|
}
|
|
|
|
// Are there any member functions for this class?
|
|
if (funclist.empty())
|
|
continue;
|
|
|
|
// Update the variable ids..
|
|
// Parse each function..
|
|
for (std::list<Token *>::iterator func = funclist.begin(); func != funclist.end(); ++func)
|
|
{
|
|
unsigned int indentlevel = 0;
|
|
for (Token *tok2 = *func; tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "{")
|
|
++indentlevel;
|
|
else if (tok2->str() == "}")
|
|
{
|
|
if (indentlevel <= 1)
|
|
break;
|
|
--indentlevel;
|
|
}
|
|
else if (indentlevel > 0 &&
|
|
tok2->varId() == 0 &&
|
|
varlist.find(tok2->str()) != varlist.end())
|
|
{
|
|
tok2->varId(varlist[tok2->str()]);
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
//---------------------------------------------------------------------------
|
|
// Simplify token list
|
|
//---------------------------------------------------------------------------
|
|
|
|
void Tokenizer::simplifyNamespaces()
|
|
{
|
|
for (Token *token = _tokens; token; token = token->next())
|
|
{
|
|
while (token && token->str() == "namespace" &&
|
|
(!token->previous() || token->previous()->str() != "using"))
|
|
{
|
|
// Token is namespace and there is no "using" before it.
|
|
Token *start = token;
|
|
Token *tok = token->tokAt(2);
|
|
if (!tok)
|
|
return;
|
|
|
|
tok = tok->link();
|
|
if (tok && tok->str() == "}")
|
|
{
|
|
tok = tok->previous();
|
|
tok->deleteNext();
|
|
start->deleteNext();
|
|
start->deleteNext();
|
|
if (start->previous())
|
|
{
|
|
token = start->next();
|
|
start = start->previous();
|
|
start->deleteNext();
|
|
}
|
|
else
|
|
{
|
|
// First token in the list, don't delete
|
|
// as _tokens is attached to it.
|
|
start->deleteThis();
|
|
}
|
|
}
|
|
else
|
|
{
|
|
return;
|
|
}
|
|
}
|
|
|
|
if (!token)
|
|
break;
|
|
}
|
|
}
|
|
|
|
bool Tokenizer::createLinks()
|
|
{
|
|
std::list<Token*> links;
|
|
std::list<Token*> links2;
|
|
std::list<Token*> links3;
|
|
for (Token *token = _tokens; token; token = token->next())
|
|
{
|
|
if (token->link())
|
|
{
|
|
token->link(0);
|
|
}
|
|
|
|
if (token->str() == "{")
|
|
{
|
|
links.push_back(token);
|
|
}
|
|
else if (token->str() == "}")
|
|
{
|
|
if (links.size() == 0)
|
|
{
|
|
// Error, { and } don't match.
|
|
syntaxError(token, '{');
|
|
return false;
|
|
}
|
|
|
|
Token::createMutualLinks(links.back(), token);
|
|
links.pop_back();
|
|
}
|
|
else if (token->str() == "(")
|
|
{
|
|
links2.push_back(token);
|
|
}
|
|
else if (token->str() == ")")
|
|
{
|
|
if (links2.size() == 0)
|
|
{
|
|
// Error, ( and ) don't match.
|
|
syntaxError(token, '(');
|
|
return false;
|
|
}
|
|
|
|
Token::createMutualLinks(links2.back(), token);
|
|
links2.pop_back();
|
|
}
|
|
else if (token->str() == "[")
|
|
{
|
|
links3.push_back(token);
|
|
}
|
|
else if (token->str() == "]")
|
|
{
|
|
if (links3.size() == 0)
|
|
{
|
|
// Error, [ and ] don't match.
|
|
syntaxError(token, '[');
|
|
return false;
|
|
}
|
|
|
|
Token::createMutualLinks(links3.back(), token);
|
|
links3.pop_back();
|
|
}
|
|
}
|
|
|
|
if (links.size() > 0)
|
|
{
|
|
// Error, { and } don't match.
|
|
syntaxError(_tokens, '{');
|
|
return false;
|
|
}
|
|
|
|
if (links2.size() > 0)
|
|
{
|
|
// Error, ( and ) don't match.
|
|
syntaxError(_tokens, '(');
|
|
return false;
|
|
}
|
|
|
|
if (links3.size() > 0)
|
|
{
|
|
// Error, [ and ] don't match.
|
|
syntaxError(_tokens, '[');
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
void Tokenizer::simplifySizeof()
|
|
{
|
|
// Fill the map _typeSize..
|
|
_typeSize.clear();
|
|
_typeSize["char"] = sizeof(char);
|
|
_typeSize["short"] = sizeof(short);
|
|
_typeSize["int"] = sizeof(int);
|
|
_typeSize["long"] = sizeof(long);
|
|
_typeSize["float"] = sizeof(float);
|
|
_typeSize["double"] = sizeof(double);
|
|
_typeSize["*"] = sizeof(void *);
|
|
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "class|struct %var%"))
|
|
{
|
|
_typeSize[tok->strAt(1)] = 100;
|
|
}
|
|
}
|
|
|
|
// Locate variable declarations and calculate the size
|
|
std::map<unsigned int, std::string> sizeOfVar;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->varId() != 0 && sizeOfVar.find(tok->varId()) == sizeOfVar.end())
|
|
{
|
|
const unsigned int varId = tok->varId();
|
|
if (Token::Match(tok->tokAt(-3), "[;{}(,] %type% * %var% [;,)]") ||
|
|
Token::Match(tok->tokAt(-4), "[;{}(,] const %type% * %var% [;),]") ||
|
|
Token::Match(tok->tokAt(-2), "[;{}(,] %type% %var% [;),]") ||
|
|
Token::Match(tok->tokAt(-3), "[;{}(,] const %type% %var% [;),]"))
|
|
{
|
|
const unsigned int size = sizeOfType(tok->previous());
|
|
if (size == 0)
|
|
{
|
|
continue;
|
|
}
|
|
|
|
sizeOfVar[varId] = MathLib::toString<long>(size);
|
|
}
|
|
|
|
else if (Token::Match(tok->tokAt(-1), "%type% %var% [ %num% ] [;=]") ||
|
|
Token::Match(tok->tokAt(-2), "%type% * %var% [ %num% ] [;=]"))
|
|
{
|
|
unsigned int size = sizeOfType(tok->tokAt(-1));
|
|
if (size == 0)
|
|
continue;
|
|
|
|
sizeOfVar[varId] = MathLib::toString<long>(size * MathLib::toLongNumber(tok->strAt(2)));
|
|
}
|
|
|
|
else if (Token::Match(tok->tokAt(-1), "%type% %var% [ %num% ] [,)]") ||
|
|
Token::Match(tok->tokAt(-2), "%type% * %var% [ %num% ] [,)]"))
|
|
{
|
|
Token tempTok;
|
|
tempTok.str("*");
|
|
sizeOfVar[varId] = MathLib::toString<long>(sizeOfType(&tempTok));
|
|
}
|
|
|
|
else if (Token::Match(tok->tokAt(-1), "%type% %var% [ ] = %str% ;"))
|
|
{
|
|
unsigned int size = sizeOfType(tok->tokAt(4));
|
|
if (size == 0)
|
|
continue;
|
|
|
|
sizeOfVar[varId] = MathLib::toString<long>(size);
|
|
}
|
|
}
|
|
}
|
|
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() != "sizeof")
|
|
continue;
|
|
|
|
// sizeof "text"
|
|
if (Token::Match(tok->next(), "%str%"))
|
|
{
|
|
tok->deleteThis();
|
|
std::ostringstream ostr;
|
|
ostr << (Token::getStrLength(tok) + 1);
|
|
tok->str(ostr.str());
|
|
continue;
|
|
}
|
|
|
|
// sizeof ("text")
|
|
if (Token::Match(tok->next(), "( %str% )"))
|
|
{
|
|
tok->deleteThis();
|
|
tok->deleteThis();
|
|
tok->deleteNext();
|
|
std::ostringstream ostr;
|
|
ostr << (Token::getStrLength(tok) + 1);
|
|
tok->str(ostr.str());
|
|
continue;
|
|
}
|
|
|
|
// sizeof int -> sizeof( int )
|
|
if (tok->strAt(1) != std::string("("))
|
|
{
|
|
// Add parenthesis around the sizeof
|
|
for (Token *tempToken = tok->next(); tempToken; tempToken = tempToken->next())
|
|
{
|
|
if (Token::Match(tempToken, "%var%"))
|
|
{
|
|
while (tempToken->next()->str() == "[")
|
|
{
|
|
tempToken = tempToken->next()->link();
|
|
}
|
|
|
|
if (tempToken->next()->str() == ".")
|
|
{
|
|
// We are checking a class or struct, search next varname
|
|
tempToken = tempToken->tokAt(1);
|
|
continue;
|
|
}
|
|
else if (Token::simpleMatch(tempToken->next(), "- >"))
|
|
{
|
|
// We are checking a class or struct, search next varname
|
|
tempToken = tempToken->tokAt(2);
|
|
continue;
|
|
}
|
|
else if (Token::Match(tempToken->next(), "++|--"))
|
|
{
|
|
// We have variable++ or variable--, there should be
|
|
// nothing after this
|
|
tempToken = tempToken->tokAt(2);
|
|
}
|
|
|
|
// Ok, we should be clean. Add ) after tempToken
|
|
tok->insertToken("(");
|
|
tempToken->insertToken(")");
|
|
Token::createMutualLinks(tok->next(), tempToken->next());
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
// sizeof(type *) => sizeof(*)
|
|
if (Token::Match(tok->next(), "( %type% *)"))
|
|
{
|
|
tok->next()->deleteNext();
|
|
continue;
|
|
}
|
|
|
|
if (Token::Match(tok->next(), "( * )"))
|
|
{
|
|
tok->str(MathLib::toString<long>(sizeOfType(tok->tokAt(2))));
|
|
Token::eraseTokens(tok, tok->tokAt(4));
|
|
}
|
|
|
|
// sizeof( a )
|
|
else if (Token::Match(tok->next(), "( %var% )") && tok->tokAt(2)->varId() != 0)
|
|
{
|
|
if (sizeOfVar.find(tok->tokAt(2)->varId()) != sizeOfVar.end())
|
|
{
|
|
tok->deleteThis();
|
|
tok->deleteThis();
|
|
tok->deleteNext();
|
|
tok->str(sizeOfVar[tok->varId()]);
|
|
}
|
|
else
|
|
{
|
|
// don't try to replace size of variable if variable has
|
|
// similar name with type (#329)
|
|
}
|
|
}
|
|
|
|
else if (Token::Match(tok, "sizeof ( %type% )"))
|
|
{
|
|
unsigned int size = sizeOfType(tok->tokAt(2));
|
|
if (size > 0)
|
|
{
|
|
tok->str(MathLib::toString<long>(size));
|
|
Token::eraseTokens(tok, tok->tokAt(4));
|
|
}
|
|
}
|
|
|
|
else if (Token::Match(tok, "sizeof ( * %var% )") || Token::Match(tok, "sizeof ( %var% [ %num% ] )"))
|
|
{
|
|
// Some default value..
|
|
unsigned int sz = 0;
|
|
|
|
unsigned int varid = tok->tokAt((tok->tokAt(2)->str() == "*") ? 3 : 2)->varId();
|
|
if (varid != 0)
|
|
{
|
|
// Try to locate variable declaration..
|
|
const Token *decltok = Token::findmatch(_tokens, "%varid%", varid);
|
|
if (Token::Match(decltok->previous(), "%type% %var% ["))
|
|
{
|
|
sz = sizeOfType(decltok->previous());
|
|
}
|
|
else if (Token::Match(decltok->previous(), "* %var% ["))
|
|
{
|
|
sz = sizeOfType(decltok->previous());
|
|
}
|
|
else if (Token::Match(decltok->tokAt(-2), "%type% * %var%"))
|
|
{
|
|
sz = sizeOfType(decltok->tokAt(-2));
|
|
}
|
|
}
|
|
|
|
if (sz > 0)
|
|
{
|
|
tok->str(MathLib::toString<long>(sz));
|
|
Token::eraseTokens(tok, tok->next()->link()->next());
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
void Tokenizer::simplifyTokenList()
|
|
{
|
|
simplifyNamespaces();
|
|
|
|
simplifyGoto();
|
|
|
|
// Combine wide strings
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
while (tok->str() == "L" && tok->next() && tok->next()->str()[0] == '"')
|
|
{
|
|
// Combine 'L "string"'
|
|
tok->str(tok->next()->str());
|
|
tok->deleteNext();
|
|
}
|
|
}
|
|
|
|
// Combine strings
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str()[0] != '"')
|
|
continue;
|
|
|
|
tok->str(simplifyString(tok->str()));
|
|
while (tok->next() && tok->next()->str()[0] == '"')
|
|
{
|
|
tok->next()->str(simplifyString(tok->next()->str()));
|
|
|
|
// Two strings after each other, combine them
|
|
tok->concatStr(tok->next()->str());
|
|
tok->deleteNext();
|
|
}
|
|
}
|
|
|
|
// Convert e.g. atol("0") into 0
|
|
simplifyMathFunctions();
|
|
|
|
// Remove unwanted keywords
|
|
static const char * const unwantedWords[] = { "unsigned", "unlikely", "likely" };
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
for (unsigned ui = 0; ui < sizeof(unwantedWords) / sizeof(unwantedWords[0]) && tok->next(); ui++)
|
|
{
|
|
if (tok->next()->str() == unwantedWords[ui])
|
|
{
|
|
tok->deleteNext();
|
|
break;
|
|
}
|
|
}
|
|
if (Token::simpleMatch(tok->next(), "__builtin_expect ("))
|
|
{
|
|
unsigned int parlevel = 0;
|
|
for (Token *tok2 = tok->next(); tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "(")
|
|
++parlevel;
|
|
else if (tok2->str() == ")")
|
|
{
|
|
if (parlevel <= 1)
|
|
break;
|
|
--parlevel;
|
|
}
|
|
if (parlevel == 1 && tok2->str() == ",")
|
|
{
|
|
if (Token::Match(tok2, ", %num% )"))
|
|
{
|
|
tok->deleteNext();
|
|
Token::eraseTokens(tok2->previous(), tok2->tokAt(2));
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// Convert + + into + and + - into -
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
while (tok->next())
|
|
{
|
|
if (tok->str() == "+")
|
|
{
|
|
if (tok->next()->str() == "+")
|
|
{
|
|
tok->deleteNext();
|
|
continue;
|
|
}
|
|
else if (tok->next()->str() == "-")
|
|
{
|
|
tok->str("-");
|
|
tok->deleteNext();
|
|
continue;
|
|
}
|
|
}
|
|
else if (tok->str() == "-")
|
|
{
|
|
if (tok->next()->str() == "-")
|
|
{
|
|
tok->str("+");
|
|
tok->deleteNext();
|
|
continue;
|
|
}
|
|
else if (tok->next()->str() == "+")
|
|
{
|
|
tok->deleteNext();
|
|
continue;
|
|
}
|
|
}
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
// 0[a] -> a[0]
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "%num% [ %var% ]"))
|
|
{
|
|
const std::string temp = tok->str();
|
|
tok->str(tok->tokAt(2)->str());
|
|
tok->tokAt(2)->str(temp);
|
|
}
|
|
}
|
|
|
|
simplifySizeof();
|
|
|
|
// change array to pointer..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "%type% %var% [ ] [,;=]"))
|
|
{
|
|
Token::eraseTokens(tok->next(), tok->tokAt(4));
|
|
tok->insertToken("*");
|
|
}
|
|
}
|
|
|
|
// Replace constants..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "const %type% %var% = %num% ;"))
|
|
{
|
|
unsigned int varId = tok->tokAt(2)->varId();
|
|
if (varId == 0)
|
|
{
|
|
tok = tok->tokAt(5);
|
|
continue;
|
|
}
|
|
|
|
const char *num = tok->strAt(4);
|
|
int indent = 1;
|
|
for (Token *tok2 = tok->tokAt(6); tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "{")
|
|
{
|
|
++indent;
|
|
}
|
|
else if (tok2->str() == "}")
|
|
{
|
|
--indent;
|
|
if (indent == 0)
|
|
break;
|
|
}
|
|
|
|
// Compare constants, but don't touch members of other structures
|
|
else if (tok2->varId() == varId)
|
|
{
|
|
tok2->str(num);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
simplifyLogicalOperators();
|
|
simplifyCasts();
|
|
|
|
// Simplify simple calculations..
|
|
while (simplifyCalculations())
|
|
;
|
|
|
|
// Replace "*(str + num)" => "str[num]"
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (! strchr(";{}(=<>", tok->str()[0]))
|
|
continue;
|
|
|
|
Token *next = tok->next();
|
|
if (! next)
|
|
break;
|
|
|
|
if (Token::Match(next, "* ( %var% + %num% )"))
|
|
{
|
|
const char *str[4] = {"var", "[", "num", "]"};
|
|
str[0] = tok->strAt(3);
|
|
str[2] = tok->strAt(5);
|
|
|
|
for (int i = 0; i < 4; i++)
|
|
{
|
|
tok = tok->next();
|
|
tok->str(str[i]);
|
|
}
|
|
|
|
tok->deleteNext();
|
|
tok->deleteNext();
|
|
}
|
|
}
|
|
|
|
// Simplify variable declarations
|
|
simplifyVarDecl();
|
|
|
|
// Replace NULL with 0..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "NULL" || tok->str() == "'\\0'")
|
|
{
|
|
tok->str("0");
|
|
}
|
|
else if (tok->isNumber() &&
|
|
MathLib::isInt(tok->str()) &&
|
|
MathLib::toLongNumber(tok->str()) == 0)
|
|
{
|
|
tok->str("0");
|
|
}
|
|
}
|
|
|
|
// Replace pointer casts of 0.. "(char *)0" => "0"
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok->next(), "( %type% * ) 0") ||
|
|
Token::Match(tok->next(), "( %type% %type% * ) 0"))
|
|
{
|
|
Token::eraseTokens(tok, tok->next()->link()->next());
|
|
}
|
|
}
|
|
|
|
simplifyFunctionParameters();
|
|
|
|
elseif();
|
|
simplifyRedundantParanthesis();
|
|
simplifyIfNot();
|
|
simplifyIfNotNull();
|
|
simplifyIfAssign();
|
|
|
|
simplifyNestedStrcat();
|
|
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "case %any% : %var%"))
|
|
tok->tokAt(2)->insertToken(";");
|
|
if (Token::Match(tok, "default : %var%"))
|
|
tok->next()->insertToken(";");
|
|
}
|
|
|
|
// In case variable declarations have been updated...
|
|
setVarId();
|
|
|
|
bool modified = true;
|
|
while (modified)
|
|
{
|
|
modified = false;
|
|
modified |= simplifyConditions();
|
|
modified |= simplifyFunctionReturn();
|
|
modified |= simplifyKnownVariables();
|
|
modified |= removeReduntantConditions();
|
|
modified |= simplifyRedundantParanthesis();
|
|
modified |= simplifyQuestionMark();
|
|
modified |= simplifyCalculations();
|
|
}
|
|
|
|
// Remove redundant parantheses in return..
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
while (Token::simpleMatch(tok, "return ("))
|
|
{
|
|
Token *tok2 = tok->next()->link();
|
|
if (Token::simpleMatch(tok2, ") ;"))
|
|
{
|
|
tok->deleteNext();
|
|
tok2->deleteThis();
|
|
}
|
|
else
|
|
{
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
simplifyComma();
|
|
if (_settings && _settings->_debug)
|
|
{
|
|
_tokens->printOut();
|
|
}
|
|
}
|
|
//---------------------------------------------------------------------------
|
|
|
|
bool Tokenizer::removeReduntantConditions()
|
|
{
|
|
bool ret = false;
|
|
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() != "if")
|
|
continue;
|
|
|
|
if (!Token::Match(tok->tokAt(1), "( %bool% ) {"))
|
|
continue;
|
|
|
|
// Find matching else
|
|
const Token *elseTag = 0;
|
|
|
|
// Find the closing "}"
|
|
elseTag = tok->tokAt(4)->link()->next();
|
|
|
|
bool boolValue = false;
|
|
if (tok->tokAt(2)->str() == "true")
|
|
boolValue = true;
|
|
|
|
// Handle if with else
|
|
if (elseTag && elseTag->str() == "else")
|
|
{
|
|
if (Token::simpleMatch(elseTag->next(), "if ("))
|
|
{
|
|
// Handle "else if"
|
|
if (boolValue == false)
|
|
{
|
|
// Convert "if( false ) {aaa;} else if() {bbb;}" => "if() {bbb;}"
|
|
Token::eraseTokens(tok, elseTag->tokAt(2));
|
|
ret = true;
|
|
}
|
|
else
|
|
{
|
|
// Keep first if, remove every else if and else after it
|
|
const Token *lastTagInIf = elseTag->tokAt(2);
|
|
while (lastTagInIf)
|
|
{
|
|
if (lastTagInIf->str() == "(")
|
|
{
|
|
lastTagInIf = lastTagInIf->link()->next();
|
|
}
|
|
|
|
lastTagInIf = lastTagInIf->link()->next();
|
|
if (!Token::simpleMatch(lastTagInIf, "else"))
|
|
break;
|
|
|
|
lastTagInIf = lastTagInIf->next();
|
|
if (lastTagInIf->str() == "if")
|
|
lastTagInIf = lastTagInIf->next();
|
|
}
|
|
|
|
Token::eraseTokens(elseTag->previous(), lastTagInIf);
|
|
ret = true;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// Handle else
|
|
if (boolValue == false)
|
|
{
|
|
// Convert "if( false ) {aaa;} else {bbb;}" => "{bbb;}" or ";{bbb;}"
|
|
if (tok->previous())
|
|
tok = tok->previous();
|
|
else
|
|
tok->str(";");
|
|
|
|
Token::eraseTokens(tok, elseTag->tokAt(1));
|
|
}
|
|
else
|
|
{
|
|
if (elseTag->tokAt(1)->str() == "{")
|
|
{
|
|
// Convert "if( true ) {aaa;} else {bbb;}" => "{aaa;}"
|
|
const Token *end = elseTag->tokAt(1)->link();
|
|
|
|
// Remove the "else { aaa; }"
|
|
Token::eraseTokens(elseTag->previous(), end->tokAt(1));
|
|
}
|
|
|
|
// Remove "if( true )"
|
|
if (tok->previous())
|
|
tok = tok->previous();
|
|
else
|
|
tok->str(";");
|
|
|
|
Token::eraseTokens(tok, tok->tokAt(5));
|
|
}
|
|
|
|
ret = true;
|
|
}
|
|
}
|
|
|
|
// Handle if without else
|
|
else
|
|
{
|
|
if (boolValue == false)
|
|
{
|
|
// Remove if and its content
|
|
if (tok->previous())
|
|
tok = tok->previous();
|
|
else
|
|
tok->str(";");
|
|
|
|
Token::eraseTokens(tok, elseTag);
|
|
}
|
|
else
|
|
{
|
|
// convert "if( true ) {aaa;}" => "{aaa;}"
|
|
if (tok->previous())
|
|
tok = tok->previous();
|
|
else
|
|
tok->str(";");
|
|
|
|
Token::eraseTokens(tok, tok->tokAt(5));
|
|
}
|
|
|
|
ret = true;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
void Tokenizer::simplifyIfAddBraces()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok ? tok->next() : NULL)
|
|
{
|
|
if (Token::Match(tok, "if|for|while ("))
|
|
{
|
|
// don't add "{}" around ";" in "do {} while();" (#609)
|
|
const Token *prev = tok->previous();
|
|
if (Token::simpleMatch(prev, "} while") &&
|
|
prev->link() &&
|
|
prev->link()->previous() &&
|
|
prev->link()->previous()->str() == "do")
|
|
{
|
|
continue;
|
|
}
|
|
|
|
// Goto the ending ')'
|
|
tok = tok->next()->link();
|
|
|
|
// ')' should be followed by '{'
|
|
if (!tok || Token::simpleMatch(tok, ") {"))
|
|
continue;
|
|
}
|
|
|
|
else if (tok->str() == "else")
|
|
{
|
|
// An else followed by an if or brace don't need to be processed further
|
|
if (Token::Match(tok, "else if|{"))
|
|
continue;
|
|
}
|
|
|
|
else
|
|
{
|
|
continue;
|
|
}
|
|
|
|
// If there is no code after he if(), abort
|
|
if (!tok->next())
|
|
return;
|
|
|
|
|
|
// insert open brace..
|
|
tok->insertToken("{");
|
|
tok = tok->next();
|
|
Token *tempToken = tok;
|
|
|
|
// insert close brace..
|
|
// In most cases it would work to just search for the next ';' and insert a closing brace after it.
|
|
// But here are special cases..
|
|
// * if (cond) for (;;) break;
|
|
// * if (cond1) if (cond2) { }
|
|
int parlevel = 0;
|
|
int indentlevel = 0;
|
|
while ((tempToken = tempToken->next()) != NULL)
|
|
{
|
|
if (tempToken->str() == "{")
|
|
++indentlevel;
|
|
|
|
else if (tempToken->str() == "}")
|
|
{
|
|
--indentlevel;
|
|
if (indentlevel == 0 && parlevel == 0)
|
|
break;
|
|
}
|
|
|
|
else if (tempToken->str() == "(")
|
|
++parlevel;
|
|
|
|
else if (tempToken->str() == ")")
|
|
--parlevel;
|
|
|
|
else if (indentlevel == 0 && parlevel == 0 && tempToken->str() == ";")
|
|
break;
|
|
}
|
|
|
|
if (tempToken)
|
|
{
|
|
tempToken->insertToken("}");
|
|
Token::createMutualLinks(tok, tempToken->next());
|
|
}
|
|
}
|
|
}
|
|
|
|
void Tokenizer::simplifyDoWhileAddBraces()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = (tok ? tok->next() : NULL))
|
|
{
|
|
if (! Token::Match(tok, "do !!{"))
|
|
{
|
|
continue;
|
|
}
|
|
|
|
Token *tok1 = tok; // token with "do"
|
|
Token *tok2 = NULL; // token with "while"
|
|
Token *tok3 = tok;
|
|
|
|
// skip loop body
|
|
while (tok3)
|
|
{
|
|
if (tok3->str() == "while")
|
|
{
|
|
tok2 = tok3;
|
|
break;
|
|
}
|
|
|
|
tok3 = tok3->next();
|
|
}
|
|
|
|
if (tok2)
|
|
{
|
|
// insert "{" after "do"
|
|
tok1->insertToken("{");
|
|
|
|
// insert "}" before "while"
|
|
tok2->previous()->insertToken("}");
|
|
|
|
Token::createMutualLinks(tok1->next(), tok2->previous());
|
|
}
|
|
}
|
|
}
|
|
|
|
void Tokenizer::simplifyConditionOperator()
|
|
{
|
|
int parlevel = 0;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "(")
|
|
++parlevel;
|
|
else if (tok->str() == ")")
|
|
--parlevel;
|
|
else if (parlevel == 0 && Token::Match(tok, "; %var% = %var% ? %var% : %var% ;"))
|
|
{
|
|
const std::string var(tok->strAt(1));
|
|
const std::string condition(tok->strAt(3));
|
|
const std::string value1(tok->strAt(5));
|
|
const std::string value2(tok->strAt(7));
|
|
|
|
Token::eraseTokens(tok, tok->tokAt(9));
|
|
|
|
std::string str("if ( " + condition + " ) { " + var + " = " + value1 + " ; } else { " + var + " = " + value2 + " ; }");
|
|
std::string::size_type pos1 = 0;
|
|
while (pos1 != std::string::npos)
|
|
{
|
|
std::string::size_type pos2 = str.find(" ", pos1);
|
|
if (pos2 == std::string::npos)
|
|
{
|
|
tok->insertToken(str.substr(pos1).c_str());
|
|
pos1 = pos2;
|
|
}
|
|
else
|
|
{
|
|
tok->insertToken(str.substr(pos1, pos2 - pos1).c_str());
|
|
pos1 = pos2 + 1;
|
|
}
|
|
tok = tok->next();
|
|
}
|
|
|
|
Token::createMutualLinks(tok->tokAt(-15), tok->tokAt(-13));
|
|
Token::createMutualLinks(tok->tokAt(-12), tok->tokAt(-7));
|
|
Token::createMutualLinks(tok->tokAt(-5), tok);
|
|
}
|
|
}
|
|
}
|
|
|
|
bool Tokenizer::simplifyConditions()
|
|
{
|
|
bool ret = false;
|
|
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "! %num%") || Token::Match(tok, "! %bool%"))
|
|
{
|
|
if (tok->next()->str() == "0" || tok->next()->str() == "false")
|
|
tok->str("true");
|
|
else
|
|
tok->str("false");
|
|
|
|
tok->deleteNext();
|
|
ret = true;
|
|
}
|
|
|
|
if (Token::simpleMatch(tok, "( true &&") ||
|
|
Token::simpleMatch(tok, "&& true &&") ||
|
|
Token::simpleMatch(tok->next(), "&& true )"))
|
|
{
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
ret = true;
|
|
}
|
|
|
|
else if (Token::simpleMatch(tok, "( false ||") ||
|
|
Token::simpleMatch(tok, "|| false ||") ||
|
|
Token::simpleMatch(tok->next(), "|| false )"))
|
|
{
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
ret = true;
|
|
}
|
|
|
|
// Change numeric constant in condition to "true" or "false"
|
|
if (Token::Match(tok, "if|while ( %num%") &&
|
|
(tok->tokAt(3)->str() == ")" || tok->tokAt(3)->str() == "||" || tok->tokAt(3)->str() == "&&"))
|
|
{
|
|
tok->tokAt(2)->str((tok->tokAt(2)->str() != "0") ? "true" : "false");
|
|
ret = true;
|
|
}
|
|
Token *tok2 = tok->tokAt(2);
|
|
if (tok2 &&
|
|
(tok->str() == "&&" || tok->str() == "||") &&
|
|
Token::Match(tok->next(), "%num%") &&
|
|
(tok2->str() == ")" || tok2->str() == "&&" || tok2->str() == "||"))
|
|
{
|
|
tok->next()->str((tok->next()->str() != "0") ? "true" : "false");
|
|
ret = true;
|
|
}
|
|
|
|
// Reduce "(%num% == %num%)" => "(true)"/"(false)"
|
|
const Token *tok4 = tok->tokAt(4);
|
|
if (! tok4)
|
|
break;
|
|
if ((tok->str() == "&&" || tok->str() == "||" || tok->str() == "(") &&
|
|
(Token::Match(tok->tokAt(1), "%num% %any% %num%") ||
|
|
Token::Match(tok->tokAt(1), "%bool% %any% %bool%")) &&
|
|
(tok4->str() == "&&" || tok4->str() == "||" || tok4->str() == ")" || tok4->str() == "?"))
|
|
{
|
|
std::string cmp = tok->strAt(2);
|
|
bool result = false;
|
|
if (Token::Match(tok->tokAt(1), "%num%"))
|
|
{
|
|
// Compare numbers
|
|
double op1 = (strstr(tok->strAt(1), "0x")) ? std::strtol(tok->strAt(1), 0, 16) : std::atof(tok->strAt(1));
|
|
double op2 = (strstr(tok->strAt(3), "0x")) ? std::strtol(tok->strAt(3), 0, 16) : std::atof(tok->strAt(3));
|
|
|
|
if (cmp == "==")
|
|
result = (op1 == op2);
|
|
else if (cmp == "!=")
|
|
result = (op1 != op2);
|
|
else if (cmp == ">=")
|
|
result = (op1 >= op2);
|
|
else if (cmp == ">")
|
|
result = (op1 > op2);
|
|
else if (cmp == "<=")
|
|
result = (op1 <= op2);
|
|
else if (cmp == "<")
|
|
result = (op1 < op2);
|
|
else
|
|
cmp = "";
|
|
}
|
|
else
|
|
{
|
|
// Compare boolean
|
|
bool op1 = (tok->strAt(1) == std::string("true"));
|
|
bool op2 = (tok->strAt(3) == std::string("true"));
|
|
|
|
if (cmp == "==")
|
|
result = (op1 == op2);
|
|
else if (cmp == "!=")
|
|
result = (op1 != op2);
|
|
else if (cmp == ">=")
|
|
result = (op1 >= op2);
|
|
else if (cmp == ">")
|
|
result = (op1 > op2);
|
|
else if (cmp == "<=")
|
|
result = (op1 <= op2);
|
|
else if (cmp == "<")
|
|
result = (op1 < op2);
|
|
else
|
|
cmp = "";
|
|
}
|
|
|
|
if (! cmp.empty())
|
|
{
|
|
tok = tok->next();
|
|
tok->deleteNext();
|
|
tok->deleteNext();
|
|
|
|
tok->str(result ? "true" : "false");
|
|
ret = true;
|
|
}
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
bool Tokenizer::simplifyQuestionMark()
|
|
{
|
|
bool ret = false;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() != "?")
|
|
continue;
|
|
|
|
if (!tok->tokAt(-2))
|
|
continue;
|
|
|
|
if (!Token::Match(tok->tokAt(-2), "[=,(]"))
|
|
continue;
|
|
|
|
if (!Token::Match(tok->previous(), "%bool%") &&
|
|
!Token::Match(tok->previous(), "%num%"))
|
|
continue;
|
|
|
|
// Find the ":" token..
|
|
Token *semicolon = 0;
|
|
{
|
|
unsigned int parlevel = 0;
|
|
for (Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "(")
|
|
++parlevel;
|
|
else if (tok2->str() == ")")
|
|
{
|
|
if (parlevel == 0)
|
|
break;
|
|
--parlevel;
|
|
}
|
|
else if (parlevel == 0 && tok2->str() == ":")
|
|
{
|
|
semicolon = tok2;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
if (!semicolon || !semicolon->next())
|
|
continue;
|
|
|
|
if (tok->previous()->str() == "false" ||
|
|
tok->previous()->str() == "0")
|
|
{
|
|
// Use code after semicolon, remove code before it.
|
|
semicolon = semicolon->next();
|
|
tok = tok->tokAt(-2);
|
|
Token::eraseTokens(tok, semicolon);
|
|
|
|
tok = tok->next();
|
|
ret = true;
|
|
}
|
|
|
|
// The condition is true. Delete the operator after the ":"..
|
|
else
|
|
{
|
|
// delete the condition token and the "?"
|
|
tok = tok->tokAt(-2);
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
int ind = 0;
|
|
for (const Token *end = semicolon; end; end = end->next())
|
|
{
|
|
if (end->str() == ";")
|
|
{
|
|
Token::eraseTokens(semicolon->previous(), end->next());
|
|
ret = true;
|
|
break;
|
|
}
|
|
|
|
else if (end->str() == "(")
|
|
{
|
|
++ind;
|
|
}
|
|
|
|
else if (end->str() == ")")
|
|
{
|
|
--ind;
|
|
if (ind < 0)
|
|
{
|
|
Token::eraseTokens(semicolon->previous(), end);
|
|
ret = true;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
void Tokenizer::simplifyCasts()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
while (Token::Match(tok->next(), "( %type% *| ) *|&| %var%") ||
|
|
Token::Match(tok->next(), "( %type% %type% *| ) *|&| %var%"))
|
|
{
|
|
if (tok->isName() && tok->str() != "return")
|
|
break;
|
|
|
|
if (Token::simpleMatch(tok->previous(), "operator"))
|
|
break;
|
|
|
|
// Remove cast..
|
|
Token::eraseTokens(tok, tok->next()->link()->next());
|
|
|
|
if (tok->str() == ")" && tok->link()->previous())
|
|
{
|
|
// If there was another cast before this, go back
|
|
// there to check it also. e.g. "(int)(char)x"
|
|
tok = tok->link()->previous();
|
|
}
|
|
}
|
|
|
|
if (Token::Match(tok->next(), "dynamic_cast|reinterpret_cast|const_cast|static_cast <"))
|
|
{
|
|
Token *tok2 = tok->next();
|
|
unsigned int level = 0;
|
|
while (tok2)
|
|
{
|
|
if (tok2->str() == "<")
|
|
++level;
|
|
else if (tok2->str() == ">")
|
|
{
|
|
--level;
|
|
if (level == 0)
|
|
break;
|
|
}
|
|
tok2 = tok2->next();
|
|
}
|
|
|
|
if (Token::simpleMatch(tok2, "> ("))
|
|
{
|
|
Token *closeBracket = tok2->next()->link();
|
|
if (closeBracket)
|
|
{
|
|
Token::eraseTokens(tok, tok2->tokAt(2));
|
|
closeBracket->deleteThis();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
void Tokenizer::simplifyFunctionParameters()
|
|
{
|
|
int indentlevel = 0;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "{")
|
|
++indentlevel;
|
|
|
|
else if (tok->str() == "}")
|
|
--indentlevel;
|
|
|
|
// Find the function e.g. foo( x ) or foo( x, y )
|
|
else if (indentlevel == 0 && Token::Match(tok, "%var% ( %var% [,)]"))
|
|
{
|
|
// We have found old style function, now we need to change it
|
|
|
|
// Get list of argument names
|
|
std::map<std::string, Token*> argumentNames;
|
|
bool bailOut = false;
|
|
for (tok = tok->tokAt(2); tok; tok = tok->tokAt(2))
|
|
{
|
|
if (!Token::Match(tok, "%var% [,)]"))
|
|
{
|
|
bailOut = true;
|
|
break;
|
|
}
|
|
|
|
if (argumentNames.find(tok->str()) != argumentNames.end())
|
|
{
|
|
// Invalid code, two arguments with the same name.
|
|
// TODO, print error perhaps?
|
|
bailOut = true;
|
|
break;
|
|
}
|
|
|
|
argumentNames[tok->str()] = tok;
|
|
if (tok->next()->str() == ")")
|
|
{
|
|
tok = tok->tokAt(2);
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (bailOut)
|
|
{
|
|
continue;
|
|
}
|
|
|
|
Token *start = tok;
|
|
while (tok && tok->str() != "{")
|
|
{
|
|
if (tok->str() == ";")
|
|
{
|
|
tok = tok->previous();
|
|
// Move tokens from start to tok into the place of
|
|
// argumentNames[tok->str()] and remove the ";"
|
|
|
|
if (argumentNames.find(tok->str()) == argumentNames.end())
|
|
{
|
|
bailOut = true;
|
|
break;
|
|
}
|
|
|
|
// Remove the following ";"
|
|
Token *temp = tok->tokAt(2);
|
|
tok->deleteNext();
|
|
|
|
// Replace "x" with "int x" or similar
|
|
Token::replace(argumentNames[tok->str()], start, tok);
|
|
argumentNames.erase(tok->str());
|
|
tok = temp;
|
|
start = tok;
|
|
}
|
|
else
|
|
{
|
|
tok = tok->next();
|
|
}
|
|
}
|
|
|
|
if (tok == NULL)
|
|
{
|
|
break;
|
|
}
|
|
|
|
if (bailOut)
|
|
{
|
|
continue;
|
|
}
|
|
|
|
++indentlevel;
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
bool Tokenizer::simplifyFunctionReturn()
|
|
{
|
|
bool ret = false;
|
|
int indentlevel = 0;
|
|
for (const Token *tok = tokens(); tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "{")
|
|
++indentlevel;
|
|
|
|
else if (tok->str() == "}")
|
|
--indentlevel;
|
|
|
|
else if (indentlevel == 0 && Token::Match(tok, "%var% ( ) { return %num% ; }"))
|
|
{
|
|
std::ostringstream pattern;
|
|
pattern << "[(=+-*/] " << tok->str() << " ( ) [;)+-*/]";
|
|
for (Token *tok2 = _tokens; tok2; tok2 = tok2->next())
|
|
{
|
|
if (Token::Match(tok2, pattern.str().c_str()))
|
|
{
|
|
tok2 = tok2->next();
|
|
tok2->str(tok->strAt(5));
|
|
tok2->deleteNext();
|
|
tok2->deleteNext();
|
|
ret = true;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
|
|
static void incdec(std::string &value, const std::string &op)
|
|
{
|
|
int ivalue = 0;
|
|
std::istringstream istr(value.c_str());
|
|
istr >> ivalue;
|
|
if (op == "++")
|
|
++ivalue;
|
|
else if (op == "--")
|
|
--ivalue;
|
|
std::ostringstream ostr;
|
|
ostr << ivalue;
|
|
value = ostr.str();
|
|
}
|
|
|
|
|
|
|
|
void Tokenizer::simplifyVarDecl()
|
|
{
|
|
// Split up variable declarations..
|
|
// "int a=4;" => "int a; a=4;"
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->previous() && !Token::Match(tok->previous(), "[{};)]"))
|
|
continue;
|
|
|
|
Token *type0 = tok;
|
|
if (!Token::Match(type0, "%type%"))
|
|
continue;
|
|
if (Token::Match(type0, "else|return"))
|
|
continue;
|
|
|
|
bool isconst = false;
|
|
bool isstatic = false;
|
|
Token *tok2 = type0;
|
|
unsigned int typelen = 1;
|
|
|
|
while (Token::Match(tok2, "%type% %type% *| *| %var%"))
|
|
{
|
|
if (tok2->str() == "const")
|
|
isconst = true;
|
|
|
|
else if (tok2->str() == "static")
|
|
isstatic = true;
|
|
|
|
tok2 = tok2->next();
|
|
++typelen;
|
|
}
|
|
|
|
// Don't split up const declaration..
|
|
if (isconst && Token::Match(tok2, "%type% %var% ="))
|
|
continue;
|
|
|
|
if (Token::Match(tok2, "%type% *| %var% ,|="))
|
|
{
|
|
const bool isPointer = (tok2->next()->str() == "*");
|
|
const Token *varName = tok2->tokAt((isPointer ? 2 : 1));
|
|
Token *endDeclaration = varName->next();
|
|
|
|
if (varName->str() != "operator")
|
|
{
|
|
tok2 = endDeclaration; // The ',' or '=' token
|
|
|
|
if (isstatic && tok2->str() == "=")
|
|
{
|
|
if (Token::Match(tok2->next(), "%num% ,"))
|
|
tok2 = tok2->tokAt(2);
|
|
else
|
|
tok2 = NULL;
|
|
}
|
|
}
|
|
else
|
|
tok2 = NULL;
|
|
}
|
|
|
|
else if (Token::Match(tok2, "%type% * * %var% ,|="))
|
|
{
|
|
if (tok2->tokAt(3)->str() != "operator")
|
|
tok2 = tok2->tokAt(4); // The ',' token
|
|
else
|
|
tok2 = NULL;
|
|
}
|
|
|
|
else if (Token::Match(tok2, "%type% * const %var% ,|="))
|
|
{
|
|
if (tok2->tokAt(3)->str() != "operator")
|
|
{
|
|
tok2 = tok2->tokAt(4); // The ',' token
|
|
}
|
|
else
|
|
{
|
|
tok2 = NULL;
|
|
}
|
|
}
|
|
|
|
else if (Token::Match(tok2, "%type% %var% [ %num% ] ,|=") ||
|
|
Token::Match(tok2, "%type% %var% [ %var% ] ,|="))
|
|
{
|
|
tok2 = tok2->tokAt(5); // The ',' token
|
|
|
|
if (tok2->str() == "=")
|
|
{
|
|
while (tok2 && tok2->str() != ",")
|
|
{
|
|
if (tok2->str() == "{")
|
|
tok2 = tok2->link();
|
|
|
|
tok2 = tok2->next();
|
|
|
|
if (tok2->str() == ";")
|
|
tok2 = NULL;
|
|
}
|
|
}
|
|
}
|
|
|
|
else if (Token::Match(tok2, "%type% * %var% [ %num% ] ,") ||
|
|
Token::Match(tok2, "%type% * %var% [ %var% ] ,"))
|
|
{
|
|
tok2 = tok2->tokAt(6); // The ',' token
|
|
}
|
|
|
|
else if (Token::Match(tok2, "std :: %type% <") || Token::Match(tok2, "%type% <"))
|
|
{
|
|
//
|
|
// Deal with templates and standart types
|
|
//
|
|
if (Token::simpleMatch(tok2, "std ::"))
|
|
{
|
|
typelen += 1;
|
|
tok2 = tok2->tokAt(2);
|
|
}
|
|
|
|
typelen += 2;
|
|
tok2 = tok2->tokAt(2);
|
|
size_t indentlevel = 1;
|
|
|
|
for (Token *tok3 = tok2; tok3; tok3 = tok3->next())
|
|
{
|
|
++typelen;
|
|
|
|
if (tok3->str() == "<")
|
|
{
|
|
++indentlevel;
|
|
}
|
|
else if (tok3->str() == ">")
|
|
{
|
|
--indentlevel;
|
|
if (indentlevel == 0)
|
|
{
|
|
tok2 = tok3->next();
|
|
break;
|
|
}
|
|
}
|
|
else if (tok3->str() == ";")
|
|
{
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (Token::Match(tok2, ":: %type%"))
|
|
{
|
|
typelen += 2;
|
|
tok2 = tok2->tokAt(2);
|
|
}
|
|
|
|
if (tok2->str() == "*" || tok2->str() == "&")
|
|
{
|
|
tok2 = tok2->next();
|
|
}
|
|
|
|
if (Token::Match(tok2, "%var% ,"))
|
|
{
|
|
tok2 = tok2->next(); // The ',' token
|
|
}
|
|
else
|
|
{
|
|
tok2 = NULL;
|
|
typelen = 0;
|
|
}
|
|
}
|
|
else
|
|
{
|
|
tok2 = NULL;
|
|
typelen = 0;
|
|
}
|
|
|
|
|
|
if (tok2)
|
|
{
|
|
if (tok2->str() == ",")
|
|
{
|
|
tok2->str(";");
|
|
insertTokens(tok2, type0, typelen);
|
|
}
|
|
|
|
else
|
|
{
|
|
Token *eq = tok2;
|
|
|
|
int parlevel = 0;
|
|
while (tok2)
|
|
{
|
|
if (Token::Match(tok2, "[{(<]"))
|
|
{
|
|
++parlevel;
|
|
}
|
|
|
|
else if (Token::Match(tok2, "[})>]"))
|
|
{
|
|
if (parlevel <= 0)
|
|
break;
|
|
--parlevel;
|
|
}
|
|
|
|
else if (parlevel == 0 && strchr(";,", tok2->str()[0]))
|
|
{
|
|
// "type var =" => "type var; var ="
|
|
Token *VarTok = type0->tokAt(typelen);
|
|
while (Token::Match(VarTok, "*|const"))
|
|
VarTok = VarTok->next();
|
|
insertTokens(eq, VarTok, 2);
|
|
eq->str(";");
|
|
|
|
// "= x, " => "= x; type "
|
|
if (tok2->str() == ",")
|
|
{
|
|
tok2->str(";");
|
|
insertTokens(tok2, type0, typelen);
|
|
}
|
|
break;
|
|
}
|
|
|
|
tok2 = tok2->next();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
void Tokenizer::unsignedint()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (!Token::Match(tok, "unsigned|signed"))
|
|
continue;
|
|
|
|
if (Token::Match(tok->previous(), "%type% unsigned|signed %var% [;,=)]") &&
|
|
tok->previous()->isStandardType())
|
|
{
|
|
if (tok->str() == "signed")
|
|
{
|
|
// int signed a; -> int a;
|
|
tok = tok->previous();
|
|
tok->deleteNext();
|
|
}
|
|
else
|
|
{
|
|
// int unsigned a; -> unsigned int a;
|
|
std::string temp = tok->str();
|
|
tok->str(tok->previous()->str());
|
|
tok->previous()->str(temp);
|
|
}
|
|
|
|
continue;
|
|
}
|
|
|
|
// signed int a; -> int a;
|
|
if (Token::Match(tok, "signed %type% %var% [;,=)]"))
|
|
{
|
|
if (tok->next()->isStandardType())
|
|
{
|
|
tok->str(tok->next()->str());
|
|
tok->deleteNext();
|
|
continue;
|
|
}
|
|
}
|
|
|
|
// A variable declaration where the "int" is left out?
|
|
else if (!Token::Match(tok, "unsigned|signed %var% [;,=)]"))
|
|
continue;
|
|
|
|
// Previous token should either be a symbol or one of "{};(,"
|
|
if (tok->previous() &&
|
|
!tok->previous()->isName() &&
|
|
!Token::Match(tok->previous(), "[{};(,]"))
|
|
continue;
|
|
|
|
// next token should not be a standard type?
|
|
if (tok->next()->isStandardType())
|
|
{
|
|
if (tok->str() == "signed")
|
|
{
|
|
tok->str(tok->next()->str());
|
|
tok->deleteNext();
|
|
}
|
|
|
|
continue;
|
|
}
|
|
|
|
// The "int" is missing.. add it
|
|
if (tok->str() == "signed")
|
|
tok->str("int");
|
|
else
|
|
tok->insertToken("int");
|
|
}
|
|
}
|
|
|
|
|
|
void Tokenizer::simplifyIfAssign()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (!Token::Match(tok->next(), "if|while ( !| (| %var% =") &&
|
|
!Token::Match(tok->next(), "if|while ( !| (| %var% . %var% ="))
|
|
continue;
|
|
|
|
// simplifying a "while" condition ?
|
|
const bool iswhile(tok->next()->str() == "while");
|
|
|
|
// delete the "if"
|
|
tok->deleteNext();
|
|
|
|
// Remember if there is a "!" or not. And delete it if there are.
|
|
const bool isNot(tok->tokAt(2)->str() == "!");
|
|
if (isNot)
|
|
tok->next()->deleteNext();
|
|
|
|
// Delete paranthesis.. and remember how many there are with
|
|
// their links.
|
|
std::list<Token *> braces;
|
|
while (tok->next()->str() == "(")
|
|
{
|
|
braces.push_back(tok->next()->link());
|
|
tok->deleteNext();
|
|
}
|
|
|
|
// Skip the "%var% = ..."
|
|
Token *tok2;
|
|
unsigned int indentlevel = 0;
|
|
for (tok2 = tok->next(); tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "(")
|
|
++indentlevel;
|
|
else if (tok2->str() == ")")
|
|
{
|
|
if (indentlevel <= 0)
|
|
break;
|
|
--indentlevel;
|
|
}
|
|
}
|
|
|
|
// Insert "; if|while ( .."
|
|
tok2 = tok2->previous();
|
|
if (Token::simpleMatch(tok->tokAt(2), "."))
|
|
{
|
|
tok2->insertToken(tok->strAt(3));
|
|
tok2->insertToken(tok->strAt(2));
|
|
}
|
|
tok2->insertToken(tok->strAt(1));
|
|
|
|
while (! braces.empty())
|
|
{
|
|
tok2->insertToken("(");
|
|
Token::createMutualLinks(tok2->next(), braces.back());
|
|
braces.pop_back();
|
|
}
|
|
|
|
if (isNot)
|
|
tok2->next()->insertToken("!");
|
|
tok2->insertToken(iswhile ? "while" : "if");
|
|
tok2->insertToken(";");
|
|
|
|
// If it's a while loop.. insert the assignment in the loop
|
|
if (iswhile)
|
|
{
|
|
indentlevel = 0;
|
|
Token *tok3 = tok2;
|
|
for (tok3 = tok2; tok3; tok3 = tok3->next())
|
|
{
|
|
if (tok3->str() == "{")
|
|
++indentlevel;
|
|
else if (tok3->str() == "}")
|
|
{
|
|
if (indentlevel <= 1)
|
|
break;
|
|
--indentlevel;
|
|
}
|
|
}
|
|
|
|
if (tok3 && indentlevel == 1)
|
|
{
|
|
tok3 = tok3->previous();
|
|
for (tok2 = tok2->next(); tok2 && tok2 != tok; tok2 = tok2->previous())
|
|
{
|
|
tok3->insertToken(tok2->strAt(0));
|
|
|
|
Token *newTok = tok3->next();
|
|
newTok->fileIndex(tok2->fileIndex());
|
|
newTok->linenr(tok2->linenr());
|
|
|
|
// link() newly tokens manually
|
|
if (newTok->str() == ")")
|
|
{
|
|
braces.push_back(newTok);
|
|
}
|
|
else if (newTok->str() == "(")
|
|
{
|
|
Token::createMutualLinks(newTok, braces.back());
|
|
braces.pop_back();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
|
|
void Tokenizer::simplifyIfNot()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "(" || tok->str() == "||" || tok->str() == "&&")
|
|
{
|
|
tok = tok->next();
|
|
while (tok && tok->str() == "(")
|
|
tok = tok->next();
|
|
|
|
if (!tok)
|
|
break;
|
|
|
|
if (Token::simpleMatch(tok, "0 == (") ||
|
|
Token::Match(tok, "0 == %var%"))
|
|
{
|
|
tok->deleteNext();
|
|
tok->str("!");
|
|
}
|
|
|
|
else if (Token::Match(tok, "%var% == 0"))
|
|
{
|
|
tok->deleteNext();
|
|
tok->next()->str(tok->str());
|
|
tok->str("!");
|
|
}
|
|
|
|
else if (Token::Match(tok, "%var% .|:: %var% == 0"))
|
|
{
|
|
tok = tok->previous();
|
|
tok->insertToken("!");
|
|
tok = tok->tokAt(4);
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
}
|
|
|
|
else if (Token::Match(tok, "* %var% == 0"))
|
|
{
|
|
tok = tok->previous();
|
|
tok->insertToken("!");
|
|
tok = tok->tokAt(3);
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
}
|
|
}
|
|
|
|
else if (tok->link() && Token::simpleMatch(tok, ") == 0"))
|
|
{
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
if (Token::Match(tok->link()->previous(), "%var%"))
|
|
{
|
|
// if( foo(x) == 0 )
|
|
tok->link()->previous()->insertToken(tok->link()->previous()->str().c_str());
|
|
tok->link()->previous()->previous()->str("!");
|
|
}
|
|
else
|
|
{
|
|
// if( (x) == 0 )
|
|
tok->link()->insertToken("(");
|
|
tok->link()->str("!");
|
|
Token *temp = tok->link();
|
|
Token::createMutualLinks(tok->link()->next(), tok);
|
|
temp->link(0);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
void Tokenizer::simplifyIfNotNull()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
Token *deleteFrom = NULL;
|
|
|
|
if (tok->str() == "(" || tok->str() == "||" || tok->str() == "&&")
|
|
{
|
|
tok = tok->next();
|
|
|
|
if (Token::simpleMatch(tok, "0 != (") ||
|
|
Token::Match(tok, "0 != %var%"))
|
|
{
|
|
deleteFrom = tok->previous();
|
|
}
|
|
|
|
else if (Token::Match(tok, "%var% != 0"))
|
|
{
|
|
deleteFrom = tok;
|
|
}
|
|
|
|
else if (Token::Match(tok, "%var% .|:: %var% != 0"))
|
|
{
|
|
tok = tok->tokAt(2);
|
|
deleteFrom = tok;
|
|
}
|
|
}
|
|
|
|
else if (tok->link() && Token::simpleMatch(tok, ") != 0"))
|
|
{
|
|
deleteFrom = tok;
|
|
}
|
|
|
|
if (deleteFrom)
|
|
{
|
|
Token::eraseTokens(deleteFrom, deleteFrom->tokAt(3));
|
|
tok = deleteFrom;
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
void Tokenizer::simplifyLogicalOperators()
|
|
{
|
|
// "if (not p)" => "if (!p)"
|
|
// "if (p and q)" => "if (p and q)"
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "if|while ( not %var%"))
|
|
{
|
|
tok->tokAt(2)->str("!");
|
|
}
|
|
else if (Token::Match(tok, "&& not %var%"))
|
|
{
|
|
tok->next()->str("!");
|
|
}
|
|
else if (Token::Match(tok, "|| not %var%"))
|
|
{
|
|
tok->next()->str("!");
|
|
}
|
|
// "%var%|) and %var%|("
|
|
else if (tok->str() == "and" &&
|
|
((Token::Match(tok->previous(), "%var%") || tok->previous()->str() == ")") ||
|
|
(Token::Match(tok->next(), "%var%") || tok->next()->str() == "(")))
|
|
{
|
|
tok->str("&&");
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
|
|
bool Tokenizer::simplifyKnownVariables()
|
|
{
|
|
bool ret = false;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
// Search for a block of code
|
|
if (! Token::Match(tok, ") const| {"))
|
|
continue;
|
|
|
|
// parse the block of code..
|
|
int indentlevel = 0;
|
|
for (Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
|
|
if (tok2->str() == "{")
|
|
++indentlevel;
|
|
|
|
else if (tok2->str() == "}")
|
|
{
|
|
--indentlevel;
|
|
if (indentlevel <= 0)
|
|
break;
|
|
}
|
|
|
|
else if (tok2->previous()->str() != "*" &&
|
|
(Token::Match(tok2, "%var% = %num% ;") ||
|
|
Token::Match(tok2, "%var% = %str% ;") ||
|
|
Token::Match(tok2, "%var% = %bool% ;") ||
|
|
Token::Match(tok2, "%var% = %var% ;")))
|
|
{
|
|
unsigned int varid = tok2->varId();
|
|
if (varid == 0)
|
|
continue;
|
|
|
|
const bool pointeralias(tok2->tokAt(2)->isName());
|
|
|
|
std::string value(tok2->strAt(2));
|
|
Token* bailOutFromLoop = 0;
|
|
int indentlevel3 = indentlevel; // indentlevel for tok3
|
|
for (Token *tok3 = tok2->next(); tok3; tok3 = tok3->next())
|
|
{
|
|
if (tok3->str() == "{")
|
|
{
|
|
++indentlevel3;
|
|
}
|
|
else if (tok3->str() == "}")
|
|
{
|
|
--indentlevel3;
|
|
if (indentlevel3 < indentlevel)
|
|
break;
|
|
}
|
|
|
|
if (pointeralias && Token::Match(tok3, ("!!= " + value).c_str()))
|
|
break;
|
|
|
|
// Stop if something like 'while (--var)' is found
|
|
if (tok3->str() == "while" || tok3->str() == "do")
|
|
{
|
|
const Token *endpar = tok3->next()->link();
|
|
bool bailout = false;
|
|
for (const Token *tok4 = tok3; tok4 && tok4 != endpar; tok4 = tok4->next())
|
|
{
|
|
if (Token::Match(tok4, "++|-- %varid%", varid) ||
|
|
Token::Match(tok4, "%varid% ++|--", varid))
|
|
{
|
|
bailout = true;
|
|
break;
|
|
}
|
|
}
|
|
if (bailout)
|
|
break;
|
|
}
|
|
|
|
if (bailOutFromLoop)
|
|
{
|
|
// This could be a loop, skip it, but only if it doesn't contain
|
|
// the variable we are checking for. If it contains the variable
|
|
// we will bail out.
|
|
if (tok3->varId() == varid)
|
|
{
|
|
// Continue
|
|
tok2 = bailOutFromLoop;
|
|
break;
|
|
}
|
|
else if (tok3 == bailOutFromLoop)
|
|
{
|
|
// We have skipped the loop
|
|
bailOutFromLoop = 0;
|
|
continue;
|
|
}
|
|
|
|
continue;
|
|
}
|
|
else if (tok3->str() == "{" && tok3->previous()->str() == ")")
|
|
{
|
|
// There is a possible loop after the assignment. Try to skip it.
|
|
bailOutFromLoop = tok3->link();
|
|
continue;
|
|
}
|
|
else if (tok3->str() == "}" && tok3->link() && tok3->link()->previous()->str() == ")")
|
|
{
|
|
// Assignment was in the middle of possible loop, bail out.
|
|
break;
|
|
}
|
|
|
|
// Variable is used somehow in a non-defined pattern => bail out
|
|
if (tok3->varId() == varid)
|
|
break;
|
|
|
|
// Using the variable in condition..
|
|
if (Token::Match(tok3, "(|!|==|!=|<|<=|>|>= %varid% )|==|!=|<|<=|>|>=", varid))
|
|
{
|
|
tok3 = tok3->next();
|
|
tok3->str(value);
|
|
ret = true;
|
|
}
|
|
|
|
// Variable is used in calculation..
|
|
if (Token::Match(tok3, "[=+-*/[] %varid% [?+-*/;]]", varid) ||
|
|
Token::Match(tok3, "[=+-*/[] %varid% <<", varid) ||
|
|
Token::Match(tok3, "<< %varid% [+-*/;]]", varid))
|
|
{
|
|
tok3 = tok3->next();
|
|
tok3->str(value);
|
|
ret = true;
|
|
}
|
|
|
|
if (Token::Match(tok3->next(), "%varid% ++|--", varid) && MathLib::isInt(value))
|
|
{
|
|
const std::string op(tok3->strAt(2));
|
|
if (Token::Match(tok3, "[{};] %any% %any% ;"))
|
|
{
|
|
Token::eraseTokens(tok3, tok3->tokAt(3));
|
|
}
|
|
else
|
|
{
|
|
tok3 = tok3->next();
|
|
tok3->str(value);
|
|
tok3->deleteNext();
|
|
}
|
|
incdec(value, op);
|
|
tok2->tokAt(2)->str(value);
|
|
ret = true;
|
|
}
|
|
|
|
if (Token::Match(tok3->next(), "++|-- %varid%", varid))
|
|
{
|
|
incdec(value, tok3->strAt(1));
|
|
tok2->tokAt(2)->str(value);
|
|
if (Token::Match(tok3, "[;{}] %any% %any% ;"))
|
|
{
|
|
Token::eraseTokens(tok3, tok3->tokAt(3));
|
|
}
|
|
else
|
|
{
|
|
tok3->deleteNext();
|
|
tok3->next()->str(value);
|
|
}
|
|
tok3 = tok3->next();
|
|
ret = true;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
|
|
void Tokenizer::elseif()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (!Token::simpleMatch(tok, "else if"))
|
|
continue;
|
|
int indent = 0;
|
|
for (Token *tok2 = tok; indent >= 0 && tok2; tok2 = tok2->next())
|
|
{
|
|
if (Token::Match(tok2, "(|{"))
|
|
++indent;
|
|
else if (Token::Match(tok2, ")|}"))
|
|
--indent;
|
|
|
|
if (indent == 0 && Token::Match(tok2, "}|;"))
|
|
{
|
|
if (tok2->next()->str() != "else")
|
|
{
|
|
tok->insertToken("{");
|
|
tok2->insertToken("}");
|
|
Token::createMutualLinks(tok->next(), tok2->next());
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
bool Tokenizer::simplifyRedundantParanthesis()
|
|
{
|
|
bool ret = false;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() != "(")
|
|
continue;
|
|
|
|
while (Token::simpleMatch(tok, "( (") &&
|
|
tok->link()->previous() == tok->next()->link())
|
|
{
|
|
// We have "(( *something* ))", remove the inner
|
|
// paranthesis
|
|
tok->deleteNext();
|
|
tok->link()->tokAt(-2)->deleteNext();
|
|
ret = true;
|
|
}
|
|
|
|
while (Token::Match(tok->previous(), "[;{] ( %var% (") &&
|
|
tok->link()->previous() == tok->tokAt(2)->link())
|
|
{
|
|
// We have "( func ( *something* ))", remove the outer
|
|
// paranthesis
|
|
tok->link()->deleteThis();
|
|
tok->deleteThis();
|
|
ret = true;
|
|
}
|
|
|
|
while (Token::Match(tok->previous(), "[;{] ( delete %var% ) ;"))
|
|
{
|
|
// We have "( delete var )", remove the outer
|
|
// paranthesis
|
|
tok->tokAt(3)->deleteThis();
|
|
tok->deleteThis();
|
|
ret = true;
|
|
}
|
|
|
|
while (Token::Match(tok->previous(), "[;{] ( delete [ ] %var% ) ;"))
|
|
{
|
|
// We have "( delete [] var )", remove the outer
|
|
// paranthesis
|
|
tok->tokAt(5)->deleteThis();
|
|
tok->deleteThis();
|
|
ret = true;
|
|
}
|
|
|
|
if (Token::Match(tok->previous(), "[(!*;}] ( %var% )") && tok->next()->varId() != 0)
|
|
{
|
|
// We have "( var )", remove the paranthesis
|
|
tok = tok->previous();
|
|
tok->deleteNext();
|
|
tok = tok->next();
|
|
tok->deleteNext();
|
|
ret = true;
|
|
continue;
|
|
}
|
|
|
|
if (Token::Match(tok, "( ( %bool% )") ||
|
|
Token::Match(tok, "( ( %num% )"))
|
|
{
|
|
tok->tokAt(2)->deleteNext();
|
|
tok->deleteNext();
|
|
ret = true;
|
|
}
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
bool Tokenizer::simplifyCalculations()
|
|
{
|
|
bool ret = false;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::simpleMatch(tok->next(), "* 1") || Token::simpleMatch(tok->next(), "1 *"))
|
|
{
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
ret = true;
|
|
}
|
|
|
|
// (1-2)
|
|
if (Token::Match(tok, "[[,(=<>+-*] %num% [+-*/] %num% [],);=<>+-*/]") ||
|
|
Token::Match(tok, "<< %num% [+-*/] %num% [],);=<>+-*/]") ||
|
|
Token::Match(tok, "[[,(=<>+-*] %num% [+-*/] %num% <<") ||
|
|
Token::Match(tok, "<< %num% [+-*/] %num% <<"))
|
|
{
|
|
tok = tok->next();
|
|
|
|
// Don't simplify "%num% / 0"
|
|
if (Token::simpleMatch(tok->next(), "/ 0"))
|
|
continue;
|
|
|
|
// + and - are calculated after *
|
|
if (Token::Match(tok->next(), "[+-]"))
|
|
{
|
|
if (tok->previous()->str() == "*")
|
|
continue;
|
|
if (Token::simpleMatch(tok->tokAt(3), "*"))
|
|
continue;
|
|
}
|
|
|
|
tok->str(MathLib::calculate(tok->str(), tok->tokAt(2)->str(), *(tok->strAt(1))));
|
|
|
|
Token::eraseTokens(tok, tok->tokAt(3));
|
|
|
|
// evaluate "2 + 2 - 2 - 2"
|
|
// as (((2 + 2) - 2) - 2) = 0
|
|
// instead of ((2 + 2) - (2 - 2)) = 4
|
|
if (Token::Match(tok->next(), "[+-*/]"))
|
|
{
|
|
tok = tok->tokAt(-2);
|
|
continue;
|
|
}
|
|
|
|
ret = true;
|
|
}
|
|
|
|
// Remove parantheses around number..
|
|
if (!tok->isName() && Token::Match(tok->next(), "( %num% )"))
|
|
{
|
|
tok->deleteNext();
|
|
tok = tok->next();
|
|
tok->deleteNext();
|
|
ret = true;
|
|
}
|
|
|
|
// Remove parantheses around variable..
|
|
// keep parantheses here: dynamic_cast<Fred *>(p);
|
|
// keep parantheses here: A operator * (int);
|
|
if (!tok->isName() && tok->str() != ">" && Token::Match(tok->next(), "( %var% ) [;),+-*/><]]") && !Token::simpleMatch(tok->previous(), "operator"))
|
|
{
|
|
tok->deleteNext();
|
|
tok = tok->next();
|
|
tok->deleteNext();
|
|
ret = true;
|
|
}
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
|
|
|
|
|
|
void Tokenizer::simplifyGoto()
|
|
{
|
|
std::list<Token *> gotos;
|
|
unsigned int indentlevel = 0;
|
|
Token *beginfunction = 0;
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "{")
|
|
{
|
|
if (beginfunction == 0 && indentlevel == 0 && tok->link())
|
|
tok = tok->link();
|
|
else
|
|
++indentlevel;
|
|
}
|
|
|
|
else if (tok->str() == "}")
|
|
{
|
|
if (indentlevel == 0)
|
|
break; // break out - it seems the code is wrong
|
|
--indentlevel;
|
|
if (indentlevel == 0)
|
|
{
|
|
gotos.clear();
|
|
beginfunction = 0;
|
|
}
|
|
}
|
|
|
|
else if (indentlevel == 0 && Token::Match(tok, ") const| {"))
|
|
{
|
|
gotos.clear();
|
|
beginfunction = tok;
|
|
}
|
|
|
|
else if (Token::Match(tok, "goto %var% ;"))
|
|
gotos.push_back(tok);
|
|
|
|
else if (indentlevel == 1 && Token::Match(tok->previous(), "[};] %var% :"))
|
|
{
|
|
// Is this label at the end..
|
|
bool end = false;
|
|
int lev = 0;
|
|
for (const Token *tok2 = tok->tokAt(2); tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "}")
|
|
{
|
|
--lev;
|
|
if (lev < 0)
|
|
{
|
|
end = true;
|
|
break;
|
|
}
|
|
}
|
|
else if (tok2->str() == "{")
|
|
{
|
|
++lev;
|
|
}
|
|
|
|
if (Token::Match(tok2, "%var% :"))
|
|
{
|
|
break;
|
|
}
|
|
}
|
|
if (!end)
|
|
continue;
|
|
|
|
const std::string name(tok->str());
|
|
|
|
tok->deleteThis();
|
|
tok->deleteThis();
|
|
|
|
// This label is at the end of the function.. replace all matching goto statements..
|
|
for (std::list<Token *>::iterator it = gotos.begin(); it != gotos.end(); ++it)
|
|
{
|
|
Token *token = *it;
|
|
if (token->next()->str() == name)
|
|
{
|
|
// Delete the "goto name;"
|
|
token = token->previous();
|
|
token->deleteNext();
|
|
token->deleteNext();
|
|
token->deleteNext();
|
|
|
|
// Insert the statements..
|
|
bool ret = false;
|
|
std::list<Token*> links;
|
|
std::list<Token*> links2;
|
|
std::list<Token*> links3;
|
|
int lev = 0;
|
|
for (const Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "}")
|
|
{
|
|
--lev;
|
|
if (lev < 0)
|
|
break;
|
|
}
|
|
if (tok2->str() == "{")
|
|
{
|
|
++lev;
|
|
}
|
|
else if (tok2->str() == "return")
|
|
ret = true;
|
|
token->insertToken(tok2->str().c_str());
|
|
token = token->next();
|
|
if (token->str() == "(")
|
|
{
|
|
links.push_back(token);
|
|
}
|
|
else if (token->str() == ")")
|
|
{
|
|
if (links.size() == 0)
|
|
{
|
|
// This should never happen at this point
|
|
syntaxError(token, ')');
|
|
return;
|
|
}
|
|
|
|
Token::createMutualLinks(links.back(), token);
|
|
links.pop_back();
|
|
}
|
|
else if (token->str() == "{")
|
|
{
|
|
links2.push_back(token);
|
|
}
|
|
else if (token->str() == "}")
|
|
{
|
|
if (links2.size() == 0)
|
|
{
|
|
// This should never happen at this point
|
|
syntaxError(token, '}');
|
|
return;
|
|
}
|
|
|
|
Token::createMutualLinks(links2.back(), token);
|
|
links2.pop_back();
|
|
}
|
|
else if (token->str() == "[")
|
|
{
|
|
links3.push_back(token);
|
|
}
|
|
else if (token->str() == "]")
|
|
{
|
|
if (links3.size() == 0)
|
|
{
|
|
// This should never happen at this point
|
|
syntaxError(token, ']');
|
|
return;
|
|
}
|
|
|
|
Token::createMutualLinks(links3.back(), token);
|
|
links3.pop_back();
|
|
}
|
|
}
|
|
|
|
if (!ret)
|
|
{
|
|
token->insertToken("return");
|
|
token = token->next();
|
|
token->insertToken(";");
|
|
token = token->next();
|
|
}
|
|
}
|
|
}
|
|
|
|
gotos.clear();
|
|
tok = beginfunction;
|
|
indentlevel = 0;
|
|
continue;
|
|
}
|
|
}
|
|
}
|
|
|
|
void Tokenizer::simplifyNestedStrcat()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (! Token::Match(tok, "[;{}] strcat ( strcat ("))
|
|
{
|
|
continue;
|
|
}
|
|
|
|
// insert extracted function calls before first strcat call
|
|
Token *insertPos = tok;
|
|
|
|
// find inner strcat call
|
|
Token *tok2 = tok->tokAt(3);
|
|
while (Token::simpleMatch(tok2, "strcat ( strcat"))
|
|
{
|
|
tok2 = tok2->tokAt(2);
|
|
}
|
|
|
|
Token *end = tok2->next()->link()->next();
|
|
Token *endOfFirstArg = NULL;
|
|
std::stack<Token *> brackets;
|
|
unsigned int lineno = tok->next()->linenr();
|
|
|
|
// copy tokens to new place
|
|
for (Token *cur = tok2; cur != end; cur = cur->next())
|
|
{
|
|
insertPos->insertToken(cur->strAt(0));
|
|
insertPos = insertPos->next();
|
|
|
|
if (cur->str() == "," && endOfFirstArg == NULL)
|
|
{
|
|
endOfFirstArg = cur;
|
|
}
|
|
|
|
// preserve varId
|
|
if (cur->varId())
|
|
{
|
|
insertPos->varId(cur->varId());
|
|
}
|
|
|
|
// use line number of first strcat token for all new
|
|
// tokens
|
|
insertPos->linenr(lineno);
|
|
|
|
// linkify braces
|
|
if (insertPos->str() == "(")
|
|
{
|
|
brackets.push(insertPos);
|
|
}
|
|
else if (insertPos->str() == ")")
|
|
{
|
|
Token::createMutualLinks(brackets.top(), insertPos);
|
|
brackets.pop();
|
|
}
|
|
}
|
|
insertPos->insertToken(";");
|
|
|
|
// remove tokens at old place, but don't remove token with
|
|
// variable name (1st argument)
|
|
Token::eraseTokens(tok2->previous(), tok2->tokAt(2));
|
|
Token::eraseTokens(endOfFirstArg->previous(), end);
|
|
|
|
// skip just inserted tokens
|
|
tok = insertPos;
|
|
}
|
|
|
|
}
|
|
|
|
|
|
//---------------------------------------------------------------------------
|
|
// Helper functions for handling the tokens list
|
|
//---------------------------------------------------------------------------
|
|
|
|
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
const Token *Tokenizer::getFunctionTokenByName(const char funcname[]) const
|
|
{
|
|
for (unsigned int i = 0; i < _functionList.size(); ++i)
|
|
{
|
|
if (_functionList[i]->str() == funcname)
|
|
{
|
|
return _functionList[i];
|
|
}
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
|
|
void Tokenizer::fillFunctionList()
|
|
{
|
|
_functionList.clear();
|
|
|
|
int indentlevel = 0;
|
|
for (const Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "{")
|
|
++indentlevel;
|
|
|
|
else if (tok->str() == "}")
|
|
--indentlevel;
|
|
|
|
if (indentlevel > 0)
|
|
{
|
|
continue;
|
|
}
|
|
|
|
if (Token::Match(tok, "%var% ("))
|
|
{
|
|
// Check if this is the first token of a function implementation..
|
|
for (const Token *tok2 = tok->tokAt(2); tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == ";")
|
|
{
|
|
tok = tok2;
|
|
break;
|
|
}
|
|
|
|
else if (tok2->str() == "{")
|
|
{
|
|
break;
|
|
}
|
|
|
|
else if (tok2->str() == ")")
|
|
{
|
|
if (Token::Match(tok2, ") const| {"))
|
|
{
|
|
_functionList.push_back(tok);
|
|
tok = tok2;
|
|
}
|
|
else
|
|
{
|
|
tok = tok2;
|
|
while (tok->next() && !strchr(";{", tok->strAt(1)[0]))
|
|
tok = tok->next();
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// If the _functionList functions with duplicate names, remove them
|
|
/** @todo handle when functions with the same name */
|
|
for (unsigned int func1 = 0; func1 < _functionList.size();)
|
|
{
|
|
bool hasDuplicates = false;
|
|
for (unsigned int func2 = func1 + 1; func2 < _functionList.size();)
|
|
{
|
|
if (_functionList[func1]->str() == _functionList[func2]->str())
|
|
{
|
|
hasDuplicates = true;
|
|
_functionList.erase(_functionList.begin() + func2);
|
|
}
|
|
else
|
|
{
|
|
++func2;
|
|
}
|
|
}
|
|
|
|
if (! hasDuplicates)
|
|
{
|
|
++func1;
|
|
}
|
|
else
|
|
{
|
|
_functionList.erase(_functionList.begin() + func1);
|
|
}
|
|
}
|
|
}
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
// Deallocate lists..
|
|
void Tokenizer::deallocateTokens()
|
|
{
|
|
deleteTokens(_tokens);
|
|
_tokens = 0;
|
|
_tokensBack = 0;
|
|
_files.clear();
|
|
}
|
|
|
|
void Tokenizer::deleteTokens(Token *tok)
|
|
{
|
|
while (tok)
|
|
{
|
|
Token *next = tok->next();
|
|
delete tok;
|
|
tok = next;
|
|
}
|
|
}
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
const char *Tokenizer::getParameterName(const Token *ftok, int par)
|
|
{
|
|
int _par = 1;
|
|
for (; ftok; ftok = ftok->next())
|
|
{
|
|
if (ftok->str() == ",")
|
|
++_par;
|
|
if (par == _par && Token::Match(ftok, "%var% [,)]"))
|
|
return ftok->str().c_str();
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
std::string Tokenizer::fileLine(const Token *tok) const
|
|
{
|
|
std::ostringstream ostr;
|
|
ostr << "[" << _files.at(tok->fileIndex()) << ":" << tok->linenr() << "]";
|
|
return ostr.str();
|
|
}
|
|
|
|
std::string Tokenizer::file(const Token *tok) const
|
|
{
|
|
return _files.at(tok->fileIndex());
|
|
}
|
|
|
|
//---------------------------------------------------------------------------
|
|
|
|
const Token * Tokenizer::findClassFunction(const Token *tok, const char classname[], const char funcname[], int &indentlevel)
|
|
{
|
|
if (indentlevel < 0 || tok == NULL)
|
|
return NULL;
|
|
|
|
std::ostringstream classPattern;
|
|
classPattern << "class " << classname << " :|{";
|
|
|
|
std::ostringstream internalPattern;
|
|
internalPattern << funcname << " (";
|
|
|
|
std::ostringstream externalPattern;
|
|
externalPattern << classname << " :: " << funcname << " (";
|
|
|
|
for (; tok; tok = tok->next())
|
|
{
|
|
if (indentlevel == 0 && Token::Match(tok, classPattern.str().c_str()))
|
|
{
|
|
while (tok && tok->str() != "{")
|
|
tok = tok->next();
|
|
if (tok)
|
|
tok = tok->next();
|
|
if (! tok)
|
|
break;
|
|
indentlevel = 1;
|
|
}
|
|
|
|
if (tok->str() == "{")
|
|
{
|
|
// If indentlevel==0 don't go to indentlevel 1. Skip the block.
|
|
if (indentlevel > 0)
|
|
++indentlevel;
|
|
|
|
else
|
|
{
|
|
for (; tok; tok = tok->next())
|
|
{
|
|
if (tok->str() == "{")
|
|
++indentlevel;
|
|
else if (tok->str() == "}")
|
|
{
|
|
--indentlevel;
|
|
if (indentlevel <= 0)
|
|
break;
|
|
}
|
|
}
|
|
if (tok == NULL)
|
|
return NULL;
|
|
|
|
continue;
|
|
}
|
|
}
|
|
|
|
if (tok->str() == "}")
|
|
{
|
|
--indentlevel;
|
|
if (indentlevel < 0)
|
|
return NULL;
|
|
}
|
|
|
|
if (indentlevel == 1)
|
|
{
|
|
// Member function implemented in the class declaration?
|
|
if (tok->str() != "~" && Token::Match(tok->next(), internalPattern.str().c_str()))
|
|
{
|
|
const Token *tok2 = tok->next();
|
|
while (tok2 && tok2->str() != "{" && tok2->str() != ";")
|
|
tok2 = tok2->next();
|
|
if (tok2 && tok2->str() == "{")
|
|
return tok->next();
|
|
}
|
|
}
|
|
|
|
else if (indentlevel == 0 && Token::Match(tok, externalPattern.str().c_str()))
|
|
{
|
|
return tok;
|
|
}
|
|
}
|
|
|
|
// Not found
|
|
return NULL;
|
|
}
|
|
//---------------------------------------------------------------------------
|
|
// Error message for bad iterator usage..
|
|
|
|
void Tokenizer::syntaxError(const Token *tok, char c)
|
|
{
|
|
if (_settings && _settings->_debug)
|
|
{
|
|
_tokens->printOut();
|
|
}
|
|
|
|
if (!_errorLogger && tok)
|
|
{
|
|
std::ostringstream err;
|
|
err << "### Unlogged error at Tokenizer::syntaxError: Invalid number of character (" << c << ")";
|
|
if (_settings && _settings->_debug)
|
|
{
|
|
throw std::runtime_error(err.str());
|
|
}
|
|
else
|
|
{
|
|
std::cerr << err.str() << std::endl;
|
|
}
|
|
return;
|
|
}
|
|
|
|
std::list<ErrorLogger::ErrorMessage::FileLocation> locationList;
|
|
if (tok)
|
|
{
|
|
ErrorLogger::ErrorMessage::FileLocation loc;
|
|
loc.line = tok->linenr();
|
|
loc.file = file(tok);
|
|
locationList.push_back(loc);
|
|
}
|
|
|
|
const ErrorLogger::ErrorMessage errmsg(locationList,
|
|
"error",
|
|
std::string("Invalid number of character (") + c + "). Can't process file.",
|
|
"syntaxError");
|
|
|
|
if (_errorLogger)
|
|
_errorLogger->reportErr(errmsg);
|
|
else
|
|
Check::reportError(errmsg);
|
|
|
|
}
|
|
|
|
void Tokenizer::simplifyMathFunctions()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "atol ( %str% )"))
|
|
{
|
|
if (!MathLib::isInt(tok->tokAt(2)->strValue()))
|
|
{
|
|
// Ignore strings which we can't convert
|
|
continue;
|
|
}
|
|
|
|
if (tok->previous() &&
|
|
Token::simpleMatch(tok->previous()->previous(), "std ::"))
|
|
{
|
|
// Delete "std ::"
|
|
tok = tok->previous()->previous();
|
|
tok->deleteNext();
|
|
tok->deleteThis();
|
|
}
|
|
|
|
// Delete atol(
|
|
tok->deleteNext();
|
|
tok->deleteThis();
|
|
|
|
// Convert string into a number
|
|
tok->str(MathLib::toString(MathLib::toLongNumber(tok->strValue())));
|
|
|
|
// Delete remaining )
|
|
tok->deleteNext();
|
|
}
|
|
}
|
|
}
|
|
|
|
void Tokenizer::simplifyComma()
|
|
{
|
|
for (Token *tok = _tokens; tok; tok = tok->next())
|
|
{
|
|
if (Token::simpleMatch(tok, "for (") ||
|
|
Token::Match(tok, "=|enum {"))
|
|
{
|
|
tok = tok->next()->link();
|
|
if (!tok)
|
|
break;
|
|
|
|
continue;
|
|
}
|
|
|
|
// Skip unhandled template specifiers..
|
|
if (Token::Match(tok, "%var% <"))
|
|
{
|
|
// Todo.. use the link instead.
|
|
unsigned int parlevel = 0;
|
|
unsigned int comparelevel = 0;
|
|
for (Token *tok2 = tok; tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "<")
|
|
++comparelevel;
|
|
else if (tok2->str() == ">")
|
|
{
|
|
if (comparelevel <= 1)
|
|
{
|
|
tok = tok2;
|
|
break;
|
|
}
|
|
++comparelevel;
|
|
}
|
|
else if (tok2->str() == "(")
|
|
++parlevel;
|
|
else if (tok2->str() == ")")
|
|
{
|
|
if (parlevel == 0)
|
|
break;
|
|
--parlevel;
|
|
}
|
|
else if (Token::Match(tok2, "[;{}]"))
|
|
break;
|
|
}
|
|
}
|
|
|
|
// If token after the comma is a constant number, simplification is not required.
|
|
if (tok->str() != "," || Token::Match(tok->next(), "%num%"))
|
|
continue;
|
|
|
|
// We must not accept just any keyword, e.g. accepting int
|
|
// would cause function parameters to corrupt.
|
|
if (Token::Match(tok->next(), "delete"))
|
|
{
|
|
// Handle "delete a, delete b;"
|
|
tok->str(";");
|
|
}
|
|
|
|
if (tok->previous() && tok->previous()->previous())
|
|
{
|
|
if (Token::Match(tok->previous()->previous(), "delete") &&
|
|
tok->next()->varId() != 0)
|
|
{
|
|
// Handle "delete a, b;"
|
|
tok->str(";");
|
|
tok->insertToken("delete");
|
|
}
|
|
else
|
|
{
|
|
for (Token *tok2 = tok->previous(); tok2; tok2 = tok2->previous())
|
|
{
|
|
if (tok2->str() == "=")
|
|
{
|
|
// Handle "a = 0, b = 0;"
|
|
tok->str(";");
|
|
break;
|
|
}
|
|
else if (Token::Match(tok2, "delete %var%") ||
|
|
Token::Match(tok2, "delete [ ] %var%"))
|
|
{
|
|
// Handle "delete a, a = 0;"
|
|
tok->str(";");
|
|
break;
|
|
}
|
|
else if (Token::Match(tok2, "[;,{}()]"))
|
|
{
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
bool inReturn = false;
|
|
Token *startFrom = NULL; // next tokean after "; return"
|
|
Token *endAt = NULL; // first ";" token after "; return"
|
|
|
|
// find "; return" pattern before comma
|
|
for (Token *tok2 = tok; tok2; tok2 = tok2->previous())
|
|
{
|
|
if (Token::Match(tok2, "[;{}]"))
|
|
{
|
|
break;
|
|
|
|
}
|
|
else if (tok2->str() == "return" && Token::Match(tok2->previous(), "[;{}]"))
|
|
{
|
|
inReturn = true;
|
|
startFrom = tok2->next();
|
|
break;
|
|
}
|
|
}
|
|
|
|
// find token where return ends and also count commas
|
|
if (inReturn)
|
|
{
|
|
size_t commaCounter = 0;
|
|
size_t indentlevel = 0;
|
|
|
|
for (Token *tok2 = startFrom; tok2; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == ";")
|
|
{
|
|
endAt = tok2;
|
|
break;
|
|
|
|
}
|
|
else if (tok2->str() == "(")
|
|
{
|
|
++indentlevel;
|
|
|
|
}
|
|
else if (tok2->str() == ")")
|
|
{
|
|
--indentlevel;
|
|
|
|
}
|
|
else if (tok2->str() == "," && indentlevel == 0)
|
|
{
|
|
++commaCounter;
|
|
}
|
|
}
|
|
|
|
if (commaCounter)
|
|
{
|
|
indentlevel = 0;
|
|
|
|
// change tokens:
|
|
// "; return a ( ) , b ( ) , c ;"
|
|
// to
|
|
// "; return a ( ) ; b ( ) ; c ;"
|
|
for (Token *tok2 = startFrom; tok2 != endAt; tok2 = tok2->next())
|
|
{
|
|
if (tok2->str() == "(")
|
|
{
|
|
++indentlevel;
|
|
|
|
}
|
|
else if (tok2->str() == ")")
|
|
{
|
|
--indentlevel;
|
|
|
|
}
|
|
else if (tok2->str() == "," && indentlevel == 0)
|
|
{
|
|
tok2->str(";");
|
|
--commaCounter;
|
|
if (commaCounter == 0)
|
|
{
|
|
tok2->insertToken("return");
|
|
}
|
|
}
|
|
}
|
|
|
|
// delete old "return"
|
|
startFrom->previous()->deleteThis();
|
|
|
|
tok = endAt;
|
|
}
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
|
|
void Tokenizer::removeExceptionSpecifications(Token *tok) const
|
|
{
|
|
while (tok)
|
|
{
|
|
if (tok->str() == "{")
|
|
tok = tok->link();
|
|
|
|
else if (tok->str() == "}")
|
|
break;
|
|
|
|
else if (Token::Match(tok, ") throw ("))
|
|
{
|
|
while (tok->next() && !Token::Match(tok->next(), "[;{]"))
|
|
tok->deleteNext();
|
|
}
|
|
|
|
else if (Token::Match(tok, "class %type%"))
|
|
{
|
|
while (tok && !Token::Match(tok, "[;{]"))
|
|
tok = tok->next();
|
|
if (tok && tok->str() == "{")
|
|
{
|
|
removeExceptionSpecifications(tok->next());
|
|
tok = tok->link();
|
|
}
|
|
}
|
|
|
|
tok = tok ? tok->next() : 0;
|
|
}
|
|
}
|
|
|
|
|
|
|
|
bool Tokenizer::validate() const
|
|
{
|
|
std::stack<const Token *> linktok;
|
|
|
|
for (const Token *tok = tokens(); tok; tok = tok->next())
|
|
{
|
|
if (Token::Match(tok, "[{([]"))
|
|
{
|
|
assert(tok->link() != 0);
|
|
linktok.push(tok);
|
|
continue;
|
|
}
|
|
|
|
else if (Token::Match(tok, "[})]]"))
|
|
{
|
|
assert(tok->link() != 0);
|
|
assert(linktok.empty() == false);
|
|
assert(tok->link() == linktok.top());
|
|
assert(tok == tok->link()->link());
|
|
linktok.pop();
|
|
continue;
|
|
}
|
|
|
|
assert(tok->link() == 0);
|
|
}
|
|
|
|
assert(linktok.empty());
|
|
|
|
return true;
|
|
}
|
|
|
|
std::string Tokenizer::simplifyString(const std::string &source)
|
|
{
|
|
std::string str = source;
|
|
bool escaped = false;
|
|
for (std::string::size_type i = 0; i + 2 < str.size(); i++)
|
|
{
|
|
if (!escaped)
|
|
{
|
|
if (str[i] == '\\')
|
|
escaped = true;
|
|
|
|
continue;
|
|
}
|
|
|
|
if (str[i] == 'x')
|
|
{
|
|
// Hex value
|
|
if (str[i+1] == '0' && str[i+2] == '0')
|
|
str.replace(i, 3, "0");
|
|
else
|
|
{
|
|
// We will replace all other character as 'a'
|
|
// If that causes problems in the future, this can
|
|
// be improved. But for now, this should be OK.
|
|
int n = 1;
|
|
while (n < 2 && std::isxdigit(str[i+1+n]))
|
|
++n;
|
|
--i;
|
|
str.replace(i, 2 + n, "a");
|
|
}
|
|
}
|
|
else if (MathLib::isOctalDigit(str[i]))
|
|
{
|
|
if (MathLib::isOctalDigit(str[i+1]) &&
|
|
MathLib::isOctalDigit(str[i+2]))
|
|
{
|
|
if (str[i+1] == '0' && str[i+2] == '0')
|
|
str.replace(i, 3, "0");
|
|
else
|
|
{
|
|
// We will replace all other character as 'a'
|
|
// If that causes problems in the future, this can
|
|
// be improved. But for now, this should be OK.
|
|
--i;
|
|
str.replace(i, 4, "a");
|
|
}
|
|
}
|
|
}
|
|
|
|
escaped = false;
|
|
}
|
|
|
|
return str;
|
|
}
|
|
|
|
void Tokenizer::getErrorMessages()
|
|
{
|
|
syntaxError(0, ' ');
|
|
}
|