mirror of https://github.com/swig/swig
1434 lines
48 KiB
C++
1434 lines
48 KiB
C++
/* -----------------------------------------------------------------------------
|
|
* This file is part of SWIG, which is licensed as a whole under version 3
|
|
* (or any later version) of the GNU General Public License. Some additional
|
|
* terms also apply to certain portions of SWIG. The full details of the SWIG
|
|
* license and copyrights can be found in the LICENSE and COPYRIGHT files
|
|
* included with the SWIG source code as distributed by the SWIG developers
|
|
* and at http://www.swig.org/legal.html.
|
|
*
|
|
* doxyparser.cxx
|
|
* ----------------------------------------------------------------------------- */
|
|
|
|
#include "doxyparser.h"
|
|
#include "doxycommands.h"
|
|
#include "swig.h"
|
|
#include "swigwarn.h"
|
|
|
|
#include <iostream>
|
|
#include <algorithm>
|
|
#include <vector>
|
|
|
|
using std::string;
|
|
using std::cout;
|
|
using std::endl;
|
|
|
|
// This constant defines the (only) characters valid inside a Doxygen "word".
|
|
// It includes some unusual ones because of the commands such as \f[, \f{, \f],
|
|
// \f} and \f$.
|
|
static const char *DOXYGEN_WORD_CHARS = "abcdefghijklmnopqrstuvwxyz" "ABCDEFGHIJKLMNOPQRSTUVWXYZ" "0123456789" "$[]{}";
|
|
|
|
// Define static class members
|
|
DoxygenParser::DoxyCommandsMap DoxygenParser::doxygenCommands;
|
|
std::set<std::string> DoxygenParser::doxygenSectionIndicators;
|
|
|
|
const int TOKENSPERLINE = 8; //change this to change the printing behaviour of the token list
|
|
const std::string END_HTML_TAG_MARK("/");
|
|
|
|
DoxygenParser::DoxygenParser(bool noisy) : noisy(noisy) {
|
|
fillTables();
|
|
}
|
|
|
|
DoxygenParser::~DoxygenParser() {
|
|
}
|
|
|
|
void DoxygenParser::fillTables() {
|
|
// run it only once
|
|
if (doxygenCommands.size())
|
|
return;
|
|
|
|
// fill in tables with data from doxycommands.h
|
|
for (int i = 0; i < simpleCommandsSize; i++)
|
|
doxygenCommands[simpleCommands[i]] = SIMPLECOMMAND;
|
|
|
|
for (int i = 0; i < commandWordsSize; i++)
|
|
doxygenCommands[commandWords[i]] = COMMANDWORD;
|
|
|
|
for (int i = 0; i < commandLinesSize; i++)
|
|
doxygenCommands[commandLines[i]] = COMMANDLINE;
|
|
|
|
for (int i = 0; i < commandParagraphSize; i++)
|
|
doxygenCommands[commandParagraph[i]] = COMMANDPARAGRAPH;
|
|
|
|
for (int i = 0; i < commandEndCommandsSize; i++)
|
|
doxygenCommands[commandEndCommands[i]] = COMMANDENDCOMMAND;
|
|
|
|
for (int i = 0; i < commandWordParagraphsSize; i++)
|
|
doxygenCommands[commandWordParagraphs[i]] = COMMANDWORDPARAGRAPH;
|
|
|
|
for (int i = 0; i < commandWordLinesSize; i++)
|
|
doxygenCommands[commandWordLines[i]] = COMMANDWORDLINE;
|
|
|
|
for (int i = 0; i < commandWordOWordOWordsSize; i++)
|
|
doxygenCommands[commandWordOWordOWords[i]] = COMMANDWORDOWORDWORD;
|
|
|
|
for (int i = 0; i < commandOWordsSize; i++)
|
|
doxygenCommands[commandOWords[i]] = COMMANDOWORD;
|
|
|
|
for (int i = 0; i < commandErrorThrowingsSize; i++)
|
|
doxygenCommands[commandErrorThrowings[i]] = COMMANDERRORTHROW;
|
|
|
|
for (int i = 0; i < commandUniquesSize; i++)
|
|
doxygenCommands[commandUniques[i]] = COMMANDUNIQUE;
|
|
|
|
for (int i = 0; i < commandHtmlSize; i++)
|
|
doxygenCommands[commandHtml[i]] = COMMAND_HTML;
|
|
|
|
for (int i = 0; i < commandHtmlEntitiesSize; i++)
|
|
doxygenCommands[commandHtmlEntities[i]] = COMMAND_HTML_ENTITY;
|
|
|
|
// fill section indicators command set
|
|
for (int i = 0; i < sectionIndicatorsSize; i++)
|
|
doxygenSectionIndicators.insert(sectionIndicators[i]);
|
|
}
|
|
|
|
std::string DoxygenParser::stringToLower(const std::string &stringToConvert) {
|
|
|
|
string result(stringToConvert.size(), ' ');
|
|
|
|
for (size_t i = 0; i < result.size(); i++) {
|
|
result[i] = tolower(stringToConvert[i]);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
bool DoxygenParser::isSectionIndicator(const std::string &smallString) {
|
|
|
|
std::set<std::string>::iterator it = doxygenSectionIndicators.find(stringToLower(smallString));
|
|
|
|
return it != doxygenSectionIndicators.end();
|
|
}
|
|
|
|
void DoxygenParser::printTree(const DoxygenEntityList &rootList) {
|
|
DoxygenEntityList::const_iterator p = rootList.begin();
|
|
while (p != rootList.end()) {
|
|
(*p).printEntity(0);
|
|
p++;
|
|
}
|
|
}
|
|
|
|
DoxygenParser::DoxyCommandEnum DoxygenParser::commandBelongs(const std::string &theCommand) {
|
|
DoxyCommandsMapIt it = doxygenCommands.find(stringToLower(theCommand));
|
|
|
|
if (it != doxygenCommands.end()) {
|
|
return it->second;
|
|
}
|
|
// Check if this command is defined as an alias.
|
|
if (Getattr(m_node, ("feature:doxygen:alias:" + theCommand).c_str())) {
|
|
return COMMAND_ALIAS;
|
|
}
|
|
// Check if this command should be ignored.
|
|
if (String *const ignore = getIgnoreFeature(theCommand)) {
|
|
// Check that no value is specified for this feature ("1" is the implicit
|
|
// one given to it by SWIG itself), we may use the value in the future, but
|
|
// for now we only use the attributes.
|
|
if (Strcmp(ignore, "1") != 0) {
|
|
Swig_warning(WARN_PP_UNEXPECTED_TOKENS, m_fileName.c_str(), m_fileLineNo,
|
|
"Feature \"doxygen:ignore\" value ignored for Doxygen command \"%s\".\n", theCommand.c_str());
|
|
}
|
|
// Also ensure that the matching end command, if any, will be recognized.
|
|
const string endCommand = getIgnoreFeatureEndCommand(theCommand);
|
|
if (!endCommand.empty()) {
|
|
Setattr(m_node, ("feature:doxygen:ignore:" + endCommand).c_str(), NewString("1"));
|
|
}
|
|
|
|
return COMMAND_IGNORE;
|
|
}
|
|
|
|
return NONE;
|
|
}
|
|
|
|
std::string DoxygenParser::trim(const std::string &text) {
|
|
size_t start = text.find_first_not_of(" \t");
|
|
size_t end = text.find_last_not_of(" \t");
|
|
|
|
if (start == string::npos || start > end) {
|
|
return "";
|
|
}
|
|
return text.substr(start, end - start + 1);
|
|
}
|
|
|
|
bool DoxygenParser::isEndOfLine() {
|
|
if (m_tokenListIt == m_tokenList.end()) {
|
|
return false;
|
|
}
|
|
Token nextToken = *m_tokenListIt;
|
|
return nextToken.m_tokenType == END_LINE;
|
|
}
|
|
|
|
void DoxygenParser::skipWhitespaceTokens() {
|
|
if (m_tokenListIt == m_tokenList.end()) {
|
|
return;
|
|
}
|
|
|
|
while (m_tokenListIt != m_tokenList.end()
|
|
&& (m_tokenListIt->m_tokenType == END_LINE || trim(m_tokenListIt->m_tokenString).empty())) {
|
|
|
|
m_tokenListIt++;
|
|
}
|
|
}
|
|
|
|
std::string DoxygenParser::getNextToken() {
|
|
|
|
if (m_tokenListIt == m_tokenList.end()) {
|
|
return "";
|
|
}
|
|
|
|
if (m_tokenListIt->m_tokenType == PLAINSTRING) {
|
|
return (m_tokenListIt++)->m_tokenString;
|
|
}
|
|
|
|
return "";
|
|
}
|
|
|
|
std::string DoxygenParser::getNextWord() {
|
|
|
|
/* if (m_tokenListIt == m_tokenList.end()) {
|
|
return "";
|
|
}
|
|
*/
|
|
while (m_tokenListIt != m_tokenList.end()
|
|
&& (m_tokenListIt->m_tokenType == PLAINSTRING)) {
|
|
// handle quoted strings as words
|
|
string token = m_tokenListIt->m_tokenString;
|
|
if (token == "\"") {
|
|
|
|
string word = m_tokenListIt->m_tokenString;
|
|
m_tokenListIt++;
|
|
while (true) {
|
|
string nextWord = getNextToken();
|
|
if (nextWord.empty()) { // maybe report unterminated string error
|
|
return word;
|
|
}
|
|
word += nextWord;
|
|
if (nextWord == "\"") {
|
|
return word;
|
|
}
|
|
}
|
|
}
|
|
|
|
string tokenStr = trim(m_tokenListIt->m_tokenString);
|
|
m_tokenListIt++;
|
|
if (!tokenStr.empty()) {
|
|
return tokenStr;
|
|
}
|
|
}
|
|
|
|
return "";
|
|
}
|
|
|
|
DoxygenParser::TokenListCIt DoxygenParser::getOneLine(const TokenList &tokList) {
|
|
|
|
TokenListCIt endOfLineIt = m_tokenListIt;
|
|
|
|
while (endOfLineIt != tokList.end()) {
|
|
if (endOfLineIt->m_tokenType == END_LINE) {
|
|
return endOfLineIt;
|
|
}
|
|
endOfLineIt++;
|
|
}
|
|
|
|
return tokList.end();
|
|
}
|
|
|
|
std::string DoxygenParser::getStringTilCommand(const TokenList &tokList) {
|
|
|
|
if (m_tokenListIt == tokList.end()) {
|
|
return "";
|
|
}
|
|
|
|
string description;
|
|
|
|
while (m_tokenListIt->m_tokenType == PLAINSTRING) {
|
|
const Token ¤tToken = *m_tokenListIt++;
|
|
if (currentToken.m_tokenType == PLAINSTRING) {
|
|
description = description + currentToken.m_tokenString; // + " ";
|
|
}
|
|
}
|
|
return description;
|
|
}
|
|
|
|
std::string DoxygenParser::getStringTilEndCommand(const std::string &theCommand, const TokenList &tokList) {
|
|
|
|
if (m_tokenListIt == tokList.end()) {
|
|
return "";
|
|
}
|
|
|
|
string description;
|
|
while (m_tokenListIt != tokList.end()) {
|
|
|
|
if (m_tokenListIt->m_tokenType == PLAINSTRING) {
|
|
description += m_tokenListIt->m_tokenString;
|
|
} else if (m_tokenListIt->m_tokenType == END_LINE) {
|
|
description += "\n";
|
|
} else if (m_tokenListIt->m_tokenString == theCommand) {
|
|
m_tokenListIt++;
|
|
return description;
|
|
}
|
|
|
|
m_tokenListIt++;
|
|
}
|
|
|
|
printListError(WARN_DOXYGEN_COMMAND_EXPECTED, "Expected Doxygen command: " + theCommand + ".");
|
|
|
|
return description;
|
|
}
|
|
|
|
DoxygenParser::TokenListCIt DoxygenParser::getEndOfParagraph(const TokenList &tokList) {
|
|
|
|
TokenListCIt endOfParagraph = m_tokenListIt;
|
|
|
|
while (endOfParagraph != tokList.end()) {
|
|
// If \code or \verbatim is encountered within a paragraph, then
|
|
// go all the way to the end of that command, since the content
|
|
// could contain empty lines that would appear to be paragraph
|
|
// ends:
|
|
if (endOfParagraph->m_tokenType == COMMAND &&
|
|
(endOfParagraph->m_tokenString == "code" ||
|
|
endOfParagraph->m_tokenString == "verbatim")) {
|
|
const string theCommand = endOfParagraph->m_tokenString;
|
|
endOfParagraph = getEndCommand("end" + theCommand, tokList);
|
|
endOfParagraph++; // Move after the end command
|
|
return endOfParagraph;
|
|
}
|
|
if (endOfParagraph->m_tokenType == END_LINE) {
|
|
endOfParagraph++;
|
|
if (endOfParagraph != tokList.end()
|
|
&& endOfParagraph->m_tokenType == END_LINE) {
|
|
endOfParagraph++;
|
|
//cout << "ENCOUNTERED END OF PARA" << endl;
|
|
return endOfParagraph;
|
|
}
|
|
|
|
} else if (endOfParagraph->m_tokenType == COMMAND) {
|
|
|
|
if (isSectionIndicator(endOfParagraph->m_tokenString)) {
|
|
return endOfParagraph;
|
|
} else {
|
|
endOfParagraph++;
|
|
}
|
|
|
|
} else if (endOfParagraph->m_tokenType == PLAINSTRING) {
|
|
endOfParagraph++;
|
|
} else {
|
|
return tokList.end();
|
|
}
|
|
}
|
|
|
|
return tokList.end();
|
|
}
|
|
|
|
DoxygenParser::TokenListCIt DoxygenParser::getEndOfSection(const std::string &theCommand, const TokenList &tokList) {
|
|
|
|
TokenListCIt endOfParagraph = m_tokenListIt;
|
|
|
|
while (endOfParagraph != tokList.end()) {
|
|
if (endOfParagraph->m_tokenType == COMMAND) {
|
|
if (theCommand == endOfParagraph->m_tokenString)
|
|
return endOfParagraph;
|
|
else
|
|
endOfParagraph++;
|
|
} else if (endOfParagraph->m_tokenType == PLAINSTRING) {
|
|
endOfParagraph++;
|
|
} else if (endOfParagraph->m_tokenType == END_LINE) {
|
|
endOfParagraph++;
|
|
if (endOfParagraph->m_tokenType == END_LINE) {
|
|
endOfParagraph++;
|
|
return endOfParagraph;
|
|
}
|
|
}
|
|
}
|
|
return tokList.end();
|
|
}
|
|
|
|
DoxygenParser::TokenListCIt DoxygenParser::getEndCommand(const std::string &theCommand, const TokenList &tokList) {
|
|
|
|
TokenListCIt endOfCommand = m_tokenListIt;
|
|
|
|
while (endOfCommand != tokList.end()) {
|
|
endOfCommand++;
|
|
if ((*endOfCommand).m_tokenType == COMMAND) {
|
|
if (theCommand == (*endOfCommand).m_tokenString) {
|
|
return endOfCommand;
|
|
}
|
|
}
|
|
}
|
|
//End command not found
|
|
return tokList.end();
|
|
}
|
|
|
|
void DoxygenParser::skipEndOfLine() {
|
|
if (m_tokenListIt != m_tokenList.end()
|
|
&& m_tokenListIt->m_tokenType == END_LINE) {
|
|
m_tokenListIt++;
|
|
}
|
|
}
|
|
|
|
void DoxygenParser::addSimpleCommand(const std::string &theCommand, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
doxyList.push_back(DoxygenEntity(theCommand));
|
|
}
|
|
|
|
void DoxygenParser::addCommandWord(const std::string &theCommand, const TokenList &, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
if (isEndOfLine()) {
|
|
// handles cases when command is at the end of line (for example "\c\nreally"
|
|
skipWhitespaceTokens();
|
|
doxyList.push_back(DoxygenEntity("plainstd::endl"));
|
|
}
|
|
std::string name = getNextWord();
|
|
if (!name.empty()) {
|
|
DoxygenEntityList aNewList;
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
} else {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No word followed the command. Command ignored.");
|
|
}
|
|
}
|
|
|
|
void DoxygenParser::addCommandLine(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
TokenListCIt endOfLine = getOneLine(tokList);
|
|
DoxygenEntityList aNewList = parse(endOfLine, tokList);
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
skipEndOfLine();
|
|
}
|
|
|
|
void DoxygenParser::addCommandParagraph(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
TokenListCIt endOfParagraph = getEndOfParagraph(tokList);
|
|
DoxygenEntityList aNewList;
|
|
aNewList = parse(endOfParagraph, tokList);
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
|
|
void DoxygenParser::addCommandEndCommand(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
TokenListCIt endCommand = getEndCommand("end" + theCommand, tokList);
|
|
if (endCommand == tokList.end()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_EXPECTED, "Expected Doxygen command: end" + theCommand + ".");
|
|
return;
|
|
}
|
|
DoxygenEntityList aNewList;
|
|
aNewList = parse(endCommand, tokList);
|
|
m_tokenListIt++;
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
|
|
void DoxygenParser::addCommandWordParagraph(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
std::string name = getNextWord();
|
|
|
|
if (name.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No word followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
TokenListCIt endOfParagraph = getEndOfParagraph(tokList);
|
|
DoxygenEntityList aNewList;
|
|
aNewList = parse(endOfParagraph, tokList);
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
|
|
void DoxygenParser::addCommandWordLine(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string name = getNextWord();
|
|
if (name.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No word followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
|
|
TokenListCIt endOfLine = getOneLine(tokList);
|
|
DoxygenEntityList aNewList;
|
|
aNewList = parse(endOfLine, tokList);
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
//else cout << "No line followed " << theCommand << " command. Not added" << endl;
|
|
}
|
|
|
|
void DoxygenParser::addCommandWordOWordOWord(const std::string &theCommand, const TokenList &, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
std::string name = getNextWord();
|
|
if (name.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No word followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
std::string headerfile = getNextWord();
|
|
std::string headername = getNextWord();
|
|
DoxygenEntityList aNewList;
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
if (!headerfile.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", headerfile));
|
|
if (!headername.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", headername));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
|
|
void DoxygenParser::addCommandOWord(const std::string &theCommand, const TokenList &, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
std::string name = getNextWord();
|
|
DoxygenEntityList aNewList;
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
|
|
void DoxygenParser::addCommandErrorThrow(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &) {
|
|
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": Unexpectedly encountered this command.");
|
|
m_tokenListIt = getOneLine(tokList);
|
|
}
|
|
|
|
void DoxygenParser::addCommandHtml(const std::string &theCommand, const TokenList &, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
std::string htmlTagArgs = getNextToken();
|
|
doxyList.push_back(DoxygenEntity(theCommand, htmlTagArgs));
|
|
}
|
|
|
|
void DoxygenParser::addCommandHtmlEntity(const std::string &theCommand, const TokenList &, DoxygenEntityList &doxyList) {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
DoxygenEntityList aNewList;
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
|
|
void DoxygenParser::addCommandUnique(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
|
|
static std::map<std::string, std::string> endCommands;
|
|
DoxygenEntityList aNewList;
|
|
if (theCommand == "arg" || theCommand == "li") {
|
|
TokenListCIt endOfSection = getEndOfSection(theCommand, tokList);
|
|
DoxygenEntityList aNewList;
|
|
aNewList = parse(endOfSection, tokList);
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \xrefitem <key> "(heading)" "(std::list title)" {text}
|
|
else if (theCommand == "xrefitem") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string key = getNextWord();
|
|
if (key.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No key followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
std::string heading = getNextWord();
|
|
if (key.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No heading followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
std::string title = getNextWord();
|
|
if (title.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No title followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
TokenListCIt endOfParagraph = getEndOfParagraph(tokList);
|
|
aNewList = parse(endOfParagraph, tokList);
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", title));
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", heading));
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", key));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \ingroup (<groupname> [<groupname> <groupname>])
|
|
else if (theCommand == "ingroup") {
|
|
std::string name = getNextWord();
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
name = getNextWord();
|
|
if (!name.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
name = getNextWord();
|
|
if (!name.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \par [(paragraph title)] { paragraph }
|
|
else if (theCommand == "par") {
|
|
TokenListCIt endOfLine = getOneLine(tokList);
|
|
aNewList = parse(endOfLine, tokList);
|
|
DoxygenEntityList aNewList2;
|
|
TokenListCIt endOfParagraph = getEndOfParagraph(tokList);
|
|
aNewList2 = parse(endOfParagraph, tokList);
|
|
aNewList.splice(aNewList.end(), aNewList2);
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \headerfile <header-file> [<header-name>]
|
|
else if (theCommand == "headerfile") {
|
|
DoxygenEntityList aNewList;
|
|
std::string name = getNextWord();
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
name = getNextWord();
|
|
if (!name.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \overload [(function declaration)]
|
|
else if (theCommand == "overload") {
|
|
TokenListCIt endOfLine = getOneLine(tokList);
|
|
if (endOfLine != m_tokenListIt) {
|
|
DoxygenEntityList aNewList;
|
|
aNewList = parse(endOfLine, tokList);
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
} else
|
|
doxyList.push_back(DoxygenEntity(theCommand));
|
|
}
|
|
// \weakgroup <name> [(title)]
|
|
else if (theCommand == "weakgroup") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string name = getNextWord();
|
|
if (name.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No word followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
DoxygenEntityList aNewList;
|
|
TokenListCIt endOfLine = getOneLine(tokList);
|
|
if (endOfLine != m_tokenListIt) {
|
|
aNewList = parse(endOfLine, tokList);
|
|
}
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \ref <name> ["(text)"]
|
|
else if (theCommand == "ref") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string name = getNextWord();
|
|
if (name.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No key followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
DoxygenEntityList aNewList;
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", name));
|
|
// TokenListCIt endOfLine = getOneLine(tokList);
|
|
// if (endOfLine != m_tokenListIt) {
|
|
// aNewList = parse(endOfLine, tokList);
|
|
//}
|
|
TokenListCIt tmpIt = m_tokenListIt;
|
|
std::string refTitle = getNextWord();
|
|
// If title is following the ref tag, it must be quoted. Otherwise
|
|
// doxy puts link on ref id.
|
|
if (refTitle.size() > 1 && refTitle[0] == '"') {
|
|
// remove quotes
|
|
refTitle = refTitle.substr(1, refTitle.size() - 2);
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", refTitle));
|
|
} else {
|
|
// no quoted string is following, so we have to restore iterator
|
|
m_tokenListIt = tmpIt;
|
|
}
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \subpage <name> ["(text)"]
|
|
else if (theCommand == "subpage") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string name = getNextWord();
|
|
if (name.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No name followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
std::string text = getNextWord();
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", name));
|
|
if (!text.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", text));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \code ... \endcode
|
|
// \verbatim ... \endverbatim
|
|
// \dot dotcode \enddot
|
|
// \msc msccode \endmsc
|
|
// \f[ ... \f]
|
|
// \f{ ... \f}
|
|
// \f{env}{ ... \f}
|
|
// \f$ ... \f$
|
|
else if (theCommand == "code" || theCommand == "verbatim"
|
|
|| theCommand == "dot" || theCommand == "msc" || theCommand == "f[" || theCommand == "f{" || theCommand == "f$") {
|
|
if (!endCommands.size()) {
|
|
// fill in static table of end commands
|
|
endCommands["f["] = "f]";
|
|
endCommands["f{"] = "f}";
|
|
endCommands["f$"] = "f$";
|
|
}
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
std::string endCommand;
|
|
std::map<std::string, std::string>::iterator it;
|
|
it = endCommands.find(theCommand);
|
|
if (it != endCommands.end())
|
|
endCommand = it->second;
|
|
else
|
|
endCommand = "end" + theCommand;
|
|
|
|
std::string content = getStringTilEndCommand(endCommand, tokList);
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", content));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \dotfile <file> ["caption"]
|
|
// \mscfile <file> ["caption"]
|
|
else if (theCommand == "dotfile" || theCommand == "mscfile") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string file = getNextWord();
|
|
if (file.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No file followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
std::string caption = getNextWord();
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", file));
|
|
if (!caption.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", caption));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \image <format> <file> ["caption"] [<sizeindication>=<size>]
|
|
else if (theCommand == "image") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string format = getNextWord();
|
|
if (format.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No format followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
std::string file = getNextWord();
|
|
if (file.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No name followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
std::string caption = getNextWord();
|
|
std::string size = getNextWord();
|
|
|
|
DoxygenEntityList aNewList;
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", format));
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", file));
|
|
if (!caption.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", caption));
|
|
if (!size.empty())
|
|
aNewList.push_back(DoxygenEntity("plainstd::string", size));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
// \addtogroup <name> [(title)]
|
|
else if (theCommand == "addtogroup") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
std::string name = getNextWord();
|
|
if (name.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": There should be at least one word following the command. Command ignored.");
|
|
return;
|
|
}
|
|
DoxygenEntityList aNewList;
|
|
TokenListCIt endOfLine = getOneLine(tokList);
|
|
if (endOfLine != m_tokenListIt) {
|
|
aNewList = parse(endOfLine, tokList);
|
|
}
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", name));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
skipEndOfLine();
|
|
}
|
|
// \if <cond> [\else ...] [\elseif <cond> ...] \endif
|
|
else if (theCommand == "if" || theCommand == "ifnot" || theCommand == "else" || theCommand == "elseif") {
|
|
if (noisy)
|
|
cout << "Parsing " << theCommand << endl;
|
|
|
|
std::string cond;
|
|
bool skipEndif = false; // if true then we skip endif after parsing block of code
|
|
bool needsCond = (theCommand == "if" || theCommand == "ifnot" || theCommand == "elseif");
|
|
if (needsCond) {
|
|
cond = getNextWord();
|
|
if (cond.empty()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_ERROR, "Error parsing Doxygen command " + theCommand + ": No word followed the command. Command ignored.");
|
|
return;
|
|
}
|
|
}
|
|
|
|
int nestedCounter = 1;
|
|
TokenListCIt endCommand = tokList.end();
|
|
|
|
// go through the commands and find closing endif or else or elseif
|
|
for (TokenListCIt it = m_tokenListIt; it != tokList.end(); it++) {
|
|
if (it->m_tokenType == COMMAND) {
|
|
if (it->m_tokenString == "if" || it->m_tokenString == "ifnot")
|
|
nestedCounter++;
|
|
else if (it->m_tokenString == "endif")
|
|
nestedCounter--;
|
|
if (nestedCounter == 1 && (it->m_tokenString == "else" || it->m_tokenString == "elseif")) { // else found
|
|
endCommand = it;
|
|
break;
|
|
}
|
|
if (nestedCounter == 0) { // endif found
|
|
endCommand = it;
|
|
skipEndif = true;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
if (endCommand == tokList.end()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_EXPECTED, "Expected Doxygen command: endif.");
|
|
return;
|
|
}
|
|
|
|
DoxygenEntityList aNewList;
|
|
aNewList = parse(endCommand, tokList);
|
|
if (skipEndif)
|
|
m_tokenListIt++;
|
|
if (needsCond)
|
|
aNewList.push_front(DoxygenEntity("plainstd::string", cond));
|
|
doxyList.push_back(DoxygenEntity(theCommand, aNewList));
|
|
}
|
|
}
|
|
|
|
void DoxygenParser::aliasCommand(const std::string &theCommand, const TokenList &/* tokList */ , DoxygenEntityList &doxyList) {
|
|
String *const alias = Getattr(m_node, ("feature:doxygen:alias:" + theCommand).c_str());
|
|
if (!alias)
|
|
return;
|
|
|
|
doxyList.push_back(DoxygenEntity("plainstd::string", Char(alias)));
|
|
}
|
|
|
|
String *DoxygenParser::getIgnoreFeature(const std::string &theCommand, const char *argument) const {
|
|
string feature_name = "feature:doxygen:ignore:" + theCommand;
|
|
if (argument) {
|
|
feature_name += ':';
|
|
feature_name += argument;
|
|
}
|
|
|
|
return Getattr(m_node, feature_name.c_str());
|
|
}
|
|
|
|
string DoxygenParser::getIgnoreFeatureEndCommand(const std::string &theCommand) const {
|
|
// We may be dealing either with a simple command or with the starting command
|
|
// of a block, as indicated by the value of "range" starting with "end".
|
|
string endCommand;
|
|
if (String *const range = getIgnoreFeature(theCommand, "range")) {
|
|
const char *const p = Char(range);
|
|
if (strncmp(p, "end", 3) == 0) {
|
|
if (p[3] == ':') {
|
|
// Normally the end command name follows after the colon.
|
|
endCommand = p + 4;
|
|
} else if (p[3] == '\0') {
|
|
// But it may be omitted in which case the default Doxygen convention of
|
|
// using "something"/"endsomething" is used.
|
|
endCommand = "end" + theCommand;
|
|
}
|
|
}
|
|
}
|
|
|
|
return endCommand;
|
|
}
|
|
|
|
void DoxygenParser::ignoreCommand(const std::string &theCommand, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
const string endCommand = getIgnoreFeatureEndCommand(theCommand);
|
|
if (!endCommand.empty()) {
|
|
TokenListCIt itEnd = getEndCommand(endCommand, tokList);
|
|
if (itEnd == tokList.end()) {
|
|
printListError(WARN_DOXYGEN_COMMAND_EXPECTED, "Expected Doxygen command: " + endCommand + ".");
|
|
return;
|
|
}
|
|
// If we ignore the command, also ignore any whitespace preceding it as we
|
|
// want to avoid having lines consisting of whitespace only or trailing
|
|
// whitespace in general (at least Python, with its pep8 tool, really
|
|
// doesn't like it).
|
|
if (!doxyList.empty()) {
|
|
DoxygenEntityList::iterator i = doxyList.end();
|
|
--i;
|
|
if (i->typeOfEntity == "plainstd::string" && i->data.find_first_not_of(" \t") == std::string::npos) {
|
|
doxyList.erase(i);
|
|
}
|
|
}
|
|
// Determine what to do with the part of the comment between the start and
|
|
// end commands: by default, we simply throw it away, but "contents"
|
|
// attribute may be used to change this.
|
|
if (String *const contents = getIgnoreFeature(theCommand, "contents")) {
|
|
// Currently only "parse" is supported but we may need to add "copy" to
|
|
// handle custom tags which contain text that is supposed to be copied
|
|
// verbatim in the future.
|
|
if (Strcmp(contents, "parse") == 0) {
|
|
DoxygenEntityList aNewList = parse(itEnd, tokList);
|
|
doxyList.splice(doxyList.end(), aNewList);
|
|
} else {
|
|
Swig_error(m_fileName.c_str(), m_fileLineNo, "Invalid \"doxygen:ignore\" feature \"contents\" attribute \"%s\".\n", Char(contents));
|
|
return;
|
|
}
|
|
}
|
|
|
|
m_tokenListIt = itEnd;
|
|
m_tokenListIt++;
|
|
} else if (String *const range = getIgnoreFeature(theCommand, "range")) {
|
|
// Currently we only support "line" but, in principle, we should also
|
|
// support "word" and "paragraph" for consistency with the built-in Doxygen
|
|
// commands which can have either of these three ranges (which are indicated
|
|
// using <word-arg>, (line-arg) and {para-arg} respectively in Doxygen
|
|
// documentation).
|
|
if (Strcmp(range, "line") == 0) {
|
|
// Consume everything until the end of line.
|
|
m_tokenListIt = getOneLine(tokList);
|
|
skipEndOfLine();
|
|
} else {
|
|
Swig_error(m_fileName.c_str(), m_fileLineNo, "Invalid \"doxygen:ignore\" feature \"range\" attribute \"%s\".\n", Char(range));
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
|
|
void DoxygenParser::addCommand(const std::string &commandString, const TokenList &tokList, DoxygenEntityList &doxyList) {
|
|
|
|
string theCommand = stringToLower(commandString);
|
|
|
|
if (theCommand == "plainstd::string") {
|
|
string nextPhrase = getStringTilCommand(tokList);
|
|
if (noisy)
|
|
cout << "Parsing plain std::string :" << nextPhrase << endl;
|
|
doxyList.push_back(DoxygenEntity("plainstd::string", nextPhrase));
|
|
return;
|
|
}
|
|
|
|
switch (commandBelongs(commandString)) {
|
|
case SIMPLECOMMAND:
|
|
addSimpleCommand(theCommand, doxyList);
|
|
break;
|
|
case COMMANDWORD:
|
|
addCommandWord(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDLINE:
|
|
addCommandLine(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDPARAGRAPH:
|
|
addCommandParagraph(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDENDCOMMAND:
|
|
addCommandEndCommand(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDWORDPARAGRAPH:
|
|
addCommandWordParagraph(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDWORDLINE:
|
|
addCommandWordLine(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDWORDOWORDWORD:
|
|
addCommandWordOWordOWord(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDOWORD:
|
|
addCommandOWord(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDERRORTHROW:
|
|
addCommandErrorThrow(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMANDUNIQUE:
|
|
addCommandUnique(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMAND_HTML:
|
|
addCommandHtml(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMAND_HTML_ENTITY:
|
|
addCommandHtmlEntity(theCommand, tokList, doxyList);
|
|
break;
|
|
case COMMAND_ALIAS:
|
|
aliasCommand(commandString, tokList, doxyList);
|
|
break;
|
|
case COMMAND_IGNORE:
|
|
ignoreCommand(commandString, tokList, doxyList);
|
|
break;
|
|
case NONE:
|
|
case END_LINE:
|
|
case PARAGRAPH_END:
|
|
case PLAINSTRING:
|
|
case COMMAND:
|
|
// TODO: Ensure that these values either are correctly ignored here or can't happen.
|
|
break;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* This method converts TokenList to DoxygenEntryList.
|
|
*/
|
|
DoxygenEntityList DoxygenParser::parse(TokenListCIt endParsingIndex, const TokenList &tokList, bool root) {
|
|
// if we are root, than any strings should be added as 'partofdescription', else as 'plainstd::string'
|
|
std::string currPlainstringCommandType = root ? "partofdescription" : "plainstd::string";
|
|
DoxygenEntityList aNewList;
|
|
|
|
while (m_tokenListIt != endParsingIndex) {
|
|
|
|
Token currToken = *m_tokenListIt;
|
|
|
|
if (noisy)
|
|
cout << "Parsing for phrase starting in:" << currToken.toString() << endl;
|
|
|
|
if (currToken.m_tokenType == END_LINE) {
|
|
aNewList.push_back(DoxygenEntity("plainstd::endl"));
|
|
m_tokenListIt++;
|
|
} else if (currToken.m_tokenType == COMMAND) {
|
|
m_tokenListIt++;
|
|
addCommand(currToken.m_tokenString, tokList, aNewList);
|
|
} else if (currToken.m_tokenType == PLAINSTRING) {
|
|
addCommand(currPlainstringCommandType, tokList, aNewList);
|
|
}
|
|
|
|
if (endParsingIndex != tokList.end() && m_tokenListIt == tokList.end()) {
|
|
// this could happen if we can't reach the original endParsingIndex
|
|
printListError(WARN_DOXYGEN_UNEXPECTED_END_OF_COMMENT, "Unexpected end of Doxygen comment encountered.");
|
|
break;
|
|
}
|
|
}
|
|
return aNewList;
|
|
}
|
|
|
|
DoxygenEntityList DoxygenParser::createTree(Node *node, String *documentation) {
|
|
m_node = node;
|
|
|
|
tokenizeDoxygenComment(Char(documentation), Char(Getfile(documentation)), Getline(documentation));
|
|
|
|
if (noisy) {
|
|
cout << "---TOKEN LIST---" << endl;
|
|
printList();
|
|
}
|
|
|
|
DoxygenEntityList rootList = parse(m_tokenList.end(), m_tokenList, true);
|
|
|
|
if (noisy) {
|
|
cout << "PARSED LIST" << endl;
|
|
printTree(rootList);
|
|
}
|
|
return rootList;
|
|
}
|
|
|
|
/*
|
|
* Splits 'text' on 'separator' chars. Separator chars are not part of the
|
|
* strings.
|
|
*/
|
|
DoxygenParser::StringVector DoxygenParser::split(const std::string &text, char separator) {
|
|
StringVector lines;
|
|
size_t prevPos = 0, pos = 0;
|
|
|
|
while (pos < string::npos) {
|
|
pos = text.find(separator, prevPos);
|
|
lines.push_back(text.substr(prevPos, pos - prevPos));
|
|
prevPos = pos + 1;
|
|
}
|
|
|
|
return lines;
|
|
}
|
|
|
|
/*
|
|
* Returns true, if 'c' is one of doxygen comment block start
|
|
* characters: *, /, or !
|
|
*/
|
|
bool DoxygenParser::isStartOfDoxyCommentChar(char c) {
|
|
return (strchr("*/!", c) != NULL);
|
|
}
|
|
|
|
/*
|
|
* Adds token with Doxygen command to token list, but only if command is one of
|
|
* Doxygen commands. In that case true is returned. If the command is not
|
|
* recognized as a doxygen command, it is ignored and false is returned.
|
|
*/
|
|
bool DoxygenParser::addDoxyCommand(DoxygenParser::TokenList &tokList, const std::string &cmd) {
|
|
if (commandBelongs(cmd) != NONE) {
|
|
tokList.push_back(Token(COMMAND, cmd));
|
|
return true;
|
|
} else {
|
|
// This function is called for the special Doxygen commands, but also for
|
|
// HTML commands (or anything that looks like them, actually) and entities.
|
|
// We don't recognize all of those, so just ignore them and pass them
|
|
// through, but warn about unknown Doxygen commands as ignoring them will
|
|
// often result in wrong output being generated.
|
|
const char ch = *cmd.begin();
|
|
if (ch != '<' && ch != '&') {
|
|
// Before calling printListError() we must ensure that m_tokenListIt used
|
|
// by it is valid.
|
|
const TokenListCIt itSave = m_tokenListIt;
|
|
m_tokenListIt = m_tokenList.end();
|
|
|
|
printListError(WARN_DOXYGEN_UNKNOWN_COMMAND, "Unknown Doxygen command: " + cmd + ".");
|
|
|
|
m_tokenListIt = itSave;
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* This method copies comment text to output as it is - no processing is
|
|
* done, Doxygen commands are ignored. It is used for commands \verbatim,
|
|
* \htmlonly, \f$, \f[, and \f{.
|
|
*/
|
|
size_t DoxygenParser::processVerbatimText(size_t pos, const std::string &line) {
|
|
if (line[pos] == '\\' || line[pos] == '@') { // check for end commands
|
|
|
|
pos++;
|
|
size_t endOfWordPos = line.find_first_not_of(DOXYGEN_WORD_CHARS, pos);
|
|
string cmd = line.substr(pos, endOfWordPos - pos);
|
|
|
|
if (cmd == CMD_END_HTML_ONLY || cmd == CMD_END_VERBATIM || cmd == CMD_END_LATEX_1 || cmd == CMD_END_LATEX_2 || cmd == CMD_END_LATEX_3) {
|
|
|
|
m_isVerbatimText = false;
|
|
addDoxyCommand(m_tokenList, cmd);
|
|
|
|
} else {
|
|
|
|
m_tokenList.push_back(Token(PLAINSTRING,
|
|
// include '\' or '@'
|
|
line.substr(pos - 1, endOfWordPos - pos + 1)));
|
|
}
|
|
|
|
pos = endOfWordPos;
|
|
|
|
} else {
|
|
|
|
// whitespaces are stored as plain strings
|
|
size_t startOfPossibleEndCmd = line.find_first_of("\\@", pos);
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(pos, startOfPossibleEndCmd - pos)));
|
|
pos = startOfPossibleEndCmd;
|
|
}
|
|
|
|
return pos;
|
|
}
|
|
|
|
/*
|
|
* Processes doxy commands for escaped characters: \$ \@ \\ \& \~ \< \> \# \% \" \. \::
|
|
* Handling this separately supports documentation text like \@someText.
|
|
*/
|
|
bool DoxygenParser::processEscapedChars(size_t &pos, const std::string &line) {
|
|
if ((pos + 1) < line.size()) {
|
|
|
|
// \ and @ with trailing whitespace or quoted get to output as plain string
|
|
string whitespaces = " '\t\n";
|
|
if (whitespaces.find(line[pos + 1]) != string::npos) {
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(pos, 1)));
|
|
pos++;
|
|
return true;
|
|
}
|
|
// these chars can be escaped for doxygen
|
|
string escapedChars = "$@\\&~<>#%\".";
|
|
if (escapedChars.find(line[pos + 1]) != string::npos) {
|
|
|
|
addDoxyCommand(m_tokenList, line.substr(pos + 1, 1));
|
|
pos += 2;
|
|
return true;
|
|
|
|
} else if ((pos + 2) < line.size() && line[pos + 1] == ':' && line[pos + 2] == ':') {
|
|
|
|
// add command \:: - handling this separately supports documentation
|
|
// text like \::someText
|
|
addDoxyCommand(m_tokenList, line.substr(pos + 1, 2));
|
|
pos += 3;
|
|
return true;
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Processes word doxygen commands, like \arg, \c, \b, \return, ...
|
|
*/
|
|
void DoxygenParser::processWordCommands(size_t &pos, const std::string &line) {
|
|
pos++;
|
|
size_t endOfWordPos = line.find_first_not_of(DOXYGEN_WORD_CHARS, pos);
|
|
|
|
string cmd = line.substr(pos, endOfWordPos - pos);
|
|
addDoxyCommand(m_tokenList, cmd);
|
|
|
|
if (cmd == CMD_HTML_ONLY || cmd == CMD_VERBATIM || cmd == CMD_LATEX_1 || cmd == CMD_LATEX_2 || cmd == CMD_LATEX_3) {
|
|
|
|
m_isVerbatimText = true;
|
|
|
|
} else {
|
|
// skip any possible spaces after command, because some commands have parameters,
|
|
// and spaces between command and parameter must be ignored.
|
|
if (endOfWordPos != string::npos) {
|
|
endOfWordPos = line.find_first_not_of(" \t", endOfWordPos);
|
|
}
|
|
}
|
|
pos = endOfWordPos;
|
|
}
|
|
|
|
void DoxygenParser::processHtmlTags(size_t &pos, const std::string &line) {
|
|
bool isEndHtmlTag = false;
|
|
pos++;
|
|
if (line.size() > pos && line[pos] == '/') {
|
|
isEndHtmlTag = true;
|
|
pos++;
|
|
}
|
|
|
|
size_t endHtmlPos = line.find_first_of("\t >", pos);
|
|
|
|
string cmd = line.substr(pos, endHtmlPos - pos);
|
|
pos = endHtmlPos;
|
|
|
|
// prepend '<' to distinguish HTML tags from doxygen commands
|
|
if (!cmd.empty() && addDoxyCommand(m_tokenList, '<' + cmd)) {
|
|
// it is a valid HTML command
|
|
if (line[pos] != '>') {
|
|
// it should be HTML tag with args,
|
|
// for example <A ...>, <IMG ...>, ...
|
|
if (isEndHtmlTag) {
|
|
m_tokenListIt = m_tokenList.end();
|
|
printListError(WARN_DOXYGEN_HTML_ERROR, "Doxygen HTML error for tag " + cmd + ": Illegal end HTML tag without '>' found.");
|
|
}
|
|
|
|
endHtmlPos = line.find(">", pos);
|
|
if (endHtmlPos == string::npos) {
|
|
m_tokenListIt = m_tokenList.end();
|
|
printListError(WARN_DOXYGEN_HTML_ERROR, "Doxygen HTML error for tag " + cmd + ": HTML tag without '>' found.");
|
|
}
|
|
// add args of HTML command, like link URL, image URL, ...
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(pos, endHtmlPos - pos)));
|
|
pos = endHtmlPos;
|
|
} else {
|
|
if (isEndHtmlTag) {
|
|
m_tokenList.push_back(Token(PLAINSTRING, END_HTML_TAG_MARK));
|
|
} else {
|
|
// it is a simple tag, so push empty string
|
|
m_tokenList.push_back(Token(PLAINSTRING, ""));
|
|
}
|
|
}
|
|
|
|
if (pos != string::npos) {
|
|
pos++; // skip '>'
|
|
}
|
|
} else {
|
|
// the command is not HTML supported by Doxygen, < and > will be
|
|
// replaced by HTML entities < and > respectively,
|
|
addDoxyCommand(m_tokenList, "<");
|
|
m_tokenList.push_back(Token(PLAINSTRING, cmd));
|
|
}
|
|
}
|
|
|
|
void DoxygenParser::processHtmlEntities(size_t &pos, const std::string &line) {
|
|
size_t endOfWordPos = line.find_first_not_of("abcdefghijklmnopqrstuvwxyz", pos + 1);
|
|
|
|
if (endOfWordPos != string::npos) {
|
|
|
|
if (line[endOfWordPos] == ';' && (endOfWordPos - pos) > 1) {
|
|
// if entity is not recognized by Doxygen (not in the list of
|
|
// commands) nothing is added (here and in Doxygen).
|
|
addDoxyCommand(m_tokenList, line.substr(pos, endOfWordPos - pos));
|
|
endOfWordPos++; // skip ';'
|
|
} else {
|
|
// it is not an entity - add entity for ampersand and the rest of string
|
|
addDoxyCommand(m_tokenList, "&");
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(pos + 1, endOfWordPos - pos - 1)));
|
|
}
|
|
}
|
|
pos = endOfWordPos;
|
|
}
|
|
|
|
/*
|
|
* This method processes normal comment, which has to be tokenized.
|
|
*/
|
|
size_t DoxygenParser::processNormalComment(size_t pos, const std::string &line) {
|
|
switch (line[pos]) {
|
|
case '\\':
|
|
case '@':
|
|
if (processEscapedChars(pos, line)) {
|
|
break;
|
|
}
|
|
// handle word commands \arg, \c, \return, ... and \f[, \f$, ... commands
|
|
processWordCommands(pos, line);
|
|
break;
|
|
|
|
case ' ': // whitespace
|
|
case '\t':
|
|
{
|
|
// whitespaces are stored as plain strings
|
|
size_t startOfNextWordPos = line.find_first_not_of(" \t", pos + 1);
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(pos, startOfNextWordPos - pos)));
|
|
pos = startOfNextWordPos;
|
|
}
|
|
break;
|
|
|
|
case '<':
|
|
processHtmlTags(pos, line);
|
|
break;
|
|
case '>': // this char is detected here only when it is not part of HTML tag
|
|
addDoxyCommand(m_tokenList, ">");
|
|
pos++;
|
|
break;
|
|
case '&':
|
|
processHtmlEntities(pos, line);
|
|
break;
|
|
case '"':
|
|
m_isInQuotedString = true;
|
|
m_tokenList.push_back(Token(PLAINSTRING, "\""));
|
|
pos++;
|
|
break;
|
|
default:
|
|
m_tokenListIt = m_tokenList.end();
|
|
printListError(WARN_DOXYGEN_UNKNOWN_CHARACTER, std::string("Unknown special character in Doxygen comment: ") + line[pos] + ".");
|
|
}
|
|
|
|
return pos;
|
|
}
|
|
|
|
/*
|
|
* This is the main method, which tokenizes Doxygen comment to words and
|
|
* doxygen commands.
|
|
*/
|
|
void DoxygenParser::tokenizeDoxygenComment(const std::string &doxygenComment, const std::string &fileName, int fileLine) {
|
|
m_isVerbatimText = false;
|
|
m_isInQuotedString = false;
|
|
m_tokenList.clear();
|
|
m_fileLineNo = fileLine;
|
|
m_fileName = fileName;
|
|
|
|
StringVector lines = split(doxygenComment, '\n');
|
|
|
|
// remove trailing spaces, because they cause additional new line at the end
|
|
// comment, which is wrong, because these spaces are space preceding
|
|
// end of comment : ' */'
|
|
if (!doxygenComment.empty() && doxygenComment[doxygenComment.size() - 1] == ' ') {
|
|
|
|
string lastLine = lines[lines.size() - 1];
|
|
|
|
if (trim(lastLine).empty()) {
|
|
lines.pop_back(); // remove trailing empty line
|
|
}
|
|
}
|
|
|
|
for (StringVectorCIt it = lines.begin(); it != lines.end(); it++) {
|
|
const string &line = *it;
|
|
size_t pos = line.find_first_not_of(" \t");
|
|
|
|
if (pos == string::npos) {
|
|
m_tokenList.push_back(Token(END_LINE, "\n"));
|
|
continue;
|
|
}
|
|
// skip sequences of '*', '/', and '!' of any length
|
|
bool isStartOfCommentLineCharFound = false;
|
|
while (pos < line.size() && isStartOfDoxyCommentChar(line[pos])) {
|
|
pos++;
|
|
isStartOfCommentLineCharFound = true;
|
|
}
|
|
|
|
if (pos == line.size()) {
|
|
m_tokenList.push_back(Token(END_LINE, "\n"));
|
|
continue;
|
|
}
|
|
// if 'isStartOfCommentLineCharFound' then preserve leading spaces, so
|
|
// ' * comment' gets translated to ' * comment', not ' * comment'
|
|
// This is important to keep formatting for comments translated to Python.
|
|
if (isStartOfCommentLineCharFound && line[pos] == ' ') {
|
|
pos++; // points to char after ' * '
|
|
if (pos == line.size()) {
|
|
m_tokenList.push_back(Token(END_LINE, "\n"));
|
|
continue;
|
|
}
|
|
}
|
|
// line[pos] may be ' \t' or start of word, it there was no '*', '/' or '!'
|
|
// at beginning of the line. Make sure it points to start of the first word
|
|
// in the line.
|
|
if (isStartOfCommentLineCharFound) {
|
|
size_t firstWordPos = line.find_first_not_of(" \t", pos);
|
|
if (firstWordPos == string::npos) {
|
|
m_tokenList.push_back(Token(END_LINE, "\n"));
|
|
continue;
|
|
}
|
|
|
|
if (firstWordPos > pos) {
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(pos, firstWordPos - pos)));
|
|
pos = firstWordPos;
|
|
}
|
|
} else {
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(0, pos)));
|
|
}
|
|
|
|
while (pos != string::npos) {
|
|
// find the end of the word
|
|
size_t doxyCmdOrHtmlTagPos = line.find_first_of("\\@<>&\" \t", pos);
|
|
if (doxyCmdOrHtmlTagPos != pos) {
|
|
// plain text found
|
|
// if the last char is punctuation, make it a separate word, otherwise
|
|
// it may be included with word also when not appropriate, for example:
|
|
// colors are \b red, green, and blue --> colors are <b>red,</b> green, and blue
|
|
// instead of (comma not bold):
|
|
// colors are \b red, green, and blue --> colors are <b>red</b>, green, and blue
|
|
// In Python it looks even worse:
|
|
// colors are \b red, green, and blue --> colors are 'red,' green, and blue
|
|
string text = line.substr(pos, doxyCmdOrHtmlTagPos - pos);
|
|
string punctuations(".,:");
|
|
size_t textSize = text.size();
|
|
|
|
if (!text.empty()
|
|
&& punctuations.find(text[text.size() - 1]) != string::npos &&
|
|
// but do not break ellipsis (...)
|
|
!(textSize > 1 && text[textSize - 2] == '.')) {
|
|
m_tokenList.push_back(Token(PLAINSTRING, text.substr(0, text.size() - 1)));
|
|
m_tokenList.push_back(Token(PLAINSTRING, text.substr(text.size() - 1)));
|
|
} else {
|
|
m_tokenList.push_back(Token(PLAINSTRING, text));
|
|
}
|
|
}
|
|
|
|
pos = doxyCmdOrHtmlTagPos;
|
|
if (pos != string::npos) {
|
|
if (m_isVerbatimText) {
|
|
pos = processVerbatimText(pos, line);
|
|
|
|
} else if (m_isInQuotedString) {
|
|
|
|
if (line[pos] == '"') {
|
|
m_isInQuotedString = false;
|
|
}
|
|
m_tokenList.push_back(Token(PLAINSTRING, line.substr(pos, 1)));
|
|
pos++;
|
|
|
|
} else {
|
|
pos = processNormalComment(pos, line);
|
|
}
|
|
}
|
|
}
|
|
m_tokenList.push_back(Token(END_LINE, "\n")); // add when pos == npos - end of line
|
|
}
|
|
|
|
m_tokenListIt = m_tokenList.begin();
|
|
}
|
|
|
|
void DoxygenParser::printList() {
|
|
|
|
int tokNo = 0;
|
|
for (TokenListCIt it = m_tokenList.begin(); it != m_tokenList.end(); it++, tokNo++) {
|
|
|
|
cout << it->toString() << " ";
|
|
|
|
if ((tokNo % TOKENSPERLINE) == 0) {
|
|
cout << endl;
|
|
}
|
|
}
|
|
}
|
|
|
|
void DoxygenParser::printListError(int warningType, const std::string &message) {
|
|
int curLine = m_fileLineNo;
|
|
for (TokenListCIt it = m_tokenList.begin(); it != m_tokenListIt; it++) {
|
|
if (it->m_tokenType == END_LINE) {
|
|
curLine++;
|
|
}
|
|
}
|
|
|
|
Swig_warning(warningType, m_fileName.c_str(), curLine, "%s\n", message.c_str());
|
|
}
|