kde-extraapps/kdevelop/languages/cpp/parser/rpp/pp-scanner.cpp

318 lines
7.2 KiB
C++
Raw Normal View History

/*
Copyright 2005 Roberto Raggi <roberto@kdevelop.org>
Copyright 2006 Hamish Rodda <rodda@kde.org>
Permission to use, copy, modify, distribute, and sell this software and its
documentation for any purpose is hereby granted without fee, provided that
the above copyright notice appear in all copies and that both that
copyright notice and this permission notice appear in supporting
documentation.
The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
KDEVELOP TEAM BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
*/
#include "pp-scanner.h"
#include "chartools.h"
#include <language/duchain/indexedstring.h>
#include <util/kdevvarlengtharray.h>
using namespace rpp;
void pp_skip_blanks::operator()(Stream& input, Stream& output)
{
while (!input.atEnd()) {
if (input == '\\') {
++input;
if (input != '\n') {
--input;
return;
} else {
++input;
continue;
}
}
if (input == '\n' || !isSpace(input.current()))
return;
output << input;
++input;
}
}
void pp_skip_whitespaces::operator()(Stream& input, Stream& output)
{
while (!input.atEnd()) {
if (!isSpace(input.current()))
return;
output << input;
++input;
}
}
void pp_skip_comment_or_divop::operator()(Stream& input, Stream& output, bool outputText)
{
enum {
MAYBE_BEGIN,
BEGIN,
MAYBE_END,
END,
IN_COMMENT,
IN_CXX_COMMENT
} state (MAYBE_BEGIN);
while (!input.atEnd()) {
switch (state) {
case MAYBE_BEGIN:
if (input != '/')
return;
state = BEGIN;
break;
case BEGIN:
if (input == '*')
state = IN_COMMENT;
else if (input == '/')
state = IN_CXX_COMMENT;
else
return;
break;
case IN_COMMENT:
if (input == '*')
state = MAYBE_END;
break;
case IN_CXX_COMMENT:
if (input == '\n')
return;
break;
case MAYBE_END:
if (input == '/')
state = END;
else if (input != '*')
state = IN_COMMENT;
break;
case END:
return;
}
if (input == '\\' && input.peek() == indexFromCharacter('\n')) {
++input;
++input;
output << ' ';
output.mark(input.inputPosition());
} else if (outputText) {
output << input;
++input;
} else if (input == '\n') {
output << '\n';
++input;
output.mark(input.inputPosition());
} else {
output << ' ';
++input;
}
}
}
uint pp_skip_identifier::operator()(Stream& input, bool multiline)
{
KDevVarLengthArray<char, 100> identifier;
KDevelop::IndexedString::RunningHash hash;
while (!input.atEnd()) {
if(!isCharacter(input.current())) {
//Do a more complex merge, where also tokenized identifiers can be merged
KDevelop::IndexedString ret;
if(!identifier.isEmpty())
ret = KDevelop::IndexedString(identifier.constData(), identifier.size(), hash.hash);
while (!input.atEnd()) {
uint current = input.current();
if (isCharacter(current) && !isValidMacroIdentifierToken(characterFromIndex(current)))
break;
if(ret.isEmpty())
ret = KDevelop::IndexedString::fromIndex(current); //The most common fast path
else ///@todo Be better to build up a complete buffer and then append it all, so we don't get he intermediate strings into the repository
ret = KDevelop::IndexedString(ret.byteArray() + KDevelop::IndexedString::fromIndex(input.current()).byteArray());
++input;
if(multiline && input == '\\' && input.peekNextCharacter() == '\n'){
++input;
++input;
}
}
return ret.index();
}
//Collect characters and connect them to an IndexedString
if (isCharacter(input.current()) && !isValidMacroIdentifierToken(characterFromIndex(input.current())))
break;
char c = characterFromIndex(input);
hash.append(c);
identifier.append(c);
++input;
}
return KDevelop::IndexedString(identifier.constData(), identifier.size(), hash.hash).index();
}
void pp_skip_number::operator()(Stream& input, Stream& output)
{
while (!input.atEnd()) {
if (isCharacter(input.current()) && !isValidMacroIdentifierToken(characterFromIndex(input.current())))
return;
output << input;
++input;
}
}
void pp_skip_string_literal::operator()(Stream& input, Stream& output)
{
enum {
BEGIN,
IN_STRING,
QUOTE,
END
} state (BEGIN);
while (!input.atEnd()) {
switch (state) {
case BEGIN:
if (input != '\"')
return;
state = IN_STRING;
break;
case IN_STRING:
// Q_ASSERT(input != '\n');
if (input == '\"')
state = END;
else if (input == '\\')
state = QUOTE;
break;
case QUOTE:
state = IN_STRING;
break;
case END:
return;
}
output << input;
++input;
}
}
void pp_skip_char_literal::operator()(Stream& input, Stream& output)
{
enum {
BEGIN,
IN_STRING,
QUOTE,
END
} state (BEGIN);
int inner_count = 0;
while (!input.atEnd()) {
if (state == END)
break;
switch (state) {
case BEGIN:
if (input != '\'')
return;
state = IN_STRING;
break;
case IN_STRING:
if(input == '\n' || inner_count > 3)
return; //Probably this isn't a string literal. Example: "#warning What's up"
if (input == '\'')
state = END;
else if (input == '\\')
state = QUOTE;
break;
++inner_count;
case QUOTE:
state = IN_STRING;
break;
default:
Q_ASSERT(0);
break;
}
output << input;
++input;
}
}
///@todo Can this deal with comments? like /*(*/
void pp_skip_argument::operator()(Stream& input, Stream& output)
{
int depth = 0;
while (!input.atEnd()) {
if (!depth && (input == ')' || input == ',')) {
return;
} else if (input == '(') {
++depth;
} else if (input == ')') {
--depth;
} else if (input == '\"') {
skip_string_literal(input, output);
continue;
} else if (input == '\'') {
skip_char_literal (input, output);
continue;
} else if (input == '/') {
skip_comment_or_divop (input, output, true);
continue;
} else if (isLetter(input.current()) || input == '_') {
Anchor inputPosition = input.inputPosition();
output.appendString(inputPosition, KDevelop::IndexedString::fromIndex(skip_identifier(input)));
continue;
} else if (isNumber(input.current())) {
output.mark(input.inputPosition());
skip_number(input, output);
continue;
}
output << input;
++input;
}
return;
}