/* Copyright 2005 Roberto Raggi Copyright 2006 Hamish Rodda Permission to use, copy, modify, distribute, and sell this software and its documentation for any purpose is hereby granted without fee, provided that the above copyright notice appear in all copies and that both that copyright notice and this permission notice appear in supporting documentation. The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE KDEVELOP TEAM BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */ #include "pp-scanner.h" #include "chartools.h" #include "../indexedstring.h" #include "../kdevvarlengtharray.h" using namespace rpp; void pp_skip_blanks::operator()(Stream& input, Stream& output) { while (!input.atEnd()) { if (input == '\\') { ++input; if (input != '\n') { --input; return; } else { ++input; continue; } } if (input == '\n' || !isSpace(input.current())) return; output << input; ++input; } } void pp_skip_whitespaces::operator()(Stream& input, Stream& output) { while (!input.atEnd()) { if (!isSpace(input.current())) return; output << input; ++input; } } void pp_skip_comment_or_divop::operator()(Stream& input, Stream& output, bool outputText) { enum { MAYBE_BEGIN, BEGIN, MAYBE_END, END, IN_COMMENT, IN_CXX_COMMENT } state (MAYBE_BEGIN); while (!input.atEnd()) { switch (state) { case MAYBE_BEGIN: if (input != '/') return; state = BEGIN; break; case BEGIN: if (input == '*') state = IN_COMMENT; else if (input == '/') state = IN_CXX_COMMENT; else return; break; case IN_COMMENT: if (input == '*') state = MAYBE_END; break; case IN_CXX_COMMENT: if (input == '\n') return; break; case MAYBE_END: if (input == '/') state = END; else if (input != '*') state = IN_COMMENT; break; case END: return; } if (outputText) { output << input; ++input; } else if (input == '\n') { output << '\n'; ++input; output.mark(input.inputPosition()); } else { output << ' '; ++input; } } } uint pp_skip_identifier::operator()(Stream& input) { KDevVarLengthArray identifier; IndexedString::RunningHash hash; while (!input.atEnd()) { if(!isCharacter(input.current())) { //Do a more complex merge, where also tokenized identifiers can be merged IndexedString ret; if(!identifier.isEmpty()) ret = IndexedString(identifier.constData(), identifier.size(), hash.hash); while (!input.atEnd()) { uint current = input.current(); if (!isLetterOrNumber(current) && input != '_' && isCharacter(current)) break; if(ret.isEmpty()) ret = IndexedString::fromIndex(current); //The most common fast path else ///@todo Be better to build up a complete buffer and then append it all, so we don't get he intermediate strings into the repository ret = IndexedString(ret.byteArray() + IndexedString::fromIndex(input.current()).byteArray()); ++input; } return ret.index(); } //Collect characters and connect them to an IndexedString if (!isLetterOrNumber(input.current()) && input != '_') break; char c = characterFromIndex(input); hash.append(c); identifier.append(c); ++input; } return IndexedString(identifier.constData(), identifier.size(), hash.hash).index(); } void pp_skip_number::operator()(Stream& input, Stream& output) { while (!input.atEnd()) { if (!isLetterOrNumber(input.current()) && input != '_') return; output << input; ++input; } } void pp_skip_string_literal::operator()(Stream& input, Stream& output) { enum { BEGIN, IN_STRING, QUOTE, END } state (BEGIN); while (!input.atEnd()) { switch (state) { case BEGIN: if (input != '\"') return; state = IN_STRING; break; case IN_STRING: // Q_ASSERT(input != '\n'); if (input == '\"') state = END; else if (input == '\\') state = QUOTE; break; case QUOTE: state = IN_STRING; break; case END: return; } output << input; ++input; } } void pp_skip_char_literal::operator()(Stream& input, Stream& output) { enum { BEGIN, IN_STRING, QUOTE, END } state (BEGIN); int inner_count = 0; while (!input.atEnd()) { if (state == END) break; switch (state) { case BEGIN: if (input != '\'') return; state = IN_STRING; break; case IN_STRING: if(input == '\n' || inner_count > 3) return; //Probably this isn't a string literal. Example: "#warning What's up" if (input == '\'') state = END; else if (input == '\\') state = QUOTE; ++inner_count; break; case QUOTE: state = IN_STRING; break; default: Q_ASSERT(0); break; } output << input; ++input; } } ///@todo Can this deal with comments? like /*(*/ void pp_skip_argument::operator()(Stream& input, Stream& output) { int depth = 0; while (!input.atEnd()) { if (!depth && (input == ')' || input == ',')) { return; } else if (input == '(') { ++depth; } else if (input == ')') { --depth; } else if (input == '\"') { skip_string_literal(input, output); continue; } else if (input == '\'') { skip_char_literal (input, output); continue; } else if (input == '/') { skip_comment_or_divop (input, output, true); continue; } else if (isLetter(input.current()) || input == '_') { Anchor inputPosition = input.inputPosition(); output.appendString(inputPosition, IndexedString::fromIndex(skip_identifier(input))); continue; } else if (isNumber(input.current())) { output.mark(input.inputPosition()); skip_number(input, output); continue; } output << input; ++input; } return; }