| // Copyright 2010 the V8 project authors. All rights reserved. |
| // Redistribution and use in source and binary forms, with or without |
| // modification, are permitted provided that the following conditions are |
| // met: |
| // |
| // * Redistributions of source code must retain the above copyright |
| // notice, this list of conditions and the following disclaimer. |
| // * Redistributions in binary form must reproduce the above |
| // copyright notice, this list of conditions and the following |
| // disclaimer in the documentation and/or other materials provided |
| // with the distribution. |
| // * Neither the name of Google Inc. nor the names of its |
| // contributors may be used to endorse or promote products derived |
| // from this software without specific prior written permission. |
| // |
| // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
| // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
| // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
| // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
| // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| |
| // Features shared by parsing and pre-parsing scanners. |
| |
| #ifndef V8_SCANNER_BASE_H_ |
| #define V8_SCANNER_BASE_H_ |
| |
| #include "token.h" |
| #include "unicode.h" |
| |
| namespace v8 { |
| namespace internal { |
| |
| class KeywordMatcher { |
| // Incrementally recognize keywords. |
| // |
| // Recognized keywords: |
| // break case catch const* continue debugger* default delete do else |
| // finally false for function if in instanceof native* new null |
| // return switch this throw true try typeof var void while with |
| // |
| // *: Actually "future reserved keywords". These are the only ones we |
| // recognized, the remaining are allowed as identifiers. |
| public: |
| KeywordMatcher() |
| : state_(INITIAL), |
| token_(Token::IDENTIFIER), |
| keyword_(NULL), |
| counter_(0), |
| keyword_token_(Token::ILLEGAL) {} |
| |
| Token::Value token() { return token_; } |
| |
| inline void AddChar(unibrow::uchar input) { |
| if (state_ != UNMATCHABLE) { |
| Step(input); |
| } |
| } |
| |
| void Fail() { |
| token_ = Token::IDENTIFIER; |
| state_ = UNMATCHABLE; |
| } |
| |
| private: |
| enum State { |
| UNMATCHABLE, |
| INITIAL, |
| KEYWORD_PREFIX, |
| KEYWORD_MATCHED, |
| C, |
| CA, |
| CO, |
| CON, |
| D, |
| DE, |
| F, |
| I, |
| IN, |
| N, |
| T, |
| TH, |
| TR, |
| V, |
| W |
| }; |
| |
| struct FirstState { |
| const char* keyword; |
| State state; |
| Token::Value token; |
| }; |
| |
| // Range of possible first characters of a keyword. |
| static const unsigned int kFirstCharRangeMin = 'b'; |
| static const unsigned int kFirstCharRangeMax = 'w'; |
| static const unsigned int kFirstCharRangeLength = |
| kFirstCharRangeMax - kFirstCharRangeMin + 1; |
| // State map for first keyword character range. |
| static FirstState first_states_[kFirstCharRangeLength]; |
| |
| // If input equals keyword's character at position, continue matching keyword |
| // from that position. |
| inline bool MatchKeywordStart(unibrow::uchar input, |
| const char* keyword, |
| int position, |
| Token::Value token_if_match) { |
| if (input == static_cast<unibrow::uchar>(keyword[position])) { |
| state_ = KEYWORD_PREFIX; |
| this->keyword_ = keyword; |
| this->counter_ = position + 1; |
| this->keyword_token_ = token_if_match; |
| return true; |
| } |
| return false; |
| } |
| |
| // If input equals match character, transition to new state and return true. |
| inline bool MatchState(unibrow::uchar input, char match, State new_state) { |
| if (input == static_cast<unibrow::uchar>(match)) { |
| state_ = new_state; |
| return true; |
| } |
| return false; |
| } |
| |
| inline bool MatchKeyword(unibrow::uchar input, |
| char match, |
| State new_state, |
| Token::Value keyword_token) { |
| if (input != static_cast<unibrow::uchar>(match)) { |
| return false; |
| } |
| state_ = new_state; |
| token_ = keyword_token; |
| return true; |
| } |
| |
| void Step(unibrow::uchar input); |
| |
| // Current state. |
| State state_; |
| // Token for currently added characters. |
| Token::Value token_; |
| |
| // Matching a specific keyword string (there is only one possible valid |
| // keyword with the current prefix). |
| const char* keyword_; |
| int counter_; |
| Token::Value keyword_token_; |
| }; |
| |
| |
| |
| |
| |
| |
| } } // namespace v8::internal |
| |
| #endif // V8_SCANNER_BASE_H_ |