// Copyright (C) 2015 The Android Open Source Project // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "tokenizer.h" namespace init { Tokenizer::Tokenizer(const std::string& data) : data_(data), eof_(false), pos_(0), tok_start_(0) { current_.type = TOK_START; if (data.size() > 0) { cur_char_ = data[0]; } else { eof_ = true; cur_char_ = '\0'; } } Tokenizer::~Tokenizer() {} const Tokenizer::Token& Tokenizer::current() { return current_; } bool Tokenizer::Next() { while (!eof_) { AdvWhiteSpace(); // Check for comments. if (cur_char_ == '#') { AdvChar(); // Skip rest of line while (!eof_ && cur_char_ != '\n') { AdvChar(); } } if (eof_) { break; } if (cur_char_ == '\0') { AdvChar(); } else if (cur_char_ == '\n') { current_.type = TOK_NEWLINE; current_.text.clear(); AdvChar(); return true; } else if (cur_char_ == '\\') { AdvChar(); // skip backslash // This is line continuation so // do not generated TOK_NEWLINE at // the next \n. AdvUntil('\n'); AdvChar(); // skip \n } else if (cur_char_ == '\"') { AdvChar(); StartText(); // Grab everything until the next quote. AdvUntil('\"'); EndText(); AdvChar(); // skip quote. return true; } else { StartText(); AdvText(); EndText(); return true; } } current_.type = TOK_END; current_.text.clear(); return false; } void Tokenizer::AdvChar() { pos_++; if (pos_ < data_.size()) { cur_char_ = data_[pos_]; } else { eof_ = true; cur_char_ = '\0'; } } void Tokenizer::AdvWhiteSpace() { while (cur_char_ == '\t' || cur_char_ == '\r' || cur_char_ == ' ') { AdvChar(); } } void Tokenizer::AdvUntil(char x) { while (!eof_ && cur_char_ != x) { AdvChar(); } } void Tokenizer::AdvText() { while (cur_char_ != '\t' && cur_char_ != '\r' && cur_char_ != '\0' && cur_char_ != ' ' && cur_char_ != '\n' && cur_char_ != '#') { AdvChar(); } } void Tokenizer::StartText() { current_.text.clear(); tok_start_ = pos_; current_.type = TOK_TEXT; } void Tokenizer::EndText() { if (pos_ != tok_start_) { current_.text.append(data_, tok_start_, pos_ - tok_start_); } } } // namespace init