init/parser/tokenizer.cpp - android-core - Git at Google

 // Copyright (C) 2015 The Android Open Source Project
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //      http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #include "tokenizer.h"

 namespace init {

 Tokenizer::Tokenizer(const std::string& data)
     : data_(data), eof_(false), pos_(0), tok_start_(0) {
   current_.type = TOK_START;

   if (data.size() > 0) {
     cur_char_ = data[0];
   } else {
     eof_ = true;
     cur_char_ = '\0';
   }
 }

 Tokenizer::~Tokenizer() {}

 const Tokenizer::Token& Tokenizer::current() {
   return current_;
 }

 bool Tokenizer::Next() {
   while (!eof_) {
     AdvWhiteSpace();

     // Check for comments.
     if (cur_char_ == '#') {
       AdvChar();
       // Skip rest of line
       while (!eof_ && cur_char_ != '\n') {
         AdvChar();
       }
     }

     if (eof_) {
       break;
     }

     if (cur_char_ == '\0') {
       AdvChar();
     } else if (cur_char_ == '\n') {
       current_.type = TOK_NEWLINE;
       current_.text.clear();
       AdvChar();
       return true;
     } else if (cur_char_ == '\\') {
       AdvChar();  // skip backslash
       // This is line continuation so
       // do not generated TOK_NEWLINE at
       // the next \n.
       AdvUntil('\n');
       AdvChar();  // skip \n
     } else if (cur_char_ == '\"') {
       AdvChar();
       StartText();
       // Grab everything until the next quote.
       AdvUntil('\"');
       EndText();
       AdvChar();  // skip quote.
       return true;
     } else {
       StartText();
       AdvText();
       EndText();
       return true;
     }
   }
   current_.type = TOK_END;
   current_.text.clear();
   return false;
 }

 void Tokenizer::AdvChar() {
   pos_++;
   if (pos_ < data_.size()) {
     cur_char_ = data_[pos_];
   } else {
     eof_ = true;
     cur_char_ = '\0';
   }
 }

 void Tokenizer::AdvWhiteSpace() {
   while (cur_char_ == '\t' || cur_char_ == '\r' || cur_char_ == ' ') {
     AdvChar();
   }
 }

 void Tokenizer::AdvUntil(char x) {
   while (!eof_ && cur_char_ != x) {
     AdvChar();
   }
 }

 void Tokenizer::AdvText() {
   while (cur_char_ != '\t' && cur_char_ != '\r' && cur_char_ != '\0' &&
          cur_char_ != ' ' && cur_char_ != '\n' && cur_char_ != '#') {
     AdvChar();
   }
 }

 void Tokenizer::StartText() {
   current_.text.clear();
   tok_start_ = pos_;
   current_.type = TOK_TEXT;
 }

 void Tokenizer::EndText() {
   if (pos_ != tok_start_) {
     current_.text.append(data_, tok_start_, pos_ - tok_start_);
   }
 }

 }  // namespace init
	// Copyright (C) 2015 The Android Open Source Project
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	#include "tokenizer.h"

	namespace init {

	Tokenizer::Tokenizer(const std::string& data)
	: data_(data), eof_(false), pos_(0), tok_start_(0) {
	current_.type = TOK_START;

	if (data.size() > 0) {
	cur_char_ = data[0];
	} else {
	eof_ = true;
	cur_char_ = '\0';
	}
	}

	Tokenizer::~Tokenizer() {}

	const Tokenizer::Token& Tokenizer::current() {
	return current_;
	}

	bool Tokenizer::Next() {
	while (!eof_) {
	AdvWhiteSpace();

	// Check for comments.
	if (cur_char_ == '#') {
	AdvChar();
	// Skip rest of line
	while (!eof_ && cur_char_ != '\n') {
	AdvChar();
	}
	}

	if (eof_) {
	break;
	}

	if (cur_char_ == '\0') {
	AdvChar();
	} else if (cur_char_ == '\n') {
	current_.type = TOK_NEWLINE;
	current_.text.clear();
	AdvChar();
	return true;
	} else if (cur_char_ == '\\') {
	AdvChar(); // skip backslash
	// This is line continuation so
	// do not generated TOK_NEWLINE at
	// the next \n.
	AdvUntil('\n');
	AdvChar(); // skip \n
	} else if (cur_char_ == '\"') {
	AdvChar();
	StartText();
	// Grab everything until the next quote.
	AdvUntil('\"');
	EndText();
	AdvChar(); // skip quote.
	return true;
	} else {
	StartText();
	AdvText();
	EndText();
	return true;
	}
	}
	current_.type = TOK_END;
	current_.text.clear();
	return false;
	}

	void Tokenizer::AdvChar() {
	pos_++;
	if (pos_ < data_.size()) {
	cur_char_ = data_[pos_];
	} else {
	eof_ = true;
	cur_char_ = '\0';
	}
	}

	void Tokenizer::AdvWhiteSpace() {
	while (cur_char_ == '\t' \|\| cur_char_ == '\r' \|\| cur_char_ == ' ') {
	AdvChar();
	}
	}

	void Tokenizer::AdvUntil(char x) {
	while (!eof_ && cur_char_ != x) {
	AdvChar();
	}
	}

	void Tokenizer::AdvText() {
	while (cur_char_ != '\t' && cur_char_ != '\r' && cur_char_ != '\0' &&
	cur_char_ != ' ' && cur_char_ != '\n' && cur_char_ != '#') {
	AdvChar();
	}
	}

	void Tokenizer::StartText() {
	current_.text.clear();
	tok_start_ = pos_;
	current_.type = TOK_TEXT;
	}

	void Tokenizer::EndText() {
	if (pos_ != tok_start_) {
	current_.text.append(data_, tok_start_, pos_ - tok_start_);
	}
	}

	} // namespace init