You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
75 lines
2.0 KiB
75 lines
2.0 KiB
4 months ago
|
// Copyright (C) 2015 The Android Open Source Project
|
||
|
//
|
||
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
// you may not use this file except in compliance with the License.
|
||
|
// You may obtain a copy of the License at
|
||
|
//
|
||
|
// http://www.apache.org/licenses/LICENSE-2.0
|
||
|
//
|
||
|
// Unless required by applicable law or agreed to in writing, software
|
||
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
// See the License for the specific language governing permissions and
|
||
|
// limitations under the License.
|
||
|
|
||
|
#ifndef _INIT_PARSER_TOKENIZER_H
|
||
|
#define _INIT_PARSER_TOKENIZER_H
|
||
|
|
||
|
#include <string>
|
||
|
|
||
|
namespace init {
|
||
|
|
||
|
// Used to tokenize a std::string.
|
||
|
// Call Next() to advance through each token until it returns false,
|
||
|
// indicating there are no more tokens left in the string.
|
||
|
// The current token can be accessed with current(), which returns
|
||
|
// a Token.
|
||
|
// Supported tokens are:
|
||
|
// TOK_START - Next() has yet to be called
|
||
|
// TOK_END - At the end of string
|
||
|
// TOK_NEWLINE - The end of a line denoted by \n.
|
||
|
// TOK_TEXT - A word.
|
||
|
// Comments are denoted with '#' and the tokenizer will ignore
|
||
|
// the rest of the line.
|
||
|
// Double quotes can be used to insert whitespace into words.
|
||
|
// A backslash at the end of a line denotes continuation and
|
||
|
// a TOK_NEWLINE will not be generated for that line.
|
||
|
class Tokenizer {
|
||
|
public:
|
||
|
explicit Tokenizer(const std::string& data);
|
||
|
~Tokenizer();
|
||
|
|
||
|
enum TokenType { TOK_START, TOK_END, TOK_NEWLINE, TOK_TEXT };
|
||
|
struct Token {
|
||
|
TokenType type;
|
||
|
std::string text;
|
||
|
};
|
||
|
|
||
|
// Returns the curret token.
|
||
|
const Token& current();
|
||
|
|
||
|
// Move to the next token, returns false at the end of input.
|
||
|
bool Next();
|
||
|
|
||
|
private:
|
||
|
void GetData();
|
||
|
void AdvChar();
|
||
|
void AdvText();
|
||
|
void AdvUntil(char x);
|
||
|
void AdvWhiteSpace();
|
||
|
void StartText();
|
||
|
void EndText();
|
||
|
|
||
|
const std::string& data_;
|
||
|
Token current_;
|
||
|
|
||
|
bool eof_;
|
||
|
size_t pos_;
|
||
|
char cur_char_;
|
||
|
size_t tok_start_;
|
||
|
};
|
||
|
|
||
|
} // namespace init
|
||
|
|
||
|
#endif
|