123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402 |
- #ifndef GOOGLE_PROTOBUF_IO_TOKENIZER_H__
- #define GOOGLE_PROTOBUF_IO_TOKENIZER_H__
- #include <string>
- #include <vector>
- #include <google/protobuf/stubs/common.h>
- namespace google {
- namespace protobuf {
- namespace io {
- class ZeroCopyInputStream;
- class ErrorCollector;
- class Tokenizer;
- class LIBPROTOBUF_EXPORT ErrorCollector {
- public:
- inline ErrorCollector() {}
- virtual ~ErrorCollector();
-
-
-
- virtual void AddError(int line, int column, const string& message) = 0;
-
-
-
- virtual void AddWarning(int , int ,
- const string& ) { }
- private:
- GOOGLE_DISALLOW_EVIL_CONSTRUCTORS(ErrorCollector);
- };
- class LIBPROTOBUF_EXPORT Tokenizer {
- public:
-
-
-
- Tokenizer(ZeroCopyInputStream* input, ErrorCollector* error_collector);
- ~Tokenizer();
- enum TokenType {
- TYPE_START,
- TYPE_END,
- TYPE_IDENTIFIER,
-
-
-
- TYPE_INTEGER,
-
-
-
-
-
- TYPE_FLOAT,
-
-
- TYPE_STRING,
-
-
- TYPE_SYMBOL,
-
-
- };
-
- struct Token {
- TokenType type;
- string text;
-
-
-
-
- int line;
- int column;
- int end_column;
- };
-
-
- const Token& current();
-
-
- const Token& previous();
-
-
- bool Next();
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- bool NextWithComments(string* prev_trailing_comments,
- vector<string>* detached_comments,
- string* next_leading_comments);
-
-
-
-
- static double ParseFloat(const string& text);
-
-
-
- static void ParseString(const string& text, string* output);
-
- static void ParseStringAppend(const string& text, string* output);
-
-
-
-
-
- static bool ParseInteger(const string& text, uint64 max_value,
- uint64* output);
-
-
-
-
-
- void set_allow_f_after_float(bool value) { allow_f_after_float_ = value; }
-
- enum CommentStyle {
-
-
- CPP_COMMENT_STYLE,
-
- SH_COMMENT_STYLE
- };
-
- void set_comment_style(CommentStyle style) { comment_style_ = style; }
-
-
- void set_require_space_after_number(bool require) {
- require_space_after_number_ = require;
- }
-
-
- void set_allow_multiline_strings(bool allow) {
- allow_multiline_strings_ = allow;
- }
-
- static bool IsIdentifier(const string& text);
-
- private:
- GOOGLE_DISALLOW_EVIL_CONSTRUCTORS(Tokenizer);
- Token current_;
- Token previous_;
- ZeroCopyInputStream* input_;
- ErrorCollector* error_collector_;
- char current_char_;
- const char* buffer_;
- int buffer_size_;
- int buffer_pos_;
- bool read_error_;
-
- int line_;
- int column_;
-
-
-
-
- string* record_target_;
- int record_start_;
-
- bool allow_f_after_float_;
- CommentStyle comment_style_;
- bool require_space_after_number_;
- bool allow_multiline_strings_;
-
-
- static const int kTabWidth = 8;
-
-
-
- void NextChar();
-
- void Refresh();
- inline void RecordTo(string* target);
- inline void StopRecording();
-
-
- inline void StartToken();
-
-
-
- inline void EndToken();
-
- void AddError(const string& message) {
- error_collector_->AddError(line_, column_, message);
- }
-
-
-
-
-
-
-
- void ConsumeString(char delimiter);
-
-
-
-
-
-
- TokenType ConsumeNumber(bool started_with_zero, bool started_with_dot);
-
- void ConsumeLineComment(string* content);
-
- void ConsumeBlockComment(string* content);
- enum NextCommentStatus {
-
- LINE_COMMENT,
-
- BLOCK_COMMENT,
-
-
- SLASH_NOT_COMMENT,
-
- NO_COMMENT
- };
-
-
- NextCommentStatus TryConsumeCommentStart();
-
-
-
-
-
-
-
-
-
- template<typename CharacterClass>
- inline bool LookingAt();
-
-
-
- template<typename CharacterClass>
- inline bool TryConsumeOne();
-
- inline bool TryConsume(char c);
-
- template<typename CharacterClass>
- inline void ConsumeZeroOrMore();
-
-
-
- template<typename CharacterClass>
- inline void ConsumeOneOrMore(const char* error);
- };
- inline const Tokenizer::Token& Tokenizer::current() {
- return current_;
- }
- inline const Tokenizer::Token& Tokenizer::previous() {
- return previous_;
- }
- inline void Tokenizer::ParseString(const string& text, string* output) {
- output->clear();
- ParseStringAppend(text, output);
- }
- }
- }
- }
- #endif
|