Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 1 | #include "parser.h" |
| 2 | |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 3 | #include <unordered_map> |
| 4 | |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 5 | #include "ast.h" |
| 6 | #include "file.h" |
| 7 | #include "loc.h" |
| 8 | #include "log.h" |
| 9 | #include "string_piece.h" |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 10 | #include "strutil.h" |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 11 | #include "value.h" |
| 12 | |
| 13 | enum struct ParserState { |
| 14 | NOT_AFTER_RULE = 0, |
| 15 | AFTER_RULE, |
| 16 | MAYBE_AFTER_RULE, |
| 17 | }; |
| 18 | |
| 19 | class Parser { |
| 20 | public: |
| 21 | Parser(StringPiece buf, const char* filename, vector<AST*>* asts) |
| 22 | : buf_(buf), |
| 23 | state_(ParserState::NOT_AFTER_RULE), |
| 24 | out_asts_(asts), |
| 25 | loc_(filename, 0), |
| 26 | fixed_lineno_(false) { |
| 27 | } |
| 28 | |
| 29 | ~Parser() { |
| 30 | } |
| 31 | |
| 32 | void Parse() { |
| 33 | l_ = 0; |
| 34 | |
| 35 | for (l_ = 0; l_ < buf_.size();) { |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 36 | size_t lf_cnt = 0; |
| 37 | size_t e = FindEndOfLine(&lf_cnt); |
Shinichiro Hamaji | 8ee8c37 | 2015-06-16 16:19:40 +0900 | [diff] [blame] | 38 | if (!fixed_lineno_) |
| 39 | loc_.lineno += lf_cnt; |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 40 | StringPiece line(buf_.data() + l_, e - l_); |
| 41 | ParseLine(line); |
| 42 | if (e == buf_.size()) |
| 43 | break; |
| 44 | |
| 45 | l_ = e + 1; |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 46 | } |
| 47 | } |
| 48 | |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 49 | static void Init() { |
| 50 | make_directives_ = new unordered_map<StringPiece, DirectiveHandler>; |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 51 | (*make_directives_)["include"] = &Parser::ParseInclude; |
| 52 | (*make_directives_)["-include"] = &Parser::ParseInclude; |
| 53 | (*make_directives_)["sinclude"] = &Parser::ParseInclude; |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 54 | (*make_directives_)["define"] = &Parser::ParseDefine; |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 55 | |
| 56 | shortest_directive_len_ = 9999; |
| 57 | longest_directive_len_ = 0; |
| 58 | for (auto p : *make_directives_) { |
| 59 | size_t len = p.first.size(); |
| 60 | shortest_directive_len_ = min(len, shortest_directive_len_); |
| 61 | longest_directive_len_ = max(len, longest_directive_len_); |
| 62 | } |
| 63 | } |
| 64 | |
| 65 | static void Quit() { |
| 66 | delete make_directives_; |
| 67 | } |
| 68 | |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 69 | private: |
| 70 | void Error(const string& msg) { |
Shinichiro Hamaji | 8ee8c37 | 2015-06-16 16:19:40 +0900 | [diff] [blame] | 71 | ERROR("%s:%d: %s", LOCF(loc_), msg.c_str()); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 72 | } |
| 73 | |
| 74 | size_t FindEndOfLine(size_t* lf_cnt) { |
| 75 | size_t e = l_; |
| 76 | bool prev_backslash = false; |
| 77 | for (; e < buf_.size(); e++) { |
| 78 | char c = buf_[e]; |
| 79 | if (c == '\\') { |
| 80 | prev_backslash = !prev_backslash; |
| 81 | } else if (c == '\n') { |
| 82 | ++*lf_cnt; |
| 83 | if (!prev_backslash) { |
| 84 | return e; |
| 85 | } |
| 86 | } else if (c != '\r') { |
| 87 | prev_backslash = false; |
| 88 | } |
| 89 | } |
| 90 | return e; |
| 91 | } |
| 92 | |
| 93 | void ParseLine(StringPiece line) { |
| 94 | if (line.empty() || (line.size() == 1 && line[0] == '\r')) |
| 95 | return; |
| 96 | |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 97 | if (!define_name_.empty()) { |
| 98 | ParseInsideDefine(line); |
| 99 | return; |
| 100 | } |
| 101 | |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 102 | if (line[0] == '\t' && state_ != ParserState::NOT_AFTER_RULE) { |
| 103 | CommandAST* ast = new CommandAST(); |
| 104 | ast->expr = ParseExpr(line.substr(1), true); |
| 105 | out_asts_->push_back(ast); |
| 106 | return; |
| 107 | } |
| 108 | |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 109 | line = TrimLeftSpace(line); |
Shinichiro Hamaji | d4e8193 | 2015-06-17 04:40:45 +0900 | [diff] [blame] | 110 | |
| 111 | if (line[0] == '#') |
| 112 | return; |
| 113 | |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 114 | if (HandleDirective(line)) { |
| 115 | return; |
| 116 | } |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 117 | |
| 118 | size_t sep = line.find_first_of(STRING_PIECE("=:")); |
| 119 | if (sep == string::npos) { |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 120 | ParseRule(line, sep); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 121 | } else if (line[sep] == '=') { |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 122 | ParseAssign(line, sep); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 123 | } else if (line.get(sep+1) == '=') { |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 124 | ParseAssign(line, sep+1); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 125 | } else if (line[sep] == ':') { |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 126 | ParseRule(line, sep); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 127 | } else { |
| 128 | CHECK(false); |
| 129 | } |
| 130 | } |
| 131 | |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 132 | void ParseRule(StringPiece line, size_t sep) { |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 133 | const bool is_rule = line.find(':') != string::npos; |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 134 | RuleAST* ast = new RuleAST(); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 135 | ast->set_loc(loc_); |
| 136 | |
| 137 | size_t found = line.substr(sep + 1).find_first_of("=;"); |
| 138 | if (found != string::npos) { |
| 139 | found += sep + 1; |
| 140 | ast->term = line[found]; |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 141 | ast->after_term = ParseExpr(TrimLeftSpace(line.substr(found + 1)), |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 142 | ast->term == ';'); |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 143 | ast->expr = ParseExpr(TrimSpace(line.substr(0, found)), false); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 144 | } else { |
| 145 | ast->term = 0; |
| 146 | ast->after_term = NULL; |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 147 | ast->expr = ParseExpr(TrimSpace(line), false); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 148 | } |
| 149 | out_asts_->push_back(ast); |
| 150 | state_ = is_rule ? ParserState::AFTER_RULE : ParserState::MAYBE_AFTER_RULE; |
| 151 | } |
| 152 | |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 153 | void ParseAssign(StringPiece line, size_t sep) { |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 154 | if (sep == 0) |
| 155 | Error("*** empty variable name ***"); |
| 156 | AssignOp op = AssignOp::EQ; |
| 157 | size_t lhs_end = sep; |
| 158 | switch (line[sep-1]) { |
| 159 | case ':': |
| 160 | lhs_end--; |
| 161 | op = AssignOp::COLON_EQ; |
| 162 | break; |
| 163 | case '+': |
| 164 | lhs_end--; |
| 165 | op = AssignOp::PLUS_EQ; |
| 166 | break; |
| 167 | case '?': |
| 168 | lhs_end--; |
| 169 | op = AssignOp::QUESTION_EQ; |
| 170 | break; |
| 171 | } |
| 172 | |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 173 | AssignAST* ast = new AssignAST(); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 174 | ast->set_loc(loc_); |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 175 | ast->lhs = ParseExpr(TrimSpace(line.substr(0, lhs_end)), false); |
| 176 | ast->rhs = ParseExpr(TrimSpace(line.substr(sep + 1)), false); |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 177 | ast->op = op; |
| 178 | ast->directive = AssignDirective::NONE; |
| 179 | out_asts_->push_back(ast); |
| 180 | state_ = ParserState::NOT_AFTER_RULE; |
| 181 | } |
| 182 | |
Shinichiro Hamaji | 14b8bea | 2015-06-17 03:14:28 +0900 | [diff] [blame] | 183 | void ParseInclude(StringPiece line, StringPiece directive) { |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 184 | IncludeAST* ast = new IncludeAST(); |
| 185 | ast->expr = ParseExpr(line, false); |
Shinichiro Hamaji | efad2dd | 2015-06-17 03:08:02 +0900 | [diff] [blame] | 186 | ast->should_exist = directive[0] == 'i'; |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 187 | out_asts_->push_back(ast); |
| 188 | } |
| 189 | |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 190 | void ParseDefine(StringPiece line, StringPiece) { |
| 191 | if (line.empty()) { |
| 192 | Error("*** empty variable name."); |
| 193 | } |
| 194 | define_name_ = line; |
| 195 | define_start_ = 0; |
| 196 | define_start_line_ = loc_.lineno; |
| 197 | } |
| 198 | |
| 199 | void ParseInsideDefine(StringPiece line) { |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 200 | if (TrimLeftSpace(line) != "endef") { |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 201 | if (define_start_ == 0) |
| 202 | define_start_ = l_; |
| 203 | return; |
| 204 | } |
| 205 | |
| 206 | AssignAST* ast = new AssignAST(); |
| 207 | ast->set_loc(Loc(loc_.filename, define_start_line_)); |
| 208 | ast->lhs = ParseExpr(define_name_, false); |
| 209 | StringPiece rhs; |
| 210 | if (define_start_) |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 211 | rhs = TrimRightSpace(buf_.substr(define_start_, l_ - define_start_)); |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 212 | ast->rhs = ParseExpr(rhs, false); |
| 213 | ast->op = AssignOp::EQ; |
| 214 | ast->directive = AssignDirective::NONE; |
| 215 | out_asts_->push_back(ast); |
| 216 | define_name_.clear(); |
| 217 | } |
| 218 | |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 219 | bool HandleDirective(StringPiece line) { |
| 220 | if (line.size() < shortest_directive_len_) |
| 221 | return false; |
| 222 | StringPiece prefix = line.substr(0, longest_directive_len_ + 1); |
| 223 | size_t space_index = prefix.find(' '); |
| 224 | if (space_index == string::npos) |
| 225 | return false; |
| 226 | StringPiece directive = prefix.substr(0, space_index); |
| 227 | auto found = make_directives_->find(directive); |
| 228 | if (found == make_directives_->end()) |
| 229 | return false; |
| 230 | |
Shinichiro Hamaji | 3275062 | 2015-06-17 14:57:33 +0900 | [diff] [blame^] | 231 | StringPiece rest = TrimLeftSpace(line.substr(directive.size() + 1)); |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 232 | (this->*found->second)(rest, directive); |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 233 | return true; |
| 234 | } |
| 235 | |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 236 | StringPiece buf_; |
| 237 | size_t l_; |
| 238 | ParserState state_; |
| 239 | |
| 240 | vector<AST*>* out_asts_; |
Shinichiro Hamaji | 810fd03 | 2015-06-17 04:38:03 +0900 | [diff] [blame] | 241 | StringPiece define_name_; |
| 242 | size_t define_start_; |
| 243 | int define_start_line_; |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 244 | |
| 245 | Loc loc_; |
| 246 | bool fixed_lineno_; |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 247 | |
| 248 | typedef void (Parser::*DirectiveHandler)( |
| 249 | StringPiece line, StringPiece directive); |
| 250 | static unordered_map<StringPiece, DirectiveHandler>* make_directives_; |
| 251 | static size_t shortest_directive_len_; |
| 252 | static size_t longest_directive_len_; |
Shinichiro Hamaji | 776ca30 | 2015-06-06 03:52:48 +0900 | [diff] [blame] | 253 | }; |
| 254 | |
| 255 | void Parse(Makefile* mk) { |
| 256 | Parser parser(StringPiece(mk->buf(), mk->len()), |
| 257 | mk->filename().c_str(), |
| 258 | mk->mutable_asts()); |
| 259 | parser.Parse(); |
| 260 | } |
Shinichiro Hamaji | 42b625f | 2015-06-16 23:07:21 +0900 | [diff] [blame] | 261 | |
| 262 | void InitParser() { |
| 263 | Parser::Init(); |
| 264 | } |
| 265 | |
| 266 | void QuitParser() { |
| 267 | Parser::Quit(); |
| 268 | } |
| 269 | |
| 270 | unordered_map<StringPiece, Parser::DirectiveHandler>* Parser::make_directives_; |
| 271 | size_t Parser::shortest_directive_len_; |
| 272 | size_t Parser::longest_directive_len_; |