| package parser |
| |
| import ( |
| "errors" |
| "fmt" |
| "io" |
| "sort" |
| "text/scanner" |
| ) |
| |
| var errTooManyErrors = errors.New("too many errors") |
| |
| const maxErrors = 100 |
| |
| type ParseError struct { |
| Err error |
| Pos scanner.Position |
| } |
| |
| func (e *ParseError) Error() string { |
| return fmt.Sprintf("%s: %s", e.Pos, e.Err) |
| } |
| |
| func (p *parser) Parse() ([]Node, []error) { |
| defer func() { |
| if r := recover(); r != nil { |
| if r == errTooManyErrors { |
| return |
| } |
| panic(r) |
| } |
| }() |
| |
| p.parseLines() |
| p.accept(scanner.EOF) |
| p.nodes = append(p.nodes, p.comments...) |
| sort.Sort(byPosition(p.nodes)) |
| |
| return p.nodes, p.errors |
| } |
| |
| type parser struct { |
| scanner scanner.Scanner |
| tok rune |
| errors []error |
| comments []Node |
| nodes []Node |
| lines []int |
| } |
| |
| func NewParser(filename string, r io.Reader) *parser { |
| p := &parser{} |
| p.lines = []int{0} |
| p.scanner.Init(r) |
| p.scanner.Error = func(sc *scanner.Scanner, msg string) { |
| p.errorf(msg) |
| } |
| p.scanner.Whitespace = 0 |
| p.scanner.IsIdentRune = func(ch rune, i int) bool { |
| return ch > 0 && ch != ':' && ch != '#' && ch != '=' && ch != '+' && ch != '$' && |
| ch != '\\' && ch != '(' && ch != ')' && ch != '{' && ch != '}' && ch != ';' && |
| ch != '|' && ch != '?' && ch != '\r' && !isWhitespace(ch) |
| } |
| p.scanner.Mode = scanner.ScanIdents |
| p.scanner.Filename = filename |
| p.next() |
| return p |
| } |
| |
| func (p *parser) Unpack(pos Pos) scanner.Position { |
| offset := int(pos) |
| line := sort.Search(len(p.lines), func(i int) bool { return p.lines[i] > offset }) - 1 |
| return scanner.Position{ |
| Filename: p.scanner.Filename, |
| Line: line + 1, |
| Column: offset - p.lines[line] + 1, |
| Offset: offset, |
| } |
| } |
| |
| func (p *parser) pos() Pos { |
| pos := p.scanner.Position |
| if !pos.IsValid() { |
| pos = p.scanner.Pos() |
| } |
| return Pos(pos.Offset) |
| } |
| |
| func (p *parser) errorf(format string, args ...interface{}) { |
| err := &ParseError{ |
| Err: fmt.Errorf(format, args...), |
| Pos: p.scanner.Position, |
| } |
| p.errors = append(p.errors, err) |
| if len(p.errors) >= maxErrors { |
| panic(errTooManyErrors) |
| } |
| } |
| |
| func (p *parser) accept(toks ...rune) bool { |
| for _, tok := range toks { |
| if p.tok != tok { |
| p.errorf("expected %s, found %s", scanner.TokenString(tok), |
| scanner.TokenString(p.tok)) |
| return false |
| } |
| p.next() |
| } |
| return true |
| } |
| |
| func (p *parser) next() { |
| if p.tok != scanner.EOF { |
| p.tok = p.scanner.Scan() |
| for p.tok == '\r' { |
| p.tok = p.scanner.Scan() |
| } |
| } |
| if p.tok == '\n' { |
| p.lines = append(p.lines, p.scanner.Position.Offset+1) |
| } |
| } |
| |
| func (p *parser) parseLines() { |
| for { |
| p.ignoreWhitespace() |
| |
| if p.parseDirective() { |
| continue |
| } |
| |
| ident := p.parseExpression('=', '?', ':', '#', '\n') |
| |
| p.ignoreSpaces() |
| |
| switch p.tok { |
| case '?': |
| p.accept('?') |
| if p.tok == '=' { |
| p.parseAssignment("?=", nil, ident) |
| } else { |
| p.errorf("expected = after ?") |
| } |
| case '+': |
| p.accept('+') |
| if p.tok == '=' { |
| p.parseAssignment("+=", nil, ident) |
| } else { |
| p.errorf("expected = after +") |
| } |
| case ':': |
| p.accept(':') |
| switch p.tok { |
| case '=': |
| p.parseAssignment(":=", nil, ident) |
| default: |
| p.parseRule(ident) |
| } |
| case '=': |
| p.parseAssignment("=", nil, ident) |
| case '#', '\n', scanner.EOF: |
| ident.TrimRightSpaces() |
| if v, ok := toVariable(ident); ok { |
| p.nodes = append(p.nodes, &v) |
| } else if !ident.Empty() { |
| p.errorf("expected directive, rule, or assignment after ident " + ident.Dump()) |
| } |
| switch p.tok { |
| case scanner.EOF: |
| return |
| case '\n': |
| p.accept('\n') |
| case '#': |
| p.parseComment() |
| } |
| default: |
| p.errorf("expected assignment or rule definition, found %s\n", |
| p.scanner.TokenText()) |
| return |
| } |
| } |
| } |
| |
| func (p *parser) parseDirective() bool { |
| if p.tok != scanner.Ident || !isDirective(p.scanner.TokenText()) { |
| return false |
| } |
| |
| d := p.scanner.TokenText() |
| pos := p.pos() |
| p.accept(scanner.Ident) |
| endPos := NoPos |
| |
| expression := SimpleMakeString("", pos) |
| |
| switch d { |
| case "endif", "endef", "else": |
| // Nothing |
| case "define": |
| expression, endPos = p.parseDefine() |
| default: |
| p.ignoreSpaces() |
| expression = p.parseExpression() |
| } |
| |
| p.nodes = append(p.nodes, &Directive{ |
| NamePos: pos, |
| Name: d, |
| Args: expression, |
| EndPos: endPos, |
| }) |
| return true |
| } |
| |
| func (p *parser) parseDefine() (*MakeString, Pos) { |
| value := SimpleMakeString("", p.pos()) |
| |
| loop: |
| for { |
| switch p.tok { |
| case scanner.Ident: |
| value.appendString(p.scanner.TokenText()) |
| if p.scanner.TokenText() == "endef" { |
| p.accept(scanner.Ident) |
| break loop |
| } |
| p.accept(scanner.Ident) |
| case '\\': |
| p.parseEscape() |
| switch p.tok { |
| case '\n': |
| value.appendString(" ") |
| case scanner.EOF: |
| p.errorf("expected escaped character, found %s", |
| scanner.TokenString(p.tok)) |
| break loop |
| default: |
| value.appendString(`\` + string(p.tok)) |
| } |
| p.accept(p.tok) |
| //TODO: handle variables inside defines? result depends if |
| //define is used in make or rule context |
| //case '$': |
| // variable := p.parseVariable() |
| // value.appendVariable(variable) |
| case scanner.EOF: |
| p.errorf("unexpected EOF while looking for endef") |
| break loop |
| default: |
| value.appendString(p.scanner.TokenText()) |
| p.accept(p.tok) |
| } |
| } |
| |
| return value, p.pos() |
| } |
| |
| func (p *parser) parseEscape() { |
| p.scanner.Mode = 0 |
| p.accept('\\') |
| p.scanner.Mode = scanner.ScanIdents |
| } |
| |
| func (p *parser) parseExpression(end ...rune) *MakeString { |
| value := SimpleMakeString("", p.pos()) |
| |
| endParen := false |
| for _, r := range end { |
| if r == ')' { |
| endParen = true |
| } |
| } |
| parens := 0 |
| |
| loop: |
| for { |
| if endParen && parens > 0 && p.tok == ')' { |
| parens-- |
| value.appendString(")") |
| p.accept(')') |
| continue |
| } |
| |
| for _, r := range end { |
| if p.tok == r { |
| break loop |
| } |
| } |
| |
| switch p.tok { |
| case '\n': |
| break loop |
| case scanner.Ident: |
| value.appendString(p.scanner.TokenText()) |
| p.accept(scanner.Ident) |
| case '\\': |
| p.parseEscape() |
| switch p.tok { |
| case '\n': |
| value.appendString(" ") |
| case scanner.EOF: |
| p.errorf("expected escaped character, found %s", |
| scanner.TokenString(p.tok)) |
| return value |
| default: |
| value.appendString(`\` + string(p.tok)) |
| } |
| p.accept(p.tok) |
| case '#': |
| p.parseComment() |
| break loop |
| case '$': |
| var variable Variable |
| variable = p.parseVariable() |
| value.appendVariable(variable) |
| case scanner.EOF: |
| break loop |
| case '(': |
| if endParen { |
| parens++ |
| } |
| value.appendString("(") |
| p.accept('(') |
| default: |
| value.appendString(p.scanner.TokenText()) |
| p.accept(p.tok) |
| } |
| } |
| |
| if parens > 0 { |
| p.errorf("expected closing paren %s", value.Dump()) |
| } |
| return value |
| } |
| |
| func (p *parser) parseVariable() Variable { |
| pos := p.pos() |
| p.accept('$') |
| var name *MakeString |
| switch p.tok { |
| case '(': |
| return p.parseBracketedVariable('(', ')', pos) |
| case '{': |
| return p.parseBracketedVariable('{', '}', pos) |
| case '$': |
| name = SimpleMakeString("__builtin_dollar", NoPos) |
| case scanner.EOF: |
| p.errorf("expected variable name, found %s", |
| scanner.TokenString(p.tok)) |
| default: |
| name = p.parseExpression(variableNameEndRunes...) |
| } |
| |
| return p.nameToVariable(name) |
| } |
| |
| func (p *parser) parseBracketedVariable(start, end rune, pos Pos) Variable { |
| p.accept(start) |
| name := p.parseExpression(end) |
| p.accept(end) |
| return p.nameToVariable(name) |
| } |
| |
| func (p *parser) nameToVariable(name *MakeString) Variable { |
| return Variable{ |
| Name: name, |
| } |
| } |
| |
| func (p *parser) parseRule(target *MakeString) { |
| prerequisites, newLine := p.parseRulePrerequisites(target) |
| |
| recipe := "" |
| recipePos := p.pos() |
| loop: |
| for { |
| if newLine { |
| if p.tok == '\t' { |
| p.accept('\t') |
| newLine = false |
| continue loop |
| } else if p.parseDirective() { |
| newLine = false |
| continue |
| } else { |
| break loop |
| } |
| } |
| |
| newLine = false |
| switch p.tok { |
| case '\\': |
| p.parseEscape() |
| recipe += string(p.tok) |
| p.accept(p.tok) |
| case '\n': |
| newLine = true |
| recipe += "\n" |
| p.accept('\n') |
| case scanner.EOF: |
| break loop |
| default: |
| recipe += p.scanner.TokenText() |
| p.accept(p.tok) |
| } |
| } |
| |
| if prerequisites != nil { |
| p.nodes = append(p.nodes, &Rule{ |
| Target: target, |
| Prerequisites: prerequisites, |
| Recipe: recipe, |
| RecipePos: recipePos, |
| }) |
| } |
| } |
| |
| func (p *parser) parseRulePrerequisites(target *MakeString) (*MakeString, bool) { |
| newLine := false |
| |
| p.ignoreSpaces() |
| |
| prerequisites := p.parseExpression('#', '\n', ';', ':', '=') |
| |
| switch p.tok { |
| case '\n': |
| p.accept('\n') |
| newLine = true |
| case '#': |
| p.parseComment() |
| newLine = true |
| case ';': |
| p.accept(';') |
| case ':': |
| p.accept(':') |
| if p.tok == '=' { |
| p.parseAssignment(":=", target, prerequisites) |
| return nil, true |
| } else { |
| more := p.parseExpression('#', '\n', ';') |
| prerequisites.appendMakeString(more) |
| } |
| case '=': |
| p.parseAssignment("=", target, prerequisites) |
| return nil, true |
| default: |
| p.errorf("unexpected token %s after rule prerequisites", scanner.TokenString(p.tok)) |
| } |
| |
| return prerequisites, newLine |
| } |
| |
| func (p *parser) parseComment() { |
| pos := p.pos() |
| p.accept('#') |
| comment := "" |
| loop: |
| for { |
| switch p.tok { |
| case '\\': |
| p.parseEscape() |
| if p.tok == '\n' { |
| comment += "\n" |
| } else { |
| comment += "\\" + p.scanner.TokenText() |
| } |
| p.accept(p.tok) |
| case '\n': |
| p.accept('\n') |
| break loop |
| case scanner.EOF: |
| break loop |
| default: |
| comment += p.scanner.TokenText() |
| p.accept(p.tok) |
| } |
| } |
| |
| p.comments = append(p.comments, &Comment{ |
| CommentPos: pos, |
| Comment: comment, |
| }) |
| } |
| |
| func (p *parser) parseAssignment(t string, target *MakeString, ident *MakeString) { |
| // The value of an assignment is everything including and after the first |
| // non-whitespace character after the = until the end of the logical line, |
| // which may included escaped newlines |
| p.accept('=') |
| value := p.parseExpression() |
| value.TrimLeftSpaces() |
| if ident.EndsWith('+') && t == "=" { |
| ident.TrimRightOne() |
| t = "+=" |
| } |
| |
| ident.TrimRightSpaces() |
| |
| p.nodes = append(p.nodes, &Assignment{ |
| Name: ident, |
| Value: value, |
| Target: target, |
| Type: t, |
| }) |
| } |
| |
| type androidMkModule struct { |
| assignments map[string]string |
| } |
| |
| type androidMkFile struct { |
| assignments map[string]string |
| modules []androidMkModule |
| includes []string |
| } |
| |
| var directives = [...]string{ |
| "define", |
| "else", |
| "endef", |
| "endif", |
| "ifdef", |
| "ifeq", |
| "ifndef", |
| "ifneq", |
| "include", |
| "-include", |
| } |
| |
| var functions = [...]string{ |
| "abspath", |
| "addprefix", |
| "addsuffix", |
| "basename", |
| "dir", |
| "notdir", |
| "subst", |
| "suffix", |
| "filter", |
| "filter-out", |
| "findstring", |
| "firstword", |
| "flavor", |
| "join", |
| "lastword", |
| "patsubst", |
| "realpath", |
| "shell", |
| "sort", |
| "strip", |
| "wildcard", |
| "word", |
| "wordlist", |
| "words", |
| "origin", |
| "foreach", |
| "call", |
| "info", |
| "error", |
| "warning", |
| "if", |
| "or", |
| "and", |
| "value", |
| "eval", |
| "file", |
| } |
| |
| func init() { |
| sort.Strings(directives[:]) |
| sort.Strings(functions[:]) |
| } |
| |
| func isDirective(s string) bool { |
| for _, d := range directives { |
| if s == d { |
| return true |
| } else if s < d { |
| return false |
| } |
| } |
| return false |
| } |
| |
| func isFunctionName(s string) bool { |
| for _, f := range functions { |
| if s == f { |
| return true |
| } else if s < f { |
| return false |
| } |
| } |
| return false |
| } |
| |
| func isWhitespace(ch rune) bool { |
| return ch == ' ' || ch == '\t' || ch == '\n' |
| } |
| |
| func isValidVariableRune(ch rune) bool { |
| return ch != scanner.Ident && ch != ':' && ch != '=' && ch != '#' |
| } |
| |
| var whitespaceRunes = []rune{' ', '\t', '\n'} |
| var variableNameEndRunes = append([]rune{':', '=', '#', ')', '}'}, whitespaceRunes...) |
| |
| func (p *parser) ignoreSpaces() int { |
| skipped := 0 |
| for p.tok == ' ' || p.tok == '\t' { |
| p.accept(p.tok) |
| skipped++ |
| } |
| return skipped |
| } |
| |
| func (p *parser) ignoreWhitespace() { |
| for isWhitespace(p.tok) { |
| p.accept(p.tok) |
| } |
| } |