mirror of
				https://github.com/robertkrimen/otto
				synced 2025-10-19 19:55:30 +08:00 
			
		
		
		
	
		
			
				
	
	
		
			345 lines
		
	
	
		
			8.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			345 lines
		
	
	
		
			8.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| /*
 | |
| Package parser implements a parser for JavaScript.
 | |
| 
 | |
|     import (
 | |
|         "github.com/robertkrimen/otto/parser"
 | |
|     )
 | |
| 
 | |
| Parse and return an AST
 | |
| 
 | |
|     filename := "" // A filename is optional
 | |
|     src := `
 | |
|         // Sample xyzzy example
 | |
|         (function(){
 | |
|             if (3.14159 > 0) {
 | |
|                 console.log("Hello, World.");
 | |
|                 return;
 | |
|             }
 | |
| 
 | |
|             var xyzzy = NaN;
 | |
|             console.log("Nothing happens.");
 | |
|             return xyzzy;
 | |
|         })();
 | |
|     `
 | |
| 
 | |
|     // Parse some JavaScript, yielding a *ast.Program and/or an ErrorList
 | |
|     program, err := parser.ParseFile(nil, filename, src, 0)
 | |
| 
 | |
| Warning
 | |
| 
 | |
| The parser and AST interfaces are still works-in-progress (particularly where
 | |
| node types are concerned) and may change in the future.
 | |
| 
 | |
| */
 | |
| package parser
 | |
| 
 | |
| import (
 | |
| 	"bytes"
 | |
| 	"errors"
 | |
| 	"io"
 | |
| 	"io/ioutil"
 | |
| 
 | |
| 	"github.com/robertkrimen/otto/ast"
 | |
| 	"github.com/robertkrimen/otto/file"
 | |
| 	"github.com/robertkrimen/otto/token"
 | |
| )
 | |
| 
 | |
| // A Mode value is a set of flags (or 0). They control optional parser functionality.
 | |
| type Mode uint
 | |
| 
 | |
| const (
 | |
| 	IgnoreRegExpErrors Mode = 1 << iota // Ignore RegExp compatibility errors (allow backtracking)
 | |
| 	StoreComments                       // Store the comments from source to the comments map
 | |
| )
 | |
| 
 | |
| type _parser struct {
 | |
| 	str    string
 | |
| 	length int
 | |
| 	base   int
 | |
| 
 | |
| 	chr       rune // The current character
 | |
| 	chrOffset int  // The offset of current character
 | |
| 	offset    int  // The offset after current character (may be greater than 1)
 | |
| 
 | |
| 	idx     file.Idx    // The index of token
 | |
| 	token   token.Token // The token
 | |
| 	literal string      // The literal of the token, if any
 | |
| 
 | |
| 	scope             *_scope
 | |
| 	insertSemicolon   bool // If we see a newline, then insert an implicit semicolon
 | |
| 	implicitSemicolon bool // An implicit semicolon exists
 | |
| 
 | |
| 	errors ErrorList
 | |
| 
 | |
| 	recover struct {
 | |
| 		// Scratch when trying to seek to the next statement, etc.
 | |
| 		idx   file.Idx
 | |
| 		count int
 | |
| 	}
 | |
| 
 | |
| 	mode Mode
 | |
| 
 | |
| 	file *file.File
 | |
| 
 | |
| 	comments         []*ast.Comment
 | |
| 	commentMap       *ast.CommentMap
 | |
| 	skippedLineBreak bool
 | |
| }
 | |
| 
 | |
| func _newParser(filename, src string, base int) *_parser {
 | |
| 	return &_parser{
 | |
| 		chr:              ' ', // This is set so we can start scanning by skipping whitespace
 | |
| 		str:              src,
 | |
| 		length:           len(src),
 | |
| 		base:             base,
 | |
| 		file:             file.NewFile(filename, src, base),
 | |
| 		comments:         make([]*ast.Comment, 0),
 | |
| 		commentMap:       &ast.CommentMap{},
 | |
| 		skippedLineBreak: false,
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func newParser(filename, src string) *_parser {
 | |
| 	return _newParser(filename, src, 1)
 | |
| }
 | |
| 
 | |
| func ReadSource(filename string, src interface{}) ([]byte, error) {
 | |
| 	if src != nil {
 | |
| 		switch src := src.(type) {
 | |
| 		case string:
 | |
| 			return []byte(src), nil
 | |
| 		case []byte:
 | |
| 			return src, nil
 | |
| 		case *bytes.Buffer:
 | |
| 			if src != nil {
 | |
| 				return src.Bytes(), nil
 | |
| 			}
 | |
| 		case io.Reader:
 | |
| 			var bfr bytes.Buffer
 | |
| 			if _, err := io.Copy(&bfr, src); err != nil {
 | |
| 				return nil, err
 | |
| 			}
 | |
| 			return bfr.Bytes(), nil
 | |
| 		}
 | |
| 		return nil, errors.New("invalid source")
 | |
| 	}
 | |
| 	return ioutil.ReadFile(filename)
 | |
| }
 | |
| 
 | |
| // ParseFile parses the source code of a single JavaScript/ECMAScript source file and returns
 | |
| // the corresponding ast.Program node.
 | |
| //
 | |
| // If fileSet == nil, ParseFile parses source without a FileSet.
 | |
| // If fileSet != nil, ParseFile first adds filename and src to fileSet.
 | |
| //
 | |
| // The filename argument is optional and is used for labelling errors, etc.
 | |
| //
 | |
| // src may be a string, a byte slice, a bytes.Buffer, or an io.Reader, but it MUST always be in UTF-8.
 | |
| //
 | |
| //      // Parse some JavaScript, yielding a *ast.Program and/or an ErrorList
 | |
| //      program, err := parser.ParseFile(nil, "", `if (abc > 1) {}`, 0)
 | |
| //
 | |
| func ParseFile(fileSet *file.FileSet, filename string, src interface{}, mode Mode) (*ast.Program, error) {
 | |
| 	str, err := ReadSource(filename, src)
 | |
| 	if err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 	{
 | |
| 		str := string(str)
 | |
| 
 | |
| 		base := 1
 | |
| 		if fileSet != nil {
 | |
| 			base = fileSet.AddFile(filename, str)
 | |
| 		}
 | |
| 
 | |
| 		parser := _newParser(filename, str, base)
 | |
| 		parser.mode = mode
 | |
| 		return parser.parse()
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // ParseFunction parses a given parameter list and body as a function and returns the
 | |
| // corresponding ast.FunctionLiteral node.
 | |
| //
 | |
| // The parameter list, if any, should be a comma-separated list of identifiers.
 | |
| //
 | |
| func ParseFunction(parameterList, body string) (*ast.FunctionLiteral, error) {
 | |
| 
 | |
| 	src := "(function(" + parameterList + ") {\n" + body + "\n})"
 | |
| 
 | |
| 	parser := _newParser("", src, 1)
 | |
| 	program, err := parser.parse()
 | |
| 	if err != nil {
 | |
| 		return nil, err
 | |
| 	}
 | |
| 
 | |
| 	return program.Body[0].(*ast.ExpressionStatement).Expression.(*ast.FunctionLiteral), nil
 | |
| }
 | |
| 
 | |
| func (self *_parser) slice(idx0, idx1 file.Idx) string {
 | |
| 	from := int(idx0) - self.base
 | |
| 	to := int(idx1) - self.base
 | |
| 	if from >= 0 && to <= len(self.str) {
 | |
| 		return self.str[from:to]
 | |
| 	}
 | |
| 
 | |
| 	return ""
 | |
| }
 | |
| 
 | |
| func (self *_parser) parse() (*ast.Program, error) {
 | |
| 	self.next()
 | |
| 	program := self.parseProgram()
 | |
| 	if false {
 | |
| 		self.errors.Sort()
 | |
| 	}
 | |
| 
 | |
| 	self.addCommentStatements(program, ast.FINAL)
 | |
| 
 | |
| 	return program, self.errors.Err()
 | |
| }
 | |
| 
 | |
| func (self *_parser) next() {
 | |
| 	self.token, self.literal, self.idx = self.scan()
 | |
| }
 | |
| 
 | |
| func (self *_parser) optionalSemicolon() {
 | |
| 	if self.token == token.SEMICOLON {
 | |
| 		self.next()
 | |
| 		return
 | |
| 	}
 | |
| 
 | |
| 	if self.implicitSemicolon {
 | |
| 		self.implicitSemicolon = false
 | |
| 		return
 | |
| 	}
 | |
| 
 | |
| 	if self.token != token.EOF && self.token != token.RIGHT_BRACE {
 | |
| 		self.expect(token.SEMICOLON)
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func (self *_parser) semicolon() {
 | |
| 	if self.token != token.RIGHT_PARENTHESIS && self.token != token.RIGHT_BRACE {
 | |
| 		if self.implicitSemicolon {
 | |
| 			self.implicitSemicolon = false
 | |
| 			return
 | |
| 		}
 | |
| 
 | |
| 		self.expect(token.SEMICOLON)
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func (self *_parser) idxOf(offset int) file.Idx {
 | |
| 	return file.Idx(self.base + offset)
 | |
| }
 | |
| 
 | |
| func (self *_parser) expect(value token.Token) file.Idx {
 | |
| 	idx := self.idx
 | |
| 	if self.token != value {
 | |
| 		self.errorUnexpectedToken(self.token)
 | |
| 	}
 | |
| 	self.next()
 | |
| 	return idx
 | |
| }
 | |
| 
 | |
| func lineCount(str string) (int, int) {
 | |
| 	line, last := 0, -1
 | |
| 	pair := false
 | |
| 	for index, chr := range str {
 | |
| 		switch chr {
 | |
| 		case '\r':
 | |
| 			line += 1
 | |
| 			last = index
 | |
| 			pair = true
 | |
| 			continue
 | |
| 		case '\n':
 | |
| 			if !pair {
 | |
| 				line += 1
 | |
| 			}
 | |
| 			last = index
 | |
| 		case '\u2028', '\u2029':
 | |
| 			line += 1
 | |
| 			last = index + 2
 | |
| 		}
 | |
| 		pair = false
 | |
| 	}
 | |
| 	return line, last
 | |
| }
 | |
| 
 | |
| func (self *_parser) position(idx file.Idx) file.Position {
 | |
| 	position := file.Position{}
 | |
| 	offset := int(idx) - self.base
 | |
| 	str := self.str[:offset]
 | |
| 	position.Filename = self.file.Name()
 | |
| 	line, last := lineCount(str)
 | |
| 	position.Line = 1 + line
 | |
| 	if last >= 0 {
 | |
| 		position.Column = offset - last
 | |
| 	} else {
 | |
| 		position.Column = 1 + len(str)
 | |
| 	}
 | |
| 
 | |
| 	return position
 | |
| }
 | |
| 
 | |
| // findComments finds the following comments.
 | |
| // Comments on the same line will be grouped together and returned.
 | |
| // After the first line break, comments will be added as statement comments.
 | |
| func (self *_parser) findComments(ignoreLineBreak bool) []*ast.Comment {
 | |
| 	if self.mode & StoreComments == 0 {
 | |
| 		return nil
 | |
| 	}
 | |
| 	comments := make([]*ast.Comment, 0)
 | |
| 
 | |
| 
 | |
| 	newline := false
 | |
| 
 | |
| 	for self.implicitSemicolon == false || ignoreLineBreak {
 | |
| 		if self.token != token.COMMENT {
 | |
| 			break
 | |
| 		}
 | |
| 
 | |
| 		comment := &ast.Comment{
 | |
| 			Begin:    self.idx,
 | |
| 			Text:     self.literal,
 | |
| 			Position: ast.TBD,
 | |
| 		}
 | |
| 
 | |
| 		newline = self.skippedLineBreak || newline
 | |
| 
 | |
| 		if newline && !ignoreLineBreak {
 | |
| 			self.comments = append(self.comments, comment)
 | |
| 		} else {
 | |
| 			comments = append(comments, comment)
 | |
| 		}
 | |
| 
 | |
| 		self.next()
 | |
| 	}
 | |
| 
 | |
| 	return comments
 | |
| }
 | |
| 
 | |
| // addCommentStatements will add the previously parsed, not positioned comments to the provided node
 | |
| func (self *_parser) addCommentStatements(node ast.Node, position ast.CommentPosition) {
 | |
| 	if len(self.comments) > 0 {
 | |
| 		self.commentMap.AddComments(node, self.comments, position)
 | |
| 
 | |
| 		// Reset comments
 | |
| 		self.comments = make([]*ast.Comment, 0)
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // fetchComments fetches the current comments, resets the slice and returns the comments
 | |
| func (self *_parser) fetchComments() (comments []*ast.Comment) {
 | |
| 	comments = self.comments
 | |
| 	self.comments = nil
 | |
| 
 | |
| 	return comments
 | |
| }
 | |
| 
 | |
| // consumeComments consumes the current comments and appends them to the provided node
 | |
| func (self *_parser) consumeComments(node ast.Node, position ast.CommentPosition) {
 | |
| 	self.commentMap.AddComments(node, self.comments, position)
 | |
| 	self.comments = nil
 | |
| }
 | 
