parser.go 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408
  1. package parser
  2. import (
  3. "fmt"
  4. "github/runnignwater/monkey/ast"
  5. "github/runnignwater/monkey/lexer"
  6. "github/runnignwater/monkey/token"
  7. "strconv"
  8. )
  9. /**
  10. * @Author: simon
  11. * @Author: ynwdlxm@163.com
  12. * @Date: 2022/10/2 下午9:55
  13. * @Desc:
  14. */
  15. const (
  16. // 优先级常量
  17. _ int = iota
  18. LOWEST
  19. EQUALS // ==
  20. LESSGREATER // > OR <
  21. SUM // +
  22. PRODUCT // *
  23. PREFIX // -X OR !X
  24. CALL // myFunction(X)
  25. )
  26. // 指派 token 类型的优先级
  27. var precedences = map[token.TypeToken]int{
  28. token.EQ: EQUALS,
  29. token.NOT_EQ: EQUALS,
  30. token.GT: LESSGREATER,
  31. token.LT: LESSGREATER,
  32. token.PLUS: SUM,
  33. token.MINUS: SUM,
  34. token.ASTERISK: PRODUCT,
  35. token.SLASH: PRODUCT,
  36. }
  37. type (
  38. prefixParseFn func() ast.Expression
  39. infixParseFn func(expression ast.Expression) ast.Expression
  40. )
  41. type Parser struct {
  42. l *lexer.Lexer // point to the instance of the lexer
  43. errors []string
  44. curToken token.Token // point to the current token
  45. peekToken token.Token // point to the next token
  46. prefixParseFns map[token.TypeToken]prefixParseFn
  47. infixParseFns map[token.TypeToken]infixParseFn
  48. }
  49. func New(l *lexer.Lexer) *Parser {
  50. p := &Parser{
  51. l: l,
  52. errors: []string{},
  53. }
  54. p.prefixParseFns = make(map[token.TypeToken]prefixParseFn)
  55. p.registerPrefix(token.IDENT, p.parseIdentifier)
  56. p.registerPrefix(token.INT, p.parseIntegerLiteral)
  57. p.registerPrefix(token.BANG, p.parsePrefixExpression)
  58. p.registerPrefix(token.MINUS, p.parsePrefixExpression)
  59. p.registerPrefix(token.TRUE, p.parseBoolean)
  60. p.registerPrefix(token.FALSE, p.parseBoolean)
  61. p.registerPrefix(token.LPAREN, p.parseGroupedExpression)
  62. p.registerPrefix(token.IF, p.parseIfExpression)
  63. p.registerPrefix(token.FUNCTION, p.parseFunctionLiteral)
  64. p.infixParseFns = make(map[token.TypeToken]infixParseFn)
  65. p.registerInfix(token.PLUS, p.parseInfixExpression)
  66. p.registerInfix(token.MINUS, p.parseInfixExpression)
  67. p.registerInfix(token.ASTERISK, p.parseInfixExpression)
  68. p.registerInfix(token.SLASH, p.parseInfixExpression)
  69. p.registerInfix(token.EQ, p.parseInfixExpression)
  70. p.registerInfix(token.NOT_EQ, p.parseInfixExpression)
  71. p.registerInfix(token.GT, p.parseInfixExpression)
  72. p.registerInfix(token.LT, p.parseInfixExpression)
  73. // Read two tokens, so curToken and peekToken are both set
  74. p.nextToken()
  75. p.nextToken()
  76. return p
  77. }
  78. func (p *Parser) parseIdentifier() ast.Expression {
  79. return &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  80. }
  81. func (p *Parser) parseBoolean() ast.Expression {
  82. return &ast.Boolean{Token: p.curToken, Value: p.curTokenIs(token.TRUE)}
  83. }
  84. func (p *Parser) parseGroupedExpression() ast.Expression {
  85. defer untrace(trace("parseGroupedExpression"))
  86. p.nextToken()
  87. exp := p.parseExpression(LOWEST)
  88. if !p.expectPeek(token.RPAREN) {
  89. return nil
  90. }
  91. return exp
  92. }
  93. func (p *Parser) parseIfExpression() ast.Expression {
  94. defer untrace(trace("parseIfExpression"))
  95. exp := &ast.IfExpression{Token: p.curToken}
  96. // (
  97. if !p.expectPeek(token.LPAREN) {
  98. return nil
  99. }
  100. p.nextToken()
  101. exp.Condition = p.parseExpression(LOWEST)
  102. // )
  103. if !p.expectPeek(token.RPAREN) {
  104. return nil
  105. }
  106. // {
  107. if !p.expectPeek(token.LBRACE) {
  108. return nil
  109. }
  110. exp.Consequence = p.parseBlockStatement()
  111. // else expression
  112. if p.peekTokenIs(token.ELSE) {
  113. p.nextToken()
  114. if !p.expectPeek(token.LBRACE) {
  115. return nil
  116. }
  117. exp.Alternative = p.parseBlockStatement()
  118. }
  119. return exp
  120. }
  121. func (p *Parser) parseFunctionLiteral() ast.Expression {
  122. lit := &ast.FunctionLiteral{Token: p.curToken}
  123. // (
  124. if !p.expectPeek(token.LPAREN) {
  125. return nil
  126. }
  127. lit.Parameters = p.ParseFunctionParameters()
  128. // {
  129. if !p.expectPeek(token.LBRACE) {
  130. return nil
  131. }
  132. lit.Body = p.parseBlockStatement()
  133. return lit
  134. }
  135. func (p *Parser) parseIntegerLiteral() ast.Expression {
  136. defer untrace(trace("parseIntegerLiteral"))
  137. lit := &ast.IntegerLiteral{Token: p.curToken}
  138. value, err := strconv.ParseInt(p.curToken.Literal, 0, 64)
  139. if err != nil {
  140. msg := fmt.Sprintf("could not parse %q as integer", p.curToken.Literal)
  141. p.errors = append(p.errors, msg)
  142. return nil
  143. }
  144. lit.Value = value
  145. return lit
  146. }
  147. func (p *Parser) parseInfixExpression(left ast.Expression) ast.Expression {
  148. defer untrace(trace("parseInfixExpression"))
  149. exp := &ast.InfixExpression{
  150. Token: p.curToken,
  151. Left: left,
  152. Operator: p.curToken.Literal,
  153. }
  154. precedence := p.curPrecedence()
  155. p.nextToken()
  156. exp.Right = p.parseExpression(precedence)
  157. return exp
  158. }
  159. func (p *Parser) parsePrefixExpression() ast.Expression {
  160. defer untrace(trace("parsePrefixExpression"))
  161. exp := &ast.PrefixExpression{
  162. Token: p.curToken,
  163. Operator: p.curToken.Literal,
  164. }
  165. p.nextToken()
  166. exp.Right = p.parseExpression(PREFIX)
  167. return exp
  168. }
  169. func (p *Parser) parseBlockStatement() *ast.BlockStatement {
  170. defer untrace(trace("parseBlockStatement"))
  171. block := &ast.BlockStatement{Token: p.curToken}
  172. block.Statements = []ast.Statement{}
  173. p.nextToken()
  174. // }
  175. for !p.curTokenIs(token.RBRACE) {
  176. stmt := p.parseStatement()
  177. if stmt != nil {
  178. block.Statements = append(block.Statements, stmt)
  179. }
  180. p.nextToken()
  181. }
  182. return block
  183. }
  184. func (p *Parser) Errors() []string {
  185. return p.errors
  186. }
  187. func (p *Parser) peekError(t token.TypeToken) {
  188. msg := fmt.Sprintf("exepected next token to be %s, got %s instead.", t, p.peekToken.Type)
  189. p.errors = append(p.errors, msg)
  190. }
  191. func (p *Parser) nextToken() {
  192. p.curToken = p.peekToken
  193. p.peekToken = p.l.NextToken()
  194. }
  195. func (p *Parser) ParseProgram() *ast.Program {
  196. program := &ast.Program{}
  197. program.Statements = []ast.Statement{}
  198. for !p.curTokenIs(token.EOF) {
  199. stmt := p.parseStatement()
  200. if stmt != nil {
  201. program.Statements = append(program.Statements, stmt)
  202. }
  203. p.nextToken()
  204. }
  205. return program
  206. }
  207. func (p *Parser) parseStatement() ast.Statement {
  208. switch p.curToken.Type {
  209. case token.LET:
  210. return p.parseLetStatement()
  211. case token.RETURN:
  212. return p.parseReturnStatement()
  213. default:
  214. return p.parseExpressionStatement()
  215. }
  216. }
  217. // let <identifier> = <expression>;
  218. func (p *Parser) parseLetStatement() *ast.LetStatement {
  219. stmt := &ast.LetStatement{Token: p.curToken}
  220. // let
  221. if !p.expectPeek(token.IDENT) {
  222. return nil
  223. }
  224. // identifier
  225. stmt.Name = &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  226. // =
  227. if !p.expectPeek(token.ASSIGN) {
  228. return nil
  229. }
  230. // TODO: we're skipping the expression until we
  231. // we encounter a semicolon
  232. // ;
  233. for !p.curTokenIs(token.SEMICOLON) {
  234. p.nextToken()
  235. }
  236. return stmt
  237. }
  238. // return <expression>;
  239. func (p *Parser) parseReturnStatement() *ast.ReturnStatement {
  240. stmt := &ast.ReturnStatement{Token: p.curToken}
  241. p.nextToken()
  242. // TODO: we're skipping the expressions until we
  243. // encounter a semicolon
  244. for !p.curTokenIs(token.SEMICOLON) {
  245. p.nextToken()
  246. }
  247. return stmt
  248. }
  249. func (p *Parser) parseExpressionStatement() *ast.ExpressionStatement {
  250. defer untrace(trace("parseExpressionStatement"))
  251. stmt := &ast.ExpressionStatement{Token: p.curToken}
  252. stmt.Expression = p.parseExpression(LOWEST)
  253. if p.peekTokenIs(token.SEMICOLON) {
  254. p.nextToken()
  255. }
  256. return stmt
  257. }
  258. func (p *Parser) parseExpression(precedence int) ast.Expression {
  259. defer untrace(trace("parseExpression"))
  260. prefix := p.prefixParseFns[p.curToken.Type]
  261. if prefix == nil {
  262. p.noPrefixParseFnError(p.curToken.Type)
  263. return nil
  264. }
  265. leftExp := prefix()
  266. for !p.peekTokenIs(token.SEMICOLON) && precedence < p.peekPrecedence() {
  267. infix := p.infixParseFns[p.peekToken.Type]
  268. if infix == nil {
  269. return leftExp
  270. }
  271. p.nextToken()
  272. leftExp = infix(leftExp)
  273. }
  274. return leftExp
  275. }
  276. func (p *Parser) curTokenIs(t token.TypeToken) bool {
  277. return p.curToken.Type == t
  278. }
  279. func (p *Parser) peekTokenIs(t token.TypeToken) bool {
  280. return p.peekToken.Type == t
  281. }
  282. func (p *Parser) expectPeek(t token.TypeToken) bool {
  283. if p.peekTokenIs(t) {
  284. p.nextToken()
  285. return true
  286. } else {
  287. p.peekError(t)
  288. return false
  289. }
  290. }
  291. func (p *Parser) registerPrefix(tokenType token.TypeToken, fn prefixParseFn) {
  292. p.prefixParseFns[tokenType] = fn
  293. }
  294. func (p *Parser) registerInfix(tokenType token.TypeToken, fn infixParseFn) {
  295. p.infixParseFns[tokenType] = fn
  296. }
  297. func (p *Parser) noPrefixParseFnError(t token.TypeToken) {
  298. msg := fmt.Sprintf("no prefix parse function for %s found", t)
  299. p.errors = append(p.errors, msg)
  300. }
  301. func (p *Parser) peekPrecedence() int {
  302. if p, ok := precedences[p.peekToken.Type]; ok {
  303. return p
  304. }
  305. return LOWEST
  306. }
  307. func (p *Parser) curPrecedence() int {
  308. if p, ok := precedences[p.curToken.Type]; ok {
  309. return p
  310. }
  311. return LOWEST
  312. }
  313. func (p *Parser) ParseFunctionParameters() []*ast.Identifier {
  314. identifiers := []*ast.Identifier{}
  315. if p.peekTokenIs(token.RPAREN) {
  316. p.nextToken()
  317. return identifiers
  318. }
  319. p.nextToken()
  320. ident := &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  321. identifiers = append(identifiers, ident)
  322. for p.peekTokenIs(token.COMMA) {
  323. p.nextToken() // ,
  324. p.nextToken()
  325. ident := &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  326. identifiers = append(identifiers, ident)
  327. }
  328. // )
  329. if !p.expectPeek(token.RPAREN) {
  330. return nil
  331. }
  332. return identifiers
  333. }