parser.go 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442
  1. package parser
  2. import (
  3. "fmt"
  4. "github/runnignwater/monkey/ast"
  5. "github/runnignwater/monkey/lexer"
  6. "github/runnignwater/monkey/token"
  7. "strconv"
  8. )
  9. /**
  10. * @Author: simon
  11. * @Author: ynwdlxm@163.com
  12. * @Date: 2022/10/2 下午9:55
  13. * @Desc:
  14. */
  15. const (
  16. // 优先级常量
  17. _ int = iota
  18. LOWEST
  19. EQUALS // ==
  20. LESSGREATER // > OR <
  21. SUM // +
  22. PRODUCT // *
  23. PREFIX // -X OR !X
  24. CALL // myFunction(X)
  25. )
  26. // precedences 指派 token 类型的优先级
  27. var precedences = map[token.TypeToken]int{
  28. token.EQ: EQUALS,
  29. token.NOT_EQ: EQUALS,
  30. token.GT: LESSGREATER,
  31. token.LT: LESSGREATER,
  32. token.PLUS: SUM,
  33. token.MINUS: SUM,
  34. token.ASTERISK: PRODUCT,
  35. token.SLASH: PRODUCT,
  36. token.LPAREN: CALL,
  37. }
  38. type (
  39. prefixParseFn func() ast.Expression
  40. infixParseFn func(expression ast.Expression) ast.Expression
  41. )
  42. type Parser struct {
  43. l *lexer.Lexer // point to the instance of the lexer
  44. errors []string
  45. curToken token.Token // point to the current token
  46. peekToken token.Token // point to the next token
  47. prefixParseFns map[token.TypeToken]prefixParseFn
  48. infixParseFns map[token.TypeToken]infixParseFn
  49. }
  50. func New(l *lexer.Lexer) *Parser {
  51. p := &Parser{
  52. l: l,
  53. errors: []string{},
  54. }
  55. p.prefixParseFns = make(map[token.TypeToken]prefixParseFn)
  56. p.registerPrefix(token.IDENT, p.parseIdentifier)
  57. p.registerPrefix(token.INT, p.parseIntegerLiteral)
  58. p.registerPrefix(token.BANG, p.parsePrefixExpression)
  59. p.registerPrefix(token.MINUS, p.parsePrefixExpression)
  60. p.registerPrefix(token.TRUE, p.parseBoolean)
  61. p.registerPrefix(token.FALSE, p.parseBoolean)
  62. p.registerPrefix(token.LPAREN, p.parseGroupedExpression)
  63. p.registerPrefix(token.IF, p.parseIfExpression)
  64. p.registerPrefix(token.FUNCTION, p.parseFunctionLiteral)
  65. p.registerPrefix(token.STRING, p.parseStringLiteral)
  66. p.infixParseFns = make(map[token.TypeToken]infixParseFn)
  67. p.registerInfix(token.PLUS, p.parseInfixExpression)
  68. p.registerInfix(token.MINUS, p.parseInfixExpression)
  69. p.registerInfix(token.ASTERISK, p.parseInfixExpression)
  70. p.registerInfix(token.SLASH, p.parseInfixExpression)
  71. p.registerInfix(token.EQ, p.parseInfixExpression)
  72. p.registerInfix(token.NOT_EQ, p.parseInfixExpression)
  73. p.registerInfix(token.GT, p.parseInfixExpression)
  74. p.registerInfix(token.LT, p.parseInfixExpression)
  75. p.registerInfix(token.LPAREN, p.parseCallExpression)
  76. // Read two tokens, so curToken and peekToken are both set
  77. p.nextToken()
  78. p.nextToken()
  79. return p
  80. }
  81. func (p *Parser) ParseProgram() *ast.Program {
  82. program := &ast.Program{}
  83. program.Statements = []ast.Statement{}
  84. for !p.curTokenIs(token.EOF) {
  85. stmt := p.parseStatement()
  86. if stmt != nil {
  87. program.Statements = append(program.Statements, stmt)
  88. }
  89. p.nextToken()
  90. }
  91. return program
  92. }
  93. func (p *Parser) parseStatement() ast.Statement {
  94. switch p.curToken.Type {
  95. case token.LET:
  96. return p.parseLetStatement()
  97. case token.RETURN:
  98. return p.parseReturnStatement()
  99. default:
  100. return p.parseExpressionStatement()
  101. }
  102. }
  103. func (p *Parser) parseIdentifier() ast.Expression {
  104. return &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  105. }
  106. func (p *Parser) parseBoolean() ast.Expression {
  107. return &ast.Boolean{Token: p.curToken, Value: p.curTokenIs(token.TRUE)}
  108. }
  109. func (p *Parser) parseGroupedExpression() ast.Expression {
  110. defer untrace(trace("parseGroupedExpression"))
  111. p.nextToken()
  112. exp := p.parseExpression(LOWEST)
  113. if !p.expectPeek(token.RPAREN) {
  114. return nil
  115. }
  116. return exp
  117. }
  118. func (p *Parser) parseIfExpression() ast.Expression {
  119. defer untrace(trace("parseIfExpression"))
  120. exp := &ast.IfExpression{Token: p.curToken}
  121. // (
  122. if !p.expectPeek(token.LPAREN) {
  123. return nil
  124. }
  125. p.nextToken()
  126. exp.Condition = p.parseExpression(LOWEST)
  127. // )
  128. if !p.expectPeek(token.RPAREN) {
  129. return nil
  130. }
  131. // {
  132. if !p.expectPeek(token.LBRACE) {
  133. return nil
  134. }
  135. exp.Consequence = p.parseBlockStatement()
  136. // else expression
  137. if p.peekTokenIs(token.ELSE) {
  138. p.nextToken()
  139. if !p.expectPeek(token.LBRACE) {
  140. return nil
  141. }
  142. exp.Alternative = p.parseBlockStatement()
  143. }
  144. return exp
  145. }
  146. func (p *Parser) parseFunctionLiteral() ast.Expression {
  147. lit := &ast.FunctionLiteral{Token: p.curToken}
  148. // (
  149. if !p.expectPeek(token.LPAREN) {
  150. return nil
  151. }
  152. lit.Parameters = p.ParseFunctionParameters()
  153. // {
  154. if !p.expectPeek(token.LBRACE) {
  155. return nil
  156. }
  157. lit.Body = p.parseBlockStatement()
  158. return lit
  159. }
  160. func (p *Parser) parseIntegerLiteral() ast.Expression {
  161. defer untrace(trace("parseIntegerLiteral"))
  162. lit := &ast.IntegerLiteral{Token: p.curToken}
  163. value, err := strconv.ParseInt(p.curToken.Literal, 0, 64)
  164. if err != nil {
  165. msg := fmt.Sprintf("could not parse %q as integer", p.curToken.Literal)
  166. p.errors = append(p.errors, msg)
  167. return nil
  168. }
  169. lit.Value = value
  170. return lit
  171. }
  172. func (p *Parser) parseStringLiteral() ast.Expression {
  173. return &ast.StringLiteral{Token: p.curToken, Value: p.curToken.Literal}
  174. }
  175. func (p *Parser) parseCallExpression(left ast.Expression) ast.Expression {
  176. defer untrace(trace("parseCallExpression"))
  177. // add(2,3) --> Function: add
  178. exp := &ast.CallExpression{Token: p.curToken, Function: left}
  179. exp.Arguments = p.parseCallArguments()
  180. return exp
  181. }
  182. func (p *Parser) parseInfixExpression(left ast.Expression) ast.Expression {
  183. defer untrace(trace("parseInfixExpression"))
  184. exp := &ast.InfixExpression{
  185. Token: p.curToken,
  186. Left: left,
  187. Operator: p.curToken.Literal,
  188. }
  189. precedence := p.curPrecedence()
  190. p.nextToken()
  191. exp.Right = p.parseExpression(precedence)
  192. return exp
  193. }
  194. func (p *Parser) parsePrefixExpression() ast.Expression {
  195. defer untrace(trace("parsePrefixExpression"))
  196. exp := &ast.PrefixExpression{
  197. Token: p.curToken,
  198. Operator: p.curToken.Literal,
  199. }
  200. p.nextToken()
  201. exp.Right = p.parseExpression(PREFIX)
  202. return exp
  203. }
  204. func (p *Parser) parseBlockStatement() *ast.BlockStatement {
  205. defer untrace(trace("parseBlockStatement"))
  206. block := &ast.BlockStatement{Token: p.curToken}
  207. block.Statements = []ast.Statement{}
  208. p.nextToken()
  209. // }
  210. for !p.curTokenIs(token.RBRACE) {
  211. stmt := p.parseStatement()
  212. if stmt != nil {
  213. block.Statements = append(block.Statements, stmt)
  214. }
  215. p.nextToken()
  216. }
  217. return block
  218. }
  219. func (p *Parser) Errors() []string {
  220. return p.errors
  221. }
  222. func (p *Parser) peekError(t token.TypeToken) {
  223. msg := fmt.Sprintf("exepected next token to be %s, got %s instead.", t, p.peekToken.Type)
  224. p.errors = append(p.errors, msg)
  225. }
  226. func (p *Parser) nextToken() {
  227. p.curToken = p.peekToken
  228. p.peekToken = p.l.NextToken()
  229. }
  230. // let <identifier> = <expression>;
  231. func (p *Parser) parseLetStatement() *ast.LetStatement {
  232. stmt := &ast.LetStatement{Token: p.curToken}
  233. // let
  234. if !p.expectPeek(token.IDENT) {
  235. return nil
  236. }
  237. // identifier
  238. stmt.Name = &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  239. // =
  240. if !p.expectPeek(token.ASSIGN) {
  241. return nil
  242. }
  243. p.nextToken()
  244. stmt.Value = p.parseExpression(LOWEST)
  245. // ;
  246. for !p.curTokenIs(token.SEMICOLON) {
  247. p.nextToken()
  248. }
  249. return stmt
  250. }
  251. // return <expression>;
  252. func (p *Parser) parseReturnStatement() *ast.ReturnStatement {
  253. stmt := &ast.ReturnStatement{Token: p.curToken}
  254. p.nextToken()
  255. stmt.ReturnValue = p.parseExpression(LOWEST)
  256. for !p.curTokenIs(token.SEMICOLON) {
  257. p.nextToken()
  258. }
  259. return stmt
  260. }
  261. func (p *Parser) parseExpressionStatement() *ast.ExpressionStatement {
  262. defer untrace(trace("parseExpressionStatement"))
  263. stmt := &ast.ExpressionStatement{Token: p.curToken}
  264. stmt.Expression = p.parseExpression(LOWEST)
  265. if p.peekTokenIs(token.SEMICOLON) {
  266. p.nextToken()
  267. }
  268. return stmt
  269. }
  270. func (p *Parser) parseExpression(precedence int) ast.Expression {
  271. defer untrace(trace("parseExpression"))
  272. prefix := p.prefixParseFns[p.curToken.Type]
  273. if prefix == nil {
  274. p.noPrefixParseFnError(p.curToken.Type)
  275. return nil
  276. }
  277. leftExp := prefix()
  278. for !p.peekTokenIs(token.SEMICOLON) && precedence < p.peekPrecedence() {
  279. infix := p.infixParseFns[p.peekToken.Type]
  280. if infix == nil {
  281. return leftExp
  282. }
  283. p.nextToken()
  284. leftExp = infix(leftExp)
  285. }
  286. return leftExp
  287. }
  288. func (p *Parser) curTokenIs(t token.TypeToken) bool {
  289. return p.curToken.Type == t
  290. }
  291. func (p *Parser) peekTokenIs(t token.TypeToken) bool {
  292. return p.peekToken.Type == t
  293. }
  294. func (p *Parser) expectPeek(t token.TypeToken) bool {
  295. if p.peekTokenIs(t) {
  296. p.nextToken()
  297. return true
  298. } else {
  299. p.peekError(t)
  300. return false
  301. }
  302. }
  303. func (p *Parser) registerPrefix(tokenType token.TypeToken, fn prefixParseFn) {
  304. p.prefixParseFns[tokenType] = fn
  305. }
  306. func (p *Parser) registerInfix(tokenType token.TypeToken, fn infixParseFn) {
  307. p.infixParseFns[tokenType] = fn
  308. }
  309. func (p *Parser) noPrefixParseFnError(t token.TypeToken) {
  310. msg := fmt.Sprintf("no prefix parse function for %s found", t)
  311. p.errors = append(p.errors, msg)
  312. }
  313. func (p *Parser) peekPrecedence() int {
  314. if p, ok := precedences[p.peekToken.Type]; ok {
  315. return p
  316. }
  317. return LOWEST
  318. }
  319. func (p *Parser) curPrecedence() int {
  320. if p, ok := precedences[p.curToken.Type]; ok {
  321. return p
  322. }
  323. return LOWEST
  324. }
  325. func (p *Parser) ParseFunctionParameters() []*ast.Identifier {
  326. identifiers := []*ast.Identifier{}
  327. if p.peekTokenIs(token.RPAREN) {
  328. p.nextToken()
  329. return identifiers
  330. }
  331. p.nextToken()
  332. ident := &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  333. identifiers = append(identifiers, ident)
  334. for p.peekTokenIs(token.COMMA) {
  335. p.nextToken() // ,
  336. p.nextToken()
  337. ident := &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  338. identifiers = append(identifiers, ident)
  339. }
  340. // )
  341. if !p.expectPeek(token.RPAREN) {
  342. return nil
  343. }
  344. return identifiers
  345. }
  346. func (p *Parser) parseCallArguments() []ast.Expression {
  347. args := []ast.Expression{}
  348. // the case (), then null args
  349. if p.peekTokenIs(token.RPAREN) {
  350. p.nextToken()
  351. return args
  352. }
  353. p.nextToken()
  354. args = append(args, p.parseExpression(LOWEST))
  355. for p.peekTokenIs(token.COMMA) {
  356. p.nextToken()
  357. p.nextToken()
  358. args = append(args, p.parseExpression(LOWEST))
  359. }
  360. if !p.expectPeek(token.RPAREN) {
  361. return nil
  362. }
  363. return args
  364. }