parser.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514
  1. package parser
  2. import (
  3. "fmt"
  4. "github/runnignwater/monkey/ast"
  5. "github/runnignwater/monkey/lexer"
  6. "github/runnignwater/monkey/token"
  7. "strconv"
  8. )
  9. /**
  10. * @Author: simon
  11. * @Author: ynwdlxm@163.com
  12. * @Date: 2022/10/2 下午9:55
  13. * @Desc:
  14. */
  15. const (
  16. // 优先级常量
  17. _ int = iota
  18. LOWEST
  19. EQUALS // ==
  20. LESSGREATER // > OR <
  21. SUM // +
  22. PRODUCT // *
  23. PREFIX // -X OR !X
  24. CALL // myFunction(X)
  25. INDEX // array[index]
  26. )
  27. // precedences 指派 token 类型的优先级
  28. var precedences = map[token.TypeToken]int{
  29. token.EQ: EQUALS,
  30. token.NOT_EQ: EQUALS,
  31. token.GT: LESSGREATER,
  32. token.LT: LESSGREATER,
  33. token.PLUS: SUM,
  34. token.MINUS: SUM,
  35. token.ASTERISK: PRODUCT,
  36. token.SLASH: PRODUCT,
  37. token.LPAREN: CALL,
  38. token.LBRACKET: INDEX,
  39. }
  40. type (
  41. prefixParseFn func() ast.Expression
  42. infixParseFn func(expression ast.Expression) ast.Expression
  43. )
  44. type Parser struct {
  45. l *lexer.Lexer // point to the instance of the lexer
  46. errors []string
  47. curToken token.Token // point to the current token
  48. peekToken token.Token // point to the next token
  49. prefixParseFns map[token.TypeToken]prefixParseFn
  50. infixParseFns map[token.TypeToken]infixParseFn
  51. }
  52. func New(l *lexer.Lexer) *Parser {
  53. p := &Parser{
  54. l: l,
  55. errors: []string{},
  56. }
  57. p.prefixParseFns = make(map[token.TypeToken]prefixParseFn)
  58. p.registerPrefix(token.IDENT, p.parseIdentifier)
  59. p.registerPrefix(token.INT, p.parseIntegerLiteral)
  60. p.registerPrefix(token.BANG, p.parsePrefixExpression)
  61. p.registerPrefix(token.MINUS, p.parsePrefixExpression)
  62. p.registerPrefix(token.TRUE, p.parseBoolean)
  63. p.registerPrefix(token.FALSE, p.parseBoolean)
  64. p.registerPrefix(token.LPAREN, p.parseGroupedExpression)
  65. p.registerPrefix(token.IF, p.parseIfExpression)
  66. p.registerPrefix(token.FUNCTION, p.parseFunctionLiteral)
  67. p.registerPrefix(token.STRING, p.parseStringLiteral)
  68. p.registerPrefix(token.LBRACKET, p.parseArrayLiteral)
  69. p.registerPrefix(token.LBRACE, p.parseHashLiteral)
  70. p.infixParseFns = make(map[token.TypeToken]infixParseFn)
  71. p.registerInfix(token.PLUS, p.parseInfixExpression)
  72. p.registerInfix(token.MINUS, p.parseInfixExpression)
  73. p.registerInfix(token.ASTERISK, p.parseInfixExpression)
  74. p.registerInfix(token.SLASH, p.parseInfixExpression)
  75. p.registerInfix(token.EQ, p.parseInfixExpression)
  76. p.registerInfix(token.NOT_EQ, p.parseInfixExpression)
  77. p.registerInfix(token.GT, p.parseInfixExpression)
  78. p.registerInfix(token.LT, p.parseInfixExpression)
  79. p.registerInfix(token.LPAREN, p.parseCallExpression)
  80. p.registerInfix(token.LBRACKET, p.parseIndexExpression)
  81. // Read two tokens, so curToken and peekToken are both set
  82. p.nextToken()
  83. p.nextToken()
  84. return p
  85. }
  86. func (p *Parser) ParseProgram() *ast.Program {
  87. program := &ast.Program{}
  88. program.Statements = []ast.Statement{}
  89. for !p.curTokenIs(token.EOF) {
  90. stmt := p.parseStatement()
  91. if stmt != nil {
  92. program.Statements = append(program.Statements, stmt)
  93. }
  94. p.nextToken()
  95. }
  96. return program
  97. }
  98. func (p *Parser) parseStatement() ast.Statement {
  99. switch p.curToken.Type {
  100. case token.LET:
  101. return p.parseLetStatement()
  102. case token.RETURN:
  103. return p.parseReturnStatement()
  104. default:
  105. return p.parseExpressionStatement()
  106. }
  107. }
  108. func (p *Parser) parseIdentifier() ast.Expression {
  109. return &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  110. }
  111. func (p *Parser) parseBoolean() ast.Expression {
  112. return &ast.Boolean{Token: p.curToken, Value: p.curTokenIs(token.TRUE)}
  113. }
  114. func (p *Parser) parseGroupedExpression() ast.Expression {
  115. defer untrace(trace("parseGroupedExpression"))
  116. p.nextToken()
  117. exp := p.parseExpression(LOWEST)
  118. if !p.expectPeek(token.RPAREN) {
  119. return nil
  120. }
  121. return exp
  122. }
  123. func (p *Parser) parseIfExpression() ast.Expression {
  124. defer untrace(trace("parseIfExpression"))
  125. exp := &ast.IfExpression{Token: p.curToken}
  126. // (
  127. if !p.expectPeek(token.LPAREN) {
  128. return nil
  129. }
  130. p.nextToken()
  131. exp.Condition = p.parseExpression(LOWEST)
  132. // )
  133. if !p.expectPeek(token.RPAREN) {
  134. return nil
  135. }
  136. // {
  137. if !p.expectPeek(token.LBRACE) {
  138. return nil
  139. }
  140. exp.Consequence = p.parseBlockStatement()
  141. // else expression
  142. if p.peekTokenIs(token.ELSE) {
  143. p.nextToken()
  144. if !p.expectPeek(token.LBRACE) {
  145. return nil
  146. }
  147. exp.Alternative = p.parseBlockStatement()
  148. }
  149. return exp
  150. }
  151. func (p *Parser) parseFunctionLiteral() ast.Expression {
  152. lit := &ast.FunctionLiteral{Token: p.curToken}
  153. // (
  154. if !p.expectPeek(token.LPAREN) {
  155. return nil
  156. }
  157. lit.Parameters = p.ParseFunctionParameters()
  158. // {
  159. if !p.expectPeek(token.LBRACE) {
  160. return nil
  161. }
  162. lit.Body = p.parseBlockStatement()
  163. return lit
  164. }
  165. func (p *Parser) parseIntegerLiteral() ast.Expression {
  166. defer untrace(trace("parseIntegerLiteral"))
  167. lit := &ast.IntegerLiteral{Token: p.curToken}
  168. value, err := strconv.ParseInt(p.curToken.Literal, 0, 64)
  169. if err != nil {
  170. msg := fmt.Sprintf("could not parse %q as integer", p.curToken.Literal)
  171. p.errors = append(p.errors, msg)
  172. return nil
  173. }
  174. lit.Value = value
  175. return lit
  176. }
  177. func (p *Parser) parseStringLiteral() ast.Expression {
  178. return &ast.StringLiteral{Token: p.curToken, Value: p.curToken.Literal}
  179. }
  180. func (p *Parser) parseArrayLiteral() ast.Expression {
  181. array := &ast.ArrayLiteral{Token: p.curToken}
  182. array.Element = p.parseExpressionList(token.RBRACKET)
  183. return array
  184. }
  185. func (p *Parser) parseHashLiteral() ast.Expression {
  186. hash := &ast.HashLiteral{Token: p.curToken}
  187. hash.Pairs = make(map[ast.Expression]ast.Expression)
  188. for !p.peekTokenIs(token.RBRACE) {
  189. p.nextToken()
  190. key := p.parseExpression(LOWEST)
  191. if !p.expectPeek(token.COLON) {
  192. return nil
  193. }
  194. p.nextToken()
  195. value := p.parseExpression(LOWEST)
  196. hash.Pairs[key] = value
  197. if !p.peekTokenIs(token.RBRACE) && !p.expectPeek(token.COMMA) {
  198. return nil
  199. }
  200. }
  201. if !p.expectPeek(token.RBRACE) {
  202. return nil
  203. }
  204. return hash
  205. }
  206. func (p *Parser) parseCallExpression(left ast.Expression) ast.Expression {
  207. defer untrace(trace("parseCallExpression"))
  208. // add(2,3) --> Function: add
  209. exp := &ast.CallExpression{Token: p.curToken, Function: left}
  210. exp.Arguments = p.parseExpressionList(token.RPAREN)
  211. return exp
  212. }
  213. func (p *Parser) parseIndexExpression(left ast.Expression) ast.Expression {
  214. defer untrace(trace("parseIndexExpression"))
  215. exp := &ast.IndexExpression{Token: p.curToken, Left: left}
  216. p.nextToken()
  217. exp.Index = p.parseExpression(LOWEST)
  218. if !p.expectPeek(token.RBRACKET) {
  219. return nil
  220. }
  221. return exp
  222. }
  223. func (p *Parser) parseInfixExpression(left ast.Expression) ast.Expression {
  224. defer untrace(trace("parseInfixExpression"))
  225. exp := &ast.InfixExpression{
  226. Token: p.curToken,
  227. Left: left,
  228. Operator: p.curToken.Literal,
  229. }
  230. precedence := p.curPrecedence()
  231. p.nextToken()
  232. exp.Right = p.parseExpression(precedence)
  233. return exp
  234. }
  235. func (p *Parser) parsePrefixExpression() ast.Expression {
  236. defer untrace(trace("parsePrefixExpression"))
  237. exp := &ast.PrefixExpression{
  238. Token: p.curToken,
  239. Operator: p.curToken.Literal,
  240. }
  241. p.nextToken()
  242. exp.Right = p.parseExpression(PREFIX)
  243. return exp
  244. }
  245. func (p *Parser) parseBlockStatement() *ast.BlockStatement {
  246. defer untrace(trace("parseBlockStatement"))
  247. block := &ast.BlockStatement{Token: p.curToken}
  248. block.Statements = []ast.Statement{}
  249. p.nextToken()
  250. // }
  251. for !p.curTokenIs(token.RBRACE) {
  252. stmt := p.parseStatement()
  253. if stmt != nil {
  254. block.Statements = append(block.Statements, stmt)
  255. }
  256. p.nextToken()
  257. }
  258. return block
  259. }
  260. func (p *Parser) Errors() []string {
  261. return p.errors
  262. }
  263. func (p *Parser) peekError(t token.TypeToken) {
  264. msg := fmt.Sprintf("exepected next token to be %s, got %s instead.", t, p.peekToken.Type)
  265. p.errors = append(p.errors, msg)
  266. }
  267. func (p *Parser) nextToken() {
  268. p.curToken = p.peekToken
  269. p.peekToken = p.l.NextToken()
  270. }
  271. // let <identifier> = <expression>;
  272. func (p *Parser) parseLetStatement() *ast.LetStatement {
  273. stmt := &ast.LetStatement{Token: p.curToken}
  274. // let
  275. if !p.expectPeek(token.IDENT) {
  276. return nil
  277. }
  278. // identifier
  279. stmt.Name = &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  280. // =
  281. if !p.expectPeek(token.ASSIGN) {
  282. return nil
  283. }
  284. p.nextToken()
  285. stmt.Value = p.parseExpression(LOWEST)
  286. // ;
  287. for !p.curTokenIs(token.SEMICOLON) {
  288. p.nextToken()
  289. }
  290. return stmt
  291. }
  292. // return <expression>;
  293. func (p *Parser) parseReturnStatement() *ast.ReturnStatement {
  294. stmt := &ast.ReturnStatement{Token: p.curToken}
  295. p.nextToken()
  296. stmt.ReturnValue = p.parseExpression(LOWEST)
  297. for !p.curTokenIs(token.SEMICOLON) {
  298. p.nextToken()
  299. }
  300. return stmt
  301. }
  302. func (p *Parser) parseExpressionStatement() *ast.ExpressionStatement {
  303. defer untrace(trace("parseExpressionStatement"))
  304. stmt := &ast.ExpressionStatement{Token: p.curToken}
  305. stmt.Expression = p.parseExpression(LOWEST)
  306. if p.peekTokenIs(token.SEMICOLON) {
  307. p.nextToken()
  308. }
  309. return stmt
  310. }
  311. func (p *Parser) parseExpression(precedence int) ast.Expression {
  312. defer untrace(trace("parseExpression"))
  313. prefix := p.prefixParseFns[p.curToken.Type]
  314. if prefix == nil {
  315. p.noPrefixParseFnError(p.curToken.Type)
  316. return nil
  317. }
  318. leftExp := prefix()
  319. for !p.peekTokenIs(token.SEMICOLON) && precedence < p.peekPrecedence() {
  320. infix := p.infixParseFns[p.peekToken.Type]
  321. if infix == nil {
  322. return leftExp
  323. }
  324. p.nextToken()
  325. leftExp = infix(leftExp)
  326. }
  327. return leftExp
  328. }
  329. func (p *Parser) parseExpressionList(end token.TypeToken) []ast.Expression {
  330. defer untrace(trace("parseExpressionList"))
  331. list := []ast.Expression{}
  332. if p.peekTokenIs(end) {
  333. p.nextToken()
  334. return list
  335. }
  336. p.nextToken()
  337. list = append(list, p.parseExpression(LOWEST))
  338. for p.peekTokenIs(token.COMMA) {
  339. p.nextToken()
  340. p.nextToken()
  341. list = append(list, p.parseExpression(LOWEST))
  342. }
  343. if !p.expectPeek(end) {
  344. return nil
  345. }
  346. return list
  347. }
  348. func (p *Parser) curTokenIs(t token.TypeToken) bool {
  349. return p.curToken.Type == t
  350. }
  351. func (p *Parser) peekTokenIs(t token.TypeToken) bool {
  352. return p.peekToken.Type == t
  353. }
  354. func (p *Parser) expectPeek(t token.TypeToken) bool {
  355. if p.peekTokenIs(t) {
  356. p.nextToken()
  357. return true
  358. } else {
  359. p.peekError(t)
  360. return false
  361. }
  362. }
  363. func (p *Parser) registerPrefix(tokenType token.TypeToken, fn prefixParseFn) {
  364. p.prefixParseFns[tokenType] = fn
  365. }
  366. func (p *Parser) registerInfix(tokenType token.TypeToken, fn infixParseFn) {
  367. p.infixParseFns[tokenType] = fn
  368. }
  369. func (p *Parser) noPrefixParseFnError(t token.TypeToken) {
  370. msg := fmt.Sprintf("no prefix parse function for %s found", t)
  371. p.errors = append(p.errors, msg)
  372. }
  373. func (p *Parser) peekPrecedence() int {
  374. if p, ok := precedences[p.peekToken.Type]; ok {
  375. return p
  376. }
  377. return LOWEST
  378. }
  379. func (p *Parser) curPrecedence() int {
  380. if p, ok := precedences[p.curToken.Type]; ok {
  381. return p
  382. }
  383. return LOWEST
  384. }
  385. func (p *Parser) ParseFunctionParameters() []*ast.Identifier {
  386. identifiers := []*ast.Identifier{}
  387. if p.peekTokenIs(token.RPAREN) {
  388. p.nextToken()
  389. return identifiers
  390. }
  391. p.nextToken()
  392. ident := &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  393. identifiers = append(identifiers, ident)
  394. for p.peekTokenIs(token.COMMA) {
  395. p.nextToken() // ,
  396. p.nextToken()
  397. ident := &ast.Identifier{Token: p.curToken, Value: p.curToken.Literal}
  398. identifiers = append(identifiers, ident)
  399. }
  400. // )
  401. if !p.expectPeek(token.RPAREN) {
  402. return nil
  403. }
  404. return identifiers
  405. }
  406. func (p *Parser) parseCallArguments() []ast.Expression {
  407. args := []ast.Expression{}
  408. // the case (), then null args
  409. if p.peekTokenIs(token.RPAREN) {
  410. p.nextToken()
  411. return args
  412. }
  413. p.nextToken()
  414. args = append(args, p.parseExpression(LOWEST))
  415. for p.peekTokenIs(token.COMMA) {
  416. p.nextToken()
  417. p.nextToken()
  418. args = append(args, p.parseExpression(LOWEST))
  419. }
  420. if !p.expectPeek(token.RPAREN) {
  421. return nil
  422. }
  423. return args
  424. }