class.go 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693
  1. // Package parser provides class diagram parsing based on classDiagram.jison
  2. package parser
  3. import (
  4. "fmt"
  5. "strings"
  6. "mermaid-go/pkg/ast"
  7. "mermaid-go/pkg/lexer"
  8. )
  9. // ClassParser implements class diagram parsing following classDiagram.jison
  10. type ClassParser struct {
  11. tokens []lexer.Token
  12. current int
  13. diagram *ast.ClassDiagram
  14. }
  15. // NewClassParser creates a new class parser
  16. func NewClassParser() *ClassParser {
  17. return &ClassParser{
  18. diagram: ast.NewClassDiagram(),
  19. }
  20. }
  21. // Parse parses class diagram syntax
  22. func (p *ClassParser) Parse(input string) (*ast.ClassDiagram, error) {
  23. // Tokenize
  24. l := lexer.NewLexer(input)
  25. tokens, err := l.Tokenize()
  26. if err != nil {
  27. return nil, fmt.Errorf("lexical analysis failed: %w", err)
  28. }
  29. // Filter tokens
  30. p.tokens = lexer.FilterTokens(tokens)
  31. p.current = 0
  32. p.diagram = ast.NewClassDiagram()
  33. // Parse document
  34. err = p.parseDocument()
  35. if err != nil {
  36. return nil, fmt.Errorf("syntax analysis failed: %w", err)
  37. }
  38. return p.diagram, nil
  39. }
  40. // parseDocument parses the class diagram document
  41. func (p *ClassParser) parseDocument() error {
  42. // Expect classDiagram
  43. if !p.check(lexer.TokenID) || p.peek().Value != "classDiagram" {
  44. return p.error("expected 'classDiagram'")
  45. }
  46. p.advance()
  47. // Parse statements
  48. for !p.isAtEnd() {
  49. if err := p.parseStatement(); err != nil {
  50. return err
  51. }
  52. }
  53. return nil
  54. }
  55. // parseStatement parses individual class diagram statements
  56. func (p *ClassParser) parseStatement() error {
  57. if p.isAtEnd() {
  58. return nil
  59. }
  60. switch {
  61. case p.check(lexer.TokenNewline):
  62. p.advance() // Skip newlines
  63. return nil
  64. case p.checkComment():
  65. return p.parseComment()
  66. case p.check(lexer.TokenClass) || p.checkKeyword("class"):
  67. return p.parseClass()
  68. case p.checkKeyword("direction"):
  69. return p.parseDirection()
  70. case p.checkKeyword("link"):
  71. return p.parseLink()
  72. case p.checkKeyword("click"):
  73. return p.parseClick()
  74. case p.checkKeyword("note"):
  75. return p.parseNote()
  76. case p.checkKeyword("classDef"):
  77. return p.parseClassDef()
  78. case p.check(lexer.TokenID):
  79. // Try to parse as class definition or relation
  80. return p.parseClassOrRelation()
  81. default:
  82. token := p.peek()
  83. return p.error(fmt.Sprintf("unexpected token: %s", token.Value))
  84. }
  85. }
  86. // parseClass parses class statements
  87. func (p *ClassParser) parseClass() error {
  88. // Consume 'class' token
  89. if p.check(lexer.TokenClass) {
  90. p.advance() // consume TokenClass
  91. } else {
  92. p.advance() // consume 'class' keyword
  93. }
  94. if !p.check(lexer.TokenID) {
  95. return p.error("expected class name")
  96. }
  97. className := p.advance().Value
  98. class := &ast.ClassNode{
  99. ID: className,
  100. Label: className,
  101. Type: ast.ClassTypeClass,
  102. Members: make([]*ast.ClassMember, 0),
  103. Methods: make([]*ast.ClassMethod, 0),
  104. Annotations: make([]string, 0),
  105. CssClasses: make([]string, 0),
  106. }
  107. // Check for class body
  108. if p.check(lexer.TokenOpenBrace) {
  109. p.advance() // consume '{'
  110. err := p.parseClassBody(class)
  111. if err != nil {
  112. return err
  113. }
  114. if !p.check(lexer.TokenCloseBrace) {
  115. return p.error("expected '}'")
  116. }
  117. p.advance() // consume '}'
  118. }
  119. p.diagram.Classes[className] = class
  120. return nil
  121. }
  122. // parseClassBody parses the contents of a class body
  123. func (p *ClassParser) parseClassBody(class *ast.ClassNode) error {
  124. for !p.check(lexer.TokenCloseBrace) && !p.isAtEnd() {
  125. if p.check(lexer.TokenNewline) {
  126. p.advance()
  127. continue
  128. }
  129. // Parse member or method
  130. visibility := ast.VisibilityPublic // default
  131. if p.checkVisibility() {
  132. switch p.peek().Value {
  133. case "+":
  134. visibility = ast.VisibilityPublic
  135. case "-":
  136. visibility = ast.VisibilityPrivate
  137. case "#":
  138. visibility = ast.VisibilityProtected
  139. case "~":
  140. visibility = ast.VisibilityPackage
  141. }
  142. p.advance()
  143. }
  144. // Check for annotations like <<interface>>, <<abstract>>
  145. if p.check(lexer.TokenOpenAngle) {
  146. // Look ahead to see if it's << (double angle)
  147. if p.checkNext(lexer.TokenOpenAngle) {
  148. p.advance() // consume first <
  149. p.advance() // consume second <
  150. annotation := ""
  151. for !p.check(lexer.TokenCloseAngle) && !p.isAtEnd() {
  152. if p.check(lexer.TokenID) {
  153. annotation += p.advance().Value
  154. } else {
  155. annotation += p.advance().Value
  156. }
  157. }
  158. // Consume closing >>
  159. if p.check(lexer.TokenCloseAngle) {
  160. p.advance() // consume first >
  161. if p.check(lexer.TokenCloseAngle) {
  162. p.advance() // consume second >
  163. class.Annotations = append(class.Annotations, annotation)
  164. // Update class type based on annotation
  165. switch strings.ToLower(annotation) {
  166. case "interface":
  167. class.Type = ast.ClassTypeInterface
  168. case "abstract":
  169. class.Type = ast.ClassTypeAbstract
  170. case "enumeration", "enum":
  171. class.Type = ast.ClassTypeEnum
  172. }
  173. }
  174. }
  175. continue
  176. }
  177. }
  178. if !p.check(lexer.TokenID) {
  179. return p.error("expected member or method name")
  180. }
  181. name := p.advance().Value
  182. // Check if it's a method (has parentheses)
  183. if p.check(lexer.TokenOpenParen) {
  184. method, err := p.parseMethod(name, visibility)
  185. if err != nil {
  186. return err
  187. }
  188. class.Methods = append(class.Methods, method)
  189. } else {
  190. // It's a member
  191. member, err := p.parseMember(name, visibility)
  192. if err != nil {
  193. return err
  194. }
  195. class.Members = append(class.Members, member)
  196. }
  197. }
  198. return nil
  199. }
  200. // parseMethod parses a method with parameters and return type
  201. func (p *ClassParser) parseMethod(name string, visibility ast.MemberVisibility) (*ast.ClassMethod, error) {
  202. method := &ast.ClassMethod{
  203. Name: name,
  204. Parameters: make([]string, 0),
  205. Visibility: visibility,
  206. }
  207. // Parse opening parenthesis
  208. if !p.check(lexer.TokenOpenParen) {
  209. return nil, p.error("expected '('")
  210. }
  211. p.advance() // consume '('
  212. // Parse parameters
  213. for !p.check(lexer.TokenCloseParen) && !p.isAtEnd() {
  214. if p.check(lexer.TokenID) {
  215. param := p.advance().Value
  216. // Check for parameter type
  217. if p.check(lexer.TokenID) {
  218. paramType := p.advance().Value
  219. method.Parameters = append(method.Parameters, param+" "+paramType)
  220. } else {
  221. method.Parameters = append(method.Parameters, param)
  222. }
  223. }
  224. // Skip commas
  225. if p.check(lexer.TokenComma) {
  226. p.advance()
  227. }
  228. }
  229. if !p.check(lexer.TokenCloseParen) {
  230. return nil, p.error("expected ')'")
  231. }
  232. p.advance() // consume ')'
  233. // Check for return type
  234. if p.check(lexer.TokenID) {
  235. returnType := p.advance().Value
  236. method.Type = returnType
  237. }
  238. return method, nil
  239. }
  240. // parseMember parses a class member/field
  241. func (p *ClassParser) parseMember(name string, visibility ast.MemberVisibility) (*ast.ClassMember, error) {
  242. member := &ast.ClassMember{
  243. Name: name,
  244. Visibility: visibility,
  245. }
  246. // Check for type annotation
  247. if p.check(lexer.TokenID) {
  248. memberType := p.advance().Value
  249. member.Type = memberType
  250. }
  251. return member, nil
  252. }
  253. // parseClassOrRelation parses either a class definition or relationship
  254. func (p *ClassParser) parseClassOrRelation() error {
  255. className := p.advance().Value
  256. // Ensure class exists
  257. p.ensureClass(className)
  258. // Check for relationship operators
  259. if p.checkRelation() {
  260. return p.parseRelation(className)
  261. }
  262. // Check for class body
  263. if p.check(lexer.TokenOpenBrace) {
  264. class := p.diagram.Classes[className]
  265. p.advance() // consume '{'
  266. err := p.parseClassBody(class)
  267. if err != nil {
  268. return err
  269. }
  270. if !p.check(lexer.TokenCloseBrace) {
  271. return p.error("expected '}'")
  272. }
  273. p.advance() // consume '}'
  274. }
  275. return nil
  276. }
  277. // parseRelation parses class relationships
  278. func (p *ClassParser) parseRelation(fromClass string) error {
  279. relationType := p.parseRelationType()
  280. if relationType == "" {
  281. return p.error("expected relationship operator")
  282. }
  283. if !p.check(lexer.TokenID) {
  284. return p.error("expected target class")
  285. }
  286. toClass := p.advance().Value
  287. // Ensure target class exists
  288. p.ensureClass(toClass)
  289. relation := &ast.ClassRelation{
  290. From: fromClass,
  291. To: toClass,
  292. Type: relationType,
  293. }
  294. // Check for label
  295. if p.check(lexer.TokenColon) {
  296. p.advance() // consume ':'
  297. var labelParts []string
  298. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  299. labelParts = append(labelParts, p.advance().Value)
  300. }
  301. if len(labelParts) > 0 {
  302. label := strings.TrimSpace(strings.Join(labelParts, " "))
  303. relation.Label = &label
  304. }
  305. }
  306. p.diagram.Relations = append(p.diagram.Relations, relation)
  307. return nil
  308. }
  309. // parseRelationType parses relationship type tokens
  310. func (p *ClassParser) parseRelationType() ast.ClassRelationType {
  311. token := p.peek()
  312. // Check for direct arrow tokens
  313. if p.check(lexer.TokenArrowSolid) {
  314. p.advance() // consume -->
  315. return ast.RelationAssociation
  316. }
  317. if p.check(lexer.TokenArrowDotted) {
  318. p.advance() // consume -.->
  319. return ast.RelationDependency
  320. }
  321. // Check for inheritance: --|>
  322. if token.Value == "--" && p.checkNext(lexer.TokenPipe) && p.checkAt(2, lexer.TokenCloseAngle) {
  323. p.advance() // --
  324. p.advance() // |
  325. p.advance() // >
  326. return ast.RelationInheritance
  327. }
  328. // Check for composition: --*
  329. if token.Value == "--" && p.checkNextValue("*") {
  330. p.advance() // --
  331. p.advance() // *
  332. return ast.RelationComposition
  333. }
  334. // Check for aggregation: --o
  335. if token.Value == "--" && p.checkNextValue("o") {
  336. p.advance() // --
  337. p.advance() // o
  338. return ast.RelationAggregation
  339. }
  340. // Check for association: -->
  341. if token.Value == "--" && p.checkNext(lexer.TokenCloseAngle) {
  342. p.advance() // --
  343. p.advance() // >
  344. return ast.RelationAssociation
  345. }
  346. // Check for realization: ..|>
  347. if token.Value == ".." && p.checkNext(lexer.TokenPipe) && p.checkAt(2, lexer.TokenCloseAngle) {
  348. p.advance() // ..
  349. p.advance() // |
  350. p.advance() // >
  351. return ast.RelationRealization
  352. }
  353. // Check for dependency: ..>
  354. if token.Value == ".." && p.checkNext(lexer.TokenCloseAngle) {
  355. p.advance() // ..
  356. p.advance() // >
  357. return ast.RelationDependency
  358. }
  359. return ""
  360. }
  361. // parseDirection parses direction statements
  362. func (p *ClassParser) parseDirection() error {
  363. p.advance() // consume 'direction'
  364. // Check for direction tokens or ID
  365. var direction string
  366. if p.check(lexer.TokenTD) || p.check(lexer.TokenTB) || p.check(lexer.TokenBT) ||
  367. p.check(lexer.TokenRL) || p.check(lexer.TokenLR) {
  368. direction = p.advance().Value
  369. } else if p.check(lexer.TokenID) {
  370. direction = p.advance().Value
  371. } else {
  372. return p.error("expected direction value (TD, TB, BT, RL, LR)")
  373. }
  374. p.diagram.Direction = direction
  375. return nil
  376. }
  377. // parseLink, parseClick, parseNote, parseClassDef - placeholder implementations
  378. func (p *ClassParser) parseLink() error {
  379. return p.skipToNextStatement()
  380. }
  381. func (p *ClassParser) parseClick() error {
  382. return p.skipToNextStatement()
  383. }
  384. func (p *ClassParser) parseClassDef() error {
  385. return p.skipToNextStatement()
  386. }
  387. // ensureClass ensures a class exists, creating it if needed
  388. func (p *ClassParser) ensureClass(id string) {
  389. if _, exists := p.diagram.Classes[id]; !exists {
  390. class := &ast.ClassNode{
  391. ID: id,
  392. Label: id,
  393. Type: ast.ClassTypeClass,
  394. Members: make([]*ast.ClassMember, 0),
  395. Methods: make([]*ast.ClassMethod, 0),
  396. Annotations: make([]string, 0),
  397. CssClasses: make([]string, 0),
  398. }
  399. p.diagram.Classes[id] = class
  400. }
  401. }
  402. // Helper methods
  403. func (p *ClassParser) check(tokenType lexer.TokenType) bool {
  404. if p.isAtEnd() {
  405. return false
  406. }
  407. return p.peek().Type == tokenType
  408. }
  409. func (p *ClassParser) checkNext(tokenType lexer.TokenType) bool {
  410. if p.current+1 >= len(p.tokens) {
  411. return false
  412. }
  413. return p.tokens[p.current+1].Type == tokenType
  414. }
  415. func (p *ClassParser) checkAt(offset int, tokenType lexer.TokenType) bool {
  416. if p.current+offset >= len(p.tokens) {
  417. return false
  418. }
  419. return p.tokens[p.current+offset].Type == tokenType
  420. }
  421. func (p *ClassParser) checkNextValue(value string) bool {
  422. if p.current+1 >= len(p.tokens) {
  423. return false
  424. }
  425. return p.tokens[p.current+1].Value == value
  426. }
  427. func (p *ClassParser) checkKeyword(keyword string) bool {
  428. if p.isAtEnd() {
  429. return false
  430. }
  431. token := p.peek()
  432. return token.Type == lexer.TokenID && strings.ToLower(token.Value) == strings.ToLower(keyword)
  433. }
  434. func (p *ClassParser) checkVisibility() bool {
  435. if p.isAtEnd() {
  436. return false
  437. }
  438. token := p.peek()
  439. return (token.Value == "+" || token.Value == "-" || token.Value == "#" || token.Value == "~") ||
  440. (token.Type == lexer.TokenPlus || token.Type == lexer.TokenMinus ||
  441. token.Type == lexer.TokenHash || token.Type == lexer.TokenTilde)
  442. }
  443. func (p *ClassParser) checkRelation() bool {
  444. token := p.peek()
  445. // Check for various relation operators
  446. return token.Value == "--" || token.Value == ".." ||
  447. p.check(lexer.TokenArrowSolid) || p.check(lexer.TokenArrowDotted) ||
  448. token.Value == "--|>" || token.Value == "--*" || token.Value == "--o"
  449. }
  450. func (p *ClassParser) advance() lexer.Token {
  451. if !p.isAtEnd() {
  452. p.current++
  453. }
  454. return p.previous()
  455. }
  456. func (p *ClassParser) isAtEnd() bool {
  457. return p.current >= len(p.tokens) || p.peek().Type == lexer.TokenEOF
  458. }
  459. func (p *ClassParser) peek() lexer.Token {
  460. if p.current >= len(p.tokens) {
  461. return lexer.Token{Type: lexer.TokenEOF}
  462. }
  463. return p.tokens[p.current]
  464. }
  465. func (p *ClassParser) previous() lexer.Token {
  466. if p.current <= 0 {
  467. return lexer.Token{Type: lexer.TokenEOF}
  468. }
  469. return p.tokens[p.current-1]
  470. }
  471. func (p *ClassParser) error(message string) error {
  472. token := p.peek()
  473. return fmt.Errorf("parse error at line %d, column %d: %s (got %s)",
  474. token.Line, token.Column, message, token.Type)
  475. }
  476. func (p *ClassParser) skipToNextStatement() error {
  477. for !p.isAtEnd() && !p.check(lexer.TokenNewline) {
  478. p.advance()
  479. }
  480. if p.check(lexer.TokenNewline) {
  481. p.advance()
  482. }
  483. return nil
  484. }
  485. // checkComment checks if current token sequence is a comment (%%)
  486. func (p *ClassParser) checkComment() bool {
  487. return p.check(lexer.TokenPercent) && p.checkNext(lexer.TokenPercent)
  488. }
  489. // parseComment parses comment statements
  490. func (p *ClassParser) parseComment() error {
  491. p.advance() // consume first %
  492. p.advance() // consume second %
  493. // Skip everything until newline
  494. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  495. p.advance()
  496. }
  497. if p.check(lexer.TokenNewline) {
  498. p.advance()
  499. }
  500. return nil
  501. }
  502. // Enhanced parseNote to support class-specific notes
  503. func (p *ClassParser) parseNote() error {
  504. p.advance() // consume 'note'
  505. var note *ast.ClassNote
  506. // Check if it's "note for ClassName"
  507. if p.checkKeyword("for") {
  508. p.advance() // consume 'for'
  509. if !p.check(lexer.TokenID) {
  510. return p.error("expected class name after 'note for'")
  511. }
  512. className := p.advance().Value
  513. // Parse note text
  514. text := ""
  515. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  516. token := p.advance()
  517. if token.Type == lexer.TokenString {
  518. // Remove quotes from string tokens
  519. val := token.Value
  520. text += val[1 : len(val)-1] // Remove surrounding quotes
  521. } else {
  522. text += token.Value + " "
  523. }
  524. }
  525. note = &ast.ClassNote{
  526. ForClass: &className,
  527. Text: strings.TrimSpace(text),
  528. }
  529. } else {
  530. // General note for the whole diagram
  531. text := ""
  532. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  533. token := p.advance()
  534. if token.Type == lexer.TokenString {
  535. // Remove quotes from string tokens
  536. val := token.Value
  537. text += val[1 : len(val)-1] // Remove surrounding quotes
  538. } else {
  539. text += token.Value + " "
  540. }
  541. }
  542. note = &ast.ClassNote{
  543. Text: strings.TrimSpace(text),
  544. }
  545. }
  546. p.diagram.Notes = append(p.diagram.Notes, note)
  547. return nil
  548. }
  549. // parseGeneric parses generic type parameters with ~Type~
  550. func (p *ClassParser) parseGeneric() (*ast.Generic, error) {
  551. if !p.check(lexer.TokenTilde) {
  552. return nil, p.error("expected '~' for generic type")
  553. }
  554. p.advance() // consume ~
  555. if !p.check(lexer.TokenID) {
  556. return nil, p.error("expected generic type name")
  557. }
  558. typeName := p.advance().Value
  559. generic := &ast.Generic{
  560. Name: typeName,
  561. Arguments: make([]*ast.Generic, 0),
  562. }
  563. // Check for nested generics like List<String>
  564. if p.check(lexer.TokenOpenAngle) {
  565. p.advance() // consume <
  566. for !p.check(lexer.TokenCloseAngle) && !p.isAtEnd() {
  567. if p.check(lexer.TokenTilde) {
  568. nestedGeneric, err := p.parseGeneric()
  569. if err != nil {
  570. return nil, err
  571. }
  572. generic.Arguments = append(generic.Arguments, nestedGeneric)
  573. } else if p.check(lexer.TokenID) {
  574. // Simple type argument
  575. argType := p.advance().Value
  576. generic.Arguments = append(generic.Arguments, &ast.Generic{
  577. Name: argType,
  578. })
  579. }
  580. if p.check(lexer.TokenComma) {
  581. p.advance() // consume comma
  582. }
  583. }
  584. if !p.check(lexer.TokenCloseAngle) {
  585. return nil, p.error("expected '>' to close generic")
  586. }
  587. p.advance() // consume >
  588. }
  589. if !p.check(lexer.TokenTilde) {
  590. return nil, p.error("expected closing '~' for generic type")
  591. }
  592. p.advance() // consume closing ~
  593. return generic, nil
  594. }