class.go 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721
  1. // Package parser provides class diagram parsing based on classDiagram.jison
  2. package parser
  3. import (
  4. "fmt"
  5. "strings"
  6. "mermaid-go/pkg/ast"
  7. "mermaid-go/pkg/lexer"
  8. )
  9. // ClassParser implements class diagram parsing following classDiagram.jison
  10. type ClassParser struct {
  11. tokens []lexer.Token
  12. current int
  13. diagram *ast.ClassDiagram
  14. }
  15. // NewClassParser creates a new class parser
  16. func NewClassParser() *ClassParser {
  17. return &ClassParser{
  18. diagram: ast.NewClassDiagram(),
  19. }
  20. }
  21. // Parse parses class diagram syntax
  22. func (p *ClassParser) Parse(input string) (*ast.ClassDiagram, error) {
  23. // Tokenize
  24. l := lexer.NewLexer(input)
  25. tokens, err := l.Tokenize()
  26. if err != nil {
  27. return nil, fmt.Errorf("lexical analysis failed: %w", err)
  28. }
  29. // Filter tokens
  30. p.tokens = lexer.FilterTokens(tokens)
  31. p.current = 0
  32. p.diagram = ast.NewClassDiagram()
  33. // Parse document
  34. err = p.parseDocument()
  35. if err != nil {
  36. return nil, fmt.Errorf("syntax analysis failed: %w", err)
  37. }
  38. return p.diagram, nil
  39. }
  40. // parseDocument parses the class diagram document
  41. func (p *ClassParser) parseDocument() error {
  42. // Expect classDiagram
  43. if !p.check(lexer.TokenID) || p.peek().Value != "classDiagram" {
  44. return p.error("expected 'classDiagram'")
  45. }
  46. p.advance()
  47. // Parse statements
  48. for !p.isAtEnd() {
  49. if err := p.parseStatement(); err != nil {
  50. return err
  51. }
  52. }
  53. return nil
  54. }
  55. // parseStatement parses individual class diagram statements
  56. func (p *ClassParser) parseStatement() error {
  57. if p.isAtEnd() {
  58. return nil
  59. }
  60. switch {
  61. case p.check(lexer.TokenNewline):
  62. p.advance() // Skip newlines
  63. return nil
  64. case p.checkComment():
  65. return p.parseComment()
  66. case p.check(lexer.TokenClass) || p.checkKeyword("class"):
  67. return p.parseClass()
  68. case p.checkKeyword("direction"):
  69. return p.parseDirection()
  70. case p.checkKeyword("link"):
  71. return p.parseLink()
  72. case p.checkKeyword("click"):
  73. return p.parseClick()
  74. case p.checkKeyword("note"):
  75. return p.parseNote()
  76. case p.checkKeyword("classDef"):
  77. return p.parseClassDef()
  78. case p.check(lexer.TokenID):
  79. // Try to parse as class definition or relation
  80. return p.parseClassOrRelation()
  81. default:
  82. token := p.peek()
  83. return p.error(fmt.Sprintf("unexpected token: %s", token.Value))
  84. }
  85. }
  86. // parseClass parses class statements
  87. func (p *ClassParser) parseClass() error {
  88. // Consume 'class' token
  89. if p.check(lexer.TokenClass) {
  90. p.advance() // consume TokenClass
  91. } else {
  92. p.advance() // consume 'class' keyword
  93. }
  94. if !p.check(lexer.TokenID) {
  95. return p.error("expected class name")
  96. }
  97. className := p.advance().Value
  98. class := &ast.ClassNode{
  99. ID: className,
  100. Label: className,
  101. Type: ast.ClassTypeClass,
  102. Members: make([]*ast.ClassMember, 0),
  103. Methods: make([]*ast.ClassMethod, 0),
  104. Annotations: make([]string, 0),
  105. CssClasses: make([]string, 0),
  106. }
  107. // Check for class body
  108. if p.check(lexer.TokenOpenBrace) {
  109. p.advance() // consume '{'
  110. err := p.parseClassBody(class)
  111. if err != nil {
  112. return err
  113. }
  114. if !p.check(lexer.TokenCloseBrace) {
  115. return p.error("expected '}'")
  116. }
  117. p.advance() // consume '}'
  118. }
  119. p.diagram.Classes[className] = class
  120. return nil
  121. }
  122. // parseClassBody parses the contents of a class body
  123. func (p *ClassParser) parseClassBody(class *ast.ClassNode) error {
  124. for !p.check(lexer.TokenCloseBrace) && !p.isAtEnd() {
  125. if p.check(lexer.TokenNewline) {
  126. p.advance()
  127. continue
  128. }
  129. // Parse member or method
  130. visibility := ast.VisibilityPublic // default
  131. if p.checkVisibility() {
  132. switch p.peek().Value {
  133. case "+":
  134. visibility = ast.VisibilityPublic
  135. case "-":
  136. visibility = ast.VisibilityPrivate
  137. case "#":
  138. visibility = ast.VisibilityProtected
  139. case "~":
  140. visibility = ast.VisibilityPackage
  141. }
  142. p.advance()
  143. }
  144. // Check for annotations like <<interface>>, <<abstract>>
  145. if p.check(lexer.TokenOpenAngle) {
  146. // Look ahead to see if it's << (double angle)
  147. if p.checkNext(lexer.TokenOpenAngle) {
  148. p.advance() // consume first <
  149. p.advance() // consume second <
  150. annotation := ""
  151. for !p.check(lexer.TokenCloseAngle) && !p.isAtEnd() {
  152. if p.check(lexer.TokenID) {
  153. annotation += p.advance().Value
  154. } else {
  155. annotation += p.advance().Value
  156. }
  157. }
  158. // Consume closing >>
  159. if p.check(lexer.TokenCloseAngle) {
  160. p.advance() // consume first >
  161. if p.check(lexer.TokenCloseAngle) {
  162. p.advance() // consume second >
  163. class.Annotations = append(class.Annotations, annotation)
  164. // Update class type based on annotation
  165. switch strings.ToLower(annotation) {
  166. case "interface":
  167. class.Type = ast.ClassTypeInterface
  168. case "abstract":
  169. class.Type = ast.ClassTypeAbstract
  170. case "enumeration", "enum":
  171. class.Type = ast.ClassTypeEnum
  172. }
  173. }
  174. }
  175. continue
  176. }
  177. }
  178. if !p.check(lexer.TokenID) {
  179. return p.error("expected member or method name")
  180. }
  181. name := p.advance().Value
  182. // Check if it's a method (has parentheses)
  183. if p.check(lexer.TokenOpenParen) {
  184. method, err := p.parseMethod(name, visibility)
  185. if err != nil {
  186. return err
  187. }
  188. class.Methods = append(class.Methods, method)
  189. } else {
  190. // It's a member
  191. member, err := p.parseMember(name, visibility)
  192. if err != nil {
  193. return err
  194. }
  195. class.Members = append(class.Members, member)
  196. }
  197. }
  198. return nil
  199. }
  200. // parseMethod parses a method with parameters and return type
  201. func (p *ClassParser) parseMethod(name string, visibility ast.MemberVisibility) (*ast.ClassMethod, error) {
  202. method := &ast.ClassMethod{
  203. Name: name,
  204. Parameters: make([]string, 0),
  205. Visibility: visibility,
  206. }
  207. // Parse opening parenthesis
  208. if !p.check(lexer.TokenOpenParen) {
  209. return nil, p.error("expected '('")
  210. }
  211. p.advance() // consume '('
  212. // Parse parameters
  213. for !p.check(lexer.TokenCloseParen) && !p.isAtEnd() {
  214. if p.check(lexer.TokenID) {
  215. param := p.advance().Value
  216. // Check for parameter type
  217. if p.check(lexer.TokenID) {
  218. paramType := p.advance().Value
  219. method.Parameters = append(method.Parameters, param+" "+paramType)
  220. } else {
  221. method.Parameters = append(method.Parameters, param)
  222. }
  223. }
  224. // Skip commas
  225. if p.check(lexer.TokenComma) {
  226. p.advance()
  227. }
  228. }
  229. if !p.check(lexer.TokenCloseParen) {
  230. return nil, p.error("expected ')'")
  231. }
  232. p.advance() // consume ')'
  233. // Check for return type
  234. if p.check(lexer.TokenID) {
  235. returnType := p.advance().Value
  236. method.Type = returnType
  237. }
  238. return method, nil
  239. }
  240. // parseMember parses a class member/field
  241. func (p *ClassParser) parseMember(name string, visibility ast.MemberVisibility) (*ast.ClassMember, error) {
  242. member := &ast.ClassMember{
  243. Name: name,
  244. Visibility: visibility,
  245. }
  246. // Check for type annotation
  247. if p.check(lexer.TokenID) {
  248. memberType := p.advance().Value
  249. member.Type = memberType
  250. }
  251. return member, nil
  252. }
  253. // parseClassOrRelation parses either a class definition or relationship
  254. func (p *ClassParser) parseClassOrRelation() error {
  255. className := p.advance().Value
  256. // Ensure class exists
  257. p.ensureClass(className)
  258. // Check for relationship operators
  259. if p.checkRelation() {
  260. return p.parseRelation(className)
  261. }
  262. // Check for class body
  263. if p.check(lexer.TokenOpenBrace) {
  264. class := p.diagram.Classes[className]
  265. p.advance() // consume '{'
  266. err := p.parseClassBody(class)
  267. if err != nil {
  268. return err
  269. }
  270. if !p.check(lexer.TokenCloseBrace) {
  271. return p.error("expected '}'")
  272. }
  273. p.advance() // consume '}'
  274. }
  275. return nil
  276. }
  277. // parseRelation parses class relationships
  278. func (p *ClassParser) parseRelation(fromClass string) error {
  279. relationType := p.parseRelationType()
  280. if relationType == "" {
  281. return p.error("expected relationship operator")
  282. }
  283. if !p.check(lexer.TokenID) {
  284. return p.error("expected target class")
  285. }
  286. toClass := p.advance().Value
  287. // Ensure target class exists
  288. p.ensureClass(toClass)
  289. relation := &ast.ClassRelation{
  290. From: fromClass,
  291. To: toClass,
  292. Type: relationType,
  293. }
  294. // Check for label
  295. if p.check(lexer.TokenColon) {
  296. p.advance() // consume ':'
  297. var labelParts []string
  298. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  299. labelParts = append(labelParts, p.advance().Value)
  300. }
  301. if len(labelParts) > 0 {
  302. label := strings.TrimSpace(strings.Join(labelParts, " "))
  303. relation.Label = &label
  304. }
  305. }
  306. p.diagram.Relations = append(p.diagram.Relations, relation)
  307. return nil
  308. }
  309. // parseRelationType parses relationship type tokens
  310. func (p *ClassParser) parseRelationType() ast.ClassRelationType {
  311. token := p.peek()
  312. // Check for compound class diagram relationship tokens
  313. switch token.Type {
  314. case lexer.TokenClassInheritance:
  315. p.advance()
  316. return ast.RelationInheritance
  317. case lexer.TokenClassComposition:
  318. p.advance()
  319. return ast.RelationComposition
  320. case lexer.TokenClassAggregation:
  321. p.advance()
  322. return ast.RelationAggregation
  323. case lexer.TokenClassAssociation:
  324. p.advance()
  325. return ast.RelationAssociation
  326. case lexer.TokenClassRealization:
  327. p.advance()
  328. return ast.RelationRealization
  329. case lexer.TokenClassDependency:
  330. p.advance()
  331. return ast.RelationDependency
  332. }
  333. // Check for direct arrow tokens (fallback)
  334. if p.check(lexer.TokenArrowSolid) {
  335. p.advance() // consume -->
  336. return ast.RelationAssociation
  337. }
  338. if p.check(lexer.TokenArrowDotted) {
  339. p.advance() // consume -.->
  340. return ast.RelationDependency
  341. }
  342. // Check for inheritance: --|>
  343. if token.Value == "--" && p.checkNext(lexer.TokenPipe) && p.checkAt(2, lexer.TokenCloseAngle) {
  344. p.advance() // --
  345. p.advance() // |
  346. p.advance() // >
  347. return ast.RelationInheritance
  348. }
  349. // Check for composition: --*
  350. if token.Value == "--" && p.checkNextValue("*") {
  351. p.advance() // --
  352. p.advance() // *
  353. return ast.RelationComposition
  354. }
  355. // Check for aggregation: --o
  356. if token.Value == "--" && p.checkNextValue("o") {
  357. p.advance() // --
  358. p.advance() // o
  359. return ast.RelationAggregation
  360. }
  361. // Check for association: -->
  362. if token.Value == "--" && p.checkNext(lexer.TokenCloseAngle) {
  363. p.advance() // --
  364. p.advance() // >
  365. return ast.RelationAssociation
  366. }
  367. // Check for realization: ..|>
  368. if token.Value == ".." && p.checkNext(lexer.TokenPipe) && p.checkAt(2, lexer.TokenCloseAngle) {
  369. p.advance() // ..
  370. p.advance() // |
  371. p.advance() // >
  372. return ast.RelationRealization
  373. }
  374. // Check for dependency: ..>
  375. if token.Value == ".." && p.checkNext(lexer.TokenCloseAngle) {
  376. p.advance() // ..
  377. p.advance() // >
  378. return ast.RelationDependency
  379. }
  380. return ""
  381. }
  382. // parseDirection parses direction statements
  383. func (p *ClassParser) parseDirection() error {
  384. p.advance() // consume 'direction'
  385. // Check for direction tokens or ID
  386. var direction string
  387. if p.check(lexer.TokenTD) || p.check(lexer.TokenTB) || p.check(lexer.TokenBT) ||
  388. p.check(lexer.TokenRL) || p.check(lexer.TokenLR) {
  389. direction = p.advance().Value
  390. } else if p.check(lexer.TokenID) {
  391. direction = p.advance().Value
  392. } else {
  393. return p.error("expected direction value (TD, TB, BT, RL, LR)")
  394. }
  395. p.diagram.Direction = direction
  396. return nil
  397. }
  398. // parseLink, parseClick, parseNote, parseClassDef - placeholder implementations
  399. func (p *ClassParser) parseLink() error {
  400. return p.skipToNextStatement()
  401. }
  402. func (p *ClassParser) parseClick() error {
  403. return p.skipToNextStatement()
  404. }
  405. func (p *ClassParser) parseClassDef() error {
  406. return p.skipToNextStatement()
  407. }
  408. // ensureClass ensures a class exists, creating it if needed
  409. func (p *ClassParser) ensureClass(id string) {
  410. if _, exists := p.diagram.Classes[id]; !exists {
  411. class := &ast.ClassNode{
  412. ID: id,
  413. Label: id,
  414. Type: ast.ClassTypeClass,
  415. Members: make([]*ast.ClassMember, 0),
  416. Methods: make([]*ast.ClassMethod, 0),
  417. Annotations: make([]string, 0),
  418. CssClasses: make([]string, 0),
  419. }
  420. p.diagram.Classes[id] = class
  421. }
  422. }
  423. // Helper methods
  424. func (p *ClassParser) check(tokenType lexer.TokenType) bool {
  425. if p.isAtEnd() {
  426. return false
  427. }
  428. return p.peek().Type == tokenType
  429. }
  430. func (p *ClassParser) checkNext(tokenType lexer.TokenType) bool {
  431. if p.current+1 >= len(p.tokens) {
  432. return false
  433. }
  434. return p.tokens[p.current+1].Type == tokenType
  435. }
  436. func (p *ClassParser) checkAt(offset int, tokenType lexer.TokenType) bool {
  437. if p.current+offset >= len(p.tokens) {
  438. return false
  439. }
  440. return p.tokens[p.current+offset].Type == tokenType
  441. }
  442. func (p *ClassParser) checkNextValue(value string) bool {
  443. if p.current+1 >= len(p.tokens) {
  444. return false
  445. }
  446. return p.tokens[p.current+1].Value == value
  447. }
  448. func (p *ClassParser) checkKeyword(keyword string) bool {
  449. if p.isAtEnd() {
  450. return false
  451. }
  452. token := p.peek()
  453. return token.Type == lexer.TokenID && strings.ToLower(token.Value) == strings.ToLower(keyword)
  454. }
  455. func (p *ClassParser) checkVisibility() bool {
  456. if p.isAtEnd() {
  457. return false
  458. }
  459. token := p.peek()
  460. return (token.Value == "+" || token.Value == "-" || token.Value == "#" || token.Value == "~") ||
  461. (token.Type == lexer.TokenPlus || token.Type == lexer.TokenMinus ||
  462. token.Type == lexer.TokenHash || token.Type == lexer.TokenTilde)
  463. }
  464. func (p *ClassParser) checkRelation() bool {
  465. token := p.peek()
  466. // Check for compound class diagram relationship tokens
  467. switch token.Type {
  468. case lexer.TokenClassInheritance, lexer.TokenClassComposition, lexer.TokenClassAggregation,
  469. lexer.TokenClassAssociation, lexer.TokenClassRealization, lexer.TokenClassDependency:
  470. return true
  471. }
  472. // Check for legacy relation operators
  473. return token.Value == "--" || token.Value == ".." ||
  474. p.check(lexer.TokenArrowSolid) || p.check(lexer.TokenArrowDotted) ||
  475. token.Value == "--|>" || token.Value == "--*" || token.Value == "--o"
  476. }
  477. func (p *ClassParser) advance() lexer.Token {
  478. if !p.isAtEnd() {
  479. p.current++
  480. }
  481. return p.previous()
  482. }
  483. func (p *ClassParser) isAtEnd() bool {
  484. return p.current >= len(p.tokens) || p.peek().Type == lexer.TokenEOF
  485. }
  486. func (p *ClassParser) peek() lexer.Token {
  487. if p.current >= len(p.tokens) {
  488. return lexer.Token{Type: lexer.TokenEOF}
  489. }
  490. return p.tokens[p.current]
  491. }
  492. func (p *ClassParser) previous() lexer.Token {
  493. if p.current <= 0 {
  494. return lexer.Token{Type: lexer.TokenEOF}
  495. }
  496. return p.tokens[p.current-1]
  497. }
  498. func (p *ClassParser) error(message string) error {
  499. token := p.peek()
  500. return fmt.Errorf("parse error at line %d, column %d: %s (got %s)",
  501. token.Line, token.Column, message, token.Type.String())
  502. }
  503. func (p *ClassParser) skipToNextStatement() error {
  504. for !p.isAtEnd() && !p.check(lexer.TokenNewline) {
  505. p.advance()
  506. }
  507. if p.check(lexer.TokenNewline) {
  508. p.advance()
  509. }
  510. return nil
  511. }
  512. // checkComment checks if current token sequence is a comment (%%)
  513. func (p *ClassParser) checkComment() bool {
  514. return p.check(lexer.TokenPercent) && p.checkNext(lexer.TokenPercent)
  515. }
  516. // parseComment parses comment statements
  517. func (p *ClassParser) parseComment() error {
  518. p.advance() // consume first %
  519. p.advance() // consume second %
  520. // Skip everything until newline
  521. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  522. p.advance()
  523. }
  524. if p.check(lexer.TokenNewline) {
  525. p.advance()
  526. }
  527. return nil
  528. }
  529. // Enhanced parseNote to support class-specific notes
  530. func (p *ClassParser) parseNote() error {
  531. p.advance() // consume 'note'
  532. var note *ast.ClassNote
  533. // Check if it's "note for ClassName"
  534. if p.checkKeyword("for") {
  535. p.advance() // consume 'for'
  536. if !p.check(lexer.TokenID) {
  537. return p.error("expected class name after 'note for'")
  538. }
  539. className := p.advance().Value
  540. // Parse note text
  541. text := ""
  542. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  543. token := p.advance()
  544. if token.Type == lexer.TokenString {
  545. // Remove quotes from string tokens
  546. val := token.Value
  547. text += val[1 : len(val)-1] // Remove surrounding quotes
  548. } else {
  549. text += token.Value + " "
  550. }
  551. }
  552. note = &ast.ClassNote{
  553. ForClass: &className,
  554. Text: strings.TrimSpace(text),
  555. }
  556. } else {
  557. // General note for the whole diagram
  558. text := ""
  559. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  560. token := p.advance()
  561. if token.Type == lexer.TokenString {
  562. // Remove quotes from string tokens
  563. val := token.Value
  564. text += val[1 : len(val)-1] // Remove surrounding quotes
  565. } else {
  566. text += token.Value + " "
  567. }
  568. }
  569. note = &ast.ClassNote{
  570. Text: strings.TrimSpace(text),
  571. }
  572. }
  573. p.diagram.Notes = append(p.diagram.Notes, note)
  574. return nil
  575. }
  576. // parseGeneric parses generic type parameters with ~Type~
  577. func (p *ClassParser) parseGeneric() (*ast.Generic, error) {
  578. if !p.check(lexer.TokenTilde) {
  579. return nil, p.error("expected '~' for generic type")
  580. }
  581. p.advance() // consume ~
  582. if !p.check(lexer.TokenID) {
  583. return nil, p.error("expected generic type name")
  584. }
  585. typeName := p.advance().Value
  586. generic := &ast.Generic{
  587. Name: typeName,
  588. Arguments: make([]*ast.Generic, 0),
  589. }
  590. // Check for nested generics like List<String>
  591. if p.check(lexer.TokenOpenAngle) {
  592. p.advance() // consume <
  593. for !p.check(lexer.TokenCloseAngle) && !p.isAtEnd() {
  594. if p.check(lexer.TokenTilde) {
  595. nestedGeneric, err := p.parseGeneric()
  596. if err != nil {
  597. return nil, err
  598. }
  599. generic.Arguments = append(generic.Arguments, nestedGeneric)
  600. } else if p.check(lexer.TokenID) {
  601. // Simple type argument
  602. argType := p.advance().Value
  603. generic.Arguments = append(generic.Arguments, &ast.Generic{
  604. Name: argType,
  605. })
  606. }
  607. if p.check(lexer.TokenComma) {
  608. p.advance() // consume comma
  609. }
  610. }
  611. if !p.check(lexer.TokenCloseAngle) {
  612. return nil, p.error("expected '>' to close generic")
  613. }
  614. p.advance() // consume >
  615. }
  616. if !p.check(lexer.TokenTilde) {
  617. return nil, p.error("expected closing '~' for generic type")
  618. }
  619. p.advance() // consume closing ~
  620. return generic, nil
  621. }