class.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487
  1. // Package parser provides class diagram parsing based on classDiagram.jison
  2. package parser
  3. import (
  4. "fmt"
  5. "strings"
  6. "mermaid-go/pkg/ast"
  7. "mermaid-go/pkg/lexer"
  8. )
  9. // ClassParser implements class diagram parsing following classDiagram.jison
  10. type ClassParser struct {
  11. tokens []lexer.Token
  12. current int
  13. diagram *ast.ClassDiagram
  14. }
  15. // NewClassParser creates a new class parser
  16. func NewClassParser() *ClassParser {
  17. return &ClassParser{
  18. diagram: ast.NewClassDiagram(),
  19. }
  20. }
  21. // Parse parses class diagram syntax
  22. func (p *ClassParser) Parse(input string) (*ast.ClassDiagram, error) {
  23. // Tokenize
  24. l := lexer.NewLexer(input)
  25. tokens, err := l.Tokenize()
  26. if err != nil {
  27. return nil, fmt.Errorf("lexical analysis failed: %w", err)
  28. }
  29. // Filter tokens
  30. p.tokens = lexer.FilterTokens(tokens)
  31. p.current = 0
  32. p.diagram = ast.NewClassDiagram()
  33. // Parse document
  34. err = p.parseDocument()
  35. if err != nil {
  36. return nil, fmt.Errorf("syntax analysis failed: %w", err)
  37. }
  38. return p.diagram, nil
  39. }
  40. // parseDocument parses the class diagram document
  41. func (p *ClassParser) parseDocument() error {
  42. // Expect classDiagram
  43. if !p.check(lexer.TokenID) || p.peek().Value != "classDiagram" {
  44. return p.error("expected 'classDiagram'")
  45. }
  46. p.advance()
  47. // Parse statements
  48. for !p.isAtEnd() {
  49. if err := p.parseStatement(); err != nil {
  50. return err
  51. }
  52. }
  53. return nil
  54. }
  55. // parseStatement parses individual class diagram statements
  56. func (p *ClassParser) parseStatement() error {
  57. if p.isAtEnd() {
  58. return nil
  59. }
  60. switch {
  61. case p.check(lexer.TokenNewline):
  62. p.advance() // Skip newlines
  63. return nil
  64. case p.check(lexer.TokenClass) || p.checkKeyword("class"):
  65. return p.parseClass()
  66. case p.checkKeyword("direction"):
  67. return p.parseDirection()
  68. case p.checkKeyword("link"):
  69. return p.parseLink()
  70. case p.checkKeyword("click"):
  71. return p.parseClick()
  72. case p.checkKeyword("note"):
  73. return p.parseNote()
  74. case p.checkKeyword("classDef"):
  75. return p.parseClassDef()
  76. case p.check(lexer.TokenID):
  77. // Try to parse as class definition or relation
  78. return p.parseClassOrRelation()
  79. default:
  80. token := p.peek()
  81. return p.error(fmt.Sprintf("unexpected token: %s", token.Value))
  82. }
  83. }
  84. // parseClass parses class statements
  85. func (p *ClassParser) parseClass() error {
  86. // Consume 'class' token
  87. if p.check(lexer.TokenClass) {
  88. p.advance() // consume TokenClass
  89. } else {
  90. p.advance() // consume 'class' keyword
  91. }
  92. if !p.check(lexer.TokenID) {
  93. return p.error("expected class name")
  94. }
  95. className := p.advance().Value
  96. class := &ast.ClassNode{
  97. ID: className,
  98. Label: className,
  99. Type: ast.ClassTypeClass,
  100. Members: make([]*ast.ClassMember, 0),
  101. Methods: make([]*ast.ClassMethod, 0),
  102. Annotations: make([]string, 0),
  103. CssClasses: make([]string, 0),
  104. }
  105. // Check for class body
  106. if p.check(lexer.TokenOpenBrace) {
  107. p.advance() // consume '{'
  108. err := p.parseClassBody(class)
  109. if err != nil {
  110. return err
  111. }
  112. if !p.check(lexer.TokenCloseBrace) {
  113. return p.error("expected '}'")
  114. }
  115. p.advance() // consume '}'
  116. }
  117. p.diagram.Classes[className] = class
  118. return nil
  119. }
  120. // parseClassBody parses the contents of a class body
  121. func (p *ClassParser) parseClassBody(class *ast.ClassNode) error {
  122. for !p.check(lexer.TokenCloseBrace) && !p.isAtEnd() {
  123. if p.check(lexer.TokenNewline) {
  124. p.advance()
  125. continue
  126. }
  127. // Parse member or method
  128. visibility := ast.VisibilityPublic // default
  129. if p.checkVisibility() {
  130. switch p.peek().Value {
  131. case "+":
  132. visibility = ast.VisibilityPublic
  133. case "-":
  134. visibility = ast.VisibilityPrivate
  135. case "#":
  136. visibility = ast.VisibilityProtected
  137. case "~":
  138. visibility = ast.VisibilityPackage
  139. }
  140. p.advance()
  141. }
  142. if !p.check(lexer.TokenID) {
  143. return p.error("expected member or method name")
  144. }
  145. name := p.advance().Value
  146. var memberType string
  147. // Check for type annotation
  148. if p.check(lexer.TokenColon) {
  149. p.advance() // consume ':'
  150. if p.check(lexer.TokenID) {
  151. memberType = p.advance().Value
  152. }
  153. }
  154. // Check if it's a method (has parentheses)
  155. if p.check(lexer.TokenOpenParen) {
  156. p.advance() // consume '('
  157. method := &ast.ClassMethod{
  158. Name: name,
  159. Type: memberType,
  160. Parameters: make([]string, 0),
  161. Visibility: visibility,
  162. }
  163. // Parse parameters
  164. for !p.check(lexer.TokenCloseParen) && !p.isAtEnd() {
  165. if p.check(lexer.TokenID) {
  166. param := p.advance().Value
  167. method.Parameters = append(method.Parameters, param)
  168. }
  169. if p.check(lexer.TokenComma) {
  170. p.advance()
  171. }
  172. }
  173. if !p.check(lexer.TokenCloseParen) {
  174. return p.error("expected ')'")
  175. }
  176. p.advance() // consume ')'
  177. class.Methods = append(class.Methods, method)
  178. } else {
  179. // It's a member
  180. member := &ast.ClassMember{
  181. Name: name,
  182. Type: memberType,
  183. Visibility: visibility,
  184. }
  185. class.Members = append(class.Members, member)
  186. }
  187. }
  188. return nil
  189. }
  190. // parseClassOrRelation parses either a class definition or relationship
  191. func (p *ClassParser) parseClassOrRelation() error {
  192. className := p.advance().Value
  193. // Ensure class exists
  194. p.ensureClass(className)
  195. // Check for relationship operators
  196. if p.checkRelation() {
  197. return p.parseRelation(className)
  198. }
  199. // Check for class body
  200. if p.check(lexer.TokenOpenBrace) {
  201. class := p.diagram.Classes[className]
  202. p.advance() // consume '{'
  203. err := p.parseClassBody(class)
  204. if err != nil {
  205. return err
  206. }
  207. if !p.check(lexer.TokenCloseBrace) {
  208. return p.error("expected '}'")
  209. }
  210. p.advance() // consume '}'
  211. }
  212. return nil
  213. }
  214. // parseRelation parses class relationships
  215. func (p *ClassParser) parseRelation(fromClass string) error {
  216. relationType := p.parseRelationType()
  217. if relationType == "" {
  218. return p.error("expected relationship operator")
  219. }
  220. if !p.check(lexer.TokenID) {
  221. return p.error("expected target class")
  222. }
  223. toClass := p.advance().Value
  224. // Ensure target class exists
  225. p.ensureClass(toClass)
  226. relation := &ast.ClassRelation{
  227. From: fromClass,
  228. To: toClass,
  229. Type: relationType,
  230. }
  231. // Check for label
  232. if p.check(lexer.TokenColon) {
  233. p.advance() // consume ':'
  234. var labelParts []string
  235. for !p.check(lexer.TokenNewline) && !p.isAtEnd() {
  236. labelParts = append(labelParts, p.advance().Value)
  237. }
  238. if len(labelParts) > 0 {
  239. label := strings.TrimSpace(strings.Join(labelParts, " "))
  240. relation.Label = &label
  241. }
  242. }
  243. p.diagram.Relations = append(p.diagram.Relations, relation)
  244. return nil
  245. }
  246. // parseRelationType parses relationship type tokens
  247. func (p *ClassParser) parseRelationType() ast.ClassRelationType {
  248. token := p.peek()
  249. // Check for direct arrow tokens
  250. if p.check(lexer.TokenArrowSolid) {
  251. p.advance() // consume -->
  252. return ast.RelationAssociation
  253. }
  254. if p.check(lexer.TokenArrowDotted) {
  255. p.advance() // consume -.->
  256. return ast.RelationDependency
  257. }
  258. // Check for inheritance: --|>
  259. if token.Value == "--" && p.checkNext(lexer.TokenPipe) && p.checkAt(2, lexer.TokenCloseAngle) {
  260. p.advance() // --
  261. p.advance() // |
  262. p.advance() // >
  263. return ast.RelationInheritance
  264. }
  265. // Check for composition: --*
  266. if token.Value == "--" && p.checkNextValue("*") {
  267. p.advance() // --
  268. p.advance() // *
  269. return ast.RelationComposition
  270. }
  271. // Check for aggregation: --o
  272. if token.Value == "--" && p.checkNextValue("o") {
  273. p.advance() // --
  274. p.advance() // o
  275. return ast.RelationAggregation
  276. }
  277. // Check for association: -->
  278. if token.Value == "--" && p.checkNext(lexer.TokenCloseAngle) {
  279. p.advance() // --
  280. p.advance() // >
  281. return ast.RelationAssociation
  282. }
  283. // Check for realization: ..|>
  284. if token.Value == ".." && p.checkNext(lexer.TokenPipe) && p.checkAt(2, lexer.TokenCloseAngle) {
  285. p.advance() // ..
  286. p.advance() // |
  287. p.advance() // >
  288. return ast.RelationRealization
  289. }
  290. // Check for dependency: ..>
  291. if token.Value == ".." && p.checkNext(lexer.TokenCloseAngle) {
  292. p.advance() // ..
  293. p.advance() // >
  294. return ast.RelationDependency
  295. }
  296. return ""
  297. }
  298. // parseDirection parses direction statements
  299. func (p *ClassParser) parseDirection() error {
  300. p.advance() // consume 'direction'
  301. if !p.check(lexer.TokenID) {
  302. return p.error("expected direction value")
  303. }
  304. direction := p.advance().Value
  305. p.diagram.Direction = direction
  306. return nil
  307. }
  308. // parseLink, parseClick, parseNote, parseClassDef - placeholder implementations
  309. func (p *ClassParser) parseLink() error {
  310. return p.skipToNextStatement()
  311. }
  312. func (p *ClassParser) parseClick() error {
  313. return p.skipToNextStatement()
  314. }
  315. func (p *ClassParser) parseNote() error {
  316. return p.skipToNextStatement()
  317. }
  318. func (p *ClassParser) parseClassDef() error {
  319. return p.skipToNextStatement()
  320. }
  321. // ensureClass ensures a class exists, creating it if needed
  322. func (p *ClassParser) ensureClass(id string) {
  323. if _, exists := p.diagram.Classes[id]; !exists {
  324. class := &ast.ClassNode{
  325. ID: id,
  326. Label: id,
  327. Type: ast.ClassTypeClass,
  328. Members: make([]*ast.ClassMember, 0),
  329. Methods: make([]*ast.ClassMethod, 0),
  330. Annotations: make([]string, 0),
  331. CssClasses: make([]string, 0),
  332. }
  333. p.diagram.Classes[id] = class
  334. }
  335. }
  336. // Helper methods
  337. func (p *ClassParser) check(tokenType lexer.TokenType) bool {
  338. if p.isAtEnd() {
  339. return false
  340. }
  341. return p.peek().Type == tokenType
  342. }
  343. func (p *ClassParser) checkNext(tokenType lexer.TokenType) bool {
  344. if p.current+1 >= len(p.tokens) {
  345. return false
  346. }
  347. return p.tokens[p.current+1].Type == tokenType
  348. }
  349. func (p *ClassParser) checkAt(offset int, tokenType lexer.TokenType) bool {
  350. if p.current+offset >= len(p.tokens) {
  351. return false
  352. }
  353. return p.tokens[p.current+offset].Type == tokenType
  354. }
  355. func (p *ClassParser) checkNextValue(value string) bool {
  356. if p.current+1 >= len(p.tokens) {
  357. return false
  358. }
  359. return p.tokens[p.current+1].Value == value
  360. }
  361. func (p *ClassParser) checkKeyword(keyword string) bool {
  362. if p.isAtEnd() {
  363. return false
  364. }
  365. token := p.peek()
  366. return token.Type == lexer.TokenID && strings.ToLower(token.Value) == strings.ToLower(keyword)
  367. }
  368. func (p *ClassParser) checkVisibility() bool {
  369. if p.isAtEnd() {
  370. return false
  371. }
  372. token := p.peek()
  373. return token.Value == "+" || token.Value == "-" || token.Value == "#" || token.Value == "~"
  374. }
  375. func (p *ClassParser) checkRelation() bool {
  376. token := p.peek()
  377. // Check for various relation operators
  378. return token.Value == "--" || token.Value == ".." ||
  379. p.check(lexer.TokenArrowSolid) || p.check(lexer.TokenArrowDotted) ||
  380. token.Value == "--|>" || token.Value == "--*" || token.Value == "--o"
  381. }
  382. func (p *ClassParser) advance() lexer.Token {
  383. if !p.isAtEnd() {
  384. p.current++
  385. }
  386. return p.previous()
  387. }
  388. func (p *ClassParser) isAtEnd() bool {
  389. return p.current >= len(p.tokens) || p.peek().Type == lexer.TokenEOF
  390. }
  391. func (p *ClassParser) peek() lexer.Token {
  392. if p.current >= len(p.tokens) {
  393. return lexer.Token{Type: lexer.TokenEOF}
  394. }
  395. return p.tokens[p.current]
  396. }
  397. func (p *ClassParser) previous() lexer.Token {
  398. if p.current <= 0 {
  399. return lexer.Token{Type: lexer.TokenEOF}
  400. }
  401. return p.tokens[p.current-1]
  402. }
  403. func (p *ClassParser) error(message string) error {
  404. token := p.peek()
  405. return fmt.Errorf("parse error at line %d, column %d: %s (got %s)",
  406. token.Line, token.Column, message, token.Type)
  407. }
  408. func (p *ClassParser) skipToNextStatement() error {
  409. for !p.isAtEnd() && !p.check(lexer.TokenNewline) {
  410. p.advance()
  411. }
  412. if p.check(lexer.TokenNewline) {
  413. p.advance()
  414. }
  415. return nil
  416. }