index.js 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641
  1. /*
  2. * md ast - pluggable markdown parser
  3. */
  4. const syntax = {
  5. a:{
  6. paired: true,
  7. recursive: false,
  8. startRegexp: /\[(.*)\]\(/,
  9. endRegexp: /\)/,
  10. content: {
  11. start: {
  12. point: 'end',
  13. offset: 0
  14. },
  15. end: {
  16. point: 'start',
  17. offset: -1
  18. }
  19. },
  20. begin: 0,
  21. forward: {
  22. point: 'end', //start, startEnd, end, endEnd
  23. offset: 1
  24. },
  25. title: {
  26. //index: 1,
  27. recursive: true,
  28. },
  29. onbuild(md, mdTags, buildAST){ //this = {tag: }
  30. }
  31. },
  32. strike: {
  33. paired: true,
  34. recursive: true,
  35. startRegexp: /\~\~\S.*/,
  36. endRegexp: /\~\~\W/,
  37. content: {
  38. start: {
  39. point: 'start',
  40. offset: 2
  41. },
  42. end: {
  43. point: 'start',
  44. offset: 0
  45. }
  46. },
  47. begin: 0,
  48. forward: {
  49. point: 'endEnd', //start, startEnd, end, endEnd
  50. offset: -1
  51. }
  52. },
  53. bold1: {
  54. paired: true,
  55. recursive: true,
  56. startRegexp: /\*\*\S.*/,
  57. endRegexp: /\*\*\W/,
  58. content: {
  59. start: {
  60. point: 'start',
  61. offset: 2
  62. },
  63. end: {
  64. point: 'start',
  65. offset: 0
  66. }
  67. },
  68. begin: 0,
  69. forward: {
  70. point: 'endEnd', //start, startEnd, end, endEnd
  71. offset: -1
  72. }
  73. },
  74. bold2: {
  75. paired: true,
  76. recursive: true,
  77. startRegexp: /\s__\S.*/,
  78. endRegexp: /__\W/,
  79. content: {
  80. start: {
  81. point: 'start',
  82. offset: 3
  83. },
  84. end: {
  85. point: 'start',
  86. offset: 0
  87. }
  88. },
  89. begin: 1,
  90. forward: {
  91. point: 'endEnd', //start, startEnd, end, endEnd
  92. offset: -1
  93. }
  94. },
  95. italic1: {
  96. paired: true,
  97. recursive: true,
  98. startRegexp: /\*\S.*/,
  99. endRegexp: /\S\*[^*]/,
  100. content: {
  101. start: {
  102. point: 'start',
  103. offset: 1
  104. },
  105. end: {
  106. point: 'start',
  107. offset: 1
  108. }
  109. },
  110. begin: 0,
  111. forward: {
  112. point: 'endEnd', //start, startEnd, end, endEnd
  113. offset: -1
  114. }
  115. },
  116. italic2: {
  117. paired: true,
  118. recursive: true,
  119. startRegexp: /\s_\S.*/,
  120. endRegexp: /\S_\W/,
  121. content: {
  122. start: {
  123. point: 'start',
  124. offset: 2
  125. },
  126. end: {
  127. point: 'start',
  128. offset: 1
  129. }
  130. },
  131. begin: 1,
  132. forward: {
  133. point: 'endEnd', //start, startEnd, end, endEnd
  134. offset: -1
  135. }
  136. },
  137. root: {
  138. paired: true,
  139. recursive: true,
  140. startRegexp: /^/,
  141. endRegexp: /$/,
  142. content: {
  143. start: {
  144. point: 'start',
  145. offset: 1
  146. },
  147. end: {
  148. point: 'end',
  149. offset: 0
  150. }
  151. },
  152. begin: 0,
  153. forward: {
  154. point: 'endEnd', //start, startEnd, end, endEnd
  155. offset: -1
  156. }
  157. },
  158. heading6: {
  159. paired: true,
  160. recursive: true,
  161. startRegexp: /\n######[ \t]*(.*)\n/,
  162. endRegexp: /\n#\s/,
  163. content: {
  164. start: {
  165. point: 'end',
  166. offset: -1
  167. },
  168. end: {
  169. point: 'start',
  170. offset: 0
  171. }
  172. },
  173. begin: 0,
  174. forward: {
  175. point: 'end', //start, startEnd, end, endEnd
  176. offset: 0
  177. },
  178. title: {
  179. //index: 1,
  180. recursive: true,
  181. },
  182. onbuild(md, mdTags, buildAST){ //this = {tag: }
  183. }
  184. },
  185. heading5: {
  186. paired: true,
  187. recursive: true,
  188. startRegexp: /\n#####[ \t]*(.*)\n/,
  189. endRegexp: /\n#{1,5}\s/,
  190. content: {
  191. start: {
  192. point: 'end',
  193. offset: -1
  194. },
  195. end: {
  196. point: 'start',
  197. offset: 0
  198. }
  199. },
  200. begin: 0,
  201. forward: {
  202. point: 'end', //start, startEnd, end, endEnd
  203. offset: 0
  204. },
  205. title: {
  206. //index: 1,
  207. recursive: true,
  208. },
  209. onbuild(md, mdTags, buildAST){ //this = {tag: }
  210. }
  211. },
  212. heading4: {
  213. paired: true,
  214. recursive: true,
  215. startRegexp: /\n####[ \t]*(.*)\n/,
  216. endRegexp: /\n#{1,4}\s/,
  217. content: {
  218. start: {
  219. point: 'end',
  220. offset: -1
  221. },
  222. end: {
  223. point: 'start',
  224. offset: 0
  225. }
  226. },
  227. begin: 0,
  228. forward: {
  229. point: 'end', //start, startEnd, end, endEnd
  230. offset: 0
  231. },
  232. title: {
  233. //index: 1,
  234. recursive: true,
  235. },
  236. onbuild(md, mdTags, buildAST){ //this = {tag: }
  237. }
  238. },
  239. heading3: {
  240. paired: true,
  241. recursive: true,
  242. startRegexp: /\n###[ \t]*(.*)\n/,
  243. endRegexp: /\n#{1,3}\s/,
  244. content: {
  245. start: {
  246. point: 'end',
  247. offset: -1
  248. },
  249. end: {
  250. point: 'start',
  251. offset: 0
  252. }
  253. },
  254. begin: 0,
  255. forward: {
  256. point: 'end', //start, startEnd, end, endEnd
  257. offset: 0
  258. },
  259. title: {
  260. //index: 1,
  261. recursive: true,
  262. },
  263. onbuild(md, mdTags, buildAST){ //this = {tag: }
  264. }
  265. },
  266. heading2: {
  267. paired: true,
  268. recursive: true,
  269. startRegexp: /\n##[ \t]*(.*)\n/,
  270. endRegexp: /\n#{1,2}\s/,
  271. content: {
  272. start: {
  273. point: 'end',
  274. offset: -1
  275. },
  276. end: {
  277. point: 'start',
  278. offset: 0
  279. }
  280. },
  281. begin: 0,
  282. forward: {
  283. point: 'end', //start, startEnd, end, endEnd
  284. offset: 0
  285. },
  286. title: {
  287. //index: 1,
  288. recursive: true,
  289. },
  290. onbuild(md, mdTags, buildAST){ //this = {tag: }
  291. }
  292. },
  293. heading1: {
  294. paired: true,
  295. recursive: true,
  296. startRegexp: /\n#[ \t]*(.*)\n/,
  297. endRegexp: /\n#\s/,
  298. content: {
  299. start: {
  300. point: 'end',
  301. offset: -1
  302. },
  303. end: {
  304. point: 'start',
  305. offset: 0
  306. }
  307. },
  308. begin: -1,
  309. forward: {
  310. point: 'end', //start, startEnd, end, endEnd
  311. offset: 0
  312. },
  313. title: {
  314. //index: 1,
  315. recursive: true,
  316. },
  317. onbuild(md, mdTags, buildAST){ //this = {tag: }
  318. }
  319. },
  320. code: {
  321. paired: true,
  322. recursive: false,
  323. startRegexp: /`/,
  324. endRegexp: /`/,
  325. content: {
  326. start: {
  327. point: 'start',
  328. offset: 1
  329. },
  330. end: {
  331. point: 'start',
  332. offset: 0
  333. }
  334. },
  335. begin: 0,
  336. forward: {
  337. point: 'end', //start, startEnd, end, endEnd
  338. offset: 1
  339. }
  340. },
  341. codeMultiLine: {
  342. paired: true,
  343. recursive: false,
  344. startRegexp: /\n```\s*\n/,
  345. endRegexp: /\n```\s*\n/,
  346. content:{
  347. start:{
  348. point: 'end',
  349. offset: 0
  350. },
  351. end:{
  352. point: 'start',
  353. offset: 0
  354. }
  355. },
  356. begin: 1,
  357. forward: {
  358. point: 'endEnd',
  359. offset: 0
  360. },
  361. },
  362. codeLanguage: {
  363. paired: true,
  364. recursive: false,
  365. startRegexp: /\n```(\w+)\s*\n/,
  366. endRegexp: /\n```\s*\n/,
  367. title: {
  368. recursive: false
  369. },
  370. content:{
  371. start:{
  372. point: 'end',
  373. offset: 0
  374. },
  375. end:{
  376. point: 'start',
  377. offset: 0
  378. }
  379. },
  380. begin: 1,
  381. forward: {
  382. point: 'endEnd',
  383. offset: 0
  384. },
  385. },
  386. unOrderedList: {
  387. indent: true,
  388. childName: 'unOrderedListItem',
  389. //paired: true,
  390. recursive: true,
  391. regexp: /-\s*\S/,
  392. content:{
  393. start:{
  394. point: 'end',
  395. offset: -1
  396. },
  397. end:{
  398. point: 'start',
  399. offset: 0
  400. }
  401. },
  402. begin: 1,
  403. forward: {
  404. point: 'end',
  405. offset: 0
  406. }
  407. },
  408. orderedList: {
  409. indent: true,
  410. childName: 'orderedListItem',
  411. //paired: true,
  412. recursive: true,
  413. regexp: /\d+\.\s*\S/,
  414. content:{
  415. start:{
  416. point: 'end',
  417. offset: -1
  418. },
  419. end:{
  420. point: 'start',
  421. offset: 0
  422. }
  423. },
  424. begin: 1,
  425. forward: {
  426. point: 'end',
  427. offset: 0
  428. }
  429. }
  430. }
  431. const indentRegexp = (regexp,count) => new RegExp(`\\n([ \\t]${count === undefined ? '*' : `{${count}}` })` + regexp.toString().slice(1,-1))
  432. const indentEndRegexp = (count) => new RegExp(`\\n([ \\t]${count === undefined ? '*' : `{0,${count}}` })\\S`)
  433. function findNearest(md, mdTags, offset=0){
  434. let nearest, nearestMatch = {index: Infinity};
  435. for (let [mdTag, {paired,
  436. startRegexp,
  437. regexp, indent}] of Object.entries(mdTags)) {
  438. if (mdTag === 'root') continue;
  439. regexp = startRegexp || regexp
  440. regexp = indent ? indentRegexp(regexp) : regexp
  441. let match = md.offsetMatch(offset, regexp)
  442. if (match && match.index < nearestMatch.index){
  443. nearestMatch = match
  444. nearest = mdTag
  445. }
  446. }
  447. return [nearest, nearestMatch]
  448. }
  449. //node:
  450. //{
  451. // tag: 'keyFromSyntax',
  452. // children: [String, Node]
  453. // parent: node
  454. //}
  455. //
  456. String.prototype.offsetMatch = function(offset, ...params){
  457. return this.slice(offset).match(...params)
  458. }
  459. Array.prototype.last = function(amount=-1){
  460. return this[this.length +amount]
  461. }
  462. String.prototype.cutIndent = function(indent){
  463. let lines = this.split('\n').map(line => line.slice(0, indent).match(/^\s*$/) ? line.slice(indent) : line)
  464. return lines.join('\n')
  465. }
  466. function buildAST(md, mdTags=syntax, offset=0, tree={tag: 'root'}, stack=[]){
  467. let currentNode = stack.last() || tree
  468. if (currentNode.tag === 'root') md = '\n' + md + '\n'
  469. currentNode.children = currentNode.children || []
  470. const { children } = currentNode
  471. let {indent, childName, title, recursive, regexp, endRegexp, content: {end: {offset: offsetEnd, point} }, forward } = mdTags[currentNode.tag]
  472. if (indent){
  473. if (currentNode.parent.tag !== currentNode.tag){ //li
  474. let { parent: {children: siblings} } = currentNode
  475. if (siblings.length > 1 && siblings.last(-2).tag === currentNode.tag){
  476. siblings.pop()
  477. currentNode = siblings.last()
  478. }
  479. const { children } = currentNode
  480. const indentLength = currentNode.startMatch[1].length
  481. console.log(indentLength)
  482. currentNode.indentLength = indentLength
  483. endRegexp = indentEndRegexp(indentLength)
  484. let endMatch = md.offsetMatch(offset, endRegexp) || {index: md.length +1, 0: 'zzz'}
  485. let listMD = md.slice(offset, endMatch.index + offset).cutIndent(currentNode.startMatch[0].length -2)
  486. debugger;
  487. const newNode = {tag: childName, startOffset: offset, parent: currentNode, startMatch: currentNode.startMatch}
  488. children.push(newNode)
  489. newNode.children = buildAST(listMD, mdTags).children
  490. newNode.children.forEach(item => item.parent = currentNode)
  491. offset = newNode.endOffset = currentNode.endOffset = endMatch.index + offset
  492. }
  493. }
  494. if (title){
  495. const {index=1, recursive} = title
  496. const {[index]: titleContent } = currentNode.startMatch
  497. if (titleContent && recursive){
  498. currentNode.title = buildAST(titleContent, mdTags).children
  499. currentNode.title.forEach(item => item.parent = currentNode)
  500. }
  501. else {
  502. currentNode.title = [titleContent]
  503. }
  504. }
  505. while(offset < md.length){
  506. const [nearest, nearestMatch] = findNearest(md, mdTags, offset)
  507. let endMatch = md.offsetMatch(offset, endRegexp)
  508. if (!recursive || endMatch) { //if we (should) find closing tag
  509. if (!recursive || !nearest || endMatch.index <= nearestMatch.index ){ //if closing tag closer than new nested tag
  510. endMatch = endMatch || {index: md.length - offset, 0: "zzz"}
  511. currentNode.endContent = offset + endMatch.index + offsetEnd + (point === 'end' ? endMatch[0].length : 0)
  512. offset !== currentNode.endContent && children.push(md.slice(offset, currentNode.endContent))
  513. offset += endMatch.index + forward.offset + (forward.point === 'endEnd' ? endMatch[0].length : 0)
  514. currentNode.endOffset = offset
  515. currentNode.endMatch = endMatch
  516. return currentNode
  517. }
  518. }
  519. if (nearest){ //new nested tag
  520. const {begin,content: {start}} = mdTags[nearest]
  521. if (nearestMatch.index){ //if just text before nested tag
  522. nearestMatch.index + begin > 0 && children.push(md.slice(offset, offset + nearestMatch.index + begin))
  523. offset += nearestMatch.index
  524. }
  525. else { //if new tag right under cursor (offset)
  526. let newNode = {tag: nearest, startOffset: offset, parent: currentNode, startMatch: nearestMatch}
  527. children.push(newNode)
  528. newNode = buildAST(md, mdTags, offset + start.offset + (start.point === 'end' ? nearestMatch[0].length : 0), tree, [...stack, newNode])
  529. offset = newNode.endOffset
  530. }
  531. }
  532. else { //no nearest - rest of line to children as text
  533. children.push(md.slice(offset))
  534. offset = md.length
  535. }
  536. }
  537. return currentNode
  538. }
  539. const Heading = ({react:React, children, title, node: {tag}}) => {
  540. const level = +tag.slice(-1)
  541. const _ = React.createElement.bind(React)
  542. if (isNaN(level)) throw new SyntaxError('wrong heading name')
  543. return _(React.Fragment, null,
  544. _(`h${level}`, null, ...title),
  545. _(`div`, null, ...children)
  546. )
  547. }
  548. const A = ({react:React, children, title}) =>{
  549. const _ = React.createElement.bind(React)
  550. return _("a", {children: title, href: children})
  551. }
  552. const defaultMapMDToComponents = {
  553. heading1: Heading,
  554. heading2: Heading,
  555. heading3: Heading,
  556. heading4: Heading,
  557. heading5: Heading,
  558. heading6: Heading,
  559. strike: "strike",
  560. bold1: "strong",
  561. bold2: "strong",
  562. a: A,
  563. italic1: "i",
  564. italic2: "i",
  565. unOrderedList: 'ul',
  566. orderedList: 'ol',
  567. unOrderedListItem: 'li',
  568. orderedListItem: 'li',
  569. code: 'code',
  570. codeMultiLine: 'pre',
  571. codeLanguage: 'pre',
  572. root: ""
  573. }
  574. function toReact(ast, React, mapMDToComponents=defaultMapMDToComponents){
  575. const gC = (tag, c) => (c = mapMDToComponents[tag]) ? c : (c === "" ? React.Fragment : "span")
  576. const RenderComponent = gC(ast.tag)
  577. const _ = React.createElement.bind(React)
  578. const childToReact = child => typeof child === 'string' ? child :
  579. toReact(child, React, mapMDToComponents)
  580. return _(RenderComponent, {node: ast,
  581. key: Math.random(),
  582. children: ast.children.map(childToReact),
  583. title: ast.title && ast.title.map(childToReact),
  584. react: React})
  585. }
  586. window.module && (module.exports = {
  587. buildAST,
  588. toReact
  589. })
  590. console.log(Object.keys(syntax))
  591. //const md =
  592. //`
  593. //# heading1
  594. //какой-то _текст_
  595. //# heading2
  596. //а тут **шо** цикавого?)))
  597. //`;
  598. //console.log( buildAST(md).children)