index.js 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215
  1. /*
  2. * md ast - pluggable markdown parser
  3. */
  4. const syntax = {
  5. bold: {
  6. paired: true,
  7. recursive: true,
  8. startRegexp: /\*\*\S.*/,
  9. endRegexp: /\S\*\*\W/,
  10. content: {
  11. start: {
  12. point: 'start',
  13. offset: 2
  14. },
  15. end: {
  16. point: 'end',
  17. offset: 1
  18. }
  19. },
  20. begin: 0,
  21. forward: {
  22. point: 'endEnd', //start, startEnd, end, endEnd
  23. offset: -1
  24. }
  25. },
  26. bold2: {
  27. paired: true,
  28. recursive: true,
  29. startRegexp: /\s__\S.*/,
  30. endRegexp: /\S__\s/,
  31. content: {
  32. start: {
  33. point: 'start',
  34. offset: 3
  35. },
  36. end: {
  37. point: 'end',
  38. offset: 1
  39. }
  40. },
  41. begin: 1,
  42. forward: {
  43. point: 'endEnd', //start, startEnd, end, endEnd
  44. offset: -1
  45. }
  46. },
  47. italic: {
  48. paired: true,
  49. recursive: true,
  50. startRegexp: /\*\S.*/,
  51. endRegexp: /\S\*\s/,
  52. content: {
  53. start: {
  54. point: 'start',
  55. offset: 2
  56. },
  57. end: {
  58. point: 'end',
  59. offset: 1
  60. }
  61. },
  62. begin: 0,
  63. forward: {
  64. point: 'endEnd', //start, startEnd, end, endEnd
  65. offset: -1
  66. }
  67. },
  68. italic2: {
  69. paired: true,
  70. recursive: true,
  71. startRegexp: /\s_\S.*/,
  72. endRegexp: /\S_\s/,
  73. content: {
  74. start: {
  75. point: 'start',
  76. offset: 2
  77. },
  78. end: {
  79. point: 'end',
  80. offset: 1
  81. }
  82. },
  83. begin: 1,
  84. forward: {
  85. point: 'endEnd', //start, startEnd, end, endEnd
  86. offset: -1
  87. }
  88. },
  89. root: {
  90. paired: true,
  91. recursive: true,
  92. startRegexp: /^/,
  93. endRegexp: /$/,
  94. content: {
  95. start: {
  96. point: 'start',
  97. offset: 1
  98. },
  99. end: {
  100. point: 'end',
  101. offset: 0
  102. }
  103. },
  104. begin: 0,
  105. forward: {
  106. point: 'endEnd', //start, startEnd, end, endEnd
  107. offset: -1
  108. }
  109. },
  110. heading1: {
  111. paired: true,
  112. recursive: true,
  113. startRegexp: /\n#[ \t]*(.*)\n/,
  114. endRegexp: /\n#/,
  115. content: {
  116. start: {
  117. point: 'end',
  118. offset: 1
  119. },
  120. end: {
  121. point: 'start',
  122. offset: 0
  123. }
  124. },
  125. begin: 1,
  126. forward: {
  127. point: 'endEnd', //start, startEnd, end, endEnd
  128. offset: -1
  129. }
  130. }
  131. }
  132. function findNearest(md, mdTags, offset=0){
  133. let nearest, nearestMatch = {index: Infinity};
  134. for (let [mdTag, {paired,
  135. startRegexp,
  136. rexexp}] of Object.entries(mdTags)) {
  137. if (mdTag === 'root') continue;
  138. let match = md.offsetMatch(offset, startRegexp || regexp)
  139. if (match && match.index < nearestMatch.index){
  140. nearestMatch = match
  141. nearest = mdTag
  142. }
  143. }
  144. return [nearest, nearestMatch]
  145. }
  146. function cutNode(md, match, tagName, {paired, recursive, startRegexp, endRegexp, content: {start, end}, begin, forward}){
  147. //if (paired){
  148. //md.match()
  149. //}
  150. }
  151. //node:
  152. //{
  153. // tag: 'keyFromSyntax',
  154. // children: [String, Node]
  155. // parent: node
  156. //}
  157. //
  158. String.prototype.offsetMatch = function(offset, ...params){
  159. return this.slice(offset).match(...params)
  160. }
  161. Array.prototype.last = function(){
  162. return this[this.length -1]
  163. }
  164. function buildAST(md, mdTags=syntax, offset=0, tree={tag: 'root'}, stack=[]){
  165. const currentNode = stack.last() || tree
  166. currentNode.children = currentNode.children || []
  167. const { children } = currentNode
  168. const { endRegexp, content: {end: {offset: offsetEnd} }, forward } = mdTags[currentNode.tag]
  169. while(offset < md.length){
  170. const [nearest, nearestMatch] = findNearest(md, mdTags, offset)
  171. const endMatch = md.offsetMatch(offset, endRegexp)
  172. if (endMatch) {
  173. if (!nearest || endMatch.index <= nearestMatch.index){
  174. currentNode.endContent = offset + endMatch.index + offsetEnd
  175. children.push(md.slice(offset, currentNode.endContent))
  176. offset += endMatch.index + endMatch[0].length + forward.offset
  177. currentNode.endOffset = offset
  178. return currentNode
  179. }
  180. }
  181. if (nearest){
  182. const {begin,content: {start}} = mdTags[nearest]
  183. if (nearestMatch.index){
  184. children.push(md.slice(offset, offset + nearestMatch.index + begin))
  185. offset += nearestMatch.index
  186. }
  187. else {
  188. const newNode = {tag: nearest, startOffset: offset, parent: currentNode}
  189. children.push(newNode)
  190. buildAST(md, mdTags, offset + start.offset, tree, [...stack, newNode])
  191. offset = newNode.endOffset
  192. }
  193. }
  194. else {
  195. children.push(md.slice(offset))
  196. offset = md.length
  197. }
  198. }
  199. return currentNode
  200. }
  201. debugger;
  202. console.log(buildAST("I just **love _bold text_ adddd**. hahaha").children[1])