UNPKG

@mdast2docx/html

Version:

Extend MDAST by parsing embedded HTML in Markdown. Converts HTML into structured MDAST nodes compatible with @m2d/core for DOCX generation.

4 lines (2 loc) 6.12 kB
import{a as y}from"./chunk-CYY6OEIU.mjs";import{AlignmentType as N,BorderStyle as h}from"docx";var H=["A","ABBR","ACRONYM","B","BDI","BDO","BIG","BR","BUTTON","CITE","CODE","DATA","DATALIST","DEL","DFN","EM","I","IMG","INPUT","INS","KBD","LABEL","MARK","METER","NOSCRIPT","OBJECT","OUTPUT","Q","RUBY","RP","RT","S","SAMP","SCRIPT","SELECT","SLOT","SMALL","SPAN","STRONG","SUB","SUP","svg","TEMPLATE","TEXTAREA","TIME","U","TT","VAR","WBR"],O={A:"link",B:"strong",BR:"break",EM:"emphasis",STRONG:"strong",I:"emphasis",IMG:"image",DEL:"delete",S:"delete"},I=["solid","dashed","dotted","double","none","ridge","groove","inset","outset"],D=t=>{var r;if(!t)return{};let n={},e=t.match(/border(-\w+)?:\s*[^;]+/gi);if(!e)return{};for(let s of e){let[a,p]=s.split(":").map(d=>d.trim()),o=p.split(/\s+/),u=(r=o.find(d=>d.endsWith("px")))==null?void 0:r.replace("px",""),i=o.find(d=>I.includes(d.toLowerCase())),c=o.find(d=>!d.endsWith("px")&&!I.includes(d.toLowerCase())),l=a==="border"?"border":a.replace("border-","");n[l]={...u?{width:parseInt(u,1)}:{},...i?{style:i}:{},...c?{color:c}:{}}}return n},k={solid:h.SINGLE,dashed:h.DASHED,dotted:h.DOTTED,double:h.DOUBLE,none:h.NONE,ridge:h.THREE_D_EMBOSS,groove:h.THREE_D_ENGRAVE,inset:h.INSET,outset:h.OUTSET},g=t=>{if(!t||!Object.keys(t).length)return;let{width:n,color:e,style:r}=t,s={style:r?k[r]:h.SINGLE};return n&&(s.size=n),e&&(s.color=y(e)),s},b=(t,n=!0)=>{var d,f;let e={};if(!(t instanceof HTMLElement||t instanceof SVGElement))return e;let{textAlign:r,fontWeight:s,fontStyle:a,textDecoration:p,textTransform:o,color:u}=t.style,i=t.getAttribute("style"),c=D(i);if(e.style=i!=null?i:void 0,n&&c.border)e.border=g(c.border);else if(Object.keys(c).length){let B={...c.border,...c.left},A={...c.border,...c.right},C={...c.border,...c.top},R={...c.border,...c.bottom};e.border={left:g(B),right:g(A),top:g(C),bottom:g(R)}}switch(r&&(Object.keys(N).includes(r)?e.alignment=r:r==="justify"&&(e.alignment=N.JUSTIFIED)),(/bold/.test(s)||parseInt(s)>=500)&&(e.bold=!0),/(italic|oblique)/.test(a)&&(e.italics=!0),p){case"underline":e.underline={};break;case"overline":e.emphasisMark={};break;case"line-through":e.strike=!0;break}o==="uppercase"&&(e.allCaps=!0),o==="lowercase"&&(e.smallCaps=!0),u&&(e.color=y(u));let l=t.tagName;return l==="SUP"?e.superScript=!0:l==="SUB"?e.subScript=!0:["STRONG","B"].includes(l)?e.bold=!0:["EM","I"].includes(l)?e.italics=!0:["DEL","S"].includes(l)?e.strike=!0:["U","INS"].includes(l)?e.underline={}:l==="MARK"?(e.highlight="yellow",e.emphasisMark={}):l==="PRE"?e.pre=!0:l==="INPUT"&&(e.type=t.type,e.name=t.name,e.value=(d=t.value)!=null?d:t.defaultValue,e.checked=(f=t.checked)!=null?f:t.defaultChecked),e.tag=l.toLowerCase(),e},m=(t,n=!1)=>{var p,o,u,i,c,l;if(!(t instanceof HTMLElement||t instanceof SVGElement))return{type:"text",value:(o=n?t.textContent:(p=t.textContent)==null?void 0:p.replace(/^\s+|\s+$/g," "))!=null?o:""};let e=Array.from(t.childNodes).map(d=>m(d,n)),r=b(t),s=t.getAttributeNames().reduce((d,f)=>({...d,[f]:t.getAttribute(f)}),{}),a=t.tagName;switch(a){case"BR":return{type:"break"};case"IMG":return{type:"image",url:(u=s.src)!=null?u:"",alt:(i=s.alt)!=null?i:"",data:{...r,...s}};case"svg":return{type:"svg",value:t.outerHTML,data:r};case"EM":case"I":case"STRONG":case"B":case"DEL":case"S":return{type:O[a],children:e,data:r};case"A":return{type:"link",url:(c=s.href)!=null?c:"",children:e,data:r};case"INPUT":return/(radio|checkbox)/.test(t.type)?{type:"checkbox",data:r}:{type:"text",value:(l=r.value)!=null?l:`_${t.value||"_".repeat(20)}_`,data:{...r,border:{style:h.OUTSET}}}}return{type:"fragment",children:e,data:r}},T=(t,n)=>{let e=Array.from(t.childNodes),r=[],s=[];for(let a of e)(a instanceof HTMLElement||a instanceof SVGElement)&&!H.includes(a.tagName)?(s.length&&(r.push({type:"paragraph",children:s.map(p=>m(p,n==null?void 0:n.pre))}),s.length=0),r.push(v(a))):s.push(a);return s.length&&r.push({type:"paragraph",children:s.map(a=>m(a,n==null?void 0:n.pre))}),r.length===1?{...r[0],data:{...n,...r[0].data}}:{type:"fragment",children:r,data:n}},M=(t,n)=>Array.from(t.children).map(e=>{let r={...n,...b(e)};return e.tagName==="TR"?{type:"tableRow",children:Array.from(e.children).map(s=>({type:"tableCell",children:[T(s,{...r,tag:void 0})],data:{...r,tag:s.tagName.toLowerCase()}})),data:r}:M(e,r)}).flat(),E={style:"single"},P={left:E,right:E,top:E,bottom:E},v=t=>{let n=b(t),e=t.tagName;switch(e){case"H1":case"H2":case"H3":case"H4":case"H5":case"H6":return{type:"heading",depth:parseInt(e[1]),children:Array.from(t.childNodes).map(r=>m(r)),data:n};case"PRE":case"P":case"DIV":case"DETAILS":case"SUMMARY":case"FORM":case"LI":return T(t,n);case"UL":case"OL":return{type:"list",ordered:e==="OL",children:Array.from(t.childNodes).map(r=>({type:"listItem",children:[T(r)],data:n}))};case"HR":return{type:"thematicBreak",data:n};case"BLOCKQUOTE":return{type:"blockquote",children:Array.from(t.childNodes).map(r=>T(r)),data:n};case"TABLE":return{type:"table",children:M(t),data:n};case"STYLE":return{type:"paragraph",children:[{type:"text",value:`Not supported yet! ${t.textContent}`}],data:{...n,pre:!0,border:P}}}return{type:"paragraph",children:[m(t)],data:n}},L=t=>{var s,a,p;let n=(a=(s=t.value)==null?void 0:s.trim())!=null?a:"",e=n.split(" ")[0].slice(1),r=document.createElement("div");r.innerHTML=n.endsWith("/>")?n:`${n}</${e}>`,Object.assign(t,{...m(r.children[0]),children:(p=t.children)!=null?p:[]})},S=(t,n=!0)=>{var s,a,p;let e=[],r=[];for(let o of t.children){if((s=o.children)!=null&&s.length&&S(o,!1),o.type==="html"&&/^<[^>]*[^/]>$/.test(o.value)){let i=o.value.split(" ")[0].replace(/^<|>$/g,"");if(i[0]==="/"){let c=r.shift();if(!c)throw new Error(`Invalid HTML: ${o.value}`);L(c),((p=(a=r[0])==null?void 0:a.children)!=null?p:e).push(c)}else r.unshift({...o,children:[],tag:i})}else r.length?r[0].children.push(o):e.push(o);let u=o.type==="html"&&/^<[^>]*\/>$/.test(o.value);if(u&&!n)L(o);else if(u&&n||o.type==="html"&&!/^<[^>]*>$/.test(o.value)){let i=document.createElement("div");i.innerHTML=o.value,Object.assign(o,T(i))}}t.children=e},G=()=>({preprocess:S});export{G as htmlPlugin};