html2json.js
5.25 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
function e(e) {
for (var t = {}, r = e.split(","), s = 0; s < r.length; s++) t[r[s]] = !0;
return t;
}
function t(e) {
return e.replace(/<\?xml.*\?>\n/, "").replace(/<.*!doctype.*\>\n/, "").replace(/<.*!DOCTYPE.*\>\n/, "");
}
function r(e) {
return e.replace(/\r?\n+/g, "").replace(/<!--.*?-->/gi, "").replace(/\/\*.*?\*\//gi, "").replace(/[ ]+</gi, "<");
}
function s(e) {
var t = [];
if (0 == a.length || !i) return (d = {}).node = "text", d.text = e, s = [ d ];
e = e.replace(/\[([^\[\]]+)\]/g, ":$1:");
for (var r = new RegExp("[:]"), s = e.split(r), n = 0; n < s.length; n++) {
var l = s[n], d = {};
i[l] ? (d.node = "element", d.tag = "emoji", d.text = i[l], d.baseSrc = o) : (d.node = "text",
d.text = l), t.push(d);
}
return t;
}
var n = "https", a = "", o = "", i = {}, l = require("./wxDiscode.js"), d = require("./htmlparser.js"), c = (e("area,base,basefont,br,col,frame,hr,img,input,link,meta,param,embed,command,keygen,source,track,wbr"),
e("br,a,code,address,article,applet,aside,audio,blockquote,button,canvas,center,dd,del,dir,div,dl,dt,fieldset,figcaption,figure,footer,form,frameset,h1,h2,h3,h4,h5,h6,header,hgroup,hr,iframe,ins,isindex,li,map,menu,noframes,noscript,object,ol,output,p,pre,section,script,table,tbody,td,tfoot,th,thead,tr,ul,video")), u = e("abbr,acronym,applet,b,basefont,bdo,big,button,cite,del,dfn,em,font,i,iframe,img,input,ins,kbd,label,map,object,q,s,samp,script,select,small,span,strike,strong,sub,sup,textarea,tt,u,var"), p = e("colgroup,dd,dt,li,options,p,td,tfoot,th,thead,tr");
e("checked,compact,declare,defer,disabled,ismap,multiple,nohref,noresize,noshade,nowrap,readonly,selected"),
e("wxxxcode-style,script,style,view,scroll-view,block");
module.exports = {
html2json: function(e, a) {
e = r(e = t(e)), e = l.strDiscode(e);
var o = [], i = {
node: a,
nodes: [],
images: [],
imageUrls: []
}, g = 0;
return d(e, {
start: function(e, t, r) {
var s = {
node: "element",
tag: e
};
if (0 === o.length ? (s.index = g.toString(), g += 1) : (void 0 === (x = o[0]).nodes && (x.nodes = []),
s.index = x.index + "." + x.nodes.length), c[e] ? s.tagType = "block" : u[e] ? s.tagType = "inline" : p[e] && (s.tagType = "closeSelf"),
0 !== t.length && (s.attr = t.reduce(function(e, t) {
var r = t.name, n = t.value;
//return "class" == r && (console.dir(n), s.classStr = n), "style" == r && (console.dir(n),
return "class" == r && ( s.classStr = n), "style" == r && (
s.styleStr = n), n.match(/ /) && (n = n.split(" ")), e[r] ? Array.isArray(e[r]) ? e[r].push(n) : e[r] = [ e[r], n ] : e[r] = n,
e;
}, {})), "img" === s.tag) {
s.imgIndex = i.images.length;
var d = s.attr.src;
"" == d[0] && d.splice(0, 1), d = l.urlToHttpUrl(d, n), s.attr.src = d, s.from = a,
i.images.push(s), i.imageUrls.push(d);
}
if ("font" === s.tag) {
var m = [ "x-small", "small", "medium", "large", "x-large", "xx-large", "-webkit-xxx-large" ], f = {
color: "color",
face: "font-family",
size: "font-size"
};
s.attr.style || (s.attr.style = []), s.styleStr || (s.styleStr = "");
for (var h in f) if (s.attr[h]) {
var v = "size" === h ? m[s.attr[h] - 1] : s.attr[h];
s.attr.style.push(f[h]), s.attr.style.push(v), s.styleStr += f[h] + ": " + v + ";";
}
}
if ("source" === s.tag && (i.source = s.attr.src), r) {
var x = o[0] || i;
void 0 === x.nodes && (x.nodes = []), x.nodes.push(s);
} else o.unshift(s);
},
end: function(e) {
var t = o.shift();
if (t.tag !== e && console.error("invalid state: mismatch end tag"), "video" === t.tag && i.source && (t.attr.src = i.source,
delete i.source), 0 === o.length) i.nodes.push(t); else {
var r = o[0];
void 0 === r.nodes && (r.nodes = []), r.nodes.push(t);
}
},
chars: function(e) {
var t = {
node: "text",
text: e,
textArray: s(e)
};
if (0 === o.length) t.index = g.toString(), g += 1, i.nodes.push(t); else {
var r = o[0];
void 0 === r.nodes && (r.nodes = []), t.index = r.index + "." + r.nodes.length,
r.nodes.push(t);
}
},
comment: function(e) {}
}), i;
},
emojisInit: function() {
var e = arguments.length > 0 && void 0 !== arguments[0] ? arguments[0] : "", t = arguments.length > 1 && void 0 !== arguments[1] ? arguments[1] : "/wxParse/emojis/", r = arguments[2];
a = e, o = t, i = r;
}
};