wangeditor
Version:
wangEditor - 轻量级 web 富文本编辑器,配置方便,使用简单,开源免费
169 lines (148 loc) • 5.82 kB
JavaScript
// Copyright 2004 Erik Arvidsson. All Rights Reserved.
//
// This code is triple licensed using Apache Software License 2.0,
// Mozilla Public License or GNU Public License
//
///////////////////////////////////////////////////////////////////////////////
//
// Licensed under the Apache License, Version 2.0 (the "License"); you may not
// use this file except in compliance with the License. You may obtain a copy
// of the License at http://www.apache.org/licenses/LICENSE-2.0
//
///////////////////////////////////////////////////////////////////////////////
//
// The contents of this file are subject to the Mozilla Public License
// Version 1.1 (the "License"); you may not use this file except in
// compliance with the License. You may obtain a copy of the License at
// http://www.mozilla.org/MPL/
//
// Software distributed under the License is distributed on an "AS IS"
// basis, WITHOUT WARRANTY OF ANY KIND, either express or implied. See the
// License for the specific language governing rights and limitations
// under the License.
//
// The Original Code is Simple HTML Parser.
//
// The Initial Developer of the Original Code is Erik Arvidsson.
// Portions created by Erik Arvidssson are Copyright (C) 2004. All Rights
// Reserved.
//
///////////////////////////////////////////////////////////////////////////////
//
// This program is free software; you can redistribute it and/or
// modify it under the terms of the GNU General Public License
// as published by the Free Software Foundation; either version 2
// of the License, or (at your option) any later version.
//
// This program is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with this program; if not, write to the Free Software
// Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
//
///////////////////////////////////////////////////////////////////////////////
/*
var handler ={
startElement: function (sTagName, oAttrs) {},
endElement: function (sTagName) {},
characters: function (s) {},
comment: function (s) {}
};
*/
function SimpleHtmlParser() {}
SimpleHtmlParser.prototype = {
handler: null,
// regexps
startTagRe: /^<([^>\s\/]+)((\s+[^=>\s]+(\s*=\s*((\"[^"]*\")|(\'[^']*\')|[^>\s]+))?)*)\s*\/?\s*>/m,
endTagRe: /^<\/([^>\s]+)[^>]*>/m,
attrRe: /([^=\s]+)(\s*=\s*((\"([^"]*)\")|(\'([^']*)\')|[^>\s]+))?/gm,
parse: function (s, oHandler) {
if (oHandler) this.contentHandler = oHandler
var i = 0
var res, lc, lm, rc, index
var treatAsChars = false
var oThis = this
while (s.length > 0) {
// Comment
if (s.substring(0, 4) == '<!--') {
index = s.indexOf('-->')
if (index != -1) {
this.contentHandler.comment(s.substring(4, index))
s = s.substring(index + 3)
treatAsChars = false
} else {
treatAsChars = true
}
}
// end tag
else if (s.substring(0, 2) == '</') {
if (this.endTagRe.test(s)) {
lc = RegExp.leftContext
lm = RegExp.lastMatch
rc = RegExp.rightContext
lm.replace(this.endTagRe, function () {
return oThis.parseEndTag.apply(oThis, arguments)
})
s = rc
treatAsChars = false
} else {
treatAsChars = true
}
}
// start tag
else if (s.charAt(0) == '<') {
if (this.startTagRe.test(s)) {
lc = RegExp.leftContext
lm = RegExp.lastMatch
rc = RegExp.rightContext
lm.replace(this.startTagRe, function () {
return oThis.parseStartTag.apply(oThis, arguments)
})
s = rc
treatAsChars = false
} else {
treatAsChars = true
}
}
if (treatAsChars) {
index = s.indexOf('<')
if (index == -1) {
this.contentHandler.characters(s)
s = ''
} else {
this.contentHandler.characters(s.substring(0, index))
s = s.substring(index)
}
}
treatAsChars = true
}
},
parseStartTag: function (sTag, sTagName, sRest) {
var attrs = this.parseAttributes(sTagName, sRest)
this.contentHandler.startElement(sTagName, attrs)
},
parseEndTag: function (sTag, sTagName) {
this.contentHandler.endElement(sTagName)
},
parseAttributes: function (sTagName, s) {
var oThis = this
var attrs = []
s.replace(this.attrRe, function (a0, a1, a2, a3, a4, a5, a6, a7) {
attrs.push(oThis.parseAttribute(sTagName, a0, a1, a2, a3, a4, a5, a6, a7))
})
return attrs
},
parseAttribute: function (sTagName, sAttribute, sName) {
var value = ''
if (arguments[7]) value = arguments[8]
else if (arguments[5]) value = arguments[6]
else if (arguments[3]) value = arguments[4]
var empty = !value && !arguments[3]
return { name: sName, value: empty ? null : value }
},
}
// export default SimpleHtmlParser
module.exports = SimpleHtmlParser