2012-09-18 23:23:16 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* 过滤XSS攻击
|
|
|
|
|
|
*
|
|
|
|
|
|
* @author 老雷<leizongmin@gmail.com>
|
|
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
|
|
|
|
* 默认HTML标签白名单
|
|
|
|
|
|
* 标签名=>属性列表
|
|
|
|
|
|
*/
|
|
|
|
|
|
var defaultWhiteList = {
|
2013-05-27 10:54:02 +08:00
|
|
|
|
h1: [],
|
|
|
|
|
|
h2: [],
|
|
|
|
|
|
h3: [],
|
|
|
|
|
|
h4: [],
|
|
|
|
|
|
h5: [],
|
|
|
|
|
|
h6: [],
|
|
|
|
|
|
hr: [],
|
|
|
|
|
|
span: [],
|
|
|
|
|
|
strong: [],
|
|
|
|
|
|
b: [],
|
|
|
|
|
|
i: [],
|
2012-09-19 09:04:23 +08:00
|
|
|
|
br: [],
|
2013-05-27 10:54:02 +08:00
|
|
|
|
p: [],
|
|
|
|
|
|
pre: [],
|
|
|
|
|
|
code: [],
|
|
|
|
|
|
a: ['target', 'href', 'title'],
|
2013-07-11 22:55:41 +08:00
|
|
|
|
img: ['src', 'alt', 'title', 'width', 'height'],
|
2013-05-27 10:54:02 +08:00
|
|
|
|
div: [],
|
|
|
|
|
|
table: ['width', 'border'],
|
2013-07-11 22:58:23 +08:00
|
|
|
|
tr: ['rowspan'],
|
2013-05-27 10:54:02 +08:00
|
|
|
|
td: ['width', 'colspan'],
|
|
|
|
|
|
th: ['width', 'colspan'],
|
|
|
|
|
|
tbody: [],
|
2013-08-15 12:57:00 +08:00
|
|
|
|
thead: [],
|
2013-05-27 10:54:02 +08:00
|
|
|
|
ul: [],
|
|
|
|
|
|
li: [],
|
|
|
|
|
|
ol: [],
|
|
|
|
|
|
dl: [],
|
|
|
|
|
|
dt: [],
|
|
|
|
|
|
em: [],
|
|
|
|
|
|
cite: [],
|
|
|
|
|
|
section:[],
|
|
|
|
|
|
header: [],
|
|
|
|
|
|
footer: [],
|
|
|
|
|
|
blockquote: [],
|
2012-10-18 12:57:58 +08:00
|
|
|
|
audio: ['autoplay', 'controls', 'loop', 'preload', 'src'],
|
2013-11-05 17:47:36 +08:00
|
|
|
|
video: ['autoplay', 'controls', 'loop', 'preload', 'src', 'height', 'width']
|
2012-09-18 23:23:16 +08:00
|
|
|
|
};
|
|
|
|
|
|
|
2013-05-07 12:50:56 +08:00
|
|
|
|
// 正则表达式
|
|
|
|
|
|
var REGEXP_LT = /</g;
|
|
|
|
|
|
var REGEXP_GT = />/g;
|
|
|
|
|
|
var REGEXP_QUOTE = /"/g;
|
|
|
|
|
|
var REGEXP_ATTR_NAME = /[^a-zA-Z0-9_:\.\-]/img;
|
2013-12-24 12:06:52 +08:00
|
|
|
|
var REGEXP_ATTR_VALUE_1 = /&#([a-zA-Z0-9]*);?/img;
|
2013-12-24 12:23:47 +08:00
|
|
|
|
var REGEXP_ATTR_VALUE_COLON = /:?/img;
|
|
|
|
|
|
var REGEXP_ATTR_VALUE_NEWLINE = /&newline;?/img;
|
2013-05-07 12:50:56 +08:00
|
|
|
|
var REGEXP_DEFAULT_ON_TAG_ATTR_1 = /\/\*|\*\//mg;
|
2013-12-24 13:13:28 +08:00
|
|
|
|
var REGEXP_DEFAULT_ON_TAG_ATTR_2 = /^[\s"'`]*((j\s*a\s*v\s*a|v\s*b|l\s*i\s*v\s*e)\s*s\s*c\s*r\s*i\s*p\s*t\s*|m\s*o\s*c\s*h\s*a)\:/ig;
|
2013-05-07 12:50:56 +08:00
|
|
|
|
var REGEXP_DEFAULT_ON_TAG_ATTR_3 = /\/\*|\*\//mg;
|
2013-12-24 13:13:28 +08:00
|
|
|
|
var REGEXP_DEFAULT_ON_TAG_ATTR_4 = /((j\s*a\s*v\s*a|v\s*b|l\s*i\s*v\s*e)\s*s\s*c\s*r\s*i\s*p\s*t\s*|m\s*o\s*c\s*h\s*a)\:/ig;
|
2013-12-24 13:38:57 +08:00
|
|
|
|
var REGEXP_DEFAULT_ON_TAG_ATTR_5 = /^[\s"'`]*(d\s*a\s*t\s*a\s*)\:/ig;
|
|
|
|
|
|
var REGEXP_DEFAULT_ON_TAG_ATTR_6 = /^[\s"'`]*(d\s*a\s*t\s*a\s*)\:\s*image\//ig;
|
2013-05-07 12:50:56 +08:00
|
|
|
|
|
|
|
|
|
|
|
2012-09-19 08:03:16 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* 过滤属性值
|
2013-09-15 23:03:05 +08:00
|
|
|
|
* 仅针对已经在白名单中的标签属性,用来替换默认的过滤属性值程序
|
2012-09-19 19:30:21 +08:00
|
|
|
|
*
|
2013-05-07 13:30:00 +08:00
|
|
|
|
* @param {String} tag 标签名
|
|
|
|
|
|
* @param {String} attr 属性名
|
|
|
|
|
|
* @param {String} value 属性值
|
|
|
|
|
|
* @return {String} 若不需要修改属性值,不返回任何值
|
2012-09-19 08:03:16 +08:00
|
|
|
|
*/
|
2013-05-07 12:50:56 +08:00
|
|
|
|
function defaultOnTagAttr (tag, attr, value) {
|
2012-09-19 09:04:23 +08:00
|
|
|
|
if (attr === 'href' || attr === 'src') {
|
2013-12-24 13:38:57 +08:00
|
|
|
|
// 过滤 href 和 src 属性
|
|
|
|
|
|
// javascript:
|
2013-05-07 12:50:56 +08:00
|
|
|
|
REGEXP_DEFAULT_ON_TAG_ATTR_1.lastIndex = 0;
|
|
|
|
|
|
if (REGEXP_DEFAULT_ON_TAG_ATTR_1.test(value)) {
|
2012-09-19 08:03:16 +08:00
|
|
|
|
return '#';
|
|
|
|
|
|
}
|
2013-12-24 13:38:57 +08:00
|
|
|
|
// /*注释*/
|
2013-05-07 12:50:56 +08:00
|
|
|
|
REGEXP_DEFAULT_ON_TAG_ATTR_2.lastIndex = 0;
|
|
|
|
|
|
if (REGEXP_DEFAULT_ON_TAG_ATTR_2.test(value)) {
|
2012-09-19 11:10:16 +08:00
|
|
|
|
return '#';
|
|
|
|
|
|
}
|
2013-12-24 13:38:57 +08:00
|
|
|
|
// data:
|
|
|
|
|
|
REGEXP_DEFAULT_ON_TAG_ATTR_5.lastIndex = 0;
|
|
|
|
|
|
if (REGEXP_DEFAULT_ON_TAG_ATTR_5.test(value)) {
|
|
|
|
|
|
// 允许 data: image/* 类型
|
|
|
|
|
|
REGEXP_DEFAULT_ON_TAG_ATTR_6.lastIndex = 0;
|
|
|
|
|
|
if (!REGEXP_DEFAULT_ON_TAG_ATTR_6.test(value)) {
|
|
|
|
|
|
return '#';
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2012-09-19 11:10:16 +08:00
|
|
|
|
} else if (attr === 'style') {
|
2013-12-24 13:38:57 +08:00
|
|
|
|
// 过滤 style 属性 (这个xss漏洞较老了,可能已经不适用)
|
|
|
|
|
|
// javascript:
|
2013-05-07 12:50:56 +08:00
|
|
|
|
REGEXP_DEFAULT_ON_TAG_ATTR_3.lastIndex = 0;
|
|
|
|
|
|
if (REGEXP_DEFAULT_ON_TAG_ATTR_3.test(value)) {
|
2012-09-19 11:10:16 +08:00
|
|
|
|
return '#';
|
|
|
|
|
|
}
|
2013-12-24 13:38:57 +08:00
|
|
|
|
// /*注释*/
|
2013-05-07 12:50:56 +08:00
|
|
|
|
REGEXP_DEFAULT_ON_TAG_ATTR_4.lastIndex = 0;
|
|
|
|
|
|
if (REGEXP_DEFAULT_ON_TAG_ATTR_4.test(value)) {
|
2012-09-19 11:10:16 +08:00
|
|
|
|
return '';
|
|
|
|
|
|
}
|
2012-09-19 08:03:16 +08:00
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
}
|
2012-09-18 23:23:16 +08:00
|
|
|
|
|
2012-09-19 19:56:20 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* 过滤非白名单的标签
|
|
|
|
|
|
*
|
2013-05-07 13:30:00 +08:00
|
|
|
|
* @param {String} tag 标签名
|
|
|
|
|
|
* @param {String} html 标签HTML代码(包括属性值)
|
|
|
|
|
|
* @param {Object} options 更多属性:
|
2012-09-20 20:30:32 +08:00
|
|
|
|
* position:在返回的HTML代码中的开始位置
|
|
|
|
|
|
* originalPosition:在原HTML代码中的开始位置
|
|
|
|
|
|
* isClosing:是否为闭合标签,如</a>
|
2013-05-07 13:30:00 +08:00
|
|
|
|
* @return {String} 若不返回任何值,则默认替换<>为<>
|
2012-09-19 19:56:20 +08:00
|
|
|
|
*/
|
2013-05-07 12:50:56 +08:00
|
|
|
|
function defaultOnIgnoreTag (tag, html, options) {
|
2012-09-19 19:56:20 +08:00
|
|
|
|
return noTag(html);
|
2013-05-07 13:30:00 +08:00
|
|
|
|
}
|
2012-09-19 19:56:20 +08:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
|
* 转换<>为< >
|
|
|
|
|
|
*
|
2013-05-07 13:30:00 +08:00
|
|
|
|
* @param {String} text
|
|
|
|
|
|
* @return {String}
|
2012-09-19 19:56:20 +08:00
|
|
|
|
*/
|
2013-05-07 12:50:56 +08:00
|
|
|
|
function noTag (text) {
|
|
|
|
|
|
return text.replace(REGEXP_LT, '<').replace(REGEXP_GT, '>');
|
2013-05-07 13:30:00 +08:00
|
|
|
|
}
|
2012-09-19 19:56:20 +08:00
|
|
|
|
|
2013-05-08 16:21:46 +08:00
|
|
|
|
/**
|
2013-12-24 11:36:14 +08:00
|
|
|
|
* 清除不可见字符
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {String} str
|
|
|
|
|
|
* @return {String}
|
|
|
|
|
|
*/
|
|
|
|
|
|
function clearNonPrintableCharacter (str) {
|
|
|
|
|
|
var str2 = '';
|
|
|
|
|
|
for (var i = 0, len = str.length; i < len; i++) {
|
|
|
|
|
|
str2 += str.charCodeAt(i) < 32 ? ' ' : str.charAt(i);
|
|
|
|
|
|
}
|
|
|
|
|
|
return str2.trim();
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
|
* 对双引号进行转义
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {String} str
|
|
|
|
|
|
* @return {String} str
|
|
|
|
|
|
*/
|
|
|
|
|
|
function escapeQuotes (str) {
|
|
|
|
|
|
return str.replace(REGEXP_QUOTE, '"e;');
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
|
* 对html实体编码进行转义
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {String} str
|
|
|
|
|
|
* @return {String}
|
|
|
|
|
|
*/
|
|
|
|
|
|
function escapeHtmlEntities (str) {
|
2013-12-24 12:06:52 +08:00
|
|
|
|
return str.replace(REGEXP_ATTR_VALUE_1, function replaceUnicode (str, code) {
|
|
|
|
|
|
return (code[0] === 'x' || code[0] === 'X')
|
|
|
|
|
|
? String.fromCharCode(parseInt(code.substr(1), 16))
|
|
|
|
|
|
: String.fromCharCode(parseInt(code, 10));
|
|
|
|
|
|
});
|
2013-12-24 11:36:14 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2013-12-24 12:23:47 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* 对html5新增的危险实体编码进行转义
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {String} str
|
|
|
|
|
|
* @return {String}
|
|
|
|
|
|
*/
|
|
|
|
|
|
function escapeDangerHtml5Entities (str) {
|
|
|
|
|
|
return str.replace(REGEXP_ATTR_VALUE_COLON, ':')
|
|
|
|
|
|
.replace(REGEXP_ATTR_VALUE_NEWLINE, ' ');
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2013-12-24 11:36:14 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* 对属性值进行转义
|
2013-05-08 16:21:46 +08:00
|
|
|
|
*
|
2013-12-24 11:36:14 +08:00
|
|
|
|
* @param {String} str
|
|
|
|
|
|
* @return {String}
|
2013-05-08 16:21:46 +08:00
|
|
|
|
*/
|
2013-12-24 11:36:14 +08:00
|
|
|
|
function safeAttrValue (str) {
|
|
|
|
|
|
// 去掉两边的空白字符
|
|
|
|
|
|
str = str.trim();
|
|
|
|
|
|
|
|
|
|
|
|
// 过滤双引号
|
|
|
|
|
|
str = escapeQuotes(str);
|
|
|
|
|
|
|
2013-12-24 12:23:47 +08:00
|
|
|
|
// 转换HTML实体编码
|
2013-12-24 11:36:14 +08:00
|
|
|
|
str = escapeHtmlEntities(str);
|
|
|
|
|
|
|
2013-12-24 12:23:47 +08:00
|
|
|
|
// 转换危险的HTML5新增实体编码
|
|
|
|
|
|
str = escapeDangerHtml5Entities(str);
|
|
|
|
|
|
|
2013-12-24 11:36:14 +08:00
|
|
|
|
// 清除不可见字符
|
|
|
|
|
|
str = clearNonPrintableCharacter(str);
|
|
|
|
|
|
|
|
|
|
|
|
return str;
|
2013-05-08 16:21:46 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* XSS过滤对象
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {Object} options 选项:whiteList, onTagAttr, onIgnoreTag
|
|
|
|
|
|
*/
|
|
|
|
|
|
function FilterXSS (options) {
|
|
|
|
|
|
'use strict';
|
2013-05-07 12:50:56 +08:00
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
this.options = options = options || {};
|
|
|
|
|
|
this.whiteList = options.whiteList || exports.whiteList;
|
|
|
|
|
|
this.onTagAttr = options.onTagAttr || exports.onTagAttr;
|
|
|
|
|
|
this.onIgnoreTag = options.onIgnoreTag || exports.onIgnoreTag;
|
|
|
|
|
|
}
|
2013-05-07 12:50:56 +08:00
|
|
|
|
|
2012-09-18 23:23:16 +08:00
|
|
|
|
/**
|
2013-05-07 13:30:00 +08:00
|
|
|
|
* 过滤不合法的属性
|
2012-09-18 23:23:16 +08:00
|
|
|
|
*
|
2013-05-07 13:30:00 +08:00
|
|
|
|
* @param {String} tagName 标签名称
|
|
|
|
|
|
* @param {String} attrs 标签属性部分
|
|
|
|
|
|
* @return {String}
|
2012-09-18 23:23:16 +08:00
|
|
|
|
*/
|
2013-05-07 13:30:00 +08:00
|
|
|
|
FilterXSS.prototype.filterAttributes = function (tagName, attrs) {
|
2012-09-18 23:23:16 +08:00
|
|
|
|
'use strict';
|
|
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
tagName = tagName.toLowerCase();
|
|
|
|
|
|
var me = this;
|
|
|
|
|
|
var whites = this.whiteList[tagName];
|
2012-09-18 23:23:16 +08:00
|
|
|
|
var lastPos = 0;
|
2013-05-07 13:46:49 +08:00
|
|
|
|
var _attrs = '';
|
2013-05-07 13:30:00 +08:00
|
|
|
|
var tmpName = false;
|
|
|
|
|
|
var hasSprit = false;
|
2013-05-07 13:46:49 +08:00
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
var addAttr = function (name, value) {
|
|
|
|
|
|
name = name.trim();
|
|
|
|
|
|
if (!hasSprit && name === '/') {
|
|
|
|
|
|
hasSprit = true;
|
|
|
|
|
|
return;
|
2013-11-05 17:47:36 +08:00
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
name = name.replace(REGEXP_ATTR_NAME, '').toLowerCase();
|
|
|
|
|
|
if (name.length < 1) return;
|
|
|
|
|
|
if (whites.indexOf(name) !== -1) {
|
|
|
|
|
|
if (value) {
|
2013-12-24 11:36:14 +08:00
|
|
|
|
// 先对属性值进行转义
|
|
|
|
|
|
value = safeAttrValue(value);
|
|
|
|
|
|
// 使用用户自定义的 onTagAttr 再过滤
|
2013-05-07 13:30:00 +08:00
|
|
|
|
var newValue = me.onTagAttr(tagName, name, value);
|
2013-05-08 16:23:16 +08:00
|
|
|
|
if (typeof newValue !== 'undefined') {
|
2013-05-07 13:30:00 +08:00
|
|
|
|
value = newValue;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
}
|
2012-09-19 09:04:23 +08:00
|
|
|
|
}
|
2013-05-07 13:46:49 +08:00
|
|
|
|
_attrs += name + (value ? '="' + value + '"' : '') + ' ';
|
2013-05-07 13:30:00 +08:00
|
|
|
|
}
|
|
|
|
|
|
};
|
2013-05-07 13:46:49 +08:00
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
for (var i = 0, len = attrs.length; i < len; i++) {
|
2013-11-05 17:47:36 +08:00
|
|
|
|
var c = attrs.charAt(i),v;
|
2013-05-07 13:30:00 +08:00
|
|
|
|
if (tmpName === false && c === '=') {
|
|
|
|
|
|
tmpName = attrs.slice(lastPos, i);
|
|
|
|
|
|
lastPos = i + 1;
|
|
|
|
|
|
continue;
|
|
|
|
|
|
}
|
|
|
|
|
|
if (tmpName !== false) {
|
|
|
|
|
|
if (i === lastPos && (c === '"' || c === "'")) {
|
|
|
|
|
|
var j = attrs.indexOf(c, i + 1);
|
|
|
|
|
|
if (j === -1) {
|
|
|
|
|
|
break;
|
2012-09-19 09:04:23 +08:00
|
|
|
|
} else {
|
2013-11-05 17:47:36 +08:00
|
|
|
|
v = attrs.slice(lastPos + 1, j).trim();
|
2012-09-19 09:04:23 +08:00
|
|
|
|
addAttr(tmpName, v);
|
2013-05-07 13:30:00 +08:00
|
|
|
|
tmpName = false;
|
|
|
|
|
|
i = j;
|
|
|
|
|
|
lastPos = i + 1;
|
|
|
|
|
|
continue;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
if (c === ' ') {
|
2013-11-05 17:47:36 +08:00
|
|
|
|
v = attrs.slice(lastPos, i).trim();
|
2012-09-19 09:04:23 +08:00
|
|
|
|
if (tmpName === false) {
|
2013-05-07 13:30:00 +08:00
|
|
|
|
addAttr(v);
|
2012-09-19 09:04:23 +08:00
|
|
|
|
} else {
|
2013-05-07 13:30:00 +08:00
|
|
|
|
addAttr(tmpName, v);
|
2012-09-19 09:04:23 +08:00
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
tmpName = false;
|
|
|
|
|
|
lastPos = i + 1;
|
|
|
|
|
|
continue;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
}
|
2013-05-07 13:46:49 +08:00
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
if (lastPos < attrs.length) {
|
|
|
|
|
|
if (tmpName === false) {
|
|
|
|
|
|
addAttr(attrs.slice(lastPos));
|
|
|
|
|
|
} else {
|
|
|
|
|
|
addAttr(tmpName, attrs.slice(lastPos));
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2013-05-07 13:46:49 +08:00
|
|
|
|
if (hasSprit) _attrs += '/';
|
2013-11-05 15:27:35 +08:00
|
|
|
|
|
2013-05-07 13:46:49 +08:00
|
|
|
|
return _attrs.trim();
|
2013-05-07 13:30:00 +08:00
|
|
|
|
};
|
2012-09-18 23:23:16 +08:00
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* 检查标签是否合法
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {String} tag 标签文本,如“<a”
|
|
|
|
|
|
* @param {Number} currentPos 原HTML的当前位置
|
|
|
|
|
|
* @param {Number} targetPos 生成的HTML的当前位置
|
|
|
|
|
|
*/
|
|
|
|
|
|
FilterXSS.prototype.addNewTag = function (tag, currentPos, targetPos) {
|
|
|
|
|
|
'use strict';
|
|
|
|
|
|
|
|
|
|
|
|
var rethtml = '';
|
2013-11-05 17:47:36 +08:00
|
|
|
|
var tagName;
|
|
|
|
|
|
var hasSprit;
|
2013-05-07 13:30:00 +08:00
|
|
|
|
var spos = tag.slice(0, 2) === '</' ? 2 : 1;
|
2013-11-05 15:27:35 +08:00
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
var i = tag.indexOf(' ');
|
|
|
|
|
|
if (i === -1) {
|
2013-11-05 17:47:36 +08:00
|
|
|
|
tagName = tag.slice(spos, tag.length - 1).trim();
|
2013-05-07 13:30:00 +08:00
|
|
|
|
} else {
|
2013-11-05 17:47:36 +08:00
|
|
|
|
tagName = tag.slice(spos, i + 1).trim();
|
2013-05-07 13:30:00 +08:00
|
|
|
|
}
|
|
|
|
|
|
tagName = tagName.toLowerCase();
|
2013-11-05 15:40:17 +08:00
|
|
|
|
|
|
|
|
|
|
// 检查标签是否以“/”结尾
|
|
|
|
|
|
if (tagName.slice(-1) === '/') {
|
|
|
|
|
|
tagName = tagName.slice(0, -1);
|
2013-11-05 17:47:36 +08:00
|
|
|
|
hasSprit = true;
|
2013-11-05 15:40:17 +08:00
|
|
|
|
} else {
|
2013-11-05 17:47:36 +08:00
|
|
|
|
hasSprit = false;
|
2013-11-05 15:40:17 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
if (tagName in this.whiteList) {
|
|
|
|
|
|
// 过滤不合法的属性
|
2012-09-18 23:23:16 +08:00
|
|
|
|
if (i === -1) {
|
2013-11-05 15:40:17 +08:00
|
|
|
|
rethtml += tag.slice(0, spos) + tagName + (hasSprit ? ' />' : '>');
|
2012-09-18 23:23:16 +08:00
|
|
|
|
} else {
|
2013-05-07 13:30:00 +08:00
|
|
|
|
var attrs = this.filterAttributes(tagName, tag.slice(i + 1, tag.length - 1).trim());
|
|
|
|
|
|
rethtml += tag.slice(0, spos) + tagName + (attrs.length > 0 ? ' ' + attrs : '') + '>';
|
2012-09-18 23:23:16 +08:00
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
} else {
|
|
|
|
|
|
// 过滤不合法的标签
|
|
|
|
|
|
var options = {
|
|
|
|
|
|
isClosing: (spos === 2),
|
|
|
|
|
|
position: targetPos,
|
|
|
|
|
|
originalPosition: currentPos - tag.length + 1
|
|
|
|
|
|
};
|
|
|
|
|
|
var tagHtml = this.onIgnoreTag(tagName, tag, options);
|
2013-05-08 16:23:16 +08:00
|
|
|
|
if (typeof tagHtml === 'undefined') {
|
2013-05-07 13:30:00 +08:00
|
|
|
|
tagHtml = noTag(tag);
|
2012-09-18 23:23:16 +08:00
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
rethtml += tagHtml;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
return rethtml;
|
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
|
* 开始处理
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {String} html
|
|
|
|
|
|
* @return {String}
|
|
|
|
|
|
*/
|
|
|
|
|
|
FilterXSS.prototype.process = function (html) {
|
|
|
|
|
|
'use strict';
|
|
|
|
|
|
|
|
|
|
|
|
var rethtml = '';
|
|
|
|
|
|
var lastPos = 0;
|
|
|
|
|
|
var tagStart = false;
|
|
|
|
|
|
var quoteStart = false;
|
|
|
|
|
|
var currentPos = 0;
|
2013-11-05 18:16:02 +08:00
|
|
|
|
var len = 0;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
|
|
|
|
|
|
// 逐个分析字符
|
2013-11-05 17:47:36 +08:00
|
|
|
|
for (currentPos = 0, len = html.length; currentPos < len; currentPos++) {
|
|
|
|
|
|
var c = html.charAt(currentPos);
|
2012-09-18 23:23:16 +08:00
|
|
|
|
if (tagStart === false) {
|
|
|
|
|
|
if (c === '<') {
|
2012-09-20 20:30:32 +08:00
|
|
|
|
tagStart = currentPos;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
continue;
|
|
|
|
|
|
}
|
|
|
|
|
|
} else {
|
|
|
|
|
|
if (quoteStart === false) {
|
|
|
|
|
|
if (c === '<') {
|
2012-09-20 20:30:32 +08:00
|
|
|
|
rethtml += noTag(html.slice(lastPos, currentPos));
|
|
|
|
|
|
tagStart = currentPos;
|
|
|
|
|
|
lastPos = currentPos;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
continue;
|
|
|
|
|
|
}
|
|
|
|
|
|
if (c === '>') {
|
2013-05-07 13:30:00 +08:00
|
|
|
|
rethtml += noTag(html.slice(lastPos, tagStart));
|
|
|
|
|
|
rethtml += this.addNewTag(html.slice(tagStart, currentPos + 1), currentPos, rethtml.length);
|
|
|
|
|
|
lastPos = currentPos + 1;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
tagStart = false;
|
|
|
|
|
|
continue;
|
|
|
|
|
|
}
|
|
|
|
|
|
if (c === '"' || c === "'") {
|
|
|
|
|
|
quoteStart = c;
|
|
|
|
|
|
continue;
|
|
|
|
|
|
}
|
|
|
|
|
|
} else {
|
|
|
|
|
|
if (c === quoteStart) {
|
|
|
|
|
|
quoteStart = false;
|
|
|
|
|
|
continue;
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
if (lastPos < html.length) {
|
|
|
|
|
|
rethtml += noTag(html.substr(lastPos));
|
|
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
|
2012-09-18 23:23:16 +08:00
|
|
|
|
return rethtml;
|
|
|
|
|
|
};
|
|
|
|
|
|
|
2013-05-07 13:30:00 +08:00
|
|
|
|
/**
|
|
|
|
|
|
* XSS过滤
|
|
|
|
|
|
*
|
|
|
|
|
|
* @param {String} html 要过滤的HTML代码
|
|
|
|
|
|
* @param {Object} options 选项:whiteList, onTagAttr, onIgnoreTag
|
|
|
|
|
|
* @return {String}
|
|
|
|
|
|
*/
|
|
|
|
|
|
function filterXSS (html, options) {
|
|
|
|
|
|
var xss = new FilterXSS(options);
|
|
|
|
|
|
return xss.process(html);
|
2013-11-05 17:47:36 +08:00
|
|
|
|
}
|
2013-05-07 13:30:00 +08:00
|
|
|
|
|
2012-09-19 19:56:20 +08:00
|
|
|
|
// 默认配置
|
2013-05-07 12:50:56 +08:00
|
|
|
|
exports = module.exports = filterXSS;
|
2013-05-07 13:30:00 +08:00
|
|
|
|
exports.FilterXSS = FilterXSS;
|
2012-09-18 23:23:16 +08:00
|
|
|
|
exports.whiteList = defaultWhiteList;
|
2012-09-19 08:03:16 +08:00
|
|
|
|
exports.onTagAttr = defaultOnTagAttr;
|
2012-09-19 19:56:20 +08:00
|
|
|
|
exports.onIgnoreTag = defaultOnIgnoreTag;
|
2012-09-20 20:55:42 +08:00
|
|
|
|
|
|
|
|
|
|
// 工具函数
|
|
|
|
|
|
exports.utils = require('./utils');
|
2013-04-19 16:31:22 +08:00
|
|
|
|
|
|
|
|
|
|
// 在浏览器端使用
|
|
|
|
|
|
if (typeof window !== 'undefined') {
|
2013-11-05 17:47:36 +08:00
|
|
|
|
if(!Array.indexOf){
|
|
|
|
|
|
Array.prototype.indexOf = function(item){
|
|
|
|
|
|
for(var i=0;i<this.length;i++){
|
|
|
|
|
|
if(this[i] == item) return i;
|
|
|
|
|
|
}
|
|
|
|
|
|
return -1;
|
|
|
|
|
|
};
|
|
|
|
|
|
}
|
|
|
|
|
|
if(!Array.forEach){
|
|
|
|
|
|
Array.prototype.forEach = function(fn){
|
2013-11-05 18:16:02 +08:00
|
|
|
|
for(var i=0;i<this.length;i++) fn(this[i],i,this);
|
2013-11-05 17:47:36 +08:00
|
|
|
|
};
|
|
|
|
|
|
}
|
|
|
|
|
|
if(!String.trim){
|
|
|
|
|
|
String.prototype.trim = function(){
|
2013-11-05 18:16:02 +08:00
|
|
|
|
return this.replace(/(^\s*)|(\s*$)/g,"");
|
2013-11-05 17:47:36 +08:00
|
|
|
|
};
|
|
|
|
|
|
}
|
2013-04-19 16:31:22 +08:00
|
|
|
|
window.filterXSS = module.exports;
|
|
|
|
|
|
}
|