具体方法如下:

HtmlAttributeFilter.class.

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

79

80

81

82

83

84

85

86

87

88

89

90

91

92

93

94

95

96

97

98

99

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

/** HTML Attribute Filter

* Date: 2013-09-22

* Author: fdipzone

* ver: 1.0

*

* Func:

* public strip 过滤属性

* public setAllow 设置允许的属性

* public setException 设置特例

* public setIgnore 设置忽略的标记

* private findElements 搜寻需要处理的元素

* private findAttributes 搜寻属性

* private removeAttributes 移除属性

* private isException 判断是否特例

* private createAttributes 创建属性

* private protect 特殊字符转义

*/

class HtmlAttributeFilter{ // class start

private $_str = ''; // 源字符串

private $_allow = array(); // 允许保留的属性 例如:array('id','class','title')

private $_exception = array(); // 特例 例如:array('a'=>array('href','class'),'span'=>array('class'))

private $_ignore = array(); // 忽略过滤的标记 例如:array('span','img')

/** 处理HTML,过滤不保留的属性

* @param String $str 源字符串

* @return String

*/

public function strip($str){

$this->_str = $str;

if(is_string($this->_str) && strlen($this->_str)>0){ // 判断字符串

$this->_str = strtolower($this->_str); // 转成小写

$res = $this->findElements();

if(is_string($res)){

return $res;

}

$nodes = $this->findAttributes($res);

$this->removeAttributes($nodes);

}

return $this->_str;

}

/** 设置允许的属性

* @param Array $param

*/

public function setAllow($param=array()){

$this->_allow = $param;

}

/** 设置特例

* @param Array $param

*/

public function setException($param=array()){

$this->_exception = $param;

}

/** 设置忽略的标记

* @param Array $param

*/

public function setIgnore($param=array()){

$this->_ignore = $param;

}

/** 搜寻需要处理的元素 */

private function findElements(){

$nodes = array();

preg_match_all("/<([^ !\/\>\n]+)([^>]*)>/i", $this->_str, $elements);

foreach($elements[1] as $el_key => $element){

if($elements[2][$el_key]){

$literal = $elements[0][$el_key];

$element_name = $elements[1][$el_key];

$attributes = $elements[2][$el_key];

if(is_array($this->_ignore) && !in_array($element_name, $this->_ignore)){

$nodes[] = array('literal'=>$literal, 'name'=>$element_name, 'attributes'=>$attributes);

}

}

}

if(!$nodes[0]){

return $this->_str;

}else{

return $nodes;

}

}

/** 搜寻属性

* @param Array $nodes 需要处理的元素

*/

private function findAttributes($nodes){

foreach($nodes as &$node){

preg_match_all("/([^ =]+)\s*=\s*[\"|']{0,1}([^\"']*)[\"|']{0,1}/i", $node['attributes'], $attributes);

if($attributes[1]){

foreach($attributes[1] as $att_key=>$att){

$literal = $attributes[0][$att_key];

$attribute_name = $attributes[1][$att_key];

$value = $attributes[2][$att_key];

$atts[] = array('literal'=>$literal, 'name'=>$attribute_name, 'value'=>$value);

}

}else{

$node['attributes'] = null;

}

$node['attributes'] = $atts;

unset($atts);

}

return $nodes;

}

/** 移除属性

* @param Array $nodes 需要处理的元素

*/

private function removeAttributes($nodes){

foreach($nodes as $node){

$node_name = $node['name'];

$new_attributes = '';

if(is_array($node['attributes'])){

foreach($node['attributes'] as $attribute){

if((is_array($this->_allow) && in_array($attribute['name'], $this->_allow)) || $this->isException($node_name, $attribute['name'], $this->_exception)){

$new_attributes = $this->createAttributes($new_attributes, $attribute['name'], $attribute['value']);

}

}

}

$replacement = ($new_attributes) ? "<$node_name $new_attributes>" : "<$node_name>";

$this->_str = preg_replace('/'.$this->protect($node['literal']).'/', $replacement, $this->_str);

}

}

/** 判断是否特例

* @param String $element_name 元素名

* @param String $attribute_name 属性名

* @param Array $exceptions 允许的特例

* @return boolean

*/

private function isException($element_name, $attribute_name, $exceptions){

if(array_key_exists($element_name, $this->_exception)){

if(in_array($attribute_name, $this->_exception[$element_name])){

return true;

}

}

return false;

}

/** 创建属性

* @param String $new_attributes

* @param String $name

* @param String $value

* @return String

*/

private function createAttributes($new_attributes, $name, $value){

if($new_attributes){

$new_attributes .= " ";

}

$new_attributes .= "$name=\"$value\"";

return $new_attributes;

}

/** 特殊字符转义

* @param String $str 源字符串

* @return String

*/

private function protect($str){

$conversions = array(

"^" => "\^",

"[" => "\[",

"." => "\.",

"$" => "\$",

"{" => "\{",

"*" => "\*",

"(" => "\(",

"\\" => "\\\\",

"/" => "\/",

"+" => "\+",

")" => "\)",

"|" => "\|",

"?" => "\?",

" "\

">" => "\>"

);

return strtr($str, $conversions);

}

} // class end

?>

demo示例代码如下:

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

require('HtmlAttributeFilter.class.

$str = '

';

$obj = new HtmlAttributeFilter();

// 允许id属性

$obj->setAllow(array('id'));

$obj->setException(array(

'a' => array('href'), // a 标签允许有 href属性特例

'ul' => array('class') // ul 标签允许有 class属性特例

));

// img 标签忽略,不过滤任何属性

$obj->setIgnore(array('img'));

echo 'source str:
';

echo htmlspecialchars($str).'

';

echo 'filter str:
';

echo htmlspecialchars($obj->strip($str));

?>

09-14 22:04