pictcode / lib / Cake / Utility / Sanitize.php @ 9ddbf630
履歴 | 表示 | アノテート | ダウンロード (7.365 KB)
1 |
<?php
|
---|---|
2 |
/**
|
3 |
* Washes strings from unwanted noise.
|
4 |
*
|
5 |
* Helpful methods to make unsafe strings usable.
|
6 |
*
|
7 |
* CakePHP(tm) : Rapid Development Framework (http://cakephp.org)
|
8 |
* Copyright (c) Cake Software Foundation, Inc. (http://cakefoundation.org)
|
9 |
*
|
10 |
* Licensed under The MIT License
|
11 |
* For full copyright and license information, please see the LICENSE.txt
|
12 |
* Redistributions of files must retain the above copyright notice.
|
13 |
*
|
14 |
* @copyright Copyright (c) Cake Software Foundation, Inc. (http://cakefoundation.org)
|
15 |
* @link http://cakephp.org CakePHP(tm) Project
|
16 |
* @package Cake.Utility
|
17 |
* @since CakePHP(tm) v 0.10.0.1076
|
18 |
* @license http://www.opensource.org/licenses/mit-license.php MIT License
|
19 |
*/
|
20 |
|
21 |
App::uses('ConnectionManager', 'Model'); |
22 |
|
23 |
/**
|
24 |
* Data Sanitization.
|
25 |
*
|
26 |
* Removal of alphanumeric characters, SQL-safe slash-added strings, HTML-friendly strings,
|
27 |
* and all of the above on arrays.
|
28 |
*
|
29 |
* @package Cake.Utility
|
30 |
* @deprecated 3.0.0 Deprecated since version 2.4
|
31 |
*/
|
32 |
class Sanitize { |
33 |
|
34 |
/**
|
35 |
* Removes any non-alphanumeric characters.
|
36 |
*
|
37 |
* @param string $string String to sanitize
|
38 |
* @param array $allowed An array of additional characters that are not to be removed.
|
39 |
* @return string Sanitized string
|
40 |
*/
|
41 |
public static function paranoid($string, $allowed = array()) { |
42 |
$allow = null; |
43 |
if (!empty($allowed)) { |
44 |
foreach ($allowed as $value) { |
45 |
$allow .= "\\$value"; |
46 |
} |
47 |
} |
48 |
|
49 |
if (!is_array($string)) { |
50 |
return preg_replace("/[^{$allow}a-zA-Z0-9]/", '', $string); |
51 |
} |
52 |
|
53 |
$cleaned = array(); |
54 |
foreach ($string as $key => $clean) { |
55 |
$cleaned[$key] = preg_replace("/[^{$allow}a-zA-Z0-9]/", '', $clean); |
56 |
} |
57 |
|
58 |
return $cleaned; |
59 |
} |
60 |
|
61 |
/**
|
62 |
* Makes a string SQL-safe.
|
63 |
*
|
64 |
* @param string $string String to sanitize
|
65 |
* @param string $connection Database connection being used
|
66 |
* @return string SQL safe string
|
67 |
*/
|
68 |
public static function escape($string, $connection = 'default') { |
69 |
if (is_numeric($string) || $string === null || is_bool($string)) { |
70 |
return $string; |
71 |
} |
72 |
$db = ConnectionManager::getDataSource($connection); |
73 |
$string = $db->value($string, 'string'); |
74 |
$start = 1; |
75 |
if ($string{0} === 'N') { |
76 |
$start = 2; |
77 |
} |
78 |
|
79 |
return substr(substr($string, $start), 0, -1); |
80 |
} |
81 |
|
82 |
/**
|
83 |
* Returns given string safe for display as HTML. Renders entities.
|
84 |
*
|
85 |
* strip_tags() does not validating HTML syntax or structure, so it might strip whole passages
|
86 |
* with broken HTML.
|
87 |
*
|
88 |
* ### Options:
|
89 |
*
|
90 |
* - remove (boolean) if true strips all HTML tags before encoding
|
91 |
* - charset (string) the charset used to encode the string
|
92 |
* - quotes (int) see http://php.net/manual/en/function.htmlentities.php
|
93 |
* - double (boolean) double encode html entities
|
94 |
*
|
95 |
* @param string $string String from where to strip tags
|
96 |
* @param array $options Array of options to use.
|
97 |
* @return string Sanitized string
|
98 |
*/
|
99 |
public static function html($string, $options = array()) { |
100 |
static $defaultCharset = false; |
101 |
if ($defaultCharset === false) { |
102 |
$defaultCharset = Configure::read('App.encoding'); |
103 |
if ($defaultCharset === null) { |
104 |
$defaultCharset = 'UTF-8'; |
105 |
} |
106 |
} |
107 |
$defaults = array( |
108 |
'remove' => false, |
109 |
'charset' => $defaultCharset, |
110 |
'quotes' => ENT_QUOTES, |
111 |
'double' => true |
112 |
); |
113 |
|
114 |
$options += $defaults; |
115 |
|
116 |
if ($options['remove']) { |
117 |
$string = strip_tags($string); |
118 |
} |
119 |
|
120 |
return htmlentities($string, $options['quotes'], $options['charset'], $options['double']); |
121 |
} |
122 |
|
123 |
/**
|
124 |
* Strips extra whitespace from output
|
125 |
*
|
126 |
* @param string $str String to sanitize
|
127 |
* @return string whitespace sanitized string
|
128 |
*/
|
129 |
public static function stripWhitespace($str) { |
130 |
return preg_replace('/\s{2,}/u', ' ', preg_replace('/[\n\r\t]+/', '', $str)); |
131 |
} |
132 |
|
133 |
/**
|
134 |
* Strips image tags from output
|
135 |
*
|
136 |
* @param string $str String to sanitize
|
137 |
* @return string Sting with images stripped.
|
138 |
*/
|
139 |
public static function stripImages($str) { |
140 |
$preg = array( |
141 |
'/(<a[^>]*>)(<img[^>]+alt=")([^"]*)("[^>]*>)(<\/a>)/i' => '$1$3$5<br />', |
142 |
'/(<img[^>]+alt=")([^"]*)("[^>]*>)/i' => '$2<br />', |
143 |
'/<img[^>]*>/i' => '' |
144 |
); |
145 |
|
146 |
return preg_replace(array_keys($preg), array_values($preg), $str); |
147 |
} |
148 |
|
149 |
/**
|
150 |
* Strips scripts and stylesheets from output
|
151 |
*
|
152 |
* @param string $str String to sanitize
|
153 |
* @return string String with <link>, <img>, <script>, <style> elements and html comments removed.
|
154 |
*/
|
155 |
public static function stripScripts($str) { |
156 |
$regex =
|
157 |
'/(<link[^>]+rel="[^"]*stylesheet"[^>]*>|' .
|
158 |
'<img[^>]*>|style="[^"]*")|' .
|
159 |
'<script[^>]*>.*?<\/script>|' .
|
160 |
'<style[^>]*>.*?<\/style>|' .
|
161 |
'<!--.*?-->/is';
|
162 |
return preg_replace($regex, '', $str); |
163 |
} |
164 |
|
165 |
/**
|
166 |
* Strips extra whitespace, images, scripts and stylesheets from output
|
167 |
*
|
168 |
* @param string $str String to sanitize
|
169 |
* @return string sanitized string
|
170 |
*/
|
171 |
public static function stripAll($str) { |
172 |
return Sanitize::stripScripts( |
173 |
Sanitize::stripImages(
|
174 |
Sanitize::stripWhitespace($str) |
175 |
) |
176 |
); |
177 |
} |
178 |
|
179 |
/**
|
180 |
* Strips the specified tags from output. First parameter is string from
|
181 |
* where to remove tags. All subsequent parameters are tags.
|
182 |
*
|
183 |
* Ex.`$clean = Sanitize::stripTags($dirty, 'b', 'p', 'div');`
|
184 |
*
|
185 |
* Will remove all `<b>`, `<p>`, and `<div>` tags from the $dirty string.
|
186 |
*
|
187 |
* @param string $str String to sanitize.
|
188 |
* @return string sanitized String
|
189 |
*/
|
190 |
public static function stripTags($str) { |
191 |
$params = func_get_args(); |
192 |
|
193 |
for ($i = 1, $count = count($params); $i < $count; $i++) { |
194 |
$str = preg_replace('/<' . $params[$i] . '\b[^>]*>/i', '', $str); |
195 |
$str = preg_replace('/<\/' . $params[$i] . '[^>]*>/i', '', $str); |
196 |
} |
197 |
return $str; |
198 |
} |
199 |
|
200 |
/**
|
201 |
* Sanitizes given array or value for safe input. Use the options to specify
|
202 |
* the connection to use, and what filters should be applied (with a boolean
|
203 |
* value). Valid filters:
|
204 |
*
|
205 |
* - odd_spaces - removes any non space whitespace characters
|
206 |
* - encode - Encode any html entities. Encode must be true for the `remove_html` to work.
|
207 |
* - dollar - Escape `$` with `\$`
|
208 |
* - carriage - Remove `\r`
|
209 |
* - unicode -
|
210 |
* - escape - Should the string be SQL escaped.
|
211 |
* - backslash -
|
212 |
* - remove_html - Strip HTML with strip_tags. `encode` must be true for this option to work.
|
213 |
*
|
214 |
* @param string|array $data Data to sanitize
|
215 |
* @param string|array $options If string, DB connection being used, otherwise set of options
|
216 |
* @return mixed Sanitized data
|
217 |
*/
|
218 |
public static function clean($data, $options = array()) { |
219 |
if (empty($data)) { |
220 |
return $data; |
221 |
} |
222 |
|
223 |
if (!is_array($options)) { |
224 |
$options = array('connection' => $options); |
225 |
} |
226 |
|
227 |
$options += array( |
228 |
'connection' => 'default', |
229 |
'odd_spaces' => true, |
230 |
'remove_html' => false, |
231 |
'encode' => true, |
232 |
'dollar' => true, |
233 |
'carriage' => true, |
234 |
'unicode' => true, |
235 |
'escape' => true, |
236 |
'backslash' => true |
237 |
); |
238 |
|
239 |
if (is_array($data)) { |
240 |
foreach ($data as $key => $val) { |
241 |
$data[$key] = Sanitize::clean($val, $options); |
242 |
} |
243 |
return $data; |
244 |
} |
245 |
|
246 |
if ($options['odd_spaces']) { |
247 |
$data = str_replace(chr(0xCA), '', $data); |
248 |
} |
249 |
if ($options['encode']) { |
250 |
$data = Sanitize::html($data, array('remove' => $options['remove_html'])); |
251 |
} |
252 |
if ($options['dollar']) { |
253 |
$data = str_replace("\\\$", "$", $data); |
254 |
} |
255 |
if ($options['carriage']) { |
256 |
$data = str_replace("\r", "", $data); |
257 |
} |
258 |
if ($options['unicode']) { |
259 |
$data = preg_replace("/&#([0-9]+);/s", "&#\\1;", $data); |
260 |
} |
261 |
if ($options['escape']) { |
262 |
$data = Sanitize::escape($data, $options['connection']); |
263 |
} |
264 |
if ($options['backslash']) { |
265 |
$data = preg_replace("/\\\(?!&#|\?#)/", "\\", $data); |
266 |
} |
267 |
return $data; |
268 |
} |
269 |
} |