3 * FILTREATMENT CLASS FILE
6 * @author Cristian Năvălici {@link http://www.lemonsoftware.eu} lemonsoftware [at] gmail [.] com
7 * @version 1.31 17 March 2008
8 * @license http://opensource.org/licenses/gpl-license.php GNU Public License
9 * @package Filtreatment
13 //error_reporting(E_ALL);
16 * constant used in float comparisions
18 define('EPSILON', 1.0e-8);
23 * This class can be used to sanitize user inputs and prevent
24 * most of known vulnerabilities
25 * it requires at least PHP 5.0
27 * @package Filtreatment
38 * do some settings at init
43 function __construct() {
44 if ( get_magic_quotes_gpc() ) {
45 if ( !defined('MAGICQUOTES') ) define ('MAGICQUOTES', TRUE);
47 if ( !defined('MAGICQUOTES') ) define ('MAGICQUOTES', FALSE);
51 //-----------------------------------------------------------------------------
53 * CHECKS FOR AN INTEGER
55 * if the $minval and|or $maxval are set, a comparison will be performed
57 * NOTE: because the function can return 0 also as a valid result, check with === the return value
58 * @param int $input - what to check/transform
61 function ft_integer($input) {
62 $input_c = (int)$input;
63 $mnval = (int)$this->minval
;
64 $mxval = (int)$this->maxval
;
66 if ( !$mnval && !$mxval ) {
68 } else if ( $mnval && $mxval ) {
69 // check if they are in order (min < max)
70 if ( $mnval > $mxval ) {
76 // and then check if the value is between these values
77 return (($input >= $mnval) && ($input <= $mxval)) ?
$input_c : FALSE;
80 if ( $mnval ) return (($input >= $mnval) ?
$input_c : FALSE );
81 if ( $mxval ) return (($input <= $mxval) ?
$input_c : FALSE );
87 //-----------------------------------------------------------------------------
91 * if the $minval and|or $maxval are set, a comparison will be performed
93 * @param int $input - what to check/transform
96 function ft_float($input) {
97 $input_c = (float)$input;
98 $mnval = (float)$this->minval
;
99 $mxval = (float)$this->maxval
;
101 if ( !$mnval && !$mxval ) {
103 } else if ( $mnval && $mxval ) {
104 // check if they are in order (min < max)
105 if ( $this->ft_realcmp($mnval, $mxval) > 0 ) {
111 // and then check if the value is between these values
112 $lt = $this->ft_realcmp($input, $mxval); //-1 or 0 for true
113 if ( $lt === -1 ||
$lt === 0 ) $lt = $input_c; else $lt = FALSE;
115 $gt = $this->ft_realcmp($input, $mnval); //1 or 0 for true
116 if ( $gt === 1 ||
$gt === 0 ) $gt = TRUE; else $gt = FALSE;
118 return (( $lt && $gt ) ?
$input_c : FALSE);
120 // only one value set
122 $gt = $this->ft_realcmp($input, $mnval); //1 or 0 for true
123 return ( $gt === 1 ||
$gt === 0 ) ?
$input_c : FALSE;
127 $lt = $this->ft_realcmp($input, $mxval); //-1 or 0 for true
128 return ( $lt === -1 ||
$lt === 0 ) ?
$input_c : FALSE;
134 //-----------------------------------------------------------------------------
138 * must be in YYYY-MM-DD format
140 * @param string $str - date in requested format
141 * @return string|bool - the string itselfs only for valid date
143 function ft_validdate($str) {
144 if ( preg_match("/([0-9]{4})-([0-9]{1,2})-([0-9]{1,2})/", $str) ) {
145 $arr = split("-",$str); // splitting the array
146 $yy = $arr[0]; // first element of the array is year
147 $mm = $arr[1]; // second element is month
148 $dd = $arr[2]; // third element is days
149 return ( checkdate($mm, $dd, $yy) ?
$str : FALSE );
155 //-----------------------------------------------------------------------------
161 * @param string $str - email to validate
162 * @return string|bool - the string itselfs only for valid email
164 function ft_email($email) {
166 $value = stripslashes($email);
169 // check for @ symbol and maximum allowed lengths
170 if (!ereg("^[^@]{1,64}@[^@]{1,255}$", $email)) { return FALSE; }
172 // split for sections
173 $email_array = explode("@", $email);
174 $local_array = explode(".", $email_array[0]);
176 for ($i = 0; $i < sizeof($local_array); $i++
) {
177 if ( !ereg("^(([A-Za-z0-9!#$%&'*+/=?^_`{|}~-][A-Za-z0-9!#$%&'*+/=?^_`{|}~\.-]{0,63})|(\"[^(\\|\")]{0,62}\"))$", $local_array[$i]) ) {
182 if (!ereg("^\[?[0-9\.]+\]?$", $email_array[1])) {
183 // verify if domain is IP. If not, it must be a valid domain name
184 $domain_array = explode(".", $email_array[1]);
185 if (sizeof($domain_array) < 2) { return FALSE; }
187 for ($i = 0; $i < sizeof($domain_array); $i++
) {
188 if (!ereg("^(([A-Za-z0-9][A-Za-z0-9-]{0,61}[A-Za-z0-9])|([A-Za-z0-9]+))$", $domain_array[$i])) {
197 //-----------------------------------------------------------------------------
199 * PREPARES THE INPUT FOR DATABASE
201 * works with mysql/postgresql
202 * NOTE: mysql_real_escape_string() requires that a valid mysql connection (mysql_connect()) exists to work
204 * @param string $value - email to validate
205 * @param string $db_type - allow two constants MYSQL | PGSQL
206 * @return string|bool $value sanitized value
208 function ft_dbsql($value, $db_type = 'MYSQL') {
210 $value = stripslashes($value);
213 // Quote if not a number or a numeric string
214 if (!is_numeric($value)) {
215 /*switch ($db_type) {
216 case 'MYSQL': $value = "'" . mysql_real_escape_string($value) . "'"; break;
217 case 'PGSQL': $value = "'" . pg_escape_string($value) . "'"; break;
219 // trick to not modify the openemr genuine code who put the string (already quoted) in quotes!
221 case 'MYSQL': $value = mysql_real_escape_string($value); break;
222 case 'PGSQL': $value = pg_escape_string($value); break;
230 //-----------------------------------------------------------------------------
232 * WORKS ON A STRING WITH REGEX EXPRESSION
234 * checks a string for specified characters
236 * @param string $value - variable to sanitize
237 * @param string $regex - is in a special form detailed below:
238 * it contains ONLY allowed characters, ANY other characters making invalid string
239 * it must NOT contain begin/end delimitators /[... ]/
240 * eg: 0-9, 0-9A-Za-z, AERS
241 * @param int $cv - 1 or 2
242 * @return string|bool return string if check succeed ($cv = 1) or string with replaced chars
245 function ft_strregex($value, $regex, $cv = 1) {
246 $s = TRUE; //var control
247 $regexfull = "/[^" . $regex . "]/";
249 // function of $cv might be a clean up operation, or just verifying
253 $s = ( preg_match($regexfull, $value) ?
FALSE : TRUE );
256 // cleanup the string
258 $value = preg_replace($regexfull,'',$value);
261 // if $cv is not specified or it's wrong
262 default: if ( preg_match($regexfull, $value) ) $s = FALSE;
265 return ( $s ?
$value : FALSE );
270 //-----------------------------------------------------------------------------
274 * NOTE all credits goes to codeigniter.com
275 * @param string $str - string to check
276 * @param string $charset - character set (default ISO-8859-1)
277 * @return string|bool $value sanitized string
279 function ft_xss($str, $charset = 'ISO-8859-1') {
281 * Remove Null Characters
283 * This prevents sandwiching null characters
284 * between ascii characters, like Java\0script.
287 $str = preg_replace('/\0+/', '', $str);
288 $str = preg_replace('/(\\\\0)+/', '', $str);
291 * Validate standard character entities
293 * Add a semicolon if missing. We do this to enable
294 * the conversion of entities to ASCII later.
297 $str = preg_replace('#(&\#*\w+)[\x00-\x20]+;#u',"\\1;",$str);
300 * Validate UTF16 two byte encoding (x00)
302 * Just as above, adds a semicolon if missing.
305 $str = preg_replace('#(&\#x*)([0-9A-F]+);*#iu',"\\1\\2;",$str);
310 * Just in case stuff like this is submitted:
312 * <a href="http://%77%77%77%2E%67%6F%6F%67%6C%65%2E%63%6F%6D">Google</a>
314 * Note: Normally urldecode() would be easier but it removes plus signs
317 $str = preg_replace("/%u0([a-z0-9]{3})/i", "&#x\\1;", $str);
318 $str = preg_replace("/%([a-z0-9]{2})/i", "&#x\\1;", $str);
321 * Convert character entities to ASCII
323 * This permits our tests below to work reliably.
324 * We only convert entities that are within tags since
325 * these are the ones that will pose security problems.
328 if (preg_match_all("/<(.+?)>/si", $str, $matches)) {
329 for ($i = 0; $i < count($matches['0']); $i++
) {
330 $str = str_replace($matches['1'][$i],
331 html_entity_decode($matches['1'][$i], ENT_COMPAT
, $charset), $str);
336 * Convert all tabs to spaces
338 * This prevents strings like this: ja vascript
339 * Note: we deal with spaces between characters later.
342 $str = preg_replace("#\t+#", " ", $str);
345 * Makes PHP tags safe
347 * Note: XML tags are inadvertently replaced too:
351 * But it doesn't seem to pose a problem.
354 $str = str_replace(array('<?php', '<?PHP', '<?', '?>'), array('<?php', '<?PHP', '<?', '?>'), $str);
357 * Compact any exploded words
359 * This corrects words like: j a v a s c r i p t
360 * These words are compacted back to their correct state.
363 $words = array('javascript', 'vbscript', 'script', 'applet', 'alert', 'document', 'write', 'cookie', 'window');
364 foreach ($words as $word) {
366 for ($i = 0; $i < strlen($word); $i++
) {
367 $temp .= substr($word, $i, 1)."\s*";
370 $temp = substr($temp, 0, -3);
371 $str = preg_replace('#'.$temp.'#s', $word, $str);
372 $str = preg_replace('#'.ucfirst($temp).'#s', ucfirst($word), $str);
376 * Remove disallowed Javascript in links or img tags
378 $str = preg_replace("#<a.+?href=.*?(alert\(|alert&\#40;|javascript\:|window\.|document\.|\.cookie|<script|<xss).*?\>.*?</a>#si", "", $str);
379 $str = preg_replace("#<img.+?src=.*?(alert\(|alert&\#40;|javascript\:|window\.|document\.|\.cookie|<script|<xss).*?\>#si","", $str);
380 $str = preg_replace("#<(script|xss).*?\>#si", "", $str);
383 * Remove JavaScript Event Handlers
385 * Note: This code is a little blunt. It removes
386 * the event handler and anything up to the closing >,
387 * but it's unlikely to be a problem.
390 $str = preg_replace('#(<[^>]+.*?)(onblur|onchange|onclick|onfocus|onload|onmouseover|onmouseup|onmousedown|onselect|onsubmit|onunload|onkeypress|onkeydown|onkeyup|onresize)[^>]*>#iU',"\\1>",$str);
393 * Sanitize naughty HTML elements
395 * If a tag containing any of the words in the list
396 * below is found, the tag gets converted to entities.
399 * Becomes: <blink>
402 $str = preg_replace('#<(/*\s*)(alert|applet|basefont|base|behavior|bgsound|blink|body|embed|expression|form|frameset|frame|head|html|ilayer|iframe|input|layer|link|meta|object|plaintext|style|script|textarea|title|xml|xss)([^>]*)>#is', "<\\1\\2\\3>", $str);
405 * Sanitize naughty scripting elements
407 * Similar to above, only instead of looking for
408 * tags it looks for PHP and JavaScript commands
409 * that are disallowed. Rather than removing the
410 * code, it simply converts the parenthesis to entities
411 * rendering the code un-executable.
413 * For example: eval('some code')
414 * Becomes: eval('some code')
417 $str = preg_replace('#(alert|cmd|passthru|eval|exec|system|fopen|fsockopen|file|file_get_contents|readfile|unlink)(\s*)\((.*?)\)#si', "\\1\\2(\\3)", $str);
422 * This adds a bit of extra precaution in case
423 * something got through the above filters
428 'document.cookie' => '',
429 'document.write' => '',
430 'window.location' => '',
431 "javascript\s*:" => '',
432 "Redirect\s+302" => '',
437 foreach ($bad as $key => $val) {
438 $str = preg_replace("#".$key."#i", $val, $str);
445 //-----------------------------------------------------------------------------
449 * @param int $mode - if 1 then echo the string; if 2 then echo the string
452 function display_error($mode = 1) {
453 $errstr = ( $this->error
) ?
$this->error
: '';
455 echo '<br />' .$this->ft_xss($errstr) . '<br />';
457 return $this->ft_xss($errstr);
462 //-----------------------------------------------------------------------------
464 * REAL COMPARASION BETWEEN FLOATS
466 * 0 - for ==, 1 for r1 > r2, -1 for r1 '<' r2
472 function ft_realcmp($r1, $r2) {
475 if ( abs($diff) < EPSILON
) return 0;
476 else return $diff < 0 ?
-1 : 1;
480 //-----------------------------------------------------------------------------