<?php /** * @copyright Copyright (c) 2009-2021 Ryan Demmer. All rights reserved * @license GNU/GPL 2 or later - http://www.gnu.org/licenses/old-licenses/gpl-2.0.html * JCE is free software. This version may have been modified pursuant * to the GNU General Public License, and as distributed it includes or * is derivative of works licensed under the GNU General Public License or * other free or open source software licenses */ defined('_JEXEC') or die('RESTRICTED'); /* Set internal character encoding to UTF-8 */ if (function_exists('mb_internal_encoding')) { mb_internal_encoding("UTF-8"); } abstract class WFUtility { /** * Multi-byte-safe pathinfo replacement. * Drop-in replacement for pathinfo(), but multibyte- and cross-platform-safe. * * From PHPMailer - https://github.com/PHPMailer/PHPMailer/blob/v6.1.4/src/PHPMailer.php#L4256-L4302 * * @see http://www.php.net/manual/en/function.pathinfo.php#107461 * * @param string $path A filename or path, does not need to exist as a file * @param int|string $options Either a PATHINFO_* constant, * or a string name to return only the specified piece * * @return string|array */ public static function mb_pathinfo($path, $options = null) { // check if multibyte string, use pathname() if not if (function_exists('mb_strlen')) { if (mb_strlen($path) === strlen($path)) { return pathinfo($path, $options); } } $ret = array('dirname' => '', 'basename' => '', 'extension' => '', 'filename' => ''); $pathinfo = array(); if (preg_match('#^(.*?)[\\\\/]*(([^/\\\\]*?)(\.([^.\\\\/]+?)|))[\\\\/.]*$#m', $path, $pathinfo)) { if (array_key_exists(1, $pathinfo)) { $ret['dirname'] = $pathinfo[1]; } if (array_key_exists(2, $pathinfo)) { $ret['basename'] = $pathinfo[2]; } if (array_key_exists(5, $pathinfo)) { $ret['extension'] = $pathinfo[5]; } if (array_key_exists(3, $pathinfo)) { $ret['filename'] = $pathinfo[3]; } } switch ($options) { case PATHINFO_DIRNAME: case 'dirname': return $ret['dirname']; case PATHINFO_BASENAME: case 'basename': return $ret['basename']; case PATHINFO_EXTENSION: case 'extension': return $ret['extension']; case PATHINFO_FILENAME: case 'filename': return $ret['filename']; default: return $ret; } } /** * Get the file extension from a path * * @param string $path The file path * @return string The file extension */ public static function getExtension($path) { $dot = strrpos($path, '.') + 1; return substr($path, $dot); } /** * Remove the extension from a file name or path * * @param string $path The file path * @return string The file path without the extension */ public static function stripExtension($path) { return preg_replace('#\.[^.]*$#', '', $path); } /** * Get the file name * * @param string $path The file path * @return string The file name without the path or extension */ public static function getFilename($path) { // check if multibyte string, use basename() if not if (function_exists('mb_strlen')) { if (mb_strlen($path) === strlen($path)) { return pathinfo($path, PATHINFO_FILENAME); } } // get basename $path = self::mb_basename($path); // remove name without extension return self::stripExtension($path); } public static function cleanPath($path, $ds = DIRECTORY_SEPARATOR, $prefix = '') { $path = trim(rawurldecode($path)); // check for UNC path on IIS and set prefix if ($ds == '\\' && strlen($path) > 1) { if ($path[0] == '\\' && $path[1] == '\\') { $prefix = '\\'; } } // clean path, removing double slashes, replacing back/forward slashes with DIRECTORY_SEPARATOR $path = preg_replace('#[/\\\\]+#', $ds, $path); // return path with prefix if any return $prefix . $path; } /** * Append a DIRECTORY_SEPARATOR to the path if required. * * @param string $path the path * @param string $ds optional directory seperator * * @return string path with trailing DIRECTORY_SEPARATOR */ public static function fixPath($path, $ds = DIRECTORY_SEPARATOR) { return self::cleanPath($path . $ds); } private static function checkCharValue($string) { // null byte check if (strstr($string, "\x00")) { return false; } if (preg_match('#([^\w\.\-\/\\\\\s ])#i', $string, $matches)) { foreach ($matches as $match) { // not a safe UTF-8 character if (ord($match) < 127) { return false; } } } return true; } public static function checkPath($path) { $path = urldecode($path); if (self::checkCharValue($path) === false || strpos($path, '..') !== false) { throw new InvalidArgumentException('Invalid path'); } } /** * Concat two paths together. Basically $a + $b. * * @param string $a path one * @param string $b path two * @param string $ds optional directory seperator * * @return string $a DIRECTORY_SEPARATOR $b */ public static function makePath($a, $b, $ds = DIRECTORY_SEPARATOR) { return self::cleanPath($a . $ds . $b, $ds); } private static function utf8_latin_to_ascii($subject) { static $CHARS = null; if (is_null($CHARS)) { $CHARS = array( 'À' => 'A', 'Á' => 'A', 'Â' => 'A', 'Ã' => 'A', 'Ä' => 'A', 'Å' => 'A', 'Æ' => 'AE', 'Ç' => 'C', 'È' => 'E', 'É' => 'E', 'Ê' => 'E', 'Ë' => 'E', 'Ì' => 'I', 'Í' => 'I', 'Î' => 'I', 'Ï' => 'I', 'Ð' => 'D', 'Ñ' => 'N', 'Ò' => 'O', 'Ó' => 'O', 'Ô' => 'O', 'Õ' => 'O', 'Ö' => 'O', 'Ø' => 'O', 'Ù' => 'U', 'Ú' => 'U', 'Û' => 'U', 'Ü' => 'U', 'Ý' => 'Y', 'ß' => 's', 'à' => 'a', 'á' => 'a', 'â' => 'a', 'ã' => 'a', 'ä' => 'a', 'å' => 'a', 'æ' => 'ae', 'ç' => 'c', 'è' => 'e', 'é' => 'e', 'ê' => 'e', 'ë' => 'e', 'ì' => 'i', 'í' => 'i', 'î' => 'i', 'ï' => 'i', 'ñ' => 'n', 'ò' => 'o', 'ó' => 'o', 'ô' => 'o', 'õ' => 'o', 'ö' => 'o', 'ø' => 'o', 'ù' => 'u', 'ú' => 'u', 'û' => 'u', 'ü' => 'u', 'ý' => 'y', 'ÿ' => 'y', 'Ā' => 'A', 'ā' => 'a', 'Ă' => 'A', 'ă' => 'a', 'Ą' => 'A', 'ą' => 'a', 'Ć' => 'C', 'ć' => 'c', 'Ĉ' => 'C', 'ĉ' => 'c', 'Ċ' => 'C', 'ċ' => 'c', 'Č' => 'C', 'č' => 'c', 'Ď' => 'D', 'ď' => 'd', 'Đ' => 'D', 'đ' => 'd', 'Ē' => 'E', 'ē' => 'e', 'Ĕ' => 'E', 'ĕ' => 'e', 'Ė' => 'E', 'ė' => 'e', 'Ę' => 'E', 'ę' => 'e', 'Ě' => 'E', 'ě' => 'e', 'Ĝ' => 'G', 'ĝ' => 'g', 'Ğ' => 'G', 'ğ' => 'g', 'Ġ' => 'G', 'ġ' => 'g', 'Ģ' => 'G', 'ģ' => 'g', 'Ĥ' => 'H', 'ĥ' => 'h', 'Ħ' => 'H', 'ħ' => 'h', 'Ĩ' => 'I', 'ĩ' => 'i', 'Ī' => 'I', 'ī' => 'i', 'Ĭ' => 'I', 'ĭ' => 'i', 'Į' => 'I', 'į' => 'i', 'İ' => 'I', 'ı' => 'i', 'IJ' => 'IJ', 'ij' => 'ij', 'Ĵ' => 'J', 'ĵ' => 'j', 'Ķ' => 'K', 'ķ' => 'k', 'Ĺ' => 'L', 'ĺ' => 'l', 'Ļ' => 'L', 'ļ' => 'l', 'Ľ' => 'L', 'ľ' => 'l', 'Ŀ' => 'L', 'ŀ' => 'l', 'Ł' => 'l', 'ł' => 'l', 'Ń' => 'N', 'ń' => 'n', 'Ņ' => 'N', 'ņ' => 'n', 'Ň' => 'N', 'ň' => 'n', 'ʼn' => 'n', 'Ō' => 'O', 'ō' => 'o', 'Ŏ' => 'O', 'ŏ' => 'o', 'Ő' => 'O', 'ő' => 'o', 'Œ' => 'OE', 'œ' => 'oe', 'Ŕ' => 'R', 'ŕ' => 'r', 'Ŗ' => 'R', 'ŗ' => 'r', 'Ř' => 'R', 'ř' => 'r', 'Ś' => 'S', 'ś' => 's', 'Ŝ' => 'S', 'ŝ' => 's', 'Ş' => 'S', 'ş' => 's', 'Š' => 'S', 'š' => 's', 'Ţ' => 'T', 'ţ' => 't', 'Ť' => 'T', 'ť' => 't', 'Ŧ' => 'T', 'ŧ' => 't', 'Ũ' => 'U', 'ũ' => 'u', 'Ū' => 'U', 'ū' => 'u', 'Ŭ' => 'U', 'ŭ' => 'u', 'Ů' => 'U', 'ů' => 'u', 'Ű' => 'U', 'ű' => 'u', 'Ų' => 'U', 'ų' => 'u', 'Ŵ' => 'W', 'ŵ' => 'w', 'Ŷ' => 'Y', 'ŷ' => 'y', 'Ÿ' => 'Y', 'Ź' => 'Z', 'ź' => 'z', 'Ż' => 'Z', 'ż' => 'z', 'Ž' => 'Z', 'ž' => 'z', 'ſ' => 's', 'ƒ' => 'f', 'Ơ' => 'O', 'ơ' => 'o', 'Ư' => 'U', 'ư' => 'u', 'Ǎ' => 'A', 'ǎ' => 'a', 'Ǐ' => 'I', 'ǐ' => 'i', 'Ǒ' => 'O', 'ǒ' => 'o', 'Ǔ' => 'U', 'ǔ' => 'u', 'Ǖ' => 'U', 'ǖ' => 'u', 'Ǘ' => 'U', 'ǘ' => 'u', 'Ǚ' => 'U', 'ǚ' => 'u', 'Ǜ' => 'U', 'ǜ' => 'u', 'Ǻ' => 'A', 'ǻ' => 'a', 'Ǽ' => 'AE', 'ǽ' => 'ae', 'Ǿ' => 'O', 'ǿ' => 'o', ); } if (function_exists('transliterator_transliterate')) { if (is_array($subject)) { /*array_walk($subject, function (&$string) { $string = WFUtility::utf8_latin_to_ascii($string); });*/ for ($i = 0; $i < count($subject); $i++) { $subject[$i] = WFUtility::utf8_latin_to_ascii($subject[$i]); } return $subject; } $transformed = transliterator_transliterate('Any-Latin; Latin-ASCII;', $subject); if ($transformed !== false) { return $transformed; } return str_replace(array_keys($CHARS), array_values($CHARS), $subject); } return str_replace(array_keys($CHARS), array_values($CHARS), $subject); } protected static function changeCase($string, $case) { if (!function_exists('mb_strtolower') || !function_exists('mb_strtoupper')) { return $string; } if (is_array($string)) { for ($i = 0; $i < count($string); $i++) { $string[$i] = WFUtility::changeCase($string[$i], $case); } } else { switch ($case) { case 'lowercase': $string = mb_strtolower($string); break; case 'uppercase': $string = mb_strtoupper($string); break; } } return $string; } private static function cleanUTF8($string) { // remove some common characters $string = preg_replace('#[\+\\\/\?\#%&<>"\'=\[\]\{\},;@\^\(\)£€$~]#', '', $string); $result = ''; $length = strlen($string); for ($i = 0; $i < $length; $i++) { $char = $string[$i]; // only process on possible restricted characters or utf-8 letters/numbers if (preg_match('#[^\w\.\-\s ]#', $char)) { // skip any character less than 127, eg: &?@* etc. if (ord($char) < 127) { continue; } } $result .= $char; } return $result; } /** * Makes file name safe to use. * * @param mixed The name of the file (not full path) * * @return mixed The sanitised string or array */ public static function makeSafe($subject, $mode = 'utf-8', $spaces = '_', $case = '') { $search = array(); // set default mode if none is passed in if (empty($mode)) { $mode = 'utf-8'; } if (!function_exists('mb_internal_encoding')) { $mode = 'ascii'; } // trim if (is_array($subject)) { $subject = array_map('trim', $subject); } else { $subject = trim($subject); } // replace spaces with specified character or space if (is_string($spaces)) { $subject = preg_replace('#[\s ]+#', $spaces, $subject); } if ($mode === 'utf-8') { $search[] = '#[^\pL\pM\pN_\.\-\s ]#u'; } else { $subject = self::utf8_latin_to_ascii($subject); $search[] = '#[^a-zA-Z0-9_\.\-\s ]#'; } // remove multiple . characters $search[] = '#(\.){2,}#'; // strip leading period $search[] = '#^\.#'; // strip trailing period $search[] = '#\.$#'; // strip whitespace $search[] = '#^\s*|\s*$#'; // only for utf-8 to avoid PCRE errors - PCRE must be at least version 5 if ($mode == 'utf-8') { try { // perform pcre replacement $result = preg_replace($search, '', $subject); } catch (Exception $e) { // try ascii return self::makeSafe($subject, 'ascii'); } // try ascii if (is_null($result) || $result === false) { return self::makeSafe($subject, 'ascii'); } if ($case) { // change case $result = self::changeCase($result, $case); } return $result; } $result = preg_replace($search, '', $subject); if ($case) { // change case $result = self::changeCase($result, $case); } return $result; } /** * Format the file size, limits to Mb. * * @param int $size the raw filesize * * @return string formated file size */ public static function formatSize($size) { if ($size < 1024) { return $size . ' ' . WFText::_('WF_LABEL_BYTES'); } elseif ($size >= 1024 && $size < 1024 * 1024) { return sprintf('%01.2f', $size / 1024.0) . ' ' . WFText::_('WF_LABEL_KB'); } else { return sprintf('%01.2f', $size / (1024.0 * 1024)) . ' ' . WFText::_('WF_LABEL_MB'); } } /** * Format the date. * * @param int $date the unix datestamp * * @return string formated date */ public static function formatDate($date, $format = '%d/%m/%Y, %H:%M') { return strftime($format, $date); } /** * Get the modified date of a file. * * @return Formatted modified date * * @param string $file Absolute path to file */ public static function getDate($file) { return self::formatDate(@filemtime($file)); } /** * Get the size of a file. * * @return Formatted filesize value * * @param string $file Absolute path to file */ public static function getSize($file) { return self::formatSize(@filesize($file)); } /** * Multi-byte-safe dirname replacement. * https://gist.github.com/tcyrus/257a1ed93c5e115b7b33426d029b5c5f * * @param string $path A Path * @param int $levels The number of parent directories to go up. * @return string The path of a parent directory. */ public static function mb_dirname($path) { // check if multibyte string, use dirname() if not if (function_exists('mb_strlen')) { if (mb_strlen($path) === strlen($path)) { return dirname($path); } } // clean $path = self::cleanPath($path, '/'); // get last slash position $slash = strrpos($path, '/') + 1; // return dirname return substr($path, 0, $slash); } public static function mb_basename($path, $ext = '') { // check if multibyte string, use basename() if not if (function_exists('mb_strlen')) { if (mb_strlen($path) === strlen($path)) { return basename($path, $ext); } } // clean $path = self::cleanPath($path, '/'); // split path $parts = explode('/', $path); // return basename $path = end($parts); if ($ext === '.' . self::getExtension($path)) { $path = self::stripExtension($path); } return $path; } public static function convertEncoding($string) { if (!function_exists('mb_detect_encoding')) { // From http://w3.org/International/questions/qa-forms-utf-8.html $isUTF8 = preg_match('%^(?: [\x09\x0A\x0D\x20-\x7E] # ASCII | [\xC2-\xDF][\x80-\xBF] # non-overlong 2-byte | \xE0[\xA0-\xBF][\x80-\xBF] # excluding overlongs | [\xE1-\xEC\xEE\xEF][\x80-\xBF]{2} # straight 3-byte | \xED[\x80-\x9F][\x80-\xBF] # excluding surrogates | \xF0[\x90-\xBF][\x80-\xBF]{2} # planes 1-3 | [\xF1-\xF3][\x80-\xBF]{3} # planes 4-15 | \xF4[\x80-\x8F][\x80-\xBF]{2} # plane 16 )*$%xs', $string); if (!$isUTF8) { return utf8_encode($string); } return $string; } // get encoding $encoding = mb_detect_encoding($string, "auto", true); // return existing string if it is already utf-8 if ($encoding === 'UTF-8') { return $string; } // invalid encoding, so make a "safe" string if ($encoding === false) { return preg_replace('#[^a-zA-Z0-9_\.\-\s ]#', '', $string); } // convert to utf-8 and return return mb_convert_encoding($string, 'UTF-8', $encoding); } public static function isUtf8($string) { if (!function_exists('mb_detect_encoding')) { // From http://w3.org/International/questions/qa-forms-utf-8.html return preg_match('%^(?: [\x09\x0A\x0D\x20-\x7E] # ASCII | [\xC2-\xDF][\x80-\xBF] # non-overlong 2-byte | \xE0[\xA0-\xBF][\x80-\xBF] # excluding overlongs | [\xE1-\xEC\xEE\xEF][\x80-\xBF]{2} # straight 3-byte | \xED[\x80-\x9F][\x80-\xBF] # excluding surrogates | \xF0[\x90-\xBF][\x80-\xBF]{2} # planes 1-3 | [\xF1-\xF3][\x80-\xBF]{3} # planes 4-15 | \xF4[\x80-\x8F][\x80-\xBF]{2} # plane 16 )*$%xs', $string); } return mb_detect_encoding($string, 'UTF-8', true); } /** * Convert size value to bytes. */ public static function convertSize($value) { $unit = ''; preg_match('#([0-9]+)\s?([a-z]*)#i', $value, $matches); if (isset($matches[1])) { $value = (int) $matches[1]; } if (isset($matches[2])) { $unit = $matches[2]; // extract first character only, eg: g, m, k if ($unit) { $unit = strtolower($unit[0]); } } $value = intval($value); // Convert to bytes switch ($unit) { case 'g': $value = $value * 1073741824; break; case 'm': $value = $value * 1048576; break; case 'k': $value = $value * 1024; break; } return $value; } /** * Checks an upload for suspicious naming, potential PHP contents, valid image and HTML tags. */ public static function isSafeFile($file) { // null byte check if (strstr($file['name'], "\x00")) { @unlink($file['tmp_name']); throw new InvalidArgumentException('The file name contains a null byte.'); } // check name for invalid extensions if (self::validateFileName($file['name']) !== true) { @unlink($file['tmp_name']); throw new InvalidArgumentException('The file name contains an invalid extension.'); } $isImage = preg_match('#\.(jpeg|jpg|jpe|png|gif|wbmp|bmp|tiff|tif|webp|psd|swc|iff|jpc|jp2|jpx|jb2|xbm|ico|xcf|odg)$#i', $file['name']); // check file for <?php tags $fp = @fopen($file['tmp_name'], 'r'); if ($fp !== false) { $data = ''; while (!feof($fp)) { $data .= @fread($fp, 131072); // we can only reliably check for the full <?php tag here (short tags conflict with valid exif xml data), so users are reminded to disable short_open_tag if (stripos($data, '<?php') !== false) { @unlink($file['tmp_name']); throw new InvalidArgumentException('The file contains PHP code.'); } // check for `__HALT_COMPILER()` phar stub if (stripos($data, '__HALT_COMPILER()') !== false) { @unlink($file['tmp_name']); throw new InvalidArgumentException('The file contains PHP code.'); } $data = substr($data, -10); } fclose($fp); } // validate image if ($isImage && @getimagesize($file['tmp_name']) === false) { @unlink($file['tmp_name']); throw new InvalidArgumentException('The file is not a valid image.'); } return true; } /** * Check file name for extensions. * * @param type $name * * @return bool */ public static function validateFileName($name) { if (empty($name) && (string) $name !== "0") { return false; } // list of invalid extensions $executable = array( 'php', 'php3', 'php4', 'php5', 'php6', 'php7', 'phar', 'js', 'exe', 'phtml', 'java', 'perl', 'py', 'asp', 'dll', 'go', 'ade', 'adp', 'bat', 'chm', 'cmd', 'com', 'cpl', 'hta', 'ins', 'isp', 'jse', 'lib', 'mde', 'msc', 'msp', 'mst', 'pif', 'scr', 'sct', 'shb', 'sys', 'vb', 'vbe', 'vbs', 'vxd', 'wsc', 'wsf', 'wsh', 'svg', ); // get file parts, eg: ['image', 'php', 'jpg'] $parts = explode('.', $name); // remove extension array_pop($parts); // remove name array_shift($parts); // no extensions in file name if (empty($parts)) { return true; } // lowercase it array_map('strtolower', $parts); // check for extension in file name, eg: image.php.jpg foreach ($executable as $extension) { if (in_array($extension, $parts)) { return false; } } return true; } /** * Method to determine if an array is an associative array. * * @param array An array to test * * @return bool True if the array is an associative array * * @link https://www.php.net/manual/en/function.is-array.php#84488 */ public static function is_associative_array($array) { if (!is_array($array)) { return false; } $i = count($array); while ($i > 0) { if (!array_key_exists(--$i, $array)) { return true; } } return false; } public static function isJson($value) { // value must be a string if (!$value || !is_string($value)) { return false; } // trim $value = trim($value); if (!$value) { return false; } // quick syntax check if ($value[0] !== '{' && $value[0] !== '[') { return false; } // full check using json_decode json_decode($value); return json_last_error() == JSON_ERROR_NONE; } /** * array_merge_recursive does indeed merge arrays, but it converts values with duplicate * keys to arrays rather than overwriting the value in the first array with the duplicate * value in the second array, as array_merge does. I.e., with array_merge_recursive, * this happens (documented behavior):. * * array_merge_recursive(array('key' => 'org value'), array('key' => 'new value')); * => array('key' => array('org value', 'new value')); * * array_merge_recursive_distinct does not change the datatypes of the values in the arrays. * Matching keys' values in the second array overwrite those in the first array, as is the * case with array_merge, i.e.: * * array_merge_recursive_distinct(array('key' => 'org value'), array('key' => 'new value')); * => array('key' => array('new value')); * * Parameters are passed by reference, though only for performance reasons. They're not * altered by this function. * * @param array $array1 * @param array $array2 * @param boolean $ignore_empty_string * * @return array * * @author Daniel <daniel (at) danielsmedegaardbuus (dot) dk> * @author Gabriel Sobrinho <gabriel (dot) sobrinho (at) gmail (dot) com> */ public static function array_merge_recursive_distinct(array $array1, array $array2, $ignore_empty_string = false) { $merged = $array1; foreach ($array2 as $key => $value) { if (self::is_associative_array($value) && array_key_exists($key, $merged) && self::is_associative_array($merged[$key])) { $merged[$key] = self::array_merge_recursive_distinct($merged[$key], $value, $ignore_empty_string); } else { if (is_null($value)) { continue; } if (array_key_exists($key, $merged) && $ignore_empty_string && $value === "") { continue; } $merged[$key] = $value; } } return $merged; } }