MOON
Server: Apache
System: Linux res.emeff.ca 3.10.0-962.3.2.lve1.5.24.10.el7.x86_64 #1 SMP Wed Mar 20 07:36:02 EDT 2019 x86_64
User: accemeff (1004)
PHP: 7.0.33
Disabled: NONE
Upload Files
File: /home/accemeff/vendor/craftcms/cms/src/helpers/Search.php
<?php
/**
 * @link https://craftcms.com/
 * @copyright Copyright (c) Pixel & Tonic, Inc.
 * @license https://craftcms.github.io/license/
 */

namespace craft\helpers;

use Craft;

/**
 * Search helper.
 *
 * @author Pixel & Tonic, Inc. <support@pixelandtonic.com>
 * @since 3.0
 */
class Search
{
    // Properties
    // =========================================================================

    /**
     * @var array Character mappings
     * @see _getCharMap()
     */
    private static $_charMaps = [];

    // Public Methods
    // =========================================================================

    /**
     * Normalizes search keywords.
     *
     * @param string[]|string $str The dirty keywords
     * @param array $ignore Ignore words to strip out
     * @param bool $processCharMap Whether to remove punctuation and diacritics (default is true)
     * @param string|null The language that the character map should be based on, if `$processCharMap` is `true`.
     * @return string The cleansed keywords.
     */
    public static function normalizeKeywords($str, array $ignore = [], bool $processCharMap = true, string $language = null): string
    {
        // Flatten
        if (is_array($str)) {
            $str = StringHelper::toString($str, ' ');
        }

        // Get rid of tags
        $str = strip_tags($str);

        // Convert non-breaking spaces entities to regular ones
        $str = str_replace(['&nbsp;', '&#160;', '&#xa0;'], ' ', $str);

        // Get rid of entities
        $str = preg_replace('/&#?[a-z0-9]{2,8};/i', '', $str);

        // Normalize to lowercase
        $str = mb_strtolower($str);

        if ($processCharMap) {
            // Remove punctuation and diacritics
            $str = strtr($str, self::_getCharMap($language ?? Craft::$app->language));
        }

        // Remove ignore-words?
        if (is_array($ignore) && !empty($ignore)) {
            foreach ($ignore as $word) {
                $word = preg_quote(static::normalizeKeywords($word, [], true, $language), '/');
                $str = preg_replace("/\b{$word}\b/u", '', $str);
            }
        }

        // Strip out new lines and superfluous spaces
        $str = preg_replace('/[\n\r]+/u', ' ', $str);
        $str = preg_replace('/\s{2,}/u', ' ', $str);

        // Trim white space
        $str = trim($str);

        return $str;
    }

    // Private Methods
    // =========================================================================

    /**
     * Get array of chars to be used for conversion.
     *
     * @param string $language
     * @return array
     */
    private static function _getCharMap(string $language): array
    {
        if (isset(self::$_charMaps[$language])) {
            return self::$_charMaps[$language];
        }

        // This will replace accented chars with non-accented chars
        $map = StringHelper::asciiCharMap(true, $language);

        // Replace punctuation with a space
        foreach (self::_getPunctuation() as $value) {
            $map[$value] = ' ';
        }

        return self::$_charMaps[$language] = $map;
    }

    /**
     * Returns the asciiPunctuation array.
     *
     * @return array
     */
    private static function _getPunctuation(): array
    {
        // Keep local copy
        static $asciiPunctuation = [];

        if (empty($asciiPunctuation)) {
            $asciiPunctuation = [
                '!',
                '"',
                '#',
                '&',
                '\'',
                '(',
                ')',
                '*',
                '+',
                ',',
                '-',
                '.',
                '/',
                ':',
                ';',
                '<',
                '>',
                '?',
                '@',
                '[',
                '\\',
                ']',
                '^',
                '{',
                '|',
                '}',
                '~',
                '¡',
                '¢',
                '£',
                '¤',
                '¥',
                '¦',
                '§',
                '¨',
                '©',
                'ª',
                '«',
                '¬',
                '®',
                '¯',
                '°',
                '±',
                '²',
                '³',
                '´',
                'µ',
                '¶',
                '·',
                '¸',
                '¹',
                'º',
                '»',
                '¼',
                '½',
                '¾',
                '¿',
                '×',
                'ƒ',
                'ˆ',
                '˜',
                '–',
                '—',
                '―',
                '‘',
                '’',
                '‚',
                '“',
                '”',
                '„',
                '†',
                '‡',
                '•',
                '‣',
                '…',
                '‰',
                '′',
                '″',
                '‹',
                '›',
                '‼',
                '‾',
                '⁄',
                '€',
                '™',
                '←',
                '↑',
                '→',
                '↓',
                '↔',
                '↵',
                '⇐',
                '⇑',
                '⇒',
                '⇓',
                '⇔',
                '∀',
                '∂',
                '∃',
                '∅',
                '∇',
                '∈',
                '∉',
                '∋',
                '∏',
                '∑',
                '−',
                '∗',
                '√',
                '∝',
                '∞',
                '∠',
                '∧',
                '∨',
                '∩',
                '∪',
                '∫',
                '∴',
                '∼',
                '≅',
                '≈',
                '≠',
                '≡',
                '≤',
                '≥',
                '⊂',
                '⊃',
                '⊄',
                '⊆',
                '⊇',
                '⊕',
                '⊗',
                '⊥',
                '⋅',
                '⌈',
                '⌉',
                '⌊',
                '⌋',
                '〈',
                '〉',
                '◊',
                '♠',
                '♣',
                '♥',
                '♦'
            ];
        }

        return $asciiPunctuation;
    }
}