more_fields-2.2.19/src/Truncator.php

src/Truncator.php
<?php

namespace Drupal\more_fields;

use DOMDocument;

class InvalidHtmlException extends \Exception
{
}

if (function_exists('grapheme_strlen')) {
    function ht_strlen($string)
    {
        return grapheme_strlen($string);
    }
    function ht_substr($string, $from, $to = 2147483647)
    {
        return grapheme_substr($string, $from, $to);
    }
} else if (function_exists('mb_strlen')) {
    function ht_strlen($string)
    {
        return mb_strlen($string);
    }
    function ht_substr($string, $from, $to = 2147483647)
    {
        return mb_substr($string, $from, $to);
    }
} else if (function_exists('iconv_strlen')) {
    function ht_strlen($string)
    {
        return iconv_strlen($string);
    }
    function ht_substr($string, $from, $to = 2147483647)
    {
        return iconv_substr($string, $from, $to);
    }
} else {
    function ht_strlen($string)
    {
        return strlen($string);
    }
    function ht_substr($string, $from, $to = 2147483647)
    {
        return substr($string, $from, $to);
    }
}

if (function_exists('mb_strtolower')) {
    function ht_strtolower($string)
    {
        return mb_strtolower($string);
    }
    function ht_strtoupper($string)
    {
        return mb_strtoupper($string);
    }
} else {
    function ht_strtolower($string)
    {
        return strtolower($string);
    }
    function ht_strtoupper($string)
    {
        return strtoupper($string);
    }
}

class Truncator
{

    public static $default_options = array(
        'ellipsis' => '…',
        'length_in_chars' => false,
    );

    // These tags are allowed to have an ellipsis inside
    public static $ellipsable_tags = array(
        'p', 'ol', 'ul', 'li',
        'div', 'header', 'article', 'nav',
        'section', 'footer', 'aside',
        'dd', 'dt', 'dl',
    );

    public static $self_closing_tags = array(
        'br', 'hr', 'img',
    );

    /**
     * Truncate given HTML string to specified length.
     * If length_in_chars is false it's trimmed by number
     * of words, otherwise by number of characters.
     *
     * @param  string        $html
     * @param  integer       $length
     * @param  string|array  $opts
     * @return string
     */
    public static function truncate($html, $length, $opts = array())
    {
        if (is_string($opts)) $opts = array('ellipsis' => $opts);
        $opts = array_merge(static::$default_options, $opts);
        // wrap the html in case it consists of adjacent nodes like <p>foo</p><p>bar</p>
        $html = "<div>" . static::utf8_for_xml($html) . "</div>";

        $root_node = null;

        // Parse using HTML5Lib if it's available.
        if (class_exists('Masterminds\HTML5')) {
            try {
                $html5 = new \Masterminds\HTML5();
                $doc = $html5->loadHTML($html);
                $root_node = $doc->documentElement->lastChild;
            } catch (\Exception $e) {;
            }
        }

        if ($root_node === null) {
            // HTML5Lib not available so we'll have to use DOMDocument
            // We'll only be able to parse HTML5 if it's valid XML
            $doc = new DOMDocument;
            $doc->formatOutput = false;
            $doc->preserveWhitespace = true;
            // loadHTML will fail with HTML5 tags (article, nav, etc)
            // so we need to suppress errors and if it fails to parse we
            // retry with the XML parser instead
            $prev_use_errors = libxml_use_internal_errors(true);
            if ($doc->loadHTML($html)) {
                $root_node = $doc->documentElement->lastChild->lastChild;
            } else if ($doc->loadXML($html)) {
                $root_node = $doc->documentElement;
            } else {
                libxml_use_internal_errors($prev_use_errors);
                throw new InvalidHtmlException;
            }
            libxml_use_internal_errors($prev_use_errors);
        }

        list($text, $_, $opts) = static::_truncate_node($doc, $root_node, $length, $opts);
        $text = ht_substr(ht_substr($text, 0, -6), 5);
        return $text;
    }

    protected static function _truncate_node($doc, $node, $length, $opts)
    {
        if ($length === 0 && !static::ellipsable($node)) {
            return array('', 1, $opts);
        }
        list($inner, $remaining, $opts) = static::_inner_truncate($doc, $node, $length, $opts);
        if (0 === ht_strlen($inner)) {
            return array(in_array(ht_strtolower($node->nodeName), static::$self_closing_tags) ? $doc->saveXML($node) : "", $length - $remaining, $opts);
        }
        while ($node->firstChild) {
            $node->removeChild($node->firstChild);
        }
        $newNode = $doc->createDocumentFragment();
        $newNode->appendXml($inner);
        $node->appendChild($newNode);
        return array($doc->saveXML($node), $length - $remaining, $opts);
    }

    protected static function _inner_truncate($doc, $node, $length, $opts)
    {
        $inner = '';
        $remaining = $length;
        foreach ($node->childNodes as $childNode) {
            if ($childNode->nodeType === XML_ELEMENT_NODE) {
                list($txt, $nb, $opts) = static::_truncate_node($doc, $childNode, $remaining, $opts);
            } else if ($childNode->nodeType === XML_TEXT_NODE) {
                list($txt, $nb, $opts) = static::_truncate_text($doc, $childNode, $remaining, $opts);
            } else {
                $txt = '';
                $nb  = 0;
            }
            $remaining -= $nb;
            $inner .= $txt;
            if ($remaining < 0) {
                if (static::ellipsable($node)) {
                    $inner = preg_replace('/(?:[\s\pP]+|(?:&(?:[a-z]+|#[0-9]+);?))*$/u', '', $inner) . $opts['ellipsis'];
                    $opts['ellipsis'] = '';
                    $opts['was_truncated'] = true;
                }
                break;
            }
        }
        return array($inner, $remaining, $opts);
    }

    protected static function _truncate_text($doc, $node, $length, $opts)
    {
        $xhtml = $node->ownerDocument->saveXML($node);
        preg_match_all('/\s*\S+/', $xhtml, $words);
        $words = $words[0];
        if ($opts['length_in_chars']) {
            $count = ht_strlen($xhtml);
            if ($count <= $length && $length > 0) {
                return array($xhtml, $count, $opts);
            }
            if (count($words) > 1) {
                $content = '';

                foreach ($words as $word) {
                    if (ht_strlen($content) + ht_strlen($word) > $length) {
                        break;
                    }

                    $content .= $word;
                }

                return array($content, $count, $opts);
            }
            return array(ht_substr($node->textContent, 0, $length), $count, $opts);
        } else {
            $count = count($words);
            if ($count <= $length && $length > 0) {
                return array($xhtml, $count, $opts);
            }
            return array(implode('', array_slice($words, 0, $length)), $count, $opts);
        }
    }

    protected static function ellipsable($node)
    {
        return ($node instanceof DOMDocument)
            || in_array(ht_strtolower($node->nodeName), static::$ellipsable_tags);
    }

    protected static function utf8_for_xml($string)
    {
        return preg_replace('/[^\x{0009}\x{000a}\x{000d}\x{0020}-\x{D7FF}\x{E000}-\x{FFFD}]+/u', ' ', $string);
    }
}

Главная | Обратная связь

drupal hosting | друпал хостинг | it patrol .inc