.
 *
 */
namespace Friendica\Content\Text;
use DOMDocument;
use DOMXPath;
use Friendica\Content\Widget\ContactBlock;
use Friendica\Core\Hook;
use Friendica\Core\Renderer;
use Friendica\DI;
use Friendica\Model\Contact;
use Friendica\Util\Network;
use Friendica\Util\Proxy as ProxyUtils;
use Friendica\Util\Strings;
use Friendica\Util\XML;
use League\HTMLToMarkdown\HtmlConverter;
class HTML
{
	public static function sanitizeCSS($input)
	{
		$cleaned = "";
		$input = strtolower($input);
		for ($i = 0; $i < strlen($input); $i++) {
			$char = substr($input, $i, 1);
			if (($char >= "a") && ($char <= "z")) {
				$cleaned .= $char;
			}
			if (!(strpos(" #;:0123456789-_.%", $char) === false)) {
				$cleaned .= $char;
			}
		}
		return $cleaned;
	}
	/**
	 * Search all instances of a specific HTML tag node in the provided DOM document and replaces them with BBCode text nodes.
	 *
	 * @see HTML::tagToBBCodeSub()
	 */
	private static function tagToBBCode(DOMDocument $doc, string $tag, array $attributes, string $startbb, string $endbb, bool $ignoreChildren = false)
	{
		do {
			$done = self::tagToBBCodeSub($doc, $tag, $attributes, $startbb, $endbb, $ignoreChildren);
		} while ($done);
	}
	/**
	 * Search the first specific HTML tag node in the provided DOM document and replaces it with BBCode text nodes.
	 *
	 * @param DOMDocument $doc
	 * @param string      $tag            HTML tag name
	 * @param array       $attributes     Array of attributes to match and optionally use the value from
	 * @param string      $startbb        BBCode tag opening
	 * @param string      $endbb          BBCode tag closing
	 * @param bool        $ignoreChildren If set to false, the HTML tag children will be appended as text inside the BBCode tag
	 *                                    Otherwise, they will be entirely ignored. Useful for simple BBCode that draw their
	 *                                    inner value from an attribute value and disregard the tag children.
	 * @return bool Whether a replacement was done
	 */
	private static function tagToBBCodeSub(DOMDocument $doc, string $tag, array $attributes, string $startbb, string $endbb, bool $ignoreChildren = false)
	{
		$savestart = str_replace('$', '\x01', $startbb);
		$replace = false;
		$xpath = new DOMXPath($doc);
		/** @var \DOMNode[] $list */
		$list = $xpath->query("//" . $tag);
		foreach ($list as $node) {
			$attr = [];
			if ($node->attributes->length) {
				foreach ($node->attributes as $attribute) {
					$attr[$attribute->name] = $attribute->value;
				}
			}
			$replace = true;
			$startbb = $savestart;
			$i = 0;
			foreach ($attributes as $attribute => $value) {
				$startbb = str_replace('\x01' . ++$i, '$1', $startbb);
				if (strpos('*' . $startbb, '$1') > 0) {
					if ($replace && (@$attr[$attribute] != '')) {
						$startbb = preg_replace($value, $startbb, $attr[$attribute], -1, $count);
						// If nothing could be changed
						if ($count == 0) {
							$replace = false;
						}
					} else {
						$replace = false;
					}
				} else {
					if (@$attr[$attribute] != $value) {
						$replace = false;
					}
				}
			}
			if ($replace) {
				$StartCode = $doc->createTextNode($startbb);
				$EndCode = $doc->createTextNode($endbb);
				$node->parentNode->insertBefore($StartCode, $node);
				if (!$ignoreChildren && $node->hasChildNodes()) {
					/** @var \DOMNode $child */
					foreach ($node->childNodes as $key => $child) {
						/* Remove empty text nodes at the start or at the end of the children list */
						if ($key > 0 && $key < $node->childNodes->length - 1 || $child->nodeName != '#text' || trim($child->nodeValue)) {
							$newNode = $child->cloneNode(true);
							$node->parentNode->insertBefore($newNode, $node);
						}
					}
				}
				$node->parentNode->insertBefore($EndCode, $node);
				$node->parentNode->removeChild($node);
			}
		}
		return $replace;
	}
	/**
	 * Converter for HTML to BBCode
	 *
	 * Made by: ike@piratenpartei.de
	 * Originally made for the syncom project: http://wiki.piratenpartei.de/Syncom
	 *                    https://github.com/annando/Syncom
	 *
	 * @param string $message
	 * @param string $basepath
	 * @return string
	 * @throws \Friendica\Network\HTTPException\InternalServerErrorException
	 */
	public static function toBBCode($message, $basepath = '')
	{
		$message = str_replace("\r", "", $message);
		// Removing code blocks before the whitespace removal processing below
		$codeblocks = [];
		$message = preg_replace_callback(
			'#
(.*)",
				"
",
				" ",
			],
			$message
		);
		// remove namespaces
		$message = preg_replace('=<(\w+):(.+?)>=', '', $message);
		$message = preg_replace('=(\w+):(.+?)>=', ' ', $message);
		$doc = new DOMDocument();
		$doc->preserveWhiteSpace = false;
		$message = mb_convert_encoding($message, 'HTML-ENTITIES', "UTF-8");
		@$doc->loadHTML($message, LIBXML_HTML_NODEFDTD);
		XML::deleteNode($doc, 'style');
		XML::deleteNode($doc, 'head');
		XML::deleteNode($doc, 'title');
		XML::deleteNode($doc, 'meta');
		XML::deleteNode($doc, 'xml');
		XML::deleteNode($doc, 'removeme');
		$xpath = new DomXPath($doc);
		$list = $xpath->query("//pre");
		foreach ($list as $node) {
			// Ensure to escape unescaped & - they will otherwise raise a warning
			$safe_value = preg_replace('/&(?!\w+;)/', '&', $node->nodeValue);
			$node->nodeValue = str_replace("\n", "\r", $safe_value);
		}
		$message = $doc->saveHTML();
		$message = str_replace(["\n<", ">\n", "\r", "\n", "\xC3\x82\xC2\xA0"], ["<", ">", "(.*?)<\/a>/is';
		preg_match_all($pattern, $message, $result, PREG_SET_ORDER);
		$urls = [];
		foreach ($result as $treffer) {
			$ignore = false;
			// A list of some links that should be ignored
			$list = ["/user/", "/tag/", "/group/", "/profile/", "/search?search=", "/search?tag=", "mailto:", "/u/", "/node/",
				"//plus.google.com/", "//twitter.com/"];
			foreach ($list as $listitem) {
				if (strpos($treffer[1], $listitem) !== false) {
					$ignore = true;
				}
			}
			if ((strpos($treffer[1], "//twitter.com/") !== false) && (strpos($treffer[1], "/status/") !== false)) {
				$ignore = false;
			}
			if ((strpos($treffer[1], "//plus.google.com/") !== false) && (strpos($treffer[1], "/posts") !== false)) {
				$ignore = false;
			}
			if ((strpos($treffer[1], "//plus.google.com/") !== false) && (strpos($treffer[1], "/photos") !== false)) {
				$ignore = false;
			}
			$ignore = $ignore || strpos($treffer[1], '#') === 0;
			if (!$ignore) {
				$urls[$treffer[1]] = $treffer[1];
			}
		}
		return $urls;
	}
	/**
	 * @param string $html
	 * @param int    $wraplength Ensures individual lines aren't longer than this many characters. Doesn't break words.
	 * @param bool   $compact    True: Completely strips image tags; False: Keeps image URLs
	 * @return string
	 */
	public static function toPlaintext(string $html, $wraplength = 75, $compact = false)
	{
		$message = str_replace("\r", "", $html);
		$doc = new DOMDocument();
		$doc->preserveWhiteSpace = false;
		$message = mb_convert_encoding($message, 'HTML-ENTITIES', "UTF-8");
		@$doc->loadHTML($message, LIBXML_HTML_NODEFDTD);
		$message = $doc->saveHTML();
		// Remove eventual UTF-8 BOM
		$message = str_replace("\xC3\x82\xC2\xA0", "", $message);
		// Collecting all links
		$urls = self::collectURLs($message);
		@$doc->loadHTML($message, LIBXML_HTML_NODEFDTD);
		self::tagToBBCode($doc, 'html', [], '', '');
		self::tagToBBCode($doc, 'body', [], '', '');
		if ($compact) {
			self::tagToBBCode($doc, 'blockquote', [], "»", "«");
		} else {
			self::tagToBBCode($doc, 'blockquote', [], '[quote]', "[/quote]\n");
		}
		self::tagToBBCode($doc, 'br', [], "\n", '');
		self::tagToBBCode($doc, 'span', [], "", "");
		self::tagToBBCode($doc, 'pre', [], "", "");
		self::tagToBBCode($doc, 'div', [], "\r", "\r");
		self::tagToBBCode($doc, 'p', [], "\n", "\n");
		self::tagToBBCode($doc, 'li', [], "\n* ", "\n");
		self::tagToBBCode($doc, 'hr', [], "\n" . str_repeat("-", 70) . "\n", "");
		self::tagToBBCode($doc, 'tr', [], "\n", "");
		self::tagToBBCode($doc, 'td', [], "\t", "");
		self::tagToBBCode($doc, 'h1', [], "\n\n*", "*\n");
		self::tagToBBCode($doc, 'h2', [], "\n\n*", "*\n");
		self::tagToBBCode($doc, 'h3', [], "\n\n*", "*\n");
		self::tagToBBCode($doc, 'h4', [], "\n\n*", "*\n");
		self::tagToBBCode($doc, 'h5', [], "\n\n*", "*\n");
		self::tagToBBCode($doc, 'h6', [], "\n\n*", "*\n");
		if (!$compact) {
			self::tagToBBCode($doc, 'img', ['src' => '/(.+)/'], ' [img]$1', '[/img] ');
		} else {
			self::tagToBBCode($doc, 'img', ['src' => '/(.+)/'], ' ', ' ');
		}
		self::tagToBBCode($doc, 'iframe', ['src' => '/(.+)/'], ' $1 ', '');
		$message = $doc->saveHTML();
		if (!$compact) {
			$message = str_replace("[img]", "", $message);
			$message = str_replace("[/img]", "", $message);
		}
		// was ersetze ich da?
		// Irgendein stoerrisches UTF-Zeug
		$message = str_replace(chr(194) . chr(160), ' ', $message);
		$message = str_replace(" ", " ", $message);
		// Aufeinanderfolgende DIVs
		$message = preg_replace('=\r *\r=i', "\n", $message);
		$message = str_replace("\r", "\n", $message);
		$message = strip_tags($message);
		$message = html_entity_decode($message, ENT_QUOTES, 'UTF-8');
		if (!$compact && ($message != '')) {
			foreach ($urls as $id => $url) {
				if ($url != '' && strpos($message, $url) === false) {
					$message .= "\n" . $url . ' ';
				}
			}
		}
		$message = str_replace("\n«", "«\n", $message);
		$message = str_replace("»\n", "\n»", $message);
		do {
			$oldmessage = $message;
			$message = str_replace("\n\n\n", "\n\n", $message);
		} while ($oldmessage != $message);
		$message = self::quoteLevel(trim($message), $wraplength);
		return trim($message);
	}
	/**
	 * Converts provided HTML code to Markdown. The hardwrap parameter maximizes
	 * compatibility with Diaspora in spite of the Markdown standards.
	 *
	 * @param string $html
	 * @return string
	 */
	public static function toMarkdown($html)
	{
		$converter = new HtmlConverter(['hard_break' => true]);
		$markdown = $converter->convert($html);
		return $markdown;
	}
	/**
	 * Convert video HTML to BBCode tags
	 *
	 * @param string $s
	 * @return string
	 */
	public static function toBBCodeVideo($s)
	{
		$s = preg_replace(
			'#]+>(.*?)https?://www.youtube.com/((?:v|cp)/[A-Za-z0-9\-_=]+)(.*?) #ism',
			'[youtube]$2[/youtube]',
			$s
		);
	
		$s = preg_replace(
			'##ism',
			'[youtube]$2[/youtube]',
			$s
		);
	
		$s = preg_replace(
			'##ism',
			'[vimeo]$2[/vimeo]',
			$s
		);
	
		return $s;
	}
	
	/**
	 * transform link href and img src from relative to absolute
	 *
	 * @param string $text
	 * @param string $base base url
	 * @return string
	 */
	public static function relToAbs($text, $base)
	{
		if (empty($base)) {
			return $text;
		}
	
		$base = rtrim($base, '/');
	
		$base2 = $base . "/";
	
		// Replace links
		$pattern = "/]*) href=\"(?!http|https|\/)([^\"]*)\"/";
		$replace = " ]*) href=\"(?!http|https)([^\"]*)\"/";
		$replace = " ]*) src=\"(?!http|https|\/)([^\"]*)\"/";
		$replace = " $1 ', $s);
		$s = preg_replace("/\<(.*?)(src|href)=(.*?)\&\;(.*?)\>/ism", '<$1$2=$3&$4>', $s);
		return $s;
	}
	/**
	 * Given a HTML text and a set of filtering reasons, adds a content hiding header with the provided reasons
	 *
	 * Reasons are expected to have been translated already.
	 *
	 * @param string $html
	 * @param array  $reasons
	 * @return string
	 * @throws \Friendica\Network\HTTPException\InternalServerErrorException
	 */
	public static function applyContentFilter($html, array $reasons)
	{
		if (count($reasons)) {
			$tpl = Renderer::getMarkupTemplate('wall/content_filter.tpl');
			$html = Renderer::replaceMacros($tpl, [
				'$reasons'   => $reasons,
				'$rnd'       => Strings::getRandomHex(8),
				'$openclose' => DI::l10n()->t('Click to open/close'),
				'$html'      => $html
			]);
		}
		return $html;
	}
	/**
	 * replace html amp entity with amp char
	 * @param string $s
	 * @return string
	 */
	public static function unamp($s)
	{
		return str_replace('&', '&', $s);
	}
}