File Metadata

Created: Thu, Nov 21, 19:17

PhutilRemarkupRuleHyperlink.php
View Options

	<?php

	/**
	* @group markup
	* @concrete-extensible (TODO only needed by Facebook at the moment)
	*/
	class PhutilRemarkupRuleHyperlink
	extends PhutilRemarkupRule {

	public function apply($text) {

	// Hyperlinks with explicit "<>" around them get linked exactly, without
	// the "<>". Angle brackets are basically special and mean "this is a URL
	// with weird characters". This is assumed to be reasonable because they
	// don't appear in normal text or normal URLs.
	$text = preg_replace_callback(
	'@[<](\w{3,}://.+?)[>]@',
	array($this, 'markupHyperlink'),
	$text);

	// Hyperlinks with explicit "()" around them get linked exactly, with the
	// "()". This is simlar to angle brackets, except that people use parens
	// in normal text so we preserve them in the output text.
	$text = preg_replace_callback(
	'@(?<=\$)(\w{3,}://.+?)(?=\$)@',
	array($this, 'markupHyperlink'),
	$text);

	// Anything else we match "ungreedily", which means we'll look for
	// stuff that's probably puncutation or otherwise not part of the URL and
	// not link it. This lets someone write "QuicK! Go to
	// http://www.example.com/!". We also apply some paren balancing rules.
	$text = preg_replace_callback(
	'@(?<=^\|\s)(\w{3,}://\S+)(?=\s\|$)@',
	array($this, 'markupHyperlinkUngreedy'),
	$text);

	return $text;
	}

	protected function markupHyperlink($matches) {

	$protocols = $this->getEngine()->getConfig(
	'uri.allowed-protocols',
	array());

	$protocol = id(new PhutilURI($matches[1]))->getProtocol();
	if (!idx($protocols, $protocol)) {
	// If this URI doesn't use a whitelisted protocol, don't link it. This
	// is primarily intended to prevent javascript:// silliness.
	return $this->getEngine()->storeText(phutil_escape_html($matches[1]));
	}

	return $this->storeRenderedHyperlink($matches[1]);
	}

	protected function storeRenderedHyperlink($link) {
	return $this->getEngine()->storeText($this->renderHyperlink($link));
	}

	protected function renderHyperlink($link) {
	return phutil_render_tag(
	'a',
	array(
	'href' => $link,
	'target' => '_blank',
	),
	phutil_escape_html($link));
	}

	private function markupHyperlinkUngreedy($matches) {
	$match = $matches[1];
	$tail = null;
	$trailing = null;
	if (preg_match('/[;,.:!?]+$/', $match, $trailing)) {
	$tail = $trailing[0];
	$match = substr($match, 0, -strlen($tail));
	}

	// If there's a closing paren at the end but no balancing open paren in
	// the URL, don't link the close paren. This is an attempt to gracefully
	// handle the two common paren cases, Wikipedia links and English language
	// parentheticals, e.g.:
	//
	// http://en.wikipedia.org/wiki/Noun_(disambiguation)
	// (see also http://www.example.com)
	//
	// We could apply a craftier heuristic here which tries to actually balance
	// the parens, but this is probably sufficient.
	if (preg_match('/\\)$/', $match) && !preg_match('/\\(/', $match)) {
	$tail = ')'.$tail;
	$match = substr($match, 0, -1);
	}

	return $this->markupHyperlink(array(null, $match)).$tail;
	}

	}

PhutilRemarkupRuleHyperlink.php
No OneTemporary
Actions

File Metadata

PhutilRemarkupRuleHyperlink.php
View Options

Event Timeline

PhutilRemarkupRuleHyperlink.phpNo OneTemporaryActions

File Metadata

PhutilRemarkupRuleHyperlink.phpView Options

Event Timeline

PhutilRemarkupRuleHyperlink.php
No OneTemporary
Actions

PhutilRemarkupRuleHyperlink.php
View Options