Page Menu
Home
c4science
Search
Configure Global Search
Log In
Files
F100477448
PhutilRemarkupHyperlinkRule.php
No One
Temporary
Actions
Download File
Edit File
Delete File
View Transforms
Subscribe
Mute Notifications
Award Token
Subscribers
None
File Metadata
Details
File Info
Storage
Attached
Created
Fri, Jan 31, 02:51
Size
3 KB
Mime Type
text/x-php
Expires
Sun, Feb 2, 02:51 (2 d)
Engine
blob
Format
Raw Data
Handle
23972108
Attached To
rPHU libphutil
PhutilRemarkupHyperlinkRule.php
View Options
<?php
final
class
PhutilRemarkupHyperlinkRule
extends
PhutilRemarkupRule
{
public
function
getPriority
()
{
return
400.0
;
}
public
function
apply
(
$text
)
{
// Hyperlinks with explicit "<>" around them get linked exactly, without
// the "<>". Angle brackets are basically special and mean "this is a URL
// with weird characters". This is assumed to be reasonable because they
// don't appear in normal text or normal URLs.
$text
=
preg_replace_callback
(
'@<(
\w
{3,}://[^
\s
'
.
PhutilRemarkupBlockStorage
::
MAGIC_BYTE
.
']+?)>@'
,
array
(
$this
,
'markupHyperlink'
),
$text
);
// Anything else we match "ungreedily", which means we'll look for
// stuff that's probably puncutation or otherwise not part of the URL and
// not link it. This lets someone write "QuicK! Go to
// http://www.example.com/!". We also apply some paren balancing rules.
// NOTE: We're explicitly avoiding capturing stored blocks, so text like
// `http://www.example.com/[[x | y]]` doesn't get aggressively captured.
$text
=
preg_replace_callback
(
'@(
\w
{3,}://[^
\s
'
.
PhutilRemarkupBlockStorage
::
MAGIC_BYTE
.
']+)@'
,
array
(
$this
,
'markupHyperlinkUngreedy'
),
$text
);
return
$text
;
}
protected
function
markupHyperlink
(
$matches
)
{
$protocols
=
$this
->
getEngine
()->
getConfig
(
'uri.allowed-protocols'
,
array
());
$protocol
=
id
(
new
PhutilURI
(
$matches
[
1
]))->
getProtocol
();
if
(!
idx
(
$protocols
,
$protocol
))
{
// If this URI doesn't use a whitelisted protocol, don't link it. This
// is primarily intended to prevent javascript:// silliness.
return
$this
->
getEngine
()->
storeText
(
$matches
[
1
]);
}
return
$this
->
storeRenderedHyperlink
(
$matches
[
1
]);
}
protected
function
storeRenderedHyperlink
(
$link
)
{
return
$this
->
getEngine
()->
storeText
(
$this
->
renderHyperlink
(
$link
));
}
protected
function
renderHyperlink
(
$link
)
{
if
(
$this
->
getEngine
()->
isTextMode
())
{
return
$link
;
}
if
(
$this
->
getEngine
()->
getState
(
'toc'
))
{
return
$link
;
}
else
{
return
phutil_tag
(
'a'
,
array
(
'href'
=>
$link
,
'class'
=>
'remarkup-link'
,
'target'
=>
'_blank'
,
),
$link
);
}
}
protected
function
markupHyperlinkUngreedy
(
$matches
)
{
$match
=
$matches
[
1
];
$tail
=
null
;
$trailing
=
null
;
if
(
preg_match
(
'/[;,.:!?]+$/'
,
$match
,
$trailing
))
{
$tail
=
$trailing
[
0
];
$match
=
substr
(
$match
,
0
,
-
strlen
(
$tail
));
}
// If there's a closing paren at the end but no balancing open paren in
// the URL, don't link the close paren. This is an attempt to gracefully
// handle the two common paren cases, Wikipedia links and English language
// parentheticals, e.g.:
//
// http://en.wikipedia.org/wiki/Noun_(disambiguation)
// (see also http://www.example.com)
//
// We could apply a craftier heuristic here which tries to actually balance
// the parens, but this is probably sufficient.
if
(
preg_match
(
'/
\\
)$/'
,
$match
)
&&
!
preg_match
(
'/
\\
(/'
,
$match
))
{
$tail
=
')'
.
$tail
;
$match
=
substr
(
$match
,
0
,
-
1
);
}
return
hsprintf
(
'%s%s'
,
$this
->
markupHyperlink
(
array
(
null
,
$match
)),
$tail
);
}
}
Event Timeline
Log In to Comment