diff options
author | Cash Costello <cash.costello@gmail.com> | 2013-04-20 09:10:50 -0700 |
---|---|---|
committer | Cash Costello <cash.costello@gmail.com> | 2013-04-20 09:10:50 -0700 |
commit | 392a3c7c94bfbe4d462d0cac1e89d6d87c4c06e4 (patch) | |
tree | bfd9741ec9c161dd987d3df91b055d3316a313bf /engine/lib | |
parent | 39886afeec37309963be57551699c7bfc3f6c37b (diff) | |
parent | 164ff10b46d5917c7ab6ad068abf10e492464691 (diff) | |
download | elgg-392a3c7c94bfbe4d462d0cac1e89d6d87c4c06e4.tar.gz elgg-392a3c7c94bfbe4d462d0cac1e89d6d87c4c06e4.tar.bz2 |
Merge pull request #5385 from cash/parse_urls
Fixes #5369 allows ! in urls and adds unit tests
Diffstat (limited to 'engine/lib')
-rw-r--r-- | engine/lib/output.php | 25 |
1 files changed, 15 insertions, 10 deletions
diff --git a/engine/lib/output.php b/engine/lib/output.php index c5a04989b..6905b9b71 100644 --- a/engine/lib/output.php +++ b/engine/lib/output.php @@ -13,28 +13,33 @@ * @param string $text The input string * * @return string The output string with formatted links - **/ + */ function parse_urls($text) { + + // URI specification: http://www.ietf.org/rfc/rfc3986.txt + // This varies from the specification in the following ways: + // * Supports non-ascii characters + // * Does not allow parentheses and single quotes + // * Cuts off commas, exclamation points, and periods off as last character + // @todo this causes problems with <attr = "val"> // must be in <attr="val"> format (no space). // By default htmlawed rewrites tags to this format. // if PHP supported conditional negative lookbehinds we could use this: // $r = preg_replace_callback('/(?<!=)(?<![ ])?(?<!["\'])((ht|f)tps?:\/\/[^\s\r\n\t<>"\'\!\(\),]+)/i', - // - // we can put , in the list of excluded char but need to keep . because of domain names. - // it is removed in the callback. - $r = preg_replace_callback('/(?<!=)(?<!["\'])((ht|f)tps?:\/\/[^\s\r\n\t<>"\'\!\(\),]+)/i', + $r = preg_replace_callback('/(?<!=)(?<!["\'])((ht|f)tps?:\/\/[^\s\r\n\t<>"\'\(\)]+)/i', create_function( '$matches', ' $url = $matches[1]; - $period = \'\'; - if (substr($url, -1, 1) == \'.\') { - $period = \'.\'; - $url = trim($url, \'.\'); + $punc = \'\'; + $last = substr($url, -1, 1); + if (in_array($last, array(".", "!", ","))) { + $punc = $last; + $url = rtrim($url, ".!,"); } $urltext = str_replace("/", "/<wbr />", $url); - return "<a href=\"$url\">$urltext</a>$period"; + return "<a href=\"$url\" rel=\"nofollow\">$urltext</a>$punc"; ' ), $text); |