| Línea 1... |
Línea 1... |
| 1 |
<?php
|
1 |
<?php
|
| 2 |
|
- |
|
| 3 |
// This file is part of Moodle - http://moodle.org/
|
2 |
// This file is part of Moodle - http://moodle.org/
|
| 4 |
//
|
3 |
//
|
| 5 |
// Moodle is free software: you can redistribute it and/or modify
|
4 |
// Moodle is free software: you can redistribute it and/or modify
|
| 6 |
// it under the terms of the GNU General Public License as published by
|
5 |
// it under the terms of the GNU General Public License as published by
|
| 7 |
// the Free Software Foundation, either version 3 of the License, or
|
6 |
// the Free Software Foundation, either version 3 of the License, or
|
| Línea 14... |
Línea 13... |
| 14 |
//
|
13 |
//
|
| 15 |
// You should have received a copy of the GNU General Public License
|
14 |
// You should have received a copy of the GNU General Public License
|
| 16 |
// along with Moodle. If not, see <http://www.gnu.org/licenses/>.
|
15 |
// along with Moodle. If not, see <http://www.gnu.org/licenses/>.
|
| Línea 17... |
Línea 16... |
| 17 |
|
16 |
|
| 18 |
/**
|
17 |
/**
|
| 19 |
* Filter converting URLs in the text to HTML links
|
18 |
* File only retained to prevent fatal errors in code that tries to require/include this.
|
| - |
|
19 |
*
|
| 20 |
*
|
20 |
* @todo MDL-82708 delete this file as part of Moodle 6.0 development.
|
| 21 |
* @package filter
|
21 |
* @deprecated This file is no longer required in Moodle 4.5+.
|
| 22 |
* @subpackage urltolink
|
22 |
* @package filter_urltolink
|
| 23 |
* @copyright 2010 David Mudrak <david@moodle.com>
|
23 |
* @copyright David Mudrak <david@moodle.com>
|
| 24 |
* @license http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
|
24 |
* @license http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
|
| 25 |
*/
|
- |
|
| 26 |
|
25 |
*/
|
| Línea 27... |
Línea -... |
| 27 |
defined('MOODLE_INTERNAL') || die();
|
- |
|
| 28 |
|
- |
|
| 29 |
class filter_urltolink extends moodle_text_filter {
|
- |
|
| 30 |
|
- |
|
| 31 |
/**
|
- |
|
| 32 |
* @var array global configuration for this filter
|
- |
|
| 33 |
*
|
- |
|
| 34 |
* This might be eventually moved into parent class if we found it
|
- |
|
| 35 |
* useful for other filters, too.
|
- |
|
| 36 |
*/
|
- |
|
| 37 |
protected static $globalconfig;
|
- |
|
| 38 |
|
- |
|
| 39 |
/**
|
- |
|
| 40 |
* Apply the filter to the text
|
- |
|
| 41 |
*
|
- |
|
| 42 |
* @see filter_manager::apply_filter_chain()
|
- |
|
| 43 |
* @param string $text to be processed by the text
|
- |
|
| 44 |
* @param array $options filter options
|
- |
|
| 45 |
* @return string text after processing
|
- |
|
| 46 |
*/
|
- |
|
| 47 |
public function filter($text, array $options = array()) {
|
- |
|
| 48 |
if (!isset($options['originalformat'])) {
|
- |
|
| 49 |
// if the format is not specified, we are probably called by {@see format_string()}
|
- |
|
| 50 |
// in that case, it would be dangerous to replace URL with the link because it could
|
- |
|
| 51 |
// be stripped. therefore, we do nothing
|
- |
|
| 52 |
return $text;
|
- |
|
| 53 |
}
|
- |
|
| 54 |
if (in_array($options['originalformat'], explode(',', get_config('filter_urltolink', 'formats')))) {
|
- |
|
| 55 |
$this->convert_urls_into_links($text);
|
- |
|
| 56 |
}
|
- |
|
| 57 |
return $text;
|
- |
|
| 58 |
}
|
- |
|
| 59 |
|
- |
|
| 60 |
////////////////////////////////////////////////////////////////////////////
|
- |
|
| 61 |
// internal implementation starts here
|
- |
|
| 62 |
////////////////////////////////////////////////////////////////////////////
|
- |
|
| 63 |
|
- |
|
| 64 |
/**
|
- |
|
| 65 |
* Given some text this function converts any URLs it finds into HTML links
|
- |
|
| 66 |
*
|
- |
|
| 67 |
* @param string $text Passed in by reference. The string to be searched for urls.
|
- |
|
| 68 |
*/
|
- |
|
| 69 |
protected function convert_urls_into_links(&$text) {
|
- |
|
| 70 |
//I've added img tags to this list of tags to ignore.
|
- |
|
| 71 |
//See MDL-21168 for more info. A better way to ignore tags whether or not
|
- |
|
| 72 |
//they are escaped partially or completely would be desirable. For example:
|
- |
|
| 73 |
//<a href="blah">
|
- |
|
| 74 |
//<a href="blah">
|
- |
|
| 75 |
//<a href="blah">
|
- |
|
| 76 |
$filterignoretagsopen = array('<a\s[^>]+?>', '<span[^>]+?class="nolink"[^>]*?>');
|
- |
|
| 77 |
$filterignoretagsclose = array('</a>', '</span>');
|
- |
|
| 78 |
$ignoretags = [];
|
- |
|
| 79 |
filter_save_ignore_tags($text,$filterignoretagsopen,$filterignoretagsclose,$ignoretags);
|
- |
|
| 80 |
|
- |
|
| 81 |
// Check if we support unicode modifiers in regular expressions. Cache it.
|
- |
|
| 82 |
// TODO: this check should be a environment requirement in Moodle 2.0, as far as unicode
|
- |
|
| 83 |
// chars are going to arrive to URLs officially really soon (2010?)
|
- |
|
| 84 |
// Original RFC regex from: http://www.bytemycode.com/snippets/snippet/796/
|
- |
|
| 85 |
// Various ideas from: http://alanstorm.com/url_regex_explained
|
- |
|
| 86 |
// Unicode check, negative assertion and other bits from Moodle.
|
- |
|
| 87 |
static $unicoderegexp;
|
- |
|
| 88 |
if (!isset($unicoderegexp)) {
|
- |
|
| 89 |
$unicoderegexp = @preg_match('/\pL/u', 'a'); // This will fail silently, returning false,
|
- |
|
| 90 |
}
|
- |
|
| 91 |
|
- |
|
| 92 |
// TODO MDL-21296 - use of unicode modifiers may cause a timeout
|
- |
|
| 93 |
$urlstart = '(?:http(s)?://|(?<!://)(www\.))';
|
- |
|
| 94 |
$domainsegment = '(?:[\pLl0-9][\pLl0-9-]*[\pLl0-9]|[\pLl0-9])';
|
- |
|
| 95 |
$numericip = '(?:(?:[0-9]{1,3}\.){3}[0-9]{1,3})';
|
- |
|
| 96 |
$port = '(?::\d*)';
|
- |
|
| 97 |
$pathchar = '(?:[\pL0-9\.!$&\'\(\)*+,;=_~:@-]|%[a-f0-9]{2})';
|
- |
|
| 98 |
$path = "(?:/$pathchar*)*";
|
- |
|
| 99 |
$querystring = '(?:\?(?:[\pL0-9\.!$&\'\(\)*+,;=_~:@/?-]|%[a-fA-F0-9]{2})*)';
|
- |
|
| 100 |
$fragment = '(?:\#(?:[\pL0-9\.!$&\'\(\)*+,;=_~:@/?-]|%[a-fA-F0-9]{2})*)';
|
- |
|
| 101 |
|
- |
|
| 102 |
// Lookbehind assertions.
|
- |
|
| 103 |
// Is not HTML attribute or CSS URL property. Unfortunately legit text like "url(http://...)" will not be a link.
|
- |
|
| 104 |
$lookbehindend = "(?<![]),.;])";
|
- |
|
| 105 |
|
- |
|
| 106 |
$regex = "$urlstart((?:$domainsegment\.)+$domainsegment|$numericip)" .
|
- |
|
| 107 |
"($port?$path$querystring?$fragment?)$lookbehindend";
|
- |
|
| 108 |
if ($unicoderegexp) {
|
- |
|
| 109 |
$regex = '#' . $regex . '#ui';
|
- |
|
| 110 |
} else {
|
- |
|
| 111 |
$regex = '#' . preg_replace(array('\pLl', '\PL'), 'a-z', $regex) . '#i';
|
- |
|
| 112 |
}
|
- |
|
| 113 |
|
- |
|
| 114 |
// Locate any HTML tags.
|
- |
|
| 115 |
$matches = preg_split('/(<[^<|>]*>)/i', $text, -1, PREG_SPLIT_NO_EMPTY | PREG_SPLIT_DELIM_CAPTURE);
|
- |
|
| 116 |
|
- |
|
| 117 |
// Iterate through the tokenized text to handle chunks (html and content).
|
- |
|
| 118 |
foreach ($matches as $idx => $chunk) {
|
- |
|
| 119 |
// Nothing to do. We skip completely any html chunk.
|
- |
|
| 120 |
if (strpos(trim($chunk), '<') === 0) {
|
- |
|
| 121 |
continue;
|
- |
|
| 122 |
}
|
- |
|
| 123 |
|
- |
|
| 124 |
// Nothing to do. We skip any content chunk having any of these attributes.
|
- |
|
| 125 |
if (preg_match('#(background=")|(action=")|(style="background)|(href=")|(src=")|(url [(])#', $chunk)) {
|
- |
|
| 126 |
continue;
|
- |
|
| 127 |
}
|
- |
|
| 128 |
|
- |
|
| 129 |
// Arrived here, we want to process every word in this chunk.
|
- |
|
| 130 |
$text = $chunk;
|
- |
|
| 131 |
$words = explode(' ', $text);
|
- |
|
| 132 |
|
- |
|
| 133 |
foreach ($words as $idx2 => $word) {
|
- |
|
| 134 |
// ReDoS protection. Stop processing if a word is too large.
|
- |
|
| 135 |
if (strlen($word) < 4096) {
|
- |
|
| 136 |
$words[$idx2] = preg_replace($regex, '<a href="http$1://$2$3$4" class="_blanktarget">$0</a>', $word);
|
- |
|
| 137 |
}
|
- |
|
| 138 |
}
|
- |
|
| 139 |
$text = implode(' ', $words);
|
- |
|
| 140 |
|
- |
|
| 141 |
// Copy the result back to the array.
|
- |
|
| 142 |
$matches[$idx] = $text;
|
- |
|
| 143 |
}
|
- |
|
| 144 |
|
- |
|
| 145 |
$text = implode('', $matches);
|
- |
|
| 146 |
|
- |
|
| 147 |
if (!empty($ignoretags)) {
|
- |
|
| 148 |
$ignoretags = array_reverse($ignoretags); /// Reversed so "progressive" str_replace() will solve some nesting problems.
|
- |
|
| 149 |
$text = str_replace(array_keys($ignoretags),$ignoretags,$text);
|
- |
|
| 150 |
}
|
- |
|
| 151 |
|
- |
|
| 152 |
if (get_config('filter_urltolink', 'embedimages')) {
|
- |
|
| 153 |
// now try to inject the images, this code was originally in the mediapluing filter
|
- |
|
| 154 |
// this may be useful only if somebody relies on the fact the links in FORMAT_MOODLE get converted
|
- |
|
| 155 |
// to URLs which in turn change to real images
|
- |
|
| 156 |
$search = '/<a href="([^"]+\.(jpg|png|gif))" class="_blanktarget">([^>]*)<\/a>/is';
|
- |
|
| 157 |
$text = preg_replace_callback($search, 'filter_urltolink_img_callback', $text);
|
- |
|
| 158 |
}
|
- |
|
| 159 |
}
|
- |
|
| 160 |
}
|
- |
|
| 161 |
|
- |
|
| 162 |
|
- |
|
| 163 |
/**
|
- |
|
| 164 |
* Change links to images into embedded images.
|
- |
|
| 165 |
*
|
- |
|
| 166 |
* This plugin is intended for automatic conversion of image URLs when FORMAT_MOODLE used.
|
- |
|
| 167 |
*
|
- |
|
| 168 |
* @param $link
|
- |
|
| 169 |
* @return string
|
- |
|
| 170 |
*/
|
- |
|
| 171 |
function filter_urltolink_img_callback($link) {
|
26 |
defined('MOODLE_INTERNAL') || die();
|
| 172 |
if ($link[1] !== $link[3]) {
|
- |
|
| 173 |
// this is not a link created by this filter, because the url does not match the text
|
- |
|
| 174 |
return $link[0];
|
- |
|
| 175 |
}
|
- |
|