2007-07-09 21:12:16 +00:00
|
|
|
<?php
|
|
|
|
/**
|
|
|
|
* Global Search Engine for Moodle
|
2008-03-31 22:22:20 +00:00
|
|
|
*
|
|
|
|
* @package search
|
|
|
|
* @category core
|
|
|
|
* @subpackage document_wrappers
|
|
|
|
* @author Valery Fremaux [valery.fremaux@club-internet.fr] > 1.8
|
|
|
|
* @date 2008/03/31
|
|
|
|
* @license http://www.gnu.org/copyleft/gpl.html GNU Public License
|
2007-07-09 21:12:16 +00:00
|
|
|
*
|
|
|
|
* this is a format handler for getting text out of a proprietary binary format
|
|
|
|
* so it can be indexed by Lucene search engine
|
|
|
|
*/
|
|
|
|
|
2008-03-31 22:22:20 +00:00
|
|
|
/**
|
|
|
|
* @param object $resource
|
2008-05-31 17:09:59 +00:00
|
|
|
* @uses $CFG
|
2008-03-31 22:22:20 +00:00
|
|
|
*/
|
2008-05-03 21:43:36 +00:00
|
|
|
function get_text_for_indexing_xml(&$resource, $directfile = ''){
|
2008-05-31 17:09:59 +00:00
|
|
|
global $CFG;
|
2007-07-09 21:12:16 +00:00
|
|
|
|
|
|
|
// SECURITY : do not allow non admin execute anything on system !!
|
2008-05-25 10:08:05 +00:00
|
|
|
if (!has_capability('moodle/site:doanything', get_context_instance(CONTEXT_SYSTEM))) return;
|
2007-07-09 21:12:16 +00:00
|
|
|
|
|
|
|
// just get text
|
2008-05-03 21:43:36 +00:00
|
|
|
if ($directfile == ''){
|
|
|
|
$text = implode('', file("{$CFG->dataroot}/{$resource->course}/{$resource->reference}"));
|
|
|
|
} else {
|
|
|
|
$text = implode('', file("{$CFG->dataroot}/{$directfile}"));
|
|
|
|
}
|
2007-07-09 21:12:16 +00:00
|
|
|
|
|
|
|
// filter out all xml tags
|
|
|
|
$text = preg_replace("/<[^>]*>/", ' ', $text);
|
|
|
|
|
|
|
|
if (!empty($CFG->block_search_limit_index_body)){
|
|
|
|
$text = shorten($text, $CFG->block_search_limit_index_body);
|
|
|
|
}
|
|
|
|
return $text;
|
|
|
|
}
|
|
|
|
?>
|