2007-07-09 21:12:16 +00:00
|
|
|
<?php
|
|
|
|
/**
|
|
|
|
* Global Search Engine for Moodle
|
2008-03-31 22:22:20 +00:00
|
|
|
*
|
|
|
|
* @package search
|
|
|
|
* @category core
|
|
|
|
* @subpackage document_wrappers
|
|
|
|
* @author Valery Fremaux [valery.fremaux@club-internet.fr] > 1.8
|
|
|
|
* @date 2008/03/31
|
|
|
|
* @license http://www.gnu.org/copyleft/gpl.html GNU Public License
|
2007-07-09 21:12:16 +00:00
|
|
|
*
|
|
|
|
* this is a format handler for getting text out of a proprietary binary format
|
|
|
|
* so it can be indexed by Lucene search engine
|
|
|
|
*/
|
|
|
|
|
2008-03-31 22:22:20 +00:00
|
|
|
/**
|
2007-07-09 21:12:16 +00:00
|
|
|
* MS Word extractor
|
2008-03-31 22:22:20 +00:00
|
|
|
* @param object $resource
|
|
|
|
* @uses CFG, USER
|
2007-07-09 21:12:16 +00:00
|
|
|
*/
|
|
|
|
function get_text_for_indexing_doc(&$resource){
|
|
|
|
global $CFG, $USER;
|
|
|
|
|
|
|
|
// SECURITY : do not allow non admin execute anything on system !!
|
|
|
|
if (!isadmin($USER->id)) return;
|
2008-03-31 22:22:20 +00:00
|
|
|
|
|
|
|
$moodleroot = (@$CFG->block_search_usemoodleroot) ? "{$CFG->dirroot}/" : '' ;
|
2007-07-09 21:12:16 +00:00
|
|
|
|
|
|
|
// just call pdftotext over stdout and capture the output
|
|
|
|
if (!empty($CFG->block_search_word_to_text_cmd)){
|
2008-03-31 22:22:20 +00:00
|
|
|
if (!file_exists("{$moodleroot}{$CFG->block_search_word_to_text_cmd}")){
|
|
|
|
mtrace('Error with MSWord to text converter command : executable not found.');
|
2007-07-09 21:12:16 +00:00
|
|
|
}
|
|
|
|
else{
|
2007-12-05 15:54:39 +00:00
|
|
|
$file = escapeshellarg($CFG->dataroot.'/'.$resource->course.'/'.$resource->reference);
|
2008-03-31 22:22:20 +00:00
|
|
|
$text_converter_cmd = "\"{$moodleroot}{$CFG->block_search_word_to_text_cmd}\" \"$file\"";
|
2007-07-09 21:12:16 +00:00
|
|
|
if ($CFG->block_search_word_to_text_env){
|
|
|
|
putenv($CFG->block_search_word_to_text_env);
|
|
|
|
}
|
|
|
|
$result = shell_exec($text_converter_cmd);
|
|
|
|
if ($result){
|
|
|
|
return mb_convert_encoding($result, 'UTF8', 'auto');
|
|
|
|
}
|
|
|
|
else{
|
|
|
|
mtrace('Error with MSWord to text converter command : execution failed.');
|
|
|
|
return '';
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
mtrace('Error with MSWord to text converter command : command not set up. Execute once search block configuration.');
|
|
|
|
return '';
|
|
|
|
}
|
|
|
|
}
|
|
|
|
?>
|