mirror of
				https://github.com/ezyang/htmlpurifier.git
				synced 2025-10-20 16:26:15 +02:00 
			
		
		
		
	git-svn-id: http://htmlpurifier.org/svnroot/html_purifier/trunk@30 48356398-32a2-884e-a903-53898d9a118a
		
			
				
	
	
		
			119 lines
		
	
	
		
			2.6 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
			
		
		
	
	
			119 lines
		
	
	
		
			2.6 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| <?php
 | |
| 
 | |
| // test our parser versus HTMLSax parser
 | |
| 
 | |
| set_time_limit(5);
 | |
| 
 | |
| // PEAR
 | |
| require_once 'Benchmark/Timer.php';
 | |
| require_once 'XML/HTMLSax3.php';
 | |
| require_once 'Text/Password.php';
 | |
| 
 | |
| require_once '../MarkupFragment.php';
 | |
| require_once '../HTML_Lexer.php';
 | |
| 
 | |
| class TinyTimer extends Benchmark_Timer
 | |
| {
 | |
|     
 | |
|     var $name;
 | |
|     
 | |
|     function TinyTimer($name, $auto = false) {
 | |
|         $this->name = htmlentities($name);
 | |
|         $this->Benchmark_Timer($auto);
 | |
|     }
 | |
|     
 | |
|     function getOutput() {
 | |
| 
 | |
|         $total  = $this->TimeElapsed();
 | |
|         $result = $this->getProfiling();
 | |
|         $dashes = '';
 | |
|         
 | |
|         $out = '<tr>';
 | |
|         
 | |
|         $out .= "<td>{$this->name}</td>";
 | |
|         
 | |
|         foreach ($result as $k => $v) {
 | |
|             if ($v['name'] == 'Start' || $v['name'] == 'Stop') continue;
 | |
|             
 | |
|             $perc = (($v['diff'] * 100) / $total);
 | |
|             $tperc = (($v['total'] * 100) / $total);
 | |
|             
 | |
|             $out .= '<td align="right">' . number_format($perc, 2, '.', '') .
 | |
|                    "%</td>";
 | |
|             
 | |
|         }
 | |
|         
 | |
|         $out .= '</tr>';
 | |
|         
 | |
|         return $out;
 | |
|     }
 | |
| }
 | |
| 
 | |
| ?>
 | |
| <html>
 | |
| <head>
 | |
| <title>Benchmark: HTML_Lexer versus HTMLSax</title>
 | |
| </head>
 | |
| <body>
 | |
| <h1>Benchmark: HTML_Lexer versus HTMLSax</h1>
 | |
| <table border="1">
 | |
| <tr><th>Case</th><th>HTML_Lexer</th><th>HTML_Lexer_Sax</th></tr>
 | |
| <?php
 | |
| 
 | |
| 
 | |
| function do_benchmark($name, $document) {
 | |
|     $timer = new TinyTimer($name);
 | |
|     $timer->start();
 | |
|     
 | |
|     $lexer = new HTML_Lexer();
 | |
|     $tokens = $lexer->tokenizeHTML($document);
 | |
|     $timer->setMarker('HTML_Lexer');
 | |
|     
 | |
|     $lexer = new HTML_Lexer_Sax();
 | |
|     $sax_tokens = $lexer->tokenizeHTML($document);
 | |
|     $timer->setMarker('HTML_Lexer_Sax');
 | |
|     
 | |
|     $timer->stop();
 | |
|     $timer->display();
 | |
| }
 | |
| 
 | |
| // sample of html pages
 | |
| 
 | |
| $dir = 'samples/HTML_Lexer';
 | |
| $dh  = opendir($dir);
 | |
| while (false !== ($filename = readdir($dh))) {
 | |
|     
 | |
|     if (strpos($filename, '.html') !== strlen($filename) - 5) continue;
 | |
|     $document = file_get_contents($dir . '/' . $filename);
 | |
|     do_benchmark("File: $filename", $document);
 | |
|     
 | |
| }
 | |
| 
 | |
| // crashers
 | |
| 
 | |
| $snippets = array();
 | |
| $snippets[] = '<a href="foo>';
 | |
| $snippets[] = '<a "=>';
 | |
| 
 | |
| foreach ($snippets as $snippet) {
 | |
|     do_benchmark($snippet, $snippet);
 | |
| }
 | |
| 
 | |
| // random input
 | |
| 
 | |
| $random = Text_Password::create(80, 'unpronounceable', 'qwerty <>="\'');
 | |
| 
 | |
| do_benchmark('Random input', $random);
 | |
| 
 | |
| ?></table>
 | |
| 
 | |
| <?php
 | |
| 
 | |
| echo '<div>Random input was: ' .
 | |
|   '<span colspan="4" style="font-family:monospace;">' . htmlentities($random) .
 | |
|   '</span></div>';
 | |
| 
 | |
| ?>
 | |
| 
 | |
| 
 | |
| </body></html>
 |