diff options
Diffstat (limited to 'ext/tidy/examples/urlgrab5.php')
-rw-r--r-- | ext/tidy/examples/urlgrab5.php | 39 |
1 files changed, 0 insertions, 39 deletions
diff --git a/ext/tidy/examples/urlgrab5.php b/ext/tidy/examples/urlgrab5.php deleted file mode 100644 index 875baf0cf9..0000000000 --- a/ext/tidy/examples/urlgrab5.php +++ /dev/null @@ -1,39 +0,0 @@ -<?php - /* - * urlgrab5.php - * - * A simple command-line utility to extract all of the URLS contained - * within <A HREF> tags from a document. - * - * NOTE: Only works with tidy for PHP 5, please see urlgrab.php for tidy for PHP 4.3.x - * - * By: John Coggeshall <john@php.net> - * - * Usage: php urlgrab5.php <file> - * - */ - function dump_nodes(tidyNode $node, &$urls = NULL) { - - $urls = (is_array($urls)) ? $urls : array(); - - if(isset($node->id)) { - if($node->id == TIDY_TAG_A) { - $urls[] = $node->attribute['href']; - } - } - - if($node->hasChildren()) { - - foreach($node->child as $c) { - dump_nodes($c, $urls); - } - - } - - return $urls; - } - - $a = tidy_parse_file($_SERVER['argv'][1]); - $a->cleanRepair(); - print_r(dump_nodes($a->html())); -?> |