提取HTML标签

作者:网络 来源:佚名 更新时间:2008-02-08 13:58:46 点击:
<?php
/*********************************
*
* 作者: 徐祖宁 (唠叨)
* 邮箱: [email protected]
* 开发: 2002.07
*
*
* 函数: tags
* 功能: 从文件中提取html标签
*
* 入口:
* $filename 文件名
* $tag 标签名
* 返回:
* 数组,每项为:
* tagname string
* text string
* attrs array
*
* 示例:
* print_r(tags("test1.htm","a"));
* print_r("http://localhost/index.htm","img");
*
*/

function tags($filename,$tag) {
$buffer = join("",file($filename));
$buffer = eregi_replace(" ","",$buffer);
$tagkey = sql_regcase($tag);
$buffer = eregi_replace("<$tagkey "," <$tag ",$buffer);
$ar = split(" ",$buffer);

foreach($ar as $v) {
if(! eregi("<$tagkey ",$v)) continue;
eregi("<$tagkey ([^>]*)((.*)</$tagkey)?",$v,$regs);
$p[tagname] = strtoupper($tag);
if($regs[3])
$p[text] = $regs[3];
$s = trim(eregi_replace("[ ]+"," ",$regs[1]))." ";
$s = eregi_replace(" *= *","=",$s);

$a = split(" ",$s);
for($i=0;$i<count($a);$i++) {
$ch = array();
if(eregi("=["']",$a[$i])) {
$j = $i+1;
while(!eregi("["']$",$a[$i])) {
$a[$i] .= " ".$a[$j];
unset($a[$j]);
}
}
}
foreach($a as $k) {
$name = strtoupper(strtok($k,"="));
$value = strtok("

商业源码热门下载www.html.org.cn