几种获取html字符串中所有a链接地址代码
$ss = "<a href='1.gif'>d</a>adfxx<a href="dir.html">dir</a>";
print_r(gethref($ss));
function gethref($temp){
preg_match_all('/<a.*?(?: |t|r|n)?href=['"]?(.+?)['"]?(?:(?: |t|r|n)+.*?)?>(.+?)</a.*?>/sim',$temp,$a);
return $a[1];
}
//下面所有a连接
$htm = preg_replace( "@<a(.*?)</a>@is","$1",$ss);
print_r($htm);
//比较全的提取url连接地址
$url="http://www.phprm.com";
$html=file_get_contents($url,"r");
preg_match_all ("/(<a)(.*)(href=)([^>]*)(>)([^<]*)(<)([^>]*)(>)/", $html, $matches);
for ($i=0;$i<count($matches[0]);$i++)
{
echo "|||".$matches[2][$i]."||".$matches[3][$i].$matches[4][$i]."||".$matches[6][$i]."||".$matches[8][$i]."<br>";
}
//提取文章字符串中所有链接地址
preg_match_all('/(?<=href=")[wd.:/]*/',$str,$fstr);教程链接:http://www.phprm.com/develop/fs4328.html
随意转载~但请保留教程地址★