几种获取html字符串中所有a链接地址代码
$ss = "<a href='1.gif'>d</a>adfxx<a href="dir.html">dir</a>"; print_r(gethref($ss)); function gethref($temp){ preg_match_all('/<a.*?(?: |t|r|n)?href=['"]?(.+?)['"]?(?:(?: |t|r|n)+.*?)?>(.+?)</a.*?>/sim',$temp,$a); return $a[1]; } //下面所有a连接 $htm = preg_replace( "@<a(.*?)</a>@is","$1",$ss); print_r($htm); //比较全的提取url连接地址 $url="http://www.phprm.com"; $html=file_get_contents($url,"r"); preg_match_all ("/(<a)(.*)(href=)([^>]*)(>)([^<]*)(<)([^>]*)(>)/", $html, $matches); for ($i=0;$i<count($matches[0]);$i++) { echo "|||".$matches[2][$i]."||".$matches[3][$i].$matches[4][$i]."||".$matches[6][$i]."||".$matches[8][$i]."<br>"; } //提取文章字符串中所有链接地址 preg_match_all('/(?<=href=")[wd.:/]*/',$str,$fstr);
教程链接:http://www.phprm.com/develop/fs4328.html
随意转载~但请保留教程地址★