这是个采集程序。每个标题不一定在同一行的,我想截取下面红色部分,再放到一个数组里。
$arr1 = array('
<div class="title">
<a href="123.php">标题一</a>
</div>
<div class="title">
<a href="456.php">标题二</a>
</div>
');preg_match_all('/<div class="title">(.*)<\/div>/iU', $arr1[1], $arr1);print_r($arr1[1]); //输出是空的我不是专业程序员,请高人们指点指点。急啊!!!
$arr1 = array('
<div class="title">
<a href="123.php">标题一</a>
</div>
<div class="title">
<a href="456.php">标题二</a>
</div>
');preg_match_all('/<div class="title">(.*)<\/div>/iU', $arr1[1], $arr1);print_r($arr1[1]); //输出是空的我不是专业程序员,请高人们指点指点。急啊!!!
<div class="title">
<a href="123.php">标题一</a>
</div>
<div class="title">
<a href="456.php">标题二</a>
</div>
');
preg_match_all('/<div class\="title">[\r\n]+(.*?)[\r\n]+<\/div>/', $arr[0], $arr1);
print_r($arr1[1]);
preg_match_all('/<div class\="title">[\r\n\s]*(.*?)[\r\n\s]*<\/div>/iU', $arr[0], $arr1);
<div class="cf">
<a id="hover"
href="thread?tid=16n8n9" class="title">title1</a>
</div>谁能帮解决一下,加我QQ125405677
<div class="title">
<a href="123.php">标题一</a>
</div>
<div class="title">
<a href="456.php">标题二</a>
</div>
');preg_match_all('/a .+a>/isU', $arr1[0], $r);print_r($r);Array
(
[0] => Array
(
[0] => a href="123.php">标题一</a>
[1] => a href="456.php">标题二</a>
))
<meta http-equiv="Content-Type" content="text/html;charset=utf-8">
<div class="cf">
<a id="hover"
href="thread?tid=16n8n9" class="title">title1</a>
</div>
<div class="title">
<a href="123.php">标题一</a>
</div>
<div class="title">
<a href="456.php">标题二</a>
</div>';
$html = new DOMDocument();
$html-> loadHTML($str);$nodes = $html->getElementsByTagName('a');$arr = Array();
foreach($nodes as $n) $arr[] = Array('href'=> $n->getAttribute('href'), 'title' => $n->nodeValue);echo '<pre>';
print_r($arr);Array
(
[0] => Array
(
[href] => thread?tid=16n8n9
[title] => title1
) [1] => Array
(
[href] => 123.php
[title] => 标题一
) [2] => Array
(
[href] => 456.php
[title] => 标题二
))