-3

我正在使用简单的 html dom 将数据从站点抓取到我的数据库中并显示在我的网页上。但是每次我运行文件时,重复的数据也会插入到数据库中。我怎样才能继续检查数据库中是否已经存在数据?这是我的抓取文件:

 <?php

 $con=mysqli_connect("localhost","root","","crawling");\

 mysql_connect("localhost", "root", "")or die("cannot connect"); 
 mysql_select_db("crawling")or die("cannot select DB");


 include "domcrawl.php";
 $url="http://www.bgr.in/category/reviews/";
 $html=file_get_html($url);
 //$arr=$html->find('table[class=findList] tbody tr td[class=result_text]');
 $m=$html->find('img');

 $b=$html->find('a');

 $c=$html->find('p');  

 $imghead = $b[21]->innertext;

 $img = $m[3];

 $imgtext = $c[0];


 $sql = sprintf("INSERT INTO image1
 ( head, image, text, name)
 VALUES
 ( '%s', '%s', '%s', '%s')",

 mysql_real_escape_string($imghead),
 mysql_real_escape_string($img),
 mysql_real_escape_string($imgtext),
mysql_real_escape_string("gm")
);
 mysql_query($sql);





 $sql = "SELECT head FROM image1 WHERE name='gm'";
 $sql1 = "SELECT image FROM image1 WHERE name='gm'";
 $sql2 = "SELECT text FROM image1 WHERE name='gm'";
 $result = mysql_query("$sql");
 $result1 = mysql_query("$sql1");
 $result2 = mysql_query("$sql2");

  $head_get= mysql_result($result, 0);
 $img_get= mysql_result($result1, 0);
 $text_get= mysql_result($result2, 0);
 echo "<br><br>";

 echo $head_get;
 echo "<br><br>";
 echo $img_get;
 echo $text_get;


  ?>
4

2 回答 2

1

在获取对象属性之前必须检查,在您的情况下,它正在查找空对象

$link = $node->getElementsByTagName('link')->item(0);
if(!empty($link)){
 $nodeValue = $link->nodeValue,
}

'link' => $nodeValue;

同样为所有人做

于 2013-09-29T18:49:27.510 回答
0

假设'date' => $node->getElementsByTagName('pubDate')->item(0)->nodeValue是第 11 行,似乎没有带有 tag 的元素pubDate,这就是$node->getElementsByTagName('pubDate')->item(0)返回nullor的原因false

于 2013-09-29T18:46:40.517 回答