1

我写了一个页面,它将扫描一个站点,然后从源代码中提取某些代码。该部分工作成功,但是我想在多个页面上运行它并将详细信息转储到数据库中。我正在努力让循环正常工作,这就是我目前拥有的:

date_default_timezone_set("australia/sydney");

$host = 'http://www.tabonline.com.au/';
$day = date(d);
$month = date(m);
$year = date(Y);
$slash = '/';
$mtgraces = '/mtgraces.html';

//Gallops Meetings on Todays racing page
$content = file_get_contents($host . $year . "/". $month . "/" . $day . $mtgraces);
preg_match_all('#<a[^<>]+href\s*=\s*[\'"](.R[0-9]+.html*)[\'"]#i', $content, $matches);
foreach ($matches[1] as $url) $links[] =  "$host$year$slash$month$slash$day$slash$url";

//get the runners from each page

for($c=0; $c<count($links); $c++)

$racepage = file_get_contents($links[$i]);
preg_match_all('#<td align="right" height="18"><font color="\#ffffff">[0-9]{1,2}</font></td>#', $racepage, $number);
preg_match_all('#<font color="\#00ffff">[0-9]{1,3}</font>#', $racepage, $rating);
preg_match_all('#<B>[\w]+([\s][A-Z]+)?</B>#', $racepage, $location);
preg_match_all('#<B>[\w]+\s[0-9]+</B>#', $racepage, $locationcode);

//strip tags for storage in DB

$number_data = implode(",", $number[0]);
$dbnumber = strip_tags($number_data);
$final_number = explode(",", $dbnumber);

$rating_data = implode(",", $rating[0]);
$dbrating = strip_tags($rating_data);
$final_rating = explode(",", $dbrating);

$location_data = implode(",", $location[0]);
$dblocation = strip_tags($location_data);
$final_location = explode(",", $dblocation);

$locationcode_data = implode(",", $locationcode[0]);
$dblocationcode = strip_tags($locationcode_data);
$final_locationcode = explode(",", $dblocationcode);

//Insert into database

 $data = array(); 
for($i=0; $i<count($final_number); $i++)
{
    $data[] = "('" . $final_location[0] . "', '" . $final_locationcode[0] . "', '" . $final_number[$i] . "', '" . $final_rating[$i] . "')";
}

if(count($queries) == 0)
{
    # Nothing passed
    # exit
}


$query = "insert into ratings(location, location_code, tab_no, rating) values " . implode(", ", $data); 


$hostname = "%hostname%";   // eg. mysql.yourdomain.com (unique)
$username = "%username%";   // the username specified when setting-up the database
$password = "%password";   // the password specified when setting-up the database
$database = "%database";   // the database name chosen when setting-up the database (unique)
mysql_connect($hostname,$username,$password);
mysql_select_db($database) or die("Unable to select database");

mysql_query($query) OR die(mysql_error())

目前,此输出为我提供了站点列表($links变量)中最后一页的正确内容。最终,我希望它遍历整个$links变量,然后使用该$query变量将该数据导入数据库,以便我可以对其进行进一步分析。

我希望这是有道理的,您可以以我的方式看到错误。

4

3 回答 3

1

嗯……这里有几个问题……

for($c=0; $c<count($links); $c++)

这个循环正在执行下一行:

$racepage = file_get_contents($links[$i]);

但是,$i 没有定义,我怀疑你想要 $c。此外,您需要在各个部分周围放置一些大括号......现在,这是未经测试的,但我认为您想要类似的东西:

date_default_timezone_set("australia/sydney");


$host = 'http://www.tabonline.com.au/';
$day = date(d);
$month = date(m);
$year = date(Y);
$slash = '/';
$mtgraces = '/mtgraces.html';


//Gallops Meetings on Todays racing page
$content = file_get_contents($host . $year . "/". $month . "/" . $day . $mtgraces);
preg_match_all('#<a[^<>]+href\s*=\s*[\'"](.R[0-9]+.html*)[\'"]#i', $content, $matches);
foreach ($matches[1] as $url) $links[] =  "$host$year$slash$month$slash$day$slash$url";


//get the runners from each page
$final_number = array();
$final_rating = array();
$final_location = array();
$final_locationcode = array();

for($c=0; $c<count($links); $c++)
{
  $racepage = file_get_contents($links[$c]);
  preg_match_all('#<td align="right" height="18"><font color="\#ffffff">[0-9]{1,2}</font></td>#', $racepage, $number);
  preg_match_all('#<font color="\#00ffff">[0-9]{1,3}</font>#', $racepage, $rating);
  preg_match_all('#<B>[\w]+([\s][A-Z]+)?</B>#', $racepage, $location);
  preg_match_all('#<B>[\w]+\s[0-9]+</B>#', $racepage, $locationcode);

  //strip tags for storage in DB
  $number_data = implode(",", $number[0]);
  $dbnumber = strip_tags($number_data);
  $final_number[] = explode(",", $dbnumber);

  $rating_data = implode(",", $rating[0]);
  $dbrating = strip_tags($rating_data);
  $final_rating[] = explode(",", $dbrating);

  $location_data = implode(",", $location[0]);
  $dblocation = strip_tags($location_data);
  $final_location[] = explode(",", $dblocation);

  $locationcode_data = implode(",", $locationcode[0]);
  $dblocationcode = strip_tags($locationcode_data);
  $final_locationcode[] = explode(",", $dblocationcode);
}

//Insert into database
$data = array();
for($i=0; $i<count($final_number); $i++)
    $data[] = "('" . $final_location[0] . "', '" . $final_locationcode[0] . "', '" . $final_number[$i] . "', '" . $final_rating[$i] . "')";


if(count($queries) != 0)
{
  $query = "insert into ratings(location, location_code, tab_no, rating) values " . implode(", ", $data);
  $hostname = "%hostname%";   // eg. mysql.yourdomain.com (unique)
  $username = "%username%";   // the username specified when setting-up the database
  $password = "%password";   // the password specified when setting-up the database
  $database = "%database";   // the database name chosen when setting-up the database (unique)
  mysql_connect($hostname,$username,$password);
  mysql_select_db($database) or die("Unable to select database");
  mysql_query($query) OR die(mysql_error())
}
于 2009-09-28T01:45:22.170 回答
0

$final_number 是您从比赛页面链接中获得的东西,对吗?您正在使用它作为$i<count($final_number). 相反,我认为您应该$i<count($links)在那里使用,因为您要插入的是每个链接的一行。你可以做的是移动:

$data[] = "('" . $final_location[0] . "', '" . $final_locationcode[0] . "', '" . $final_number[$i] . "', '" . $final_rating[$i] . "')";

...行到行的底部,for($c=0; $c<count($links); $c++)这将使您的代码从该点开始看起来像这样,(注意 $data=array() 在循环之前定义):

$data = array();
for($c=0; $c<count($links); $c++)
{
  $racepage = file_get_contents($links[$c]);
  preg_match_all('#<td align="right" height="18"><font color="\#ffffff">[0-9]{1,2}</font></td>#', $racepage, $number);
  preg_match_all('#<font color="\#00ffff">[0-9]{1,3}</font>#', $racepage, $rating);
  preg_match_all('#<B>[\w]+([\s][A-Z]+)?</B>#', $racepage, $location);
  preg_match_all('#<B>[\w]+\s[0-9]+</B>#', $racepage, $locationcode);

  //strip tags for storage in DB
  $number_data = implode(",", $number[0]);
  $dbnumber = strip_tags($number_data);
  $final_number[] = explode(",", $dbnumber);

  $rating_data = implode(",", $rating[0]);
  $dbrating = strip_tags($rating_data);
  $final_rating[] = explode(",", $dbrating);

  $location_data = implode(",", $location[0]);
  $dblocation = strip_tags($location_data);
  $final_location[] = explode(",", $dblocation);

  $locationcode_data = implode(",", $locationcode[0]);
  $dblocationcode = strip_tags($locationcode_data);
  $final_locationcode[] = explode(",", $dblocationcode);

  $data[] = "('" . $final_location[0] . "', '" . $final_locationcode[0] . "', '" . $final_number[0] . "', '" . $final_rating[0] . "')";
}

if(count($queries) != 0)
{
  $query = "insert into ratings(location, location_code, tab_no, rating) values " . implode(", ", $data);
  $hostname = "%hostname%";   // eg. mysql.yourdomain.com (unique)
  $username = "%username%";   // the username specified when setting-up the database
  $password = "%password";   // the password specified when setting-up the database
  $database = "%database";   // the database name chosen when setting-up the database (unique)
  mysql_connect($hostname,$username,$password);
  mysql_select_db($database) or die("Unable to select database");
  mysql_query($query) OR die(mysql_error())
}

我认为这段代码仍然存在一些问题。
编辑:我也注意到这一行

$number_data = implode(",", $number[0]);

不会$number[0]是字符串,也不会是数组,因为$number它是匹配字符串的数组,所以$number[0]会是整个匹配的字符串。这将适用于“number_data”、“rating_data”、“location_data”和“locationcode_data”,因此您可以

$number_data = strip_tags($number[0]);

然后在创建插入数据时:

$data[] = "('" . $final_location . "', '" . $final_locationcode . "', '" . $final_number . "', '" . $final_rating . "')";
于 2009-09-28T02:58:51.307 回答
0

我已经设法弄清楚了!

我需要将全部内容放在 for 循环中,所以它看起来像这样:

for($c=0; $c<count($links); $c++)
    {
$racepage = file_get_contents($links[$c]);
preg_match_all('#<td align="right" height="18"><font color="\#ffffff">[0-9]{1,2}</font></td>#', $racepage, $number);
preg_match_all('#<font color="\#00ffff">[0-9]{1,3}</font>#', $racepage, $rating);
preg_match_all('#<B>[\w]+([\s][A-Z]+)?</B>#', $racepage, $location);
preg_match_all('#<B>[\w]+\s[0-9]+</B>#', $racepage, $locationcode);

//strip tags for storage in DB

$number_data = implode(",", $number[0]);
$dbnumber = strip_tags($number_data);
$final_number = explode(",", $dbnumber);

$rating_data = implode(",", $rating[0]);
$dbrating = strip_tags($rating_data);
$final_rating = explode(",", $dbrating);

$location_data = implode(",", $location[0]);
$dblocation = strip_tags($location_data);
$final_location = explode(",", $dblocation);

$locationcode_data = implode(",", $locationcode[0]);
$dblocationcode = strip_tags($locationcode_data);
$final_locationcode = explode(",", $dblocationcode);

//Insert into database

 $data = array(); 
for($i=0; $i<count($final_number); $i++)
{
    $data[] = "('" . $final_location[0] . "', '" . $final_locationcode[0] . "', '" . $final_number[$i] . "', '" . $final_rating[$i] . "')";
}

if(count($queries) == 0)
{
    # Nothing passed
    # exit
}


$query = "insert into ratings(location, location_code, tab_no, rating) values " . implode(", ", $data);


$hostname = "%HOSTNAME";   // eg. mysql.yourdomain.com (unique)
$username = "%username%";   // the username specified when setting-up the database
$password = "%password%";   // the password specified when setting-up the database
$database = "%database%";   // the database name chosen when setting-up the database (unique)
mysql_connect($hostname,$username,$password);
mysql_select_db($database) or die("Unable to select database");

mysql_query($query) OR die(mysql_error());


}

谢谢大家的帮助,这里似乎是一个很棒的社区。我一定会密切关注它以获取更多修复。

于 2009-09-28T05:41:50.073 回答