抓取豆瓣电影TOP250的PHP代码
时间:2021-07-01 10:21:17
帮助过:22人阅读
- for ($start = 0; $start < 250; $start += 25) {
- $url = "http://movie.douban.com/top250?start=$start&filter=&type=";
- $titles = parsePage($url);
- if ($titles === false) {
- echo $url, "\n";
- } else {
- array_walk($titles, 'printTitle');
- }
- }
-
-
- function parsePage($url) {
- $html = file_get_contents($url);
- if ($html === false) {
- return false;
- }
-
- if (preg_match_all('/([^<]+)/s', $html, $matches) === false) {
- return false;
- }
-
- $titles = array();
- foreach($matches[1] as $item) {
- $titles[] = iconv('utf-8', 'gbk', $item);
- }
- return $titles;
- }
-
-
- $count = 0;
- function printTitle($title) {
- global $count;
- ++$count;
- printf("%3d %s\n", $count, $title);
- }
|
PHP