| 注册
请输入搜索内容

热门搜索

Java Linux MySQL PHP JavaScript Hibernate jQuery Nginx
jopen
9年前发布

抓取豆瓣电影TOP250的PHP代码

for ($start = 0; $start < 250; $start += 25) {      $url = "http://movie.douban.com/top250?start=$start&filter=&type=";      $titles = parsePage($url);      if ($titles === false) {          echo $url, "\n";      } else {          array_walk($titles, 'printTitle');      }  }        function parsePage($url) {      $html = file_get_contents($url);      if ($html === false) {          return false;      }             if (preg_match_all('/<a.+?<span class="title">([^<]+)/s', $html, $matches) === false) {          return false;      }             $titles = array();      foreach($matches[1] as $item) {          $titles[] = iconv('utf-8', 'gbk', $item);      }      return $titles;  }        $count = 0;  function printTitle($title) {      global $count;      ++$count;      printf("%3d %s\n", $count, $title);  }