代码来自本人博客:
http://www.taoniwu.com/archives/3234.html各位大神如果有什么好的建议,感谢提出~~~~~
- ?class Collection{
- protected $url; //采集地址
- protected $prefix; //重命名文件前缀
- protected $style; //需要采集的图片格式,传入一个数组
- const prel = '/(?:http?|https?):\/\/(?:[^\.\/\(\)\?]+)\.(?:[^\.\/]+)\.(?:com|cn|net|org)\/(?:[^\.:\"\'\(\)\?]+)\.(jpg|png|gif)/i'; //采集规则
- //构造函数
- function __construct($url,$prefix,$style){
- switch($this->checkdata($url,$prefix,$style)){
- case 1:
- echo '';
- exit;
- break;
- case 2:
- echo '';
- exit;
- break;
- case 3:
- echo '';
- exit;
- break;
- case 4:
- echo '';
- exit;
- }
- $this->url = $url;
- $this->prefix = $prefix;
- $this->style = $style;
- }
- //开始采集数据
- public function action(){
- $url = $this->checkurl();
- $imgurl = $this->collecturl($url);
- $this->savafile($imgurl);
- }
- //url处理
- protected function checkurl(){
- $munprel = '/\([0-9]+,[0-9]+\)/i';
- $myurl;
- if(preg_match($munprel,$this->url,$arr)){
- $temp = substr($arr[0],1,strlen($arr[0])-2);
- $mymunber = explode(',',$temp);
- $temparr = explode($arr[0],$this->url);
- for($i=$mymunber[0];$i<=$mymunber[1];$i++){
- $myurl[] = $temparr[0].$i.$temparr[1];
- }
- }else{
- $myurl = $this->url;
- }
- return $myurl;
- }
- //文件保存
- protected function savafile($imgurl){
- if(!empty($imgurl)){
- foreach($imgurl[0] as $key=>$value){
- $filename = '';
- if(in_array($imgurl[1][$key],$this->style)){
- $size = @getimagesize($value);
- if($size === false){
- continue;
- }
- list($w,$h,$t,$a) = $size;
- if($w<200 || $h<200){
- continue;
- }
- ob_start();
- readfile($value);
- $obj = ob_get_contents();
- ob_end_clean();
- $dir = 'F:/php/';
- if(!is_dir($dir)){
- mkdir($dir,0777);
- }
- if(!empty($this->prefix)){
- $filename = $dir.$this->prefix.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
- }else{
- $filename = $dir.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
- }
- $fo = @fopen($filename,'wb');
- if($fo === false){
- echo '';
- exit;
- }
- $fw = fwrite($fo,$obj);
- echo ''.$filename.'采集成功';
- }
- }
- }
- }
-
- //地址采集函数,包括图片后缀名
- protected function collecturl($url){
- set_time_limit(0);
- if(is_array($url)){
- $arr = array();
- $imgkey = array();
- foreach($url as $value){
- $code = file_get_contents($value);
- preg_match_all(self::prel,$code,$arrimg);
- $arr = array_merge($arr,$arrimg[0]);
- $imgkey = array_merge($imgkey,$arrimg[1]);
- }
- return array($arr,$imgkey);
- }else{
- $code = file_get_contents($url);
- preg_match_all(self::prel,$code,$arrimg);
- return $arrimg;
- }
- }
- //检验数据
- private function checkdata($url,$prefix,$style){
- if(empty($url)){
- return 1;
- }elseif(!is_array($style)){
- return 2;
- }elseif(count($style)==0){
- return 3;
- }elseif(stripos($prefix,'.') !== false || stripos($prefix,'/') !== false || stripos($prefix,'|') !== false){
- return 4;
- }
- }
- }
-
-
-
-
-
-
-
- ?>
- class Collection{
- protected $url; //采集地址
- protected $prefix; //重命名文件前缀
- protected $style; //需要采集的图片格式,传入一个数组
- const prel = '/(?:http?|https?):\/\/(?:[^\.\/\(\)\?]+)\.(?:[^\.\/]+)\.(?:com|cn|net|org)\/(?:[^\.:\"\'\(\)\?]+)\.(jpg|png|gif)/i'; //采集规则
- //构造函数
- function __construct($url,$prefix,$style){
- switch($this->checkdata($url,$prefix,$style)){
- case 1:
- echo '';
- exit;
- break;
- case 2:
- echo '';
- exit;
- break;
- case 3:
- echo '';
- exit;
- break;
- case 4:
- echo '';
- exit;
- }
- $this->url = $url;
- $this->prefix = $prefix;
- $this->style = $style;
- }
- //开始采集数据
- public function action(){
- $url = $this->checkurl();
- $imgurl = $this->collecturl($url);
- $this->savafile($imgurl);
- }
- //url处理
- protected function checkurl(){
- $munprel = '/\([0-9]+,[0-9]+\)/i';
- $myurl;
- if(preg_match($munprel,$this->url,$arr)){
- $temp = substr($arr[0],1,strlen($arr[0])-2);
- $mymunber = explode(',',$temp);
- $temparr = explode($arr[0],$this->url);
- for($i=$mymunber[0];$i<=$mymunber[1];$i++){
- $myurl[] = $temparr[0].$i.$temparr[1];
- }
- }else{
- $myurl = $this->url;
- }
- return $myurl;
- }
- //文件保存
- protected function savafile($imgurl){
- if(!empty($imgurl)){
- foreach($imgurl[0] as $key=>$value){
- $filename = '';
- if(in_array($imgurl[1][$key],$this->style)){
- $size = @getimagesize($value);
- if($size === false){
- continue;
- }
- list($w,$h,$t,$a) = $size;
- if($w<200 || $h<200){
- continue;
- }
- ob_start();
- readfile($value);
- $obj = ob_get_contents();
- ob_end_clean();
- $dir = 'F:/php/';
- if(!is_dir($dir)){
- mkdir($dir,0777);
- }
- if(!empty($this->prefix)){
- $filename = $dir.$this->prefix.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
- }else{
- $filename = $dir.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
- }
- $fo = @fopen($filename,'wb');
- if($fo === false){
- echo '';
- exit;
- }
- $fw = fwrite($fo,$obj);
- echo ''.$filename.'采集成功';
- }
- }
- }
- }
-
- //地址采集函数,包括图片后缀名
- protected function collecturl($url){
- set_time_limit(0);
- if(is_array($url)){
- $arr = array();
- $imgkey = array();
- foreach($url as $value){
- $code = file_get_contents($value);
- preg_match_all(self::prel,$code,$arrimg);
- $arr = array_merge($arr,$arrimg[0]);
- $imgkey = array_merge($imgkey,$arrimg[1]);
- }
- return array($arr,$imgkey);
- }else{
- $code = file_get_contents($url);
- preg_match_all(self::prel,$code,$arrimg);
- return $arrimg;
- }
- }
- //检验数据
- private function checkdata($url,$prefix,$style){
- if(empty($url)){
- return 1;
- }elseif(!is_array($style)){
- return 2;
- }elseif(count($style)==0){
- return 3;
- }elseif(stripos($prefix,'.') !== false || stripos($prefix,'/') !== false || stripos($prefix,'|') !== false){
- return 4;
- }
- }
- }
|