1. collection.class.php

<?php
class Collection{
	protected $url;				//采集地址
	protected $prefix;			//重命名文件前缀
	protected $style;			//需要采集的图片格式,传入一个数组
	const prel = '/(?:http?|https?):\/\/(?:[^\.\/\(\)\?]+)\.(?:[^\.\/]+)\.(?:com|cn|net|org)\/(?:[^\.:\"\'\(\)\?]+)\.(jpg|png|gif)/i';			//采集规则
	//构造函数
	function __construct($url,$prefix,$style){
		switch($this->checkdata($url,$prefix,$style)){
			case 1:
				echo '<script>alert("采集地址不能为空!")</script>';
				exit;
				break;
			case 2:
				echo '<script>alert("需要采集的图片格式,应该为数组!")</script>';
				exit;
				break;
			case 3:
				echo '<script>alert("需要采集的图片格式,不能为空!")</script>';
				exit;
				break;
			case 4:
				echo '<script>alert("文件名不能含有. / |或用空格开头!")</script>';
				exit;
		}
		$this->url = $url;
		$this->prefix = $prefix;
		$this->style = $style;
	}
	//开始采集数据
	public function action(){
		$url = $this->checkurl();
		$imgurl = $this->collecturl($url);
		$this->savafile($imgurl);
	}
	//url处理
	protected function checkurl(){
		$munprel = '/\([0-9]+,[0-9]+\)/i';
		$myurl;
		if(preg_match($munprel,$this->url,$arr)){
			$temp = substr($arr[0],1,strlen($arr[0])-2);
			$mymunber = explode(',',$temp);
			$temparr = explode($arr[0],$this->url);
			for($i=$mymunber[0];$i<=$mymunber[1];$i++){
				$myurl[] = $temparr[0].$i.$temparr[1];
			}
		}else{
			$myurl = $this->url;
		}
		return $myurl;
	}
	//文件保存
	protected function savafile($imgurl){
		if(!empty($imgurl)){
			foreach($imgurl[0] as $key=>$value){
				$filename = '';
				if(in_array($imgurl[1][$key],$this->style)){
				    $size = @getimagesize($value);
					if($size === false){
						continue;
					}
					list($w,$h,$t,$a) = $size;
					if($w<200 || $h<200){
						continue;
					} 
					ob_start();
					readfile($value);
					$obj = ob_get_contents();
					ob_end_clean();
					$dir = 'F:/php/';
					if(!is_dir($dir)){
						mkdir($dir,0777);
					}
					if(!empty($this->prefix)){
						$filename = $dir.$this->prefix.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
					}else{
						$filename = $dir.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
					}
					$fo = @fopen($filename,'wb');
					if($fo === false){
						echo '<script>alert("创建文件失败,文件目录不可写!")</script>';
						exit;
					}
					$fw = fwrite($fo,$obj);
					echo '<p style="width:350px;background:#ddd;">'.$filename.'采集成功</p>';
				}
			}
		}
	}
	
	//地址采集函数,包括图片后缀名
	protected function collecturl($url){
		set_time_limit(0);
		if(is_array($url)){
			$arr = array();
			$imgkey = array();
			foreach($url as $value){
				$code = file_get_contents($value);
				preg_match_all(self::prel,$code,$arrimg);
				$arr = array_merge($arr,$arrimg[0]);
				$imgkey = array_merge($imgkey,$arrimg[1]);
			}
			return array($arr,$imgkey);
		}else{
			$code = file_get_contents($url);
			preg_match_all(self::prel,$code,$arrimg);
			return $arrimg;
		}
	}
	//检验数据
	private function checkdata($url,$prefix,$style){
		if(empty($url)){
			return 1;
		}elseif(!is_array($style)){
			return 2;
		}elseif(count($style)==0){
			return 3;
		}elseif(stripos($prefix,'.') !== false || stripos($prefix,'/') !== false || stripos($prefix,'|') !== false){
			return 4;
		}
	}
}
	
	
	
	
	
	
	
?>
登录后复制


2. PHP图片采集程序--图片采集类

class Collection{
	protected $url;				//采集地址
	protected $prefix;			//重命名文件前缀
	protected $style;			//需要采集的图片格式,传入一个数组
	const prel = '/(?:http?|https?):\/\/(?:[^\.\/\(\)\?]+)\.(?:[^\.\/]+)\.(?:com|cn|net|org)\/(?:[^\.:\"\'\(\)\?]+)\.(jpg|png|gif)/i';			//采集规则
	//构造函数
	function __construct($url,$prefix,$style){
		switch($this->checkdata($url,$prefix,$style)){
			case 1:
				echo '<script>alert("采集地址不能为空!")</script>';
				exit;
				break;
			case 2:
				echo '<script>alert("需要采集的图片格式,应该为数组!")</script>';
				exit;
				break;
			case 3:
				echo '<script>alert("需要采集的图片格式,不能为空!")</script>';
				exit;
				break;
			case 4:
				echo '<script>alert("文件名不能含有. / |或用空格开头!")</script>';
				exit;
		}
		$this->url = $url;
		$this->prefix = $prefix;
		$this->style = $style;
	}
	//开始采集数据
	public function action(){
		$url = $this->checkurl();
		$imgurl = $this->collecturl($url);
		$this->savafile($imgurl);
	}
	//url处理
	protected function checkurl(){
		$munprel = '/\([0-9]+,[0-9]+\)/i';
		$myurl;
		if(preg_match($munprel,$this->url,$arr)){
			$temp = substr($arr[0],1,strlen($arr[0])-2);
			$mymunber = explode(',',$temp);
			$temparr = explode($arr[0],$this->url);
			for($i=$mymunber[0];$i<=$mymunber[1];$i++){
				$myurl[] = $temparr[0].$i.$temparr[1];
			}
		}else{
			$myurl = $this->url;
		}
		return $myurl;
	}
	//文件保存
	protected function savafile($imgurl){
		if(!empty($imgurl)){
			foreach($imgurl[0] as $key=>$value){
				$filename = '';
				if(in_array($imgurl[1][$key],$this->style)){
				    $size = @getimagesize($value);
					if($size === false){
						continue;
					}
					list($w,$h,$t,$a) = $size;
					if($w<200 || $h<200){
						continue;
					} 
					ob_start();
					readfile($value);
					$obj = ob_get_contents();
					ob_end_clean();
					$dir = 'F:/php/';
					if(!is_dir($dir)){
						mkdir($dir,0777);
					}
					if(!empty($this->prefix)){
						$filename = $dir.$this->prefix.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
					}else{
						$filename = $dir.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
					}
					$fo = @fopen($filename,'wb');
					if($fo === false){
						echo '<script>alert("创建文件失败,文件目录不可写!")</script>';
						exit;
					}
					$fw = fwrite($fo,$obj);
					echo '<p style="width:350px;background:#ddd;">'.$filename.'采集成功</p>';
				}
			}
		}
	}
	
	//地址采集函数,包括图片后缀名
	protected function collecturl($url){
		set_time_limit(0);
		if(is_array($url)){
			$arr = array();
			$imgkey = array();
			foreach($url as $value){
				$code = file_get_contents($value);
				preg_match_all(self::prel,$code,$arrimg);
				$arr = array_merge($arr,$arrimg[0]);
				$imgkey = array_merge($imgkey,$arrimg[1]);
			}
			return array($arr,$imgkey);
		}else{
			$code = file_get_contents($url);
			preg_match_all(self::prel,$code,$arrimg);
			return $arrimg;
		}
	}
	//检验数据
	private function checkdata($url,$prefix,$style){
		if(empty($url)){
			return 1;
		}elseif(!is_array($style)){
			return 2;
		}elseif(count($style)==0){
			return 3;
		}elseif(stripos($prefix,'.') !== false || stripos($prefix,'/') !== false || stripos($prefix,'|') !== false){
			return 4;
		}
	}
}
登录后复制
09-15 09:01