PHP图片采集程序--图片采集类

<?php
class Collection{
    protected $url;             //采集地址
    protected $prefix;          //重命名文件前缀
    protected $style;           //需要采集的图片格式,传入一个数组
    const prel = '/(?:http?|https?):\/\/(?:[^\.\/\(\)\?]+)\.(?:[^\.\/]+)\.(?:com|cn|net|org)\/(?:[^\.:\"\'\(\)\?]+)\.(jpg|png|gif)/i';          //采集规则
    //构造函数
    function __construct($url,$prefix,$style){
        switch($this->checkdata($url,$prefix,$style)){
            case 1:
                echo '<script>alert("采集地址不能为空!")</script>';
                exit;
                break;
            case 2:
                echo '<script>alert("需要采集的图片格式,应该为数组!")</script>';
                exit;
                break;
            case 3:
                echo '<script>alert("需要采集的图片格式,不能为空!")</script>';
                exit;
                break;
            case 4:
                echo '<script>alert("文件名不能含有. / |或用空格开头!")</script>';
                exit;
        }
        $this->url = $url;
        $this->prefix = $prefix;
        $this->style = $style;
    }
    //开始采集数据
    public function action(){
        $url = $this->checkurl();
        $imgurl = $this->collecturl($url);
        $this->savafile($imgurl);
    }
    //url处理
    protected function checkurl(){
        $munprel = '/\([0-9]+,[0-9]+\)/i';
        $myurl;
        if(preg_match($munprel,$this->url,$arr)){
            $temp = substr($arr[0],1,strlen($arr[0])-2);
            $mymunber = explode(',',$temp);
            $temparr = explode($arr[0],$this->url);
            for($i=$mymunber[0];$i<=$mymunber[1];$i++){
                $myurl[] = $temparr[0].$i.$temparr[1];
            }
        }else{
            $myurl = $this->url;
        }
        return $myurl;
    }
    //文件保存
    protected function savafile($imgurl){
        if(!empty($imgurl)){
            foreach($imgurl[0] as $key=>$value){
                $filename = '';
                if(in_array($imgurl[1][$key],$this->style)){
                    $size = @getimagesize($value);
                    if($size === false){
                        continue;
                    }
                    list($w,$h,$t,$a) = $size;
                    if($w<200 || $h<200){
                        continue;
                    } 
                    ob_start();
                    readfile($value);
                    $obj = ob_get_contents();
                    ob_end_clean();
                    $dir = 'F:/php/';
                    if(!is_dir($dir)){
                        mkdir($dir,0777);
                    }
                    if(!empty($this->prefix)){
                        $filename = $dir.$this->prefix.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
                    }else{
                        $filename = $dir.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
                    }
                    $fo = @fopen($filename,'wb');
                    if($fo === false){
                        echo '<script>alert("创建文件失败,文件目录不可写!")</script>';
                        exit;
                    }
                    $fw = fwrite($fo,$obj);
                    echo '<div style="width:350px;background:#ddd;">'.$filename.'采集成功</div>';
                }
            }
        }
    }
     
    //地址采集函数,包括图片后缀名
    protected function collecturl($url){
        set_time_limit(0);
        if(is_array($url)){
            $arr = array();
            $imgkey = array();
            foreach($url as $value){
                $code = file_get_contents($value);
                preg_match_all(self::prel,$code,$arrimg);
                $arr = array_merge($arr,$arrimg[0]);
                $imgkey = array_merge($imgkey,$arrimg[1]);
            }
            return array($arr,$imgkey);
        }else{
            $code = file_get_contents($url);
            preg_match_all(self::prel,$code,$arrimg);
            return $arrimg;
        }
    }
    //检验数据
    private function checkdata($url,$prefix,$style){
        if(empty($url)){
            return 1;
        }elseif(!is_array($style)){
            return 2;
        }elseif(count($style)==0){
            return 3;
        }elseif(stripos($prefix,'.') !== false || stripos($prefix,'/') !== false || stripos($prefix,'|') !== false){
            return 4;
        }
    }
}
     
     
     
     
     
     
     
?>
class Collection{
    protected $url;             //采集地址
    protected $prefix;          //重命名文件前缀
    protected $style;           //需要采集的图片格式,传入一个数组
    const prel = '/(?:http?|https?):\/\/(?:[^\.\/\(\)\?]+)\.(?:[^\.\/]+)\.(?:com|cn|net|org)\/(?:[^\.:\"\'\(\)\?]+)\.(jpg|png|gif)/i';          //采集规则
    //构造函数
    function __construct($url,$prefix,$style){
        switch($this->checkdata($url,$prefix,$style)){
            case 1:
                echo '<script>alert("采集地址不能为空!")</script>';
                exit;
                break;
            case 2:
                echo '<script>alert("需要采集的图片格式,应该为数组!")</script>';
                exit;
                break;
            case 3:
                echo '<script>alert("需要采集的图片格式,不能为空!")</script>';
                exit;
                break;
            case 4:
                echo '<script>alert("文件名不能含有. / |或用空格开头!")</script>';
                exit;
        }
        $this->url = $url;
        $this->prefix = $prefix;
        $this->style = $style;
    }
    //开始采集数据
    public function action(){
        $url = $this->checkurl();
        $imgurl = $this->collecturl($url);
        $this->savafile($imgurl);
    }
    //url处理
    protected function checkurl(){
        $munprel = '/\([0-9]+,[0-9]+\)/i';
        $myurl;
        if(preg_match($munprel,$this->url,$arr)){
            $temp = substr($arr[0],1,strlen($arr[0])-2);
            $mymunber = explode(',',$temp);
            $temparr = explode($arr[0],$this->url);
            for($i=$mymunber[0];$i<=$mymunber[1];$i++){
                $myurl[] = $temparr[0].$i.$temparr[1];
            }
        }else{
            $myurl = $this->url;
        }
        return $myurl;
    }
    //文件保存
    protected function savafile($imgurl){
        if(!empty($imgurl)){
            foreach($imgurl[0] as $key=>$value){
                $filename = '';
                if(in_array($imgurl[1][$key],$this->style)){
                    $size = @getimagesize($value);
                    if($size === false){
                        continue;
                    }
                    list($w,$h,$t,$a) = $size;
                    if($w<200 || $h<200){
                        continue;
                    } 
                    ob_start();
                    readfile($value);
                    $obj = ob_get_contents();
                    ob_end_clean();
                    $dir = 'F:/php/';
                    if(!is_dir($dir)){
                        mkdir($dir,0777);
                    }
                    if(!empty($this->prefix)){
                        $filename = $dir.$this->prefix.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
                    }else{
                        $filename = $dir.date('Ymd').rand(10000,99999).'.'.$imgurl[1][$key];
                    }
                    $fo = @fopen($filename,'wb');
                    if($fo === false){
                        echo '<script>alert("创建文件失败,文件目录不可写!")</script>';
                        exit;
                    }
                    $fw = fwrite($fo,$obj);
                    echo '<div style="width:350px;background:#ddd;">'.$filename.'采集成功</div>';
                }
            }
        }
    }
     
    //地址采集函数,包括图片后缀名
    protected function collecturl($url){
        set_time_limit(0);
        if(is_array($url)){
            $arr = array();
            $imgkey = array();
            foreach($url as $value){
                $code = file_get_contents($value);
                preg_match_all(self::prel,$code,$arrimg);
                $arr = array_merge($arr,$arrimg[0]);
                $imgkey = array_merge($imgkey,$arrimg[1]);
            }
            return array($arr,$imgkey);
        }else{
            $code = file_get_contents($url);
            preg_match_all(self::prel,$code,$arrimg);
            return $arrimg;
        }
    }
    //检验数据
    private function checkdata($url,$prefix,$style){
        if(empty($url)){
            return 1;
        }elseif(!is_array($style)){
            return 2;
        }elseif(count($style)==0){
            return 3;
        }elseif(stripos($prefix,'.') !== false || stripos($prefix,'/') !== false || stripos($prefix,'|') !== false){
            return 4;
        }
    }
}

 

posted on 2016-05-09 15:13  岩_生  阅读(355)  评论(0编辑  收藏  举报

导航