php 获取优酷视频的真实地址(2014.6月新算法)

  上个礼拜发现优酷改版了,各种过滤优酷广告的插件都失效了,于是我百度了一下(谷歌也不能用了)发现优酷改算法了,在ckplayer论坛发现有人在6月25号发了个php 的优酷代理文件,下载下来发现,能用但只能获取mp4格式的视频地址,而且php还加密了,没办法查看源码,后来通过微盾解密发现其中的源码,结合以前自己写的一个优酷视频解析类。。。。

感谢    3shi大大 具体分析请见 3shi大大的文章  优酷视频真实地址解析  (当然现在不能用了,主要看分析

 

ps.  新算法是从别人那里解密出来的所以有可能存在错误,当然也没有注释,不过我试了几个视频都可以解析。

 

下面是源码:

文件名为:youku.class.php

  1 <?php
  2 
  3 class Youku {
  4 
  5     const USER_AGENT = "Mozilla/5.0 (Windows NT 5.1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.116 Safari/537.36";
  6     const REFERER = "http://www.youku.com";
  7     const FORM_ENCODE = "GBK";
  8     const TO_ENCODE = "UTF-8";
  9     private static $base = "http://v.youku.com/player/getPlaylist/VideoIDS/";
 10     private static $source = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ/\\:._-1234567890";
 11     private static $sz = '-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,-1,62,-1,-1,-1,63,52,53,54,55,56,57,58,59,60,61,-1,-1,-1,-1,-1,-1,-1,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,-1,-1,-1,-1,-1,-1,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,-1,-1,-1,-1,-1';
 12     private static $str = 'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/';
 13 
 14     public static function parse($url){
 15         preg_match("#id\_([\w=]+)#", $url, $matches); //id里可以有=号
 16         if (empty($matches)){
 17             $html = self::_cget($url);
 18             preg_match("#videoId2\s*=\s*\'(\w+)\'#", $html, $matches);
 19             if(!$matches) return false;
 20         }
 21         //根据you vid 获取相应的视频地址
 22         return self::_getYouku(trim($matches[1]));
 23     }
 24     /**
 25      * [_cget curl获取数据]
 26      * @param  [type]  $url     [url地址]
 27      * @param  boolean $convert [是否转换编码]
 28      * @param  integer $timeout [超时时间]
 29      * @return [type]           [description]
 30      */
 31     public static function _cget($url,$convert=false,$timeout=10){
 32         $ch=curl_init($url);
 33         curl_setopt($ch,CURLOPT_RETURNTRANSFER,1);
 34         curl_setopt($ch,CURLOPT_TIMEOUT,$timeout);
 35         curl_setopt($ch,CURLOPT_CONNECTTIMEOUT,$timeout);
 36         curl_setopt($ch,CURLOPT_USERAGENT,self::USER_AGENT);
 37         curl_setopt($ch,CURLOPT_REFERER,self::REFERER);       
 38         curl_setopt($ch,CURLOPT_FOLLOWLOCATION,1); //跟随301跳转
 39         curl_setopt($ch,CURLOPT_AUTOREFERER,1); //自动设置referer              
 40         $res=curl_exec($ch);
 41         curl_close($ch);
 42         if($convert){
 43             $res=mb_convert_encoding($res,self::TO_ENCODE,self::FORM_ENCODE);
 44         }
 45         return $res;
 46     }    
 47 
 48     //start 获得优酷视频需要用到的方法
 49     private static function getSid(){
 50         $sid = time().(mt_rand(0,9000)+10000);
 51         return $sid;
 52     }
 53 
 54     private static function getKey($key1,$key2){
 55         $a = hexdec($key1);
 56         $b = $a ^0xA55AA5A5;
 57         $b = dechex($b);
 58         return $key2.$b;
 59     }
 60 
 61     private static function getFileid($fileId,$seed){
 62         $mixed = self::getMixString($seed);
 63         $ids = explode("*",rtrim($fileId,'*')); //去掉末尾的*号分割为数组
 64         $realId = "";
 65         for ($i=0;$i<count($ids);$i++){
 66             $idx = $ids[$i];
 67             $realId .= substr($mixed,$idx,1);
 68         }  
 69         return $realId;
 70     } 
 71 
 72     private static function getMixString($seed){
 73         $mixed = "";
 74         $source = self::$source;
 75         $len = strlen($source);
 76         for($i=0;$i<$len;$i++){
 77             $seed = ($seed * 211 + 30031)%65536;
 78             $index = ($seed / 65536 * strlen($source));
 79             $c = substr($source,$index,1);
 80             $mixed .= $c;
 81             $source = str_replace($c,"",$source);
 82         }
 83         return $mixed;
 84     }
 85 
 86     private static function yk_d($a){
 87         if (!$a) {
 88             return '';
 89         }
 90         $f = strlen($a);
 91         $b = 0;
 92         $str = self::$str;
 93         for ($c = ''; $b < $f;) {
 94             $e = self::charCodeAt($a, $b++) & 255;
 95             if ($b == $f) {
 96                 $c .= self::charAt($str, $e >> 2);
 97                 $c .= self::charAt($str, ($e & 3) << 4);
 98                 $c .= '==';
 99                 break;
100             }
101             $g = self::charCodeAt($a, $b++);
102             if ($b == $f) {
103                 $c .= self::charAt($str, $e >> 2);
104                 $c .= self::charAt($str, ($e & 3) << 4 | ($g & 240) >> 4);
105                 $c .= self::charAt($str, ($g & 15) << 2);
106                 $c .= '=';
107                 break;
108             }
109             $h = self::charCodeAt($a, $b++);
110             $c .= self::charAt($str, $e >> 2);
111             $c .= self::charAt($str, ($e & 3) << 4 | ($g & 240) >> 4);
112             $c .= self::charAt($str, ($g & 15) << 2 | ($h & 192) >> 6);
113             $c .= self::charAt($str, $h & 63);
114         }
115         return $c;
116     }
117     private static function yk_na($a){
118         if (!$a) {
119             return '';
120         }
121 
122         $h = explode(',', self::$sz);
123         $i = strlen($a);
124         $f = 0;
125         for ($e = ''; $f < $i;) {
126             do {
127                 $c = $h[self::charCodeAt($a, $f++) & 255];
128             } while ($f < $i && -1 == $c);
129             if (-1 == $c) {
130                 break;
131             }
132             do {
133                 $b = $h[self::charCodeAt($a, $f++) & 255];
134             } while ($f < $i && -1 == $b);
135             if (-1 == $b) {
136                 break;
137             }
138             $e .= self::fromCharCode($c << 2 | ($b & 48) >> 4);
139             do {
140                 $c = self::charCodeAt($a, $f++) & 255;
141                 if (61 == $c) {
142                     return $e;
143                 }
144                 $c = $h[$c];
145             } while ($f < $i && -1 == $c);
146             if (-1 == $c) {
147                 break;
148             }
149             $e .= self::fromCharCode(($b & 15) << 4 | ($c & 60) >> 2);
150             do {
151                 $b = self::charCodeAt($a, $f++) & 255;
152                 if (61 == $b) {
153                     return $e;
154                 }
155                 $b = $h[$b];
156             } while ($f < $i && -1 == $b);
157             if (-1 == $b) {
158                 break;
159             }
160             $e .= self::fromCharCode(($c & 3) << 6 | $b);
161         }
162         return $e;
163     }
164     private static function yk_e($a, $c){
165         for ($f = 0, $i, $e = '', $h = 0; 256 > $h; $h++) {
166             $b[$h] = $h;
167         }
168         for ($h = 0; 256 > $h; $h++) {
169             $f = (($f + $b[$h]) + self::charCodeAt($a, $h % strlen($a))) % 256;
170             $i = $b[$h];
171             $b[$h] = $b[$f];
172             $b[$f] = $i;
173         }
174         for ($q = ($f = ($h = 0)); $q < strlen($c); $q++) {
175             $h = ($h + 1) % 256;
176             $f = ($f + $b[$h]) % 256;
177             $i = $b[$h];
178             $b[$h] = $b[$f];
179             $b[$f] = $i;
180             $e .= self::fromCharCode(self::charCodeAt($c, $q) ^ $b[($b[$h] + $b[$f]) % 256]);
181         }
182         return $e;
183     }
184     
185     private static function fromCharCode($codes){
186         if (is_scalar($codes)) {
187             $codes = func_get_args();
188         }
189         $str = '';
190         foreach ($codes as $code) {
191             $str .= chr($code);
192         }
193         return $str;
194     }
195     private static function charCodeAt($str, $index){
196         static $charCode = array();
197         $key = md5($str);
198         $index = $index + 1;
199         if (isset($charCode[$key])) {
200             return $charCode[$key][$index];
201         }
202         $charCode[$key] = unpack('C*', $str);
203         return $charCode[$key][$index];
204     }
205 
206     private static function charAt($str, $index = 0){
207         return substr($str, $index, 1);
208     }
209 
210 
211     /**
212      * [_getYouku description]
213      * @param  [type] $vid [视频id]
214      * @return [type]      [description]
215      */
216     public static function _getYouku($vid){
217         //$link = "http://v.youku.com/player/getPlayList/VideoIDS/{$vid}/Pf/4"; //获取视频信息json 有些视频获取不全(土豆网的 火影忍者)
218         $blink = self::$base.$vid;
219         $link = $blink."/Pf/4/ctype/12/ev/1";
220         $retval = self::_cget($link);
221         $bretval = self::_cget($blink);
222         if ($retval) {
223             $rs = json_decode($retval, true);
224             $brs = json_decode($bretval, true);
225             if(!empty($rs['data'][0]['error'])){
226                 return false;  //有错误返回false
227             }
228             $data = array();
229             $streamtypes = $rs['data'][0]['streamtypes'];  //可以输出的视频清晰度
230             $streamfileids = $rs['data'][0]['streamfileids'];
231             $seed = $rs['data'][0]['seed'];
232             $segs = $rs['data'][0]['segs'];
233             $ip = $rs['data'][0]['ip'];
234             $bsegs =  $brs['data'][0]['segs'];
235             list($sid, $token) = explode('_', self::yk_e('becaf9be', self::yk_na($rs['data'][0]['ep'])));
236             foreach ($segs as $key=>$val) {
237                 if(in_array($key,$streamtypes)){
238                     foreach($val as $k=> $v){
239                         $no = strtoupper(dechex($v['no'])); //转换为16进制 大写
240                         if(strlen($no) == 1){
241                             $no ="0".$no;  //no 为每段视频序号
242                         }
243                         //构建视频地址K值
244                         $_k = $v['k'];
245                         if ((!$_k || $_k == '') || $_k == '-1') {
246                             $_k = $bsegs[$key][$k]['k'];
247                         }
248                         $fileId = self::getFileid($streamfileids[$key],$seed);
249                         $fileId = substr($fileId,0,8).$no.substr($fileId,10);
250                         $ep = urlencode(iconv('gbk', 'UTF-8', self::yk_d(self::yk_e('bf7e5f01', ((($sid . '_') . $fileId) . '_') . $token))));
251                         //判断后缀类型 、获得后缀
252                         $typeArray = array("flv"=>"flv","mp4"=>"mp4","hd2"=>"flv","3gphd"=>"mp4","3gp"=>"flv","hd3"=>"flv");
253                         //判断视频清晰度  
254                         $sharpness = array("flv"=>"normal","flvhd"=>"normal","mp4"=>"high","hd2"=>"super","3gphd"=>"high","3gp"=>"normal","hd3"=>"original"); //清晰度 数组
255                         $fileType = $typeArray[$key];
256                         $data[$sharpness[$key]][$k] = "http://k.youku.com/player/getFlvPath/sid/".$sid."_00/st/{$fileType}/fileid/".$fileId."?K=".$_k."&hd=1&myp=0&ts=".((((($v['seconds'].'&ypp=0&ctype=12&ev=1&token=').$token).'&oip=').$ip).'&ep=').$ep;;
257                     }
258                 }
259             }
260             //返回 图片 标题 链接  时长  视频地址
261             $data['img'] = $rs['data'][0]['logo'];
262             $data['title'] = $rs['data'][0]['title'];
263             $data['seconds'] = $rs['data'][0]['seconds'];
264             return $data;
265         } else {
266             return false;
267         }
268     }
269     //end  获得优酷视频需要用到的方法
270 }

引入这个类就可以使用: 输出一个带有各种清晰度的 视频url 的数组。

1 require "youku.class.php";
2 $url = "http://v.youku.com/v_show/id_XNzM1NjQ0Mzgw.html";
3 $data = Youku::parse($url);
4 print_r($data);
posted @ 2014-07-07 16:18  keygle  阅读(14926)  评论(30编辑  收藏  举报