通过JAVA获取优酷、土豆、酷6、6间房等视频

通过JAVA获取优酷、土豆、酷6、6间房等视频

通过JAVA获取优酷、土豆、酷6、6间房、56视频,现在很多社会网站都有这个功能,用户输入优酷、土豆、酷6、6间房、56视频地址后,能找到对应的视频及视频的缩略图,有些社区网站还能获取到视频的时长。
比如:新浪微博就有这个功能,当用户输入优酷、土豆、酷6、6间房、56视频网址后,就能获取到相应的视频地址及视频的缩略图。

代码如下:
import  org.jsoup.Jsoup;
import  org.jsoup.nodes.Document;
import  org.jsoup.nodes.Element;
import  org.jsoup.select.Elements;

public   class  VideoUtil {
    
    
/**
     * 获取视频信息
     * 
@param  url
     * 
@return
     
*/
    
public   static  Video getVideoInfo(String url){
        Video video 
=   new  Video();
        
        
if (url.indexOf( " v.youku.com " ) !=- 1 ){
            
try  {
                video 
=  getYouKuVideo(url);
            } 
catch  (Exception e) {
                video 
=   null ;
            }
        }
else   if (url.indexOf( " tudou.com " ) !=- 1 ){
            
try  {
                video 
=  getTudouVideo(url);
            } 
catch  (Exception e) {
                video 
=   null ;
            }
        }
else   if (url.indexOf( " v.ku6.com " ) !=- 1 ){
            
try  {
                video 
=  getKu6Video(url);
            } 
catch  (Exception e) {
                video 
=   null ;
            }
        }
else   if (url.indexOf( " 6.cn " ) !=- 1 ){
            
try  {
                video 
=  get6Video(url);
            } 
catch  (Exception e) {
                video 
=   null ;
            }
        }
else   if (url.indexOf( " 56.com " ) !=- 1 ){
            
try  {
                video 
=  get56Video(url);
            } 
catch  (Exception e) {
                video 
=   null ;
            }
        }
        
        
return  video;
    }
    
    
    
/**
     * 获取优酷视频
     * 
@param  url  视频URL
     
*/
    
public   static  Video getYouKuVideo(String url)  throws  Exception{
        Document doc 
=  getURLContent(url);
        
        
/**
         *获取视频缩略图 
         
*/
        String pic 
=  getElementAttrById(doc,  " s_sina " " href " );
        
int  local  =  pic.indexOf( " pic= " );
        pic 
=  pic.substring(local + 4 );
        
        
/**
         * 获取视频地址
         
*/         
        String flash 
=  getElementAttrById(doc,  " link2 " " value " );
        
        
/**
         * 获取视频时间
         
*/     
        String time 
=  getElementAttrById(doc,  " download " " href " );
        String []arrays 
=  time.split( " \\| " );
        time 
=  arrays[ 4 ];
        
        Video video 
=   new  Video();
        video.setPic(pic);
        video.setFlash(flash);
        video.setTime(time);
        
        
return  video;
    }
    
    
    
/**
     * 获取土豆视频
     * 
@param  url  视频URL
     
*/
    
public   static  Video getTudouVideo(String url)  throws  Exception{
        Document doc 
=  getURLContent(url);
        String content 
=  doc.html();
        
int  beginLocal  =  content.indexOf( " <script>document.domain " );
        
int  endLocal  =  content.indexOf( " </script> " );
        content 
=  content.substring(beginLocal, endLocal);
        
        
/**
         * 获取视频地址
         
*/     
        String flash 
=  getScriptVarByName( " iid_code " , content);
        flash 
=   " http://www.tudou.com/v/ "   +  flash  +   " /v.swf " ;
        
        
/**
         *获取视频缩略图 
         
*/
        String pic 
=  getScriptVarByName( " thumbnail " , content);
        
        
/**
         * 获取视频时间
         
*/     
        String time 
=  getScriptVarByName( " time " , content);

        Video video 
=   new  Video();
        video.setPic(pic);
        video.setFlash(flash);
        video.setTime(time);
        
        
return  video;
    }
    
    
    
/**
     * 获取酷6视频
     * 
@param  url  视频URL
     
*/
    
public   static  Video getKu6Video(String url)  throws  Exception{
        Document doc 
=  getURLContent(url);
        
        
/**
         * 获取视频地址
         
*/
        Element flashEt 
=  doc.getElementById( " outSideSwfCode " );
        String flash 
=  flashEt.attr( " value " );
        
        
/**
         * 获取视频缩略图
         
*/
        Element picEt 
=  doc.getElementById( " plVideosList " );
        String time 
=   null ;
        String pic 
=   null ;
        
if (picEt != null ){
            Elements pics 
=  picEt.getElementsByTag( " img " );
            pic 
=  pics.get( 0 ).attr( " src " );
            
            
/**
             * 获取视频时长
             
*/
            Element timeEt 
=  picEt.select( " span.review>cite " ).first(); 
            time 
=  timeEt.text();
        }
else {
            pic 
=  doc.getElementsByClass( " s_pic " ).first().text();
        }
        
        Video video 
=   new  Video();
        video.setPic(pic);
        video.setFlash(flash);
        video.setTime(time);
        
        
return  video;
        
    }
    
    
    
/**
     * 获取6间房视频
     * 
@param  url  视频URL
     
*/
    
public   static  Video get6Video(String url)  throws  Exception{
        Document doc 
=  getURLContent(url);
        
        
/**
         * 获取视频缩略图
         
*/
        Element picEt 
=  doc.getElementsByClass( " summary " ).first();
        String pic 
=  picEt.getElementsByTag( " img " ).first().attr( " src " );
        
        
/**
         * 获取视频时长
         
*/
        String time 
=  getVideoTime(doc, url,  " watchUserVideo " );
        
if (time == null ){
            time 
=  getVideoTime(doc, url,  " watchRelVideo " );
        }
        
        
/**
         * 获取视频地址
         
*/
        Element flashEt 
=  doc.getElementById( " video-share-code " );
        doc 
=  Jsoup.parse(flashEt.attr( " value " ));  
        String flash 
=  doc.select( " embed " ).attr( " src " );
        
        Video video 
=   new  Video();
        video.setPic(pic);
        video.setFlash(flash);
        video.setTime(time);
        
        
return  video;
    }
    
    
    
/**
     * 获取56视频
     * 
@param  url  视频URL
     
*/
    
public   static  Video get56Video(String url)  throws  Exception{
        Document doc 
=  getURLContent(url);
        String content 
=  doc.html();
        
        
/**
         * 获取视频缩略图
         
*/
        
int  begin  =  content.indexOf( " \ " img\ " :\ "" );
        content  =  content.substring(begin + 7 , begin + 200 );
        
int  end  =  content.indexOf( " \ " }; " );
        String pic  =  content.substring( 0 , end).trim();
        pic 
=  pic.replaceAll( " \\\\ " "" );        
        
        
/**
         * 获取视频地址
         
*/
        String flash 
=   " http://player.56.com "   +  url.substring(url.lastIndexOf( " / " ), url.lastIndexOf( " .html " ))  +   " .swf " ;
        
        Video video 
=   new  Video();
        video.setPic(pic);
        video.setFlash(flash);
        
        
return  video;
    }

    
/**
     * 获取6间房视频时长    
     
*/
    
private   static  String getVideoTime(Document doc, String url, String id) {
        String time 
=   null ;
        
        Element timeEt 
=  doc.getElementById(id); 
        Elements links 
=  timeEt.select( " dt > a " );
        
        
        
for  (Element link : links) {
          String linkHref 
=  link.attr( " href " );
          
if (linkHref.equalsIgnoreCase(url)){
              time 
=  link.parent().getElementsByTag( " em " ).first().text();
              
break ;
          }
        }
        
return  time;
    }
    
            
    
/**
     * 获取script某个变量的值
     * 
@param  name  变量名称
     * 
@return    返回获取的值 
     
*/
    
private   static  String getScriptVarByName(String name, String content){
        String script 
=  content;
        
        
int  begin  =  script.indexOf(name);
        
        script 
=  script.substring(begin + name.length() + 2 );
        
        
int  end  =  script.indexOf( " , " );
        
        script 
=  script.substring( 0 ,end);
        
        String result
= script.replaceAll( " ' " "" );
        result 
=  result.trim();
        
        
return  result;
    }
    
    
    
/**
     * 根据HTML的ID键及属于名,获取属于值
     * 
@param  id  HTML的ID键
     * 
@param  attrName  属于名
     * 
@return   返回属性值
     
*/
    
private   static  String getElementAttrById(Document doc, String id, String attrName) throws  Exception{
        Element et 
=  doc.getElementById(id);
        String attrValue 
=  et.attr(attrName);
        
        
return  attrValue;
    }
    
    
    
    
/**
     * 获取网页的内容
     
*/
    
private   static  Document getURLContent(String url)  throws  Exception{
        Document doc 
=  Jsoup.connect(url)
          .data(
" query " " Java " )
          .userAgent(
" Mozilla " )
          .cookie(
" auth " " token " )
          .timeout(
6000 )
          .post();
        
return  doc;
    }
    
    
    
public   static   void  main(String[] args) {
        
// String url = " http://v.youku.com/v_show/id_XMjU0MjI2NzY0.html ";
        
// String url = " http://www.tudou.com/programs/view/pVploWOtCQM/ ";
        
// String url = " http://v.ku6.com/special/show_4024167/9t7p64bisV2A31Hz.html ";
        
// String url = " http://v.ku6.com/show/BpP5LeyVwvikbT1F.html ";
        
// String url = " http://6.cn/watch/14757577.html ";
        String url  =   " http://www.56.com/u64/v_NTkzMDEzMTc.html " ;
        Video video 
=  getVideoInfo(url);
        System.out.println(
" 视频缩略图: " + video.getPic());
        System.out.println(
" 视频地址: " + video.getFlash());
        System.out.println(
" 视频时长: " + video.getTime());
    }
}

视频封装类

public   class  Video {
    
private  String flash;
    
private  String pic;
    
private  String time;
    
public  String getFlash() {
        
return  flash;
    }
    
public   void  setFlash(String flash) {
        
this .flash  =  flash;
    }
    
public  String getPic() {
        
return  pic;
    }
    
public   void  setPic(String pic) {
        
this .pic  =  pic;
    }
    
public  String getTime() {
        
return  time;
    }
    
public   void  setTime(String time) {
        
this .time  =  time;
    }
}

其中要用到一个JAR包,链接地址如下:
http://jsoup.org/packages/jsoup-1.5.2.jar

你可能感兴趣的:(通过JAVA获取优酷、土豆、酷6、6间房等视频)